diff --git a/README.md b/README.md index 21e21c6294ec2e7cff22e189e086a3765ff27581..bdeeff679b5cf386a67c62b47b34c6a95c8a77e3 100644 --- a/README.md +++ b/README.md @@ -3,44 +3,31 @@ license: apache-2.0 tags: - generated_from_trainer model-index: -- name: bart-base-spelling-nl-1m +- name: bart-base-spelling-nl-2m results: [] --- -This model is a Dutch fine-tuned version of -[facebook/bart-base](https://huggingface.co/facebook/bart-base). + -It achieves the following results on the evaluation set: +# bart-base-spelling-nl-2m -- Loss: 0.0221 -- Cer: 0.0145 +This model is a fine-tuned version of [facebook/bart-base](https://huggingface.co/facebook/bart-base) on an unknown dataset. +It achieves the following results on the evaluation set: +- Loss: 0.0248 +- Cer: 0.0133 ## Model description -This is a text-to-text fine-tuned version of -[facebook/bart-base](https://huggingface.co/facebook/bart-base) -trained on spelling correction. It leans on the excellent work by -Oliver Guhr ([github](https://github.com/oliverguhr/spelling), -[huggingface](https://huggingface.co/oliverguhr/spelling-correction-english-base)). Training -was performed on an AWS EC2 instance (g5.xlarge) on a single GPU. +More information needed ## Intended uses & limitations -The intended use for this model is to be a component of the -[Valkuil.net](https://valkuil.net) context-sensitive spelling -checker. +More information needed ## Training and evaluation data -The model was trained on a Dutch dataset composed of 2,964,203 (nearly -3m) lines of text from three public Dutch sources, downloaded from the -[Opus corpus](https://opus.nlpl.eu/): - -- nl-europarlv7.1m.txt (1,000,000 lines) -- nl-opensubtitles2016.1m.txt (1,000,000 lines) -- nl-wikipedia.txt (964,203 lines) - -Together these texts comprise 45,308,056 tokens. +More information needed ## Training procedure @@ -61,190 +48,315 @@ The following hyperparameters were used during training: | Training Loss | Epoch | Step | Validation Loss | Cer | |:-------------:|:-----:|:------:|:---------------:|:------:| -| 0.2824 | 0.01 | 1000 | 0.2129 | 0.9219 | -| 0.1971 | 0.02 | 2000 | 0.1600 | 0.9217 | -| 0.171 | 0.03 | 3000 | 0.1273 | 0.9217 | -| 0.1586 | 0.04 | 4000 | 0.1110 | 0.9216 | -| 0.1288 | 0.05 | 5000 | 0.0991 | 0.9214 | -| 0.1338 | 0.06 | 6000 | 0.0910 | 0.9215 | -| 0.1279 | 0.08 | 7000 | 0.0831 | 0.9215 | -| 0.1147 | 0.09 | 8000 | 0.0789 | 0.9215 | -| 0.1091 | 0.1 | 9000 | 0.0769 | 0.9216 | -| 0.0935 | 0.11 | 10000 | 0.0700 | 0.9214 | -| 0.0963 | 0.12 | 11000 | 0.0678 | 0.9215 | -| 0.0969 | 0.13 | 12000 | 0.0654 | 0.9214 | -| 0.0957 | 0.14 | 13000 | 0.0627 | 0.9215 | -| 0.0886 | 0.15 | 14000 | 0.0644 | 0.9215 | -| 0.0911 | 0.16 | 15000 | 0.0604 | 0.9215 | -| 0.0955 | 0.17 | 16000 | 0.0595 | 0.9215 | -| 0.0875 | 0.18 | 17000 | 0.0587 | 0.9213 | -| 0.0879 | 0.19 | 18000 | 0.0576 | 0.9214 | -| 0.079 | 0.21 | 19000 | 0.0550 | 0.9213 | -| 0.0808 | 0.22 | 20000 | 0.0536 | 0.9215 | -| 0.0684 | 0.23 | 21000 | 0.0536 | 0.9214 | -| 0.0789 | 0.24 | 22000 | 0.0530 | 0.9214 | -| 0.088 | 0.25 | 23000 | 0.0524 | 0.9215 | -| 0.076 | 0.26 | 24000 | 0.0519 | 0.9214 | -| 0.0714 | 0.27 | 25000 | 0.0506 | 0.9213 | -| 0.0664 | 0.28 | 26000 | 0.0495 | 0.9213 | -| 0.0791 | 0.29 | 27000 | 0.0492 | 0.9215 | -| 0.0702 | 0.3 | 28000 | 0.0485 | 0.9215 | -| 0.0709 | 0.31 | 29000 | 0.0493 | 0.9213 | -| 0.0676 | 0.32 | 30000 | 0.0480 | 0.9214 | -| 0.0692 | 0.34 | 31000 | 0.0468 | 0.9215 | -| 0.0633 | 0.35 | 32000 | 0.0473 | 0.9213 | -| 0.0732 | 0.36 | 33000 | 0.0455 | 0.9213 | -| 0.0809 | 0.37 | 34000 | 0.0455 | 0.9214 | -| 0.0562 | 0.38 | 35000 | 0.0451 | 0.9214 | -| 0.0715 | 0.39 | 36000 | 0.0440 | 0.9214 | -| 0.0596 | 0.4 | 37000 | 0.0441 | 0.9214 | -| 0.0534 | 0.41 | 38000 | 0.0430 | 0.9213 | -| 0.0657 | 0.42 | 39000 | 0.0427 | 0.9214 | -| 0.0643 | 0.43 | 40000 | 0.0441 | 0.9212 | -| 0.0579 | 0.44 | 41000 | 0.0414 | 0.9213 | -| 0.0695 | 0.45 | 42000 | 0.0430 | 0.9212 | -| 0.0566 | 0.47 | 43000 | 0.0413 | 0.9212 | -| 0.0646 | 0.48 | 44000 | 0.0415 | 0.9213 | -| 0.0573 | 0.49 | 45000 | 0.0410 | 0.9212 | -| 0.0568 | 0.5 | 46000 | 0.0406 | 0.9213 | -| 0.065 | 0.51 | 47000 | 0.0405 | 0.9213 | -| 0.063 | 0.52 | 48000 | 0.0396 | 0.9213 | -| 0.0654 | 0.53 | 49000 | 0.0397 | 0.9213 | -| 0.0506 | 0.54 | 50000 | 0.0391 | 0.9212 | -| 0.0573 | 0.55 | 51000 | 0.0382 | 0.9213 | -| 0.0569 | 0.56 | 52000 | 0.0381 | 0.9214 | -| 0.0597 | 0.57 | 53000 | 0.0381 | 0.9212 | -| 0.0543 | 0.58 | 54000 | 0.0374 | 0.9213 | -| 0.057 | 0.59 | 55000 | 0.0381 | 0.9213 | -| 0.058 | 0.61 | 56000 | 0.0380 | 0.9212 | -| 0.0481 | 0.62 | 57000 | 0.0366 | 0.9213 | -| 0.0581 | 0.63 | 58000 | 0.0367 | 0.9212 | -| 0.0521 | 0.64 | 59000 | 0.0363 | 0.9213 | -| 0.0543 | 0.65 | 60000 | 0.0358 | 0.9212 | -| 0.0594 | 0.66 | 61000 | 0.0359 | 0.9214 | -| 0.0479 | 0.67 | 62000 | 0.0354 | 0.9212 | -| 0.0512 | 0.68 | 63000 | 0.0357 | 0.9211 | -| 0.0488 | 0.69 | 64000 | 0.0341 | 0.9213 | -| 0.0485 | 0.7 | 65000 | 0.0346 | 0.9213 | -| 0.052 | 0.71 | 66000 | 0.0343 | 0.9213 | -| 0.0427 | 0.72 | 67000 | 0.0341 | 0.9212 | -| 0.0502 | 0.74 | 68000 | 0.0343 | 0.9211 | -| 0.0434 | 0.75 | 69000 | 0.0337 | 0.9213 | -| 0.0579 | 0.76 | 70000 | 0.0337 | 0.9213 | -| 0.0534 | 0.77 | 71000 | 0.0330 | 0.9212 | -| 0.0437 | 0.78 | 72000 | 0.0334 | 0.9212 | -| 0.05 | 0.79 | 73000 | 0.0332 | 0.9213 | -| 0.043 | 0.8 | 74000 | 0.0329 | 0.9212 | -| 0.0554 | 0.81 | 75000 | 0.0323 | 0.9212 | -| 0.0418 | 0.82 | 76000 | 0.0326 | 0.9212 | -| 0.0461 | 0.83 | 77000 | 0.0326 | 0.9212 | -| 0.0435 | 0.84 | 78000 | 0.0319 | 0.9212 | -| 0.0453 | 0.85 | 79000 | 0.0317 | 0.9212 | -| 0.0434 | 0.87 | 80000 | 0.0318 | 0.9212 | -| 0.0466 | 0.88 | 81000 | 0.0321 | 0.9212 | -| 0.0461 | 0.89 | 82000 | 0.0316 | 0.9212 | -| 0.0381 | 0.9 | 83000 | 0.0311 | 0.9213 | -| 0.0455 | 0.91 | 84000 | 0.0306 | 0.9212 | -| 0.0446 | 0.92 | 85000 | 0.0315 | 0.9212 | -| 0.0532 | 0.93 | 86000 | 0.0305 | 0.9212 | -| 0.052 | 0.94 | 87000 | 0.0305 | 0.9212 | -| 0.0353 | 0.95 | 88000 | 0.0305 | 0.9211 | -| 0.0469 | 0.96 | 89000 | 0.0304 | 0.9212 | -| 0.0387 | 0.97 | 90000 | 0.0303 | 0.9212 | -| 0.0478 | 0.98 | 91000 | 0.0302 | 0.9212 | -| 0.0395 | 1.0 | 92000 | 0.0299 | 0.9212 | -| 0.0387 | 1.01 | 93000 | 0.0290 | 0.9212 | -| 0.0356 | 1.02 | 94000 | 0.0287 | 0.9212 | -| 0.0381 | 1.03 | 95000 | 0.0295 | 0.9212 | -| 0.0386 | 1.04 | 96000 | 0.0284 | 0.9213 | -| 0.038 | 1.05 | 97000 | 0.0293 | 0.9212 | -| 0.0346 | 1.06 | 98000 | 0.0284 | 0.9212 | -| 0.0357 | 1.07 | 99000 | 0.0285 | 0.9212 | -| 0.0446 | 1.08 | 100000 | 0.0287 | 0.9211 | -| 0.0424 | 1.09 | 101000 | 0.0284 | 0.9213 | -| 0.0357 | 1.1 | 102000 | 0.0282 | 0.9211 | -| 0.0413 | 1.11 | 103000 | 0.0282 | 0.9211 | -| 0.0348 | 1.12 | 104000 | 0.0279 | 0.9212 | -| 0.0363 | 1.14 | 105000 | 0.0279 | 0.9212 | -| 0.0329 | 1.15 | 106000 | 0.0282 | 0.9211 | -| 0.0438 | 1.16 | 107000 | 0.0279 | 0.9212 | -| 0.037 | 1.17 | 108000 | 0.0274 | 0.9212 | -| 0.0311 | 1.18 | 109000 | 0.0278 | 0.9212 | -| 0.0297 | 1.19 | 110000 | 0.0275 | 0.9212 | -| 0.0323 | 1.2 | 111000 | 0.0271 | 0.9212 | -| 0.0387 | 1.21 | 112000 | 0.0275 | 0.9212 | -| 0.0366 | 1.22 | 113000 | 0.0269 | 0.9211 | -| 0.0345 | 1.23 | 114000 | 0.0269 | 0.9211 | -| 0.0389 | 1.24 | 115000 | 0.0261 | 0.9211 | -| 0.0381 | 1.25 | 116000 | 0.0265 | 0.9211 | -| 0.0324 | 1.27 | 117000 | 0.0265 | 0.9211 | -| 0.0345 | 1.28 | 118000 | 0.0260 | 0.9212 | -| 0.032 | 1.29 | 119000 | 0.0260 | 0.9211 | -| 0.0359 | 1.3 | 120000 | 0.0259 | 0.9211 | -| 0.0347 | 1.31 | 121000 | 0.0259 | 0.9212 | -| 0.0334 | 1.32 | 122000 | 0.0253 | 0.9211 | -| 0.0297 | 1.33 | 123000 | 0.0260 | 0.9210 | -| 0.0333 | 1.34 | 124000 | 0.0251 | 0.9212 | -| 0.0303 | 1.35 | 125000 | 0.0254 | 0.9211 | -| 0.0292 | 1.36 | 126000 | 0.0250 | 0.9211 | -| 0.0318 | 1.37 | 127000 | 0.0250 | 0.9212 | -| 0.0284 | 1.38 | 128000 | 0.0250 | 0.9211 | -| 0.0311 | 1.4 | 129000 | 0.0248 | 0.9211 | -| 0.0323 | 1.41 | 130000 | 0.0248 | 0.9211 | -| 0.0253 | 1.42 | 131000 | 0.0244 | 0.9211 | -| 0.0287 | 1.43 | 132000 | 0.0246 | 0.9211 | -| 0.0351 | 1.44 | 133000 | 0.0240 | 0.9212 | -| 0.0363 | 1.45 | 134000 | 0.0238 | 0.9211 | -| 0.0264 | 1.46 | 135000 | 0.0240 | 0.9211 | -| 0.0304 | 1.47 | 136000 | 0.0242 | 0.9211 | -| 0.0325 | 1.48 | 137000 | 0.0236 | 0.9212 | -| 0.033 | 1.49 | 138000 | 0.0239 | 0.9211 | -| 0.03 | 1.5 | 139000 | 0.0236 | 0.9211 | -| 0.0256 | 1.51 | 140000 | 0.0235 | 0.9211 | -| 0.0312 | 1.53 | 141000 | 0.0237 | 0.9211 | -| 0.0302 | 1.54 | 142000 | 0.0237 | 0.9211 | -| 0.0227 | 1.55 | 143000 | 0.0232 | 0.9212 | -| 0.0261 | 1.56 | 144000 | 0.0232 | 0.9211 | -| 0.0269 | 1.57 | 145000 | 0.0227 | 0.9211 | -| 0.0312 | 1.58 | 146000 | 0.0228 | 0.9211 | -| 0.0298 | 1.59 | 147000 | 0.0231 | 0.9211 | -| 0.0281 | 1.6 | 148000 | 0.0226 | 0.9212 | -| 0.029 | 1.61 | 149000 | 0.0227 | 0.9211 | -| 0.0324 | 1.62 | 150000 | 0.0225 | 0.9211 | -| 0.0251 | 1.63 | 151000 | 0.0223 | 0.9212 | -| 0.0278 | 1.64 | 152000 | 0.0223 | 0.9211 | -| 0.0284 | 1.65 | 153000 | 0.0224 | 0.9210 | -| 0.0254 | 1.67 | 154000 | 0.0220 | 0.9211 | -| 0.028 | 1.68 | 155000 | 0.0221 | 0.9210 | -| 0.0247 | 1.69 | 156000 | 0.0222 | 0.9211 | -| 0.0295 | 1.7 | 157000 | 0.0218 | 0.9211 | -| 0.0283 | 1.71 | 158000 | 0.0216 | 0.9211 | -| 0.0245 | 1.72 | 159000 | 0.0218 | 0.9211 | -| 0.0249 | 1.73 | 160000 | 0.0216 | 0.9211 | -| 0.0264 | 1.74 | 161000 | 0.0215 | 0.9211 | -| 0.0264 | 1.75 | 162000 | 0.0213 | 0.9211 | -| 0.0306 | 1.76 | 163000 | 0.0212 | 0.9211 | -| 0.0242 | 1.77 | 164000 | 0.0212 | 0.9212 | -| 0.0247 | 1.78 | 165000 | 0.0211 | 0.9211 | -| 0.0227 | 1.8 | 166000 | 0.0211 | 0.9210 | -| 0.0252 | 1.81 | 167000 | 0.0211 | 0.9211 | -| 0.0269 | 1.82 | 168000 | 0.0208 | 0.9211 | -| 0.0256 | 1.83 | 169000 | 0.0209 | 0.9211 | -| 0.0234 | 1.84 | 170000 | 0.0207 | 0.9211 | -| 0.0258 | 1.85 | 171000 | 0.0207 | 0.9211 | -| 0.0282 | 1.86 | 172000 | 0.0205 | 0.9210 | -| 0.0282 | 1.87 | 173000 | 0.0206 | 0.9210 | -| 0.0234 | 1.88 | 174000 | 0.0205 | 0.9211 | -| 0.0222 | 1.89 | 175000 | 0.0204 | 0.9211 | -| 0.0237 | 1.9 | 176000 | 0.0203 | 0.9211 | -| 0.0299 | 1.91 | 177000 | 0.0203 | 0.9211 | -| 0.0246 | 1.93 | 178000 | 0.0203 | 0.9211 | -| 0.0227 | 1.94 | 179000 | 0.0204 | 0.9211 | -| 0.0253 | 1.95 | 180000 | 0.0202 | 0.9211 | -| 0.0197 | 1.96 | 181000 | 0.0202 | 0.9211 | -| 0.0231 | 1.97 | 182000 | 0.0200 | 0.9211 | -| 0.0244 | 1.98 | 183000 | 0.0201 | 0.9211 | -| 0.0259 | 1.99 | 184000 | 0.0200 | 0.9211 | +| 0.277 | 0.01 | 1000 | 0.2337 | 0.9206 | +| 0.2349 | 0.01 | 2000 | 0.1757 | 0.9204 | +| 0.1929 | 0.02 | 3000 | 0.1482 | 0.9205 | +| 0.1686 | 0.03 | 4000 | 0.1314 | 0.9202 | +| 0.1435 | 0.03 | 5000 | 0.1175 | 0.9203 | +| 0.1505 | 0.04 | 6000 | 0.1086 | 0.9204 | +| 0.1438 | 0.05 | 7000 | 0.0984 | 0.9203 | +| 0.1362 | 0.05 | 8000 | 0.0941 | 0.9203 | +| 0.1207 | 0.06 | 9000 | 0.0890 | 0.9201 | +| 0.108 | 0.06 | 10000 | 0.0850 | 0.9203 | +| 0.1142 | 0.07 | 11000 | 0.0798 | 0.9201 | +| 0.1081 | 0.08 | 12000 | 0.0757 | 0.9203 | +| 0.0987 | 0.08 | 13000 | 0.0739 | 0.9201 | +| 0.1103 | 0.09 | 14000 | 0.0728 | 0.9202 | +| 0.0961 | 0.1 | 15000 | 0.0678 | 0.9202 | +| 0.0976 | 0.1 | 16000 | 0.0672 | 0.9202 | +| 0.0949 | 0.11 | 17000 | 0.0640 | 0.9202 | +| 0.1026 | 0.12 | 18000 | 0.0635 | 0.9203 | +| 0.1049 | 0.12 | 19000 | 0.0618 | 0.9201 | +| 0.0893 | 0.13 | 20000 | 0.0617 | 0.9201 | +| 0.0834 | 0.14 | 21000 | 0.0582 | 0.9202 | +| 0.0815 | 0.14 | 22000 | 0.0584 | 0.9202 | +| 0.0801 | 0.15 | 23000 | 0.0606 | 0.9202 | +| 0.0764 | 0.15 | 24000 | 0.0591 | 0.9201 | +| 0.0779 | 0.16 | 25000 | 0.0556 | 0.9201 | +| 0.0839 | 0.17 | 26000 | 0.0548 | 0.9202 | +| 0.0811 | 0.17 | 27000 | 0.0532 | 0.9202 | +| 0.0817 | 0.18 | 28000 | 0.0537 | 0.9202 | +| 0.0809 | 0.19 | 29000 | 0.0527 | 0.9201 | +| 0.0812 | 0.19 | 30000 | 0.0512 | 0.9202 | +| 0.0741 | 0.2 | 31000 | 0.0507 | 0.9201 | +| 0.0764 | 0.21 | 32000 | 0.0510 | 0.9201 | +| 0.0741 | 0.21 | 33000 | 0.0494 | 0.9201 | +| 0.0736 | 0.22 | 34000 | 0.0499 | 0.9201 | +| 0.0674 | 0.23 | 35000 | 0.0486 | 0.9202 | +| 0.0775 | 0.23 | 36000 | 0.0489 | 0.9201 | +| 0.0772 | 0.24 | 37000 | 0.0484 | 0.9202 | +| 0.073 | 0.25 | 38000 | 0.0487 | 0.9202 | +| 0.0675 | 0.25 | 39000 | 0.0474 | 0.9200 | +| 0.0739 | 0.26 | 40000 | 0.0460 | 0.9201 | +| 0.0694 | 0.26 | 41000 | 0.0478 | 0.9200 | +| 0.0659 | 0.27 | 42000 | 0.0451 | 0.9201 | +| 0.0638 | 0.28 | 43000 | 0.0449 | 0.9200 | +| 0.0704 | 0.28 | 44000 | 0.0447 | 0.9201 | +| 0.0657 | 0.29 | 45000 | 0.0463 | 0.9201 | +| 0.0649 | 0.3 | 46000 | 0.0445 | 0.9200 | +| 0.069 | 0.3 | 47000 | 0.0444 | 0.9201 | +| 0.0655 | 0.31 | 48000 | 0.0433 | 0.9200 | +| 0.0592 | 0.32 | 49000 | 0.0439 | 0.9201 | +| 0.0623 | 0.32 | 50000 | 0.0433 | 0.9201 | +| 0.074 | 0.33 | 51000 | 0.0419 | 0.9202 | +| 0.0602 | 0.34 | 52000 | 0.0410 | 0.9202 | +| 0.0672 | 0.34 | 53000 | 0.0418 | 0.9202 | +| 0.063 | 0.35 | 54000 | 0.0425 | 0.9200 | +| 0.0609 | 0.35 | 55000 | 0.0407 | 0.9200 | +| 0.0583 | 0.36 | 56000 | 0.0399 | 0.9200 | +| 0.0602 | 0.37 | 57000 | 0.0400 | 0.9201 | +| 0.0707 | 0.37 | 58000 | 0.0399 | 0.9200 | +| 0.0628 | 0.38 | 59000 | 0.0401 | 0.9201 | +| 0.0586 | 0.39 | 60000 | 0.0390 | 0.9201 | +| 0.061 | 0.39 | 61000 | 0.0403 | 0.9199 | +| 0.0611 | 0.4 | 62000 | 0.0388 | 0.9201 | +| 0.0569 | 0.41 | 63000 | 0.0379 | 0.9200 | +| 0.0577 | 0.41 | 64000 | 0.0382 | 0.9200 | +| 0.061 | 0.42 | 65000 | 0.0390 | 0.9202 | +| 0.0605 | 0.43 | 66000 | 0.0381 | 0.9199 | +| 0.0566 | 0.43 | 67000 | 0.0382 | 0.9200 | +| 0.0616 | 0.44 | 68000 | 0.0380 | 0.9200 | +| 0.0666 | 0.45 | 69000 | 0.0381 | 0.9201 | +| 0.052 | 0.45 | 70000 | 0.0373 | 0.9200 | +| 0.0576 | 0.46 | 71000 | 0.0376 | 0.9200 | +| 0.0529 | 0.46 | 72000 | 0.0365 | 0.9200 | +| 0.0504 | 0.47 | 73000 | 0.0371 | 0.9201 | +| 0.0499 | 0.48 | 74000 | 0.0373 | 0.9200 | +| 0.0578 | 0.48 | 75000 | 0.0367 | 0.9200 | +| 0.0545 | 0.49 | 76000 | 0.0356 | 0.9200 | +| 0.0527 | 0.5 | 77000 | 0.0358 | 0.9200 | +| 0.0464 | 0.5 | 78000 | 0.0354 | 0.9201 | +| 0.0546 | 0.51 | 79000 | 0.0354 | 0.9200 | +| 0.0536 | 0.52 | 80000 | 0.0346 | 0.9200 | +| 0.0568 | 0.52 | 81000 | 0.0355 | 0.9199 | +| 0.0486 | 0.53 | 82000 | 0.0346 | 0.9199 | +| 0.0571 | 0.54 | 83000 | 0.0338 | 0.9200 | +| 0.0526 | 0.54 | 84000 | 0.0339 | 0.9200 | +| 0.0485 | 0.55 | 85000 | 0.0338 | 0.9200 | +| 0.0489 | 0.56 | 86000 | 0.0345 | 0.9199 | +| 0.0473 | 0.56 | 87000 | 0.0338 | 0.9201 | +| 0.0449 | 0.57 | 88000 | 0.0334 | 0.9199 | +| 0.0516 | 0.57 | 89000 | 0.0331 | 0.9199 | +| 0.0537 | 0.58 | 90000 | 0.0331 | 0.9199 | +| 0.0477 | 0.59 | 91000 | 0.0326 | 0.9200 | +| 0.046 | 0.59 | 92000 | 0.0325 | 0.9201 | +| 0.0545 | 0.6 | 93000 | 0.0326 | 0.9200 | +| 0.0473 | 0.61 | 94000 | 0.0327 | 0.9201 | +| 0.0558 | 0.61 | 95000 | 0.0324 | 0.9199 | +| 0.0428 | 0.62 | 96000 | 0.0317 | 0.9200 | +| 0.0596 | 0.63 | 97000 | 0.0314 | 0.9200 | +| 0.0449 | 0.63 | 98000 | 0.0322 | 0.9200 | +| 0.041 | 0.64 | 99000 | 0.0314 | 0.9199 | +| 0.0464 | 0.65 | 100000 | 0.0319 | 0.9200 | +| 0.0519 | 0.65 | 101000 | 0.0301 | 0.9199 | +| 0.0417 | 0.66 | 102000 | 0.0305 | 0.9199 | +| 0.0456 | 0.66 | 103000 | 0.0308 | 0.9199 | +| 0.046 | 0.67 | 104000 | 0.0315 | 0.9198 | +| 0.0462 | 0.68 | 105000 | 0.0306 | 0.9199 | +| 0.0478 | 0.68 | 106000 | 0.0306 | 0.9199 | +| 0.0456 | 0.69 | 107000 | 0.0308 | 0.9199 | +| 0.0433 | 0.7 | 108000 | 0.0302 | 0.9200 | +| 0.0498 | 0.7 | 109000 | 0.0296 | 0.9200 | +| 0.0438 | 0.71 | 110000 | 0.0300 | 0.9200 | +| 0.0394 | 0.72 | 111000 | 0.0299 | 0.9198 | +| 0.0451 | 0.72 | 112000 | 0.0297 | 0.9200 | +| 0.0413 | 0.73 | 113000 | 0.0295 | 0.9199 | +| 0.0461 | 0.74 | 114000 | 0.0301 | 0.9198 | +| 0.0501 | 0.74 | 115000 | 0.0296 | 0.9199 | +| 0.0387 | 0.75 | 116000 | 0.0293 | 0.9200 | +| 0.0384 | 0.76 | 117000 | 0.0293 | 0.9199 | +| 0.0492 | 0.76 | 118000 | 0.0291 | 0.9199 | +| 0.0415 | 0.77 | 119000 | 0.0288 | 0.9200 | +| 0.0435 | 0.77 | 120000 | 0.0286 | 0.9199 | +| 0.0423 | 0.78 | 121000 | 0.0284 | 0.9198 | +| 0.0437 | 0.79 | 122000 | 0.0286 | 0.9199 | +| 0.0512 | 0.79 | 123000 | 0.0285 | 0.9200 | +| 0.0427 | 0.8 | 124000 | 0.0285 | 0.9199 | +| 0.0461 | 0.81 | 125000 | 0.0287 | 0.9199 | +| 0.0433 | 0.81 | 126000 | 0.0290 | 0.9198 | +| 0.0386 | 0.82 | 127000 | 0.0283 | 0.9199 | +| 0.0407 | 0.83 | 128000 | 0.0282 | 0.9199 | +| 0.0466 | 0.83 | 129000 | 0.0276 | 0.9199 | +| 0.048 | 0.84 | 130000 | 0.0278 | 0.9201 | +| 0.046 | 0.85 | 131000 | 0.0279 | 0.9199 | +| 0.0431 | 0.85 | 132000 | 0.0270 | 0.9199 | +| 0.047 | 0.86 | 133000 | 0.0272 | 0.9199 | +| 0.0466 | 0.86 | 134000 | 0.0266 | 0.9199 | +| 0.04 | 0.87 | 135000 | 0.0267 | 0.9199 | +| 0.038 | 0.88 | 136000 | 0.0271 | 0.9199 | +| 0.0382 | 0.88 | 137000 | 0.0271 | 0.9199 | +| 0.0422 | 0.89 | 138000 | 0.0265 | 0.9199 | +| 0.0464 | 0.9 | 139000 | 0.0265 | 0.9200 | +| 0.0372 | 0.9 | 140000 | 0.0270 | 0.9200 | +| 0.0381 | 0.91 | 141000 | 0.0266 | 0.9199 | +| 0.0359 | 0.92 | 142000 | 0.0267 | 0.9198 | +| 0.0368 | 0.92 | 143000 | 0.0270 | 0.9199 | +| 0.0365 | 0.93 | 144000 | 0.0266 | 0.9199 | +| 0.0413 | 0.94 | 145000 | 0.0268 | 0.9199 | +| 0.0383 | 0.94 | 146000 | 0.0261 | 0.9199 | +| 0.0396 | 0.95 | 147000 | 0.0259 | 0.9199 | +| 0.0405 | 0.96 | 148000 | 0.0260 | 0.9199 | +| 0.0433 | 0.96 | 149000 | 0.0258 | 0.9199 | +| 0.0378 | 0.97 | 150000 | 0.0260 | 0.9200 | +| 0.0337 | 0.97 | 151000 | 0.0258 | 0.9199 | +| 0.0456 | 0.98 | 152000 | 0.0254 | 0.9199 | +| 0.0355 | 0.99 | 153000 | 0.0256 | 0.9199 | +| 0.0396 | 0.99 | 154000 | 0.0253 | 0.9199 | +| 0.0353 | 1.0 | 155000 | 0.0256 | 0.9199 | +| 0.036 | 1.01 | 156000 | 0.0253 | 0.9200 | +| 0.0345 | 1.01 | 157000 | 0.0254 | 0.9199 | +| 0.0321 | 1.02 | 158000 | 0.0248 | 0.9198 | +| 0.0366 | 1.03 | 159000 | 0.0252 | 0.9200 | +| 0.0298 | 1.03 | 160000 | 0.0254 | 0.9198 | +| 0.0316 | 1.04 | 161000 | 0.0250 | 0.9199 | +| 0.0322 | 1.05 | 162000 | 0.0243 | 0.9199 | +| 0.0313 | 1.05 | 163000 | 0.0246 | 0.9198 | +| 0.0329 | 1.06 | 164000 | 0.0247 | 0.9200 | +| 0.0393 | 1.06 | 165000 | 0.0248 | 0.9198 | +| 0.0352 | 1.07 | 166000 | 0.0243 | 0.9198 | +| 0.0319 | 1.08 | 167000 | 0.0244 | 0.9199 | +| 0.0315 | 1.08 | 168000 | 0.0250 | 0.9198 | +| 0.0345 | 1.09 | 169000 | 0.0243 | 0.9199 | +| 0.0341 | 1.1 | 170000 | 0.0247 | 0.9199 | +| 0.0317 | 1.1 | 171000 | 0.0241 | 0.9199 | +| 0.0313 | 1.11 | 172000 | 0.0245 | 0.9199 | +| 0.033 | 1.12 | 173000 | 0.0237 | 0.9199 | +| 0.0339 | 1.12 | 174000 | 0.0237 | 0.9199 | +| 0.0319 | 1.13 | 175000 | 0.0240 | 0.9199 | +| 0.0391 | 1.14 | 176000 | 0.0241 | 0.9199 | +| 0.0325 | 1.14 | 177000 | 0.0239 | 0.9200 | +| 0.0295 | 1.15 | 178000 | 0.0240 | 0.9199 | +| 0.0288 | 1.16 | 179000 | 0.0232 | 0.9199 | +| 0.0347 | 1.16 | 180000 | 0.0234 | 0.9199 | +| 0.029 | 1.17 | 181000 | 0.0234 | 0.9198 | +| 0.0305 | 1.17 | 182000 | 0.0231 | 0.9199 | +| 0.0454 | 1.18 | 183000 | 0.0231 | 0.9200 | +| 0.0339 | 1.19 | 184000 | 0.0234 | 0.9199 | +| 0.0375 | 1.19 | 185000 | 0.0229 | 0.9199 | +| 0.0351 | 1.2 | 186000 | 0.0227 | 0.9199 | +| 0.0305 | 1.21 | 187000 | 0.0230 | 0.9199 | +| 0.0376 | 1.21 | 188000 | 0.0228 | 0.9199 | +| 0.0338 | 1.22 | 189000 | 0.0225 | 0.9200 | +| 0.0315 | 1.23 | 190000 | 0.0229 | 0.9199 | +| 0.0369 | 1.23 | 191000 | 0.0229 | 0.9199 | +| 0.0288 | 1.24 | 192000 | 0.0227 | 0.9199 | +| 0.0344 | 1.25 | 193000 | 0.0225 | 0.9199 | +| 0.0283 | 1.25 | 194000 | 0.0221 | 0.9199 | +| 0.0377 | 1.26 | 195000 | 0.0225 | 0.9198 | +| 0.0395 | 1.27 | 196000 | 0.0225 | 0.9199 | +| 0.0268 | 1.27 | 197000 | 0.0224 | 0.9199 | +| 0.032 | 1.28 | 198000 | 0.0222 | 0.9199 | +| 0.0328 | 1.28 | 199000 | 0.0221 | 0.9199 | +| 0.0278 | 1.29 | 200000 | 0.0220 | 0.9198 | +| 0.029 | 1.3 | 201000 | 0.0221 | 0.9199 | +| 0.0319 | 1.3 | 202000 | 0.0218 | 0.9199 | +| 0.0422 | 1.31 | 203000 | 0.0220 | 0.9199 | +| 0.0301 | 1.32 | 204000 | 0.0215 | 0.9198 | +| 0.0293 | 1.32 | 205000 | 0.0217 | 0.9198 | +| 0.0347 | 1.33 | 206000 | 0.0216 | 0.9199 | +| 0.0288 | 1.34 | 207000 | 0.0215 | 0.9199 | +| 0.0264 | 1.34 | 208000 | 0.0216 | 0.9199 | +| 0.0341 | 1.35 | 209000 | 0.0214 | 0.9199 | +| 0.029 | 1.36 | 210000 | 0.0213 | 0.9199 | +| 0.0281 | 1.36 | 211000 | 0.0218 | 0.9198 | +| 0.033 | 1.37 | 212000 | 0.0212 | 0.9199 | +| 0.0348 | 1.37 | 213000 | 0.0211 | 0.9199 | +| 0.0291 | 1.38 | 214000 | 0.0214 | 0.9199 | +| 0.0353 | 1.39 | 215000 | 0.0212 | 0.9199 | +| 0.0324 | 1.39 | 216000 | 0.0209 | 0.9199 | +| 0.0342 | 1.4 | 217000 | 0.0209 | 0.9199 | +| 0.0293 | 1.41 | 218000 | 0.0212 | 0.9199 | +| 0.0281 | 1.41 | 219000 | 0.0209 | 0.9199 | +| 0.0286 | 1.42 | 220000 | 0.0209 | 0.9198 | +| 0.0297 | 1.43 | 221000 | 0.0205 | 0.9200 | +| 0.0256 | 1.43 | 222000 | 0.0207 | 0.9199 | +| 0.0261 | 1.44 | 223000 | 0.0209 | 0.9198 | +| 0.0274 | 1.45 | 224000 | 0.0204 | 0.9199 | +| 0.0343 | 1.45 | 225000 | 0.0201 | 0.9199 | +| 0.0249 | 1.46 | 226000 | 0.0204 | 0.9199 | +| 0.0267 | 1.47 | 227000 | 0.0202 | 0.9199 | +| 0.0264 | 1.47 | 228000 | 0.0202 | 0.9199 | +| 0.031 | 1.48 | 229000 | 0.0201 | 0.9199 | +| 0.0273 | 1.48 | 230000 | 0.0199 | 0.9199 | +| 0.024 | 1.49 | 231000 | 0.0199 | 0.9199 | +| 0.0295 | 1.5 | 232000 | 0.0198 | 0.9199 | +| 0.0281 | 1.5 | 233000 | 0.0196 | 0.9199 | +| 0.0243 | 1.51 | 234000 | 0.0195 | 0.9198 | +| 0.0258 | 1.52 | 235000 | 0.0197 | 0.9199 | +| 0.0272 | 1.52 | 236000 | 0.0196 | 0.9198 | +| 0.0261 | 1.53 | 237000 | 0.0198 | 0.9199 | +| 0.0222 | 1.54 | 238000 | 0.0198 | 0.9199 | +| 0.0259 | 1.54 | 239000 | 0.0195 | 0.9199 | +| 0.0317 | 1.55 | 240000 | 0.0194 | 0.9199 | +| 0.0266 | 1.56 | 241000 | 0.0191 | 0.9199 | +| 0.0272 | 1.56 | 242000 | 0.0193 | 0.9199 | +| 0.0236 | 1.57 | 243000 | 0.0194 | 0.9199 | +| 0.0266 | 1.57 | 244000 | 0.0193 | 0.9198 | +| 0.027 | 1.58 | 245000 | 0.0195 | 0.9199 | +| 0.0257 | 1.59 | 246000 | 0.0192 | 0.9199 | +| 0.0276 | 1.59 | 247000 | 0.0190 | 0.9199 | +| 0.0238 | 1.6 | 248000 | 0.0188 | 0.9199 | +| 0.0301 | 1.61 | 249000 | 0.0188 | 0.9199 | +| 0.0273 | 1.61 | 250000 | 0.0189 | 0.9199 | +| 0.0246 | 1.62 | 251000 | 0.0187 | 0.9198 | +| 0.0309 | 1.63 | 252000 | 0.0187 | 0.9198 | +| 0.0237 | 1.63 | 253000 | 0.0188 | 0.9199 | +| 0.0234 | 1.64 | 254000 | 0.0184 | 0.9198 | +| 0.0246 | 1.65 | 255000 | 0.0186 | 0.9198 | +| 0.0213 | 1.65 | 256000 | 0.0182 | 0.9199 | +| 0.0251 | 1.66 | 257000 | 0.0182 | 0.9198 | +| 0.0236 | 1.67 | 258000 | 0.0184 | 0.9198 | +| 0.0276 | 1.67 | 259000 | 0.0185 | 0.9198 | +| 0.0233 | 1.68 | 260000 | 0.0182 | 0.9199 | +| 0.0205 | 1.68 | 261000 | 0.0183 | 0.9198 | +| 0.0253 | 1.69 | 262000 | 0.0181 | 0.9198 | +| 0.0221 | 1.7 | 263000 | 0.0180 | 0.9198 | +| 0.0228 | 1.7 | 264000 | 0.0182 | 0.9199 | +| 0.0209 | 1.71 | 265000 | 0.0181 | 0.9198 | +| 0.0319 | 1.72 | 266000 | 0.0179 | 0.9199 | +| 0.0236 | 1.72 | 267000 | 0.0178 | 0.9199 | +| 0.029 | 1.73 | 268000 | 0.0179 | 0.9198 | +| 0.0233 | 1.74 | 269000 | 0.0178 | 0.9198 | +| 0.0248 | 1.74 | 270000 | 0.0176 | 0.9198 | +| 0.0211 | 1.75 | 271000 | 0.0177 | 0.9198 | +| 0.0257 | 1.76 | 272000 | 0.0177 | 0.9198 | +| 0.0247 | 1.76 | 273000 | 0.0175 | 0.9199 | +| 0.0323 | 1.77 | 274000 | 0.0176 | 0.9199 | +| 0.0236 | 1.77 | 275000 | 0.0175 | 0.9198 | +| 0.0202 | 1.78 | 276000 | 0.0176 | 0.9198 | +| 0.0318 | 1.79 | 277000 | 0.0174 | 0.9199 | +| 0.0206 | 1.79 | 278000 | 0.0175 | 0.9198 | +| 0.0245 | 1.8 | 279000 | 0.0174 | 0.9199 | +| 0.0177 | 1.81 | 280000 | 0.0174 | 0.9199 | +| 0.0268 | 1.81 | 281000 | 0.0174 | 0.9199 | +| 0.0209 | 1.82 | 282000 | 0.0172 | 0.9199 | +| 0.0248 | 1.83 | 283000 | 0.0171 | 0.9198 | +| 0.0205 | 1.83 | 284000 | 0.0173 | 0.9198 | +| 0.0231 | 1.84 | 285000 | 0.0172 | 0.9199 | +| 0.0278 | 1.85 | 286000 | 0.0171 | 0.9198 | +| 0.0244 | 1.85 | 287000 | 0.0171 | 0.9198 | +| 0.0223 | 1.86 | 288000 | 0.0169 | 0.9198 | +| 0.0285 | 1.87 | 289000 | 0.0168 | 0.9198 | +| 0.0223 | 1.87 | 290000 | 0.0169 | 0.9198 | +| 0.0231 | 1.88 | 291000 | 0.0169 | 0.9198 | +| 0.0192 | 1.88 | 292000 | 0.0169 | 0.9198 | +| 0.0234 | 1.89 | 293000 | 0.0168 | 0.9198 | +| 0.0223 | 1.9 | 294000 | 0.0168 | 0.9198 | +| 0.0255 | 1.9 | 295000 | 0.0168 | 0.9198 | +| 0.0248 | 1.91 | 296000 | 0.0166 | 0.9198 | +| 0.0216 | 1.92 | 297000 | 0.0166 | 0.9198 | +| 0.0219 | 1.92 | 298000 | 0.0167 | 0.9198 | +| 0.0196 | 1.93 | 299000 | 0.0167 | 0.9198 | +| 0.0175 | 1.94 | 300000 | 0.0166 | 0.9198 | +| 0.0228 | 1.94 | 301000 | 0.0165 | 0.9198 | +| 0.019 | 1.95 | 302000 | 0.0165 | 0.9198 | +| 0.0191 | 1.96 | 303000 | 0.0165 | 0.9198 | +| 0.0249 | 1.96 | 304000 | 0.0165 | 0.9198 | +| 0.0233 | 1.97 | 305000 | 0.0164 | 0.9198 | +| 0.0211 | 1.97 | 306000 | 0.0164 | 0.9198 | +| 0.02 | 1.98 | 307000 | 0.0164 | 0.9198 | +| 0.0191 | 1.99 | 308000 | 0.0164 | 0.9198 | +| 0.0214 | 1.99 | 309000 | 0.0164 | 0.9198 | ### Framework versions diff --git a/all_results.json b/all_results.json index 82b52e74b780ac54963a415ba1767aa2cb18e5b7..797c700636d5558b0546c06ec5ed75d366f53c6e 100644 --- a/all_results.json +++ b/all_results.json @@ -1,14 +1,14 @@ { "epoch": 2.0, - "eval_cer": 0.014513880422164147, - "eval_loss": 0.02208337001502514, - "eval_runtime": 1920.0198, + "eval_cer": 0.013285730425940572, + "eval_loss": 0.024751625955104828, + "eval_runtime": 1869.7345, "eval_samples": 2000, - "eval_samples_per_second": 1.042, - "eval_steps_per_second": 0.26, - "train_loss": 0.05150384478483596, - "train_runtime": 204639.736, - "train_samples": 2958558, - "train_samples_per_second": 28.915, - "train_steps_per_second": 0.904 + "eval_samples_per_second": 1.07, + "eval_steps_per_second": 0.267, + "train_loss": 0.047053869794253175, + "train_runtime": 343177.6492, + "train_samples": 4957999, + "train_samples_per_second": 28.895, + "train_steps_per_second": 0.903 } \ No newline at end of file diff --git a/eval_results.json b/eval_results.json index 1815db9f36fc2f7a88f6b742065098414f797bbb..d08ad2508fbacef4efa44a4bd53b3205b5da031b 100644 --- a/eval_results.json +++ b/eval_results.json @@ -1,9 +1,9 @@ { "epoch": 2.0, - "eval_cer": 0.014513880422164147, - "eval_loss": 0.02208337001502514, - "eval_runtime": 1920.0198, + "eval_cer": 0.013285730425940572, + "eval_loss": 0.024751625955104828, + "eval_runtime": 1869.7345, "eval_samples": 2000, - "eval_samples_per_second": 1.042, - "eval_steps_per_second": 0.26 + "eval_samples_per_second": 1.07, + "eval_steps_per_second": 0.267 } \ No newline at end of file diff --git a/pytorch_model.bin b/pytorch_model.bin index d2d56fffd0a54ab59e461bdb7c6fd272cdc38997..307619fb0e688bdc0e9daa838429874ed07d2458 100644 --- a/pytorch_model.bin +++ b/pytorch_model.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:fb2eb6470de7d689abff2f06ce460c17539f1dcffe05da3ff6a91b4cf6c353dd +oid sha256:a88fc7ded935df70dcafe67db7bc7214334bab70e42a315c9785ebdf7cd750a9 size 557971229 diff --git a/train_results.json b/train_results.json index d2409a95a34a77b109bc15e135a4123615379b45..27de7a906d2c0a7371ba20c71673767fa931cf33 100644 --- a/train_results.json +++ b/train_results.json @@ -1,8 +1,8 @@ { "epoch": 2.0, - "train_loss": 0.05150384478483596, - "train_runtime": 204639.736, - "train_samples": 2958558, - "train_samples_per_second": 28.915, - "train_steps_per_second": 0.904 + "train_loss": 0.047053869794253175, + "train_runtime": 343177.6492, + "train_samples": 4957999, + "train_samples_per_second": 28.895, + "train_steps_per_second": 0.903 } \ No newline at end of file diff --git a/trainer_state.json b/trainer_state.json index ed08d651f83a9d1bfb3972fe5441558fa9cca387..8a77e14816e6d4016ea4a87ee57055445d26629d 100644 --- a/trainer_state.json +++ b/trainer_state.json @@ -1,112621 +1,188728 @@ { - "best_metric": 0.9210173852044647, - "best_model_checkpoint": "./models/bart-base-spelling-nl-1m/checkpoint-155000", - "epoch": 1.999979719850008, - "global_step": 184908, + "best_metric": 0.9197731329793244, + "best_model_checkpoint": "./models/bart-base-spelling-nl-2m/checkpoint-158000", + "epoch": 1.9999935457845905, + "global_step": 309874, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, - "learning_rate": 0.00029998377571549095, - "loss": 2.8408, + "learning_rate": 0.00029999031864564305, + "loss": 4.6156, "step": 10 }, { "epoch": 0.0, - "learning_rate": 0.0002999675514309819, - "loss": 1.2018, + "learning_rate": 0.00029998063729128613, + "loss": 1.343, "step": 20 }, { "epoch": 0.0, - "learning_rate": 0.00029995132714647285, - "loss": 0.9944, + "learning_rate": 0.0002999709559369292, + "loss": 1.0206, "step": 30 }, { "epoch": 0.0, - "learning_rate": 0.00029993510286196377, - "loss": 0.8851, + "learning_rate": 0.00029996127458257224, + "loss": 0.9534, "step": 40 }, { "epoch": 0.0, - "learning_rate": 0.00029991887857745475, - "loss": 0.8278, + "learning_rate": 0.0002999515932282153, + "loss": 0.8341, "step": 50 }, { "epoch": 0.0, - "learning_rate": 0.00029990265429294567, - "loss": 0.7606, + "learning_rate": 0.0002999419118738584, + "loss": 0.7678, "step": 60 }, { "epoch": 0.0, - "learning_rate": 0.0002998864300084366, - "loss": 0.7213, + "learning_rate": 0.0002999322305195014, + "loss": 0.7105, "step": 70 }, { "epoch": 0.0, - "learning_rate": 0.00029987020572392757, - "loss": 0.7086, + "learning_rate": 0.0002999225491651445, + "loss": 0.699, "step": 80 }, { "epoch": 0.0, - "learning_rate": 0.0002998539814394185, - "loss": 0.6504, + "learning_rate": 0.0002999128678107876, + "loss": 0.6662, "step": 90 }, { "epoch": 0.0, - "learning_rate": 0.0002998377571549094, - "loss": 0.6291, + "learning_rate": 0.00029990318645643066, + "loss": 0.6317, "step": 100 }, { "epoch": 0.0, - "learning_rate": 0.0002998215328704004, - "loss": 0.6259, + "learning_rate": 0.0002998935051020737, + "loss": 0.622, "step": 110 }, { "epoch": 0.0, - "learning_rate": 0.0002998053085858913, - "loss": 0.5982, + "learning_rate": 0.00029988382374771677, + "loss": 0.6266, "step": 120 }, { "epoch": 0.0, - "learning_rate": 0.0002997890843013823, - "loss": 0.615, + "learning_rate": 0.00029987414239335985, + "loss": 0.5759, "step": 130 }, { "epoch": 0.0, - "learning_rate": 0.0002997728600168732, - "loss": 0.5648, + "learning_rate": 0.00029986446103900293, + "loss": 0.5915, "step": 140 }, { "epoch": 0.0, - "learning_rate": 0.0002997566357323642, - "loss": 0.5603, + "learning_rate": 0.000299854779684646, + "loss": 0.5852, "step": 150 }, { "epoch": 0.0, - "learning_rate": 0.0002997404114478551, - "loss": 0.5628, + "learning_rate": 0.0002998450983302891, + "loss": 0.5174, "step": 160 }, { "epoch": 0.0, - "learning_rate": 0.0002997241871633461, - "loss": 0.5692, + "learning_rate": 0.00029983541697593217, + "loss": 0.5193, "step": 170 }, { "epoch": 0.0, - "learning_rate": 0.000299707962878837, - "loss": 0.5216, + "learning_rate": 0.0002998257356215752, + "loss": 0.5252, "step": 180 }, { "epoch": 0.0, - "learning_rate": 0.000299691738594328, - "loss": 0.5384, + "learning_rate": 0.0002998160542672183, + "loss": 0.5231, "step": 190 }, { "epoch": 0.0, - "learning_rate": 0.0002996755143098189, - "loss": 0.5085, + "learning_rate": 0.00029980637291286135, + "loss": 0.5039, "step": 200 }, { "epoch": 0.0, - "learning_rate": 0.0002996592900253099, - "loss": 0.5185, + "learning_rate": 0.0002997966915585044, + "loss": 0.5046, "step": 210 }, { "epoch": 0.0, - "learning_rate": 0.0002996430657408008, - "loss": 0.4803, + "learning_rate": 0.00029978701020414746, + "loss": 0.4904, "step": 220 }, { "epoch": 0.0, - "learning_rate": 0.0002996268414562918, - "loss": 0.5168, + "learning_rate": 0.00029977732884979054, + "loss": 0.4778, "step": 230 }, { "epoch": 0.0, - "learning_rate": 0.0002996106171717827, - "loss": 0.4688, + "learning_rate": 0.0002997676474954336, + "loss": 0.4769, "step": 240 }, { "epoch": 0.0, - "learning_rate": 0.00029959439288727364, - "loss": 0.4961, + "learning_rate": 0.00029975796614107664, + "loss": 0.4826, "step": 250 }, { "epoch": 0.0, - "learning_rate": 0.0002995781686027646, - "loss": 0.4728, + "learning_rate": 0.0002997482847867197, + "loss": 0.4792, "step": 260 }, { "epoch": 0.0, - "learning_rate": 0.00029956194431825554, - "loss": 0.5015, + "learning_rate": 0.0002997386034323628, + "loss": 0.4771, "step": 270 }, { "epoch": 0.0, - "learning_rate": 0.00029954572003374646, - "loss": 0.4669, + "learning_rate": 0.0002997289220780059, + "loss": 0.4732, "step": 280 }, { "epoch": 0.0, - "learning_rate": 0.00029952949574923744, - "loss": 0.4554, + "learning_rate": 0.00029971924072364896, + "loss": 0.4576, "step": 290 }, { "epoch": 0.0, - "learning_rate": 0.00029951327146472836, - "loss": 0.4611, + "learning_rate": 0.00029970955936929204, + "loss": 0.4423, "step": 300 }, { "epoch": 0.0, - "learning_rate": 0.00029949704718021934, - "loss": 0.4607, + "learning_rate": 0.00029969987801493507, + "loss": 0.4416, "step": 310 }, { "epoch": 0.0, - "learning_rate": 0.00029948082289571026, - "loss": 0.4341, + "learning_rate": 0.00029969019666057815, + "loss": 0.448, "step": 320 }, { "epoch": 0.0, - "learning_rate": 0.00029946459861120123, - "loss": 0.437, + "learning_rate": 0.00029968051530622123, + "loss": 0.4101, "step": 330 }, { "epoch": 0.0, - "learning_rate": 0.00029944837432669216, - "loss": 0.4209, + "learning_rate": 0.00029967083395186425, + "loss": 0.4048, "step": 340 }, { "epoch": 0.0, - "learning_rate": 0.00029943215004218313, - "loss": 0.4182, + "learning_rate": 0.00029966115259750733, + "loss": 0.4128, "step": 350 }, { "epoch": 0.0, - "learning_rate": 0.00029941592575767406, - "loss": 0.4199, + "learning_rate": 0.0002996514712431504, + "loss": 0.4237, "step": 360 }, { "epoch": 0.0, - "learning_rate": 0.00029939970147316503, - "loss": 0.4053, + "learning_rate": 0.0002996417898887935, + "loss": 0.3986, "step": 370 }, { "epoch": 0.0, - "learning_rate": 0.00029938347718865596, - "loss": 0.4079, + "learning_rate": 0.00029963210853443657, + "loss": 0.433, "step": 380 }, { "epoch": 0.0, - "learning_rate": 0.00029936725290414693, - "loss": 0.3965, + "learning_rate": 0.0002996224271800796, + "loss": 0.3928, "step": 390 }, { "epoch": 0.0, - "learning_rate": 0.00029935102861963786, - "loss": 0.3927, + "learning_rate": 0.0002996127458257227, + "loss": 0.3997, "step": 400 }, { "epoch": 0.0, - "learning_rate": 0.00029933480433512883, - "loss": 0.4119, + "learning_rate": 0.00029960306447136576, + "loss": 0.3833, "step": 410 }, { "epoch": 0.0, - "learning_rate": 0.00029931858005061976, - "loss": 0.3889, + "learning_rate": 0.00029959338311700884, + "loss": 0.3819, "step": 420 }, { "epoch": 0.0, - "learning_rate": 0.0002993023557661107, - "loss": 0.4037, + "learning_rate": 0.0002995837017626519, + "loss": 0.3894, "step": 430 }, { "epoch": 0.0, - "learning_rate": 0.00029928613148160166, - "loss": 0.4049, + "learning_rate": 0.00029957402040829494, + "loss": 0.3804, "step": 440 }, { "epoch": 0.0, - "learning_rate": 0.0002992699071970926, - "loss": 0.3675, + "learning_rate": 0.000299564339053938, + "loss": 0.3933, "step": 450 }, { "epoch": 0.0, - "learning_rate": 0.0002992536829125835, - "loss": 0.3822, + "learning_rate": 0.0002995546576995811, + "loss": 0.3748, "step": 460 }, { - "epoch": 0.01, - "learning_rate": 0.0002992374586280745, - "loss": 0.3995, + "epoch": 0.0, + "learning_rate": 0.00029954497634522413, + "loss": 0.3799, "step": 470 }, { - "epoch": 0.01, - "learning_rate": 0.0002992212343435654, - "loss": 0.3483, + "epoch": 0.0, + "learning_rate": 0.0002995352949908672, + "loss": 0.3612, "step": 480 }, { - "epoch": 0.01, - "learning_rate": 0.0002992050100590564, - "loss": 0.3611, + "epoch": 0.0, + "learning_rate": 0.0002995256136365103, + "loss": 0.392, "step": 490 }, { - "epoch": 0.01, - "learning_rate": 0.0002991887857745473, - "loss": 0.369, + "epoch": 0.0, + "learning_rate": 0.00029951593228215337, + "loss": 0.3791, "step": 500 }, { - "epoch": 0.01, - "learning_rate": 0.0002991725614900383, - "loss": 0.3761, + "epoch": 0.0, + "learning_rate": 0.00029950625092779645, + "loss": 0.3663, "step": 510 }, { - "epoch": 0.01, - "learning_rate": 0.0002991563372055292, - "loss": 0.3702, + "epoch": 0.0, + "learning_rate": 0.0002994965695734395, + "loss": 0.3514, "step": 520 }, { - "epoch": 0.01, - "learning_rate": 0.0002991401129210202, - "loss": 0.3446, + "epoch": 0.0, + "learning_rate": 0.00029948688821908255, + "loss": 0.3595, "step": 530 }, { - "epoch": 0.01, - "learning_rate": 0.0002991238886365111, - "loss": 0.3519, + "epoch": 0.0, + "learning_rate": 0.00029947720686472563, + "loss": 0.3605, "step": 540 }, { - "epoch": 0.01, - "learning_rate": 0.0002991076643520021, - "loss": 0.3677, + "epoch": 0.0, + "learning_rate": 0.0002994675255103687, + "loss": 0.3555, "step": 550 }, { - "epoch": 0.01, - "learning_rate": 0.000299091440067493, - "loss": 0.354, + "epoch": 0.0, + "learning_rate": 0.0002994578441560118, + "loss": 0.3563, "step": 560 }, { - "epoch": 0.01, - "learning_rate": 0.000299075215782984, - "loss": 0.3367, + "epoch": 0.0, + "learning_rate": 0.00029944816280165487, + "loss": 0.3481, "step": 570 }, { - "epoch": 0.01, - "learning_rate": 0.0002990589914984749, - "loss": 0.3339, + "epoch": 0.0, + "learning_rate": 0.0002994384814472979, + "loss": 0.3557, "step": 580 }, { - "epoch": 0.01, - "learning_rate": 0.0002990427672139659, - "loss": 0.3365, + "epoch": 0.0, + "learning_rate": 0.000299428800092941, + "loss": 0.3522, "step": 590 }, { - "epoch": 0.01, - "learning_rate": 0.0002990265429294568, - "loss": 0.3377, + "epoch": 0.0, + "learning_rate": 0.00029941911873858406, + "loss": 0.3563, "step": 600 }, { - "epoch": 0.01, - "learning_rate": 0.0002990103186449477, - "loss": 0.3298, + "epoch": 0.0, + "learning_rate": 0.0002994094373842271, + "loss": 0.3507, "step": 610 }, { - "epoch": 0.01, - "learning_rate": 0.0002989940943604387, - "loss": 0.3438, + "epoch": 0.0, + "learning_rate": 0.00029939975602987016, + "loss": 0.3356, "step": 620 }, { - "epoch": 0.01, - "learning_rate": 0.0002989778700759296, - "loss": 0.3472, + "epoch": 0.0, + "learning_rate": 0.00029939007467551324, + "loss": 0.3457, "step": 630 }, { - "epoch": 0.01, - "learning_rate": 0.00029896164579142054, - "loss": 0.3314, + "epoch": 0.0, + "learning_rate": 0.0002993803933211563, + "loss": 0.3522, "step": 640 }, { - "epoch": 0.01, - "learning_rate": 0.0002989454215069115, - "loss": 0.3316, + "epoch": 0.0, + "learning_rate": 0.0002993707119667994, + "loss": 0.3329, "step": 650 }, { - "epoch": 0.01, - "learning_rate": 0.00029892919722240244, - "loss": 0.3287, + "epoch": 0.0, + "learning_rate": 0.0002993610306124425, + "loss": 0.3286, "step": 660 }, { - "epoch": 0.01, - "learning_rate": 0.0002989129729378934, - "loss": 0.3246, + "epoch": 0.0, + "learning_rate": 0.0002993513492580855, + "loss": 0.3394, "step": 670 }, { - "epoch": 0.01, - "learning_rate": 0.00029889674865338434, - "loss": 0.3346, + "epoch": 0.0, + "learning_rate": 0.0002993416679037286, + "loss": 0.3201, "step": 680 }, { - "epoch": 0.01, - "learning_rate": 0.0002988805243688753, - "loss": 0.317, + "epoch": 0.0, + "learning_rate": 0.00029933198654937167, + "loss": 0.3277, "step": 690 }, { - "epoch": 0.01, - "learning_rate": 0.00029886430008436624, - "loss": 0.321, + "epoch": 0.0, + "learning_rate": 0.00029932230519501475, + "loss": 0.3332, "step": 700 }, { - "epoch": 0.01, - "learning_rate": 0.0002988480757998572, - "loss": 0.3322, + "epoch": 0.0, + "learning_rate": 0.00029931262384065777, + "loss": 0.314, "step": 710 }, { - "epoch": 0.01, - "learning_rate": 0.00029883185151534814, - "loss": 0.3345, + "epoch": 0.0, + "learning_rate": 0.00029930294248630085, + "loss": 0.3204, "step": 720 }, { - "epoch": 0.01, - "learning_rate": 0.0002988156272308391, - "loss": 0.3156, + "epoch": 0.0, + "learning_rate": 0.00029929326113194393, + "loss": 0.3157, "step": 730 }, { - "epoch": 0.01, - "learning_rate": 0.00029879940294633004, - "loss": 0.3147, + "epoch": 0.0, + "learning_rate": 0.00029928357977758696, + "loss": 0.313, "step": 740 }, { - "epoch": 0.01, - "learning_rate": 0.000298783178661821, - "loss": 0.3208, + "epoch": 0.0, + "learning_rate": 0.00029927389842323004, + "loss": 0.3161, "step": 750 }, { - "epoch": 0.01, - "learning_rate": 0.00029876695437731194, - "loss": 0.3181, + "epoch": 0.0, + "learning_rate": 0.0002992642170688731, + "loss": 0.3139, "step": 760 }, { - "epoch": 0.01, - "learning_rate": 0.0002987507300928029, - "loss": 0.305, + "epoch": 0.0, + "learning_rate": 0.0002992545357145162, + "loss": 0.3181, "step": 770 }, { "epoch": 0.01, - "learning_rate": 0.00029873450580829384, - "loss": 0.3123, + "learning_rate": 0.0002992448543601593, + "loss": 0.3069, "step": 780 }, { "epoch": 0.01, - "learning_rate": 0.00029871828152378476, - "loss": 0.3033, + "learning_rate": 0.00029923517300580236, + "loss": 0.3001, "step": 790 }, { "epoch": 0.01, - "learning_rate": 0.00029870205723927574, - "loss": 0.3271, + "learning_rate": 0.00029922549165144544, + "loss": 0.3222, "step": 800 }, { "epoch": 0.01, - "learning_rate": 0.00029868583295476666, - "loss": 0.3036, + "learning_rate": 0.00029921581029708846, + "loss": 0.3097, "step": 810 }, { "epoch": 0.01, - "learning_rate": 0.0002986696086702576, - "loss": 0.3059, + "learning_rate": 0.00029920612894273154, + "loss": 0.3168, "step": 820 }, { "epoch": 0.01, - "learning_rate": 0.00029865338438574856, - "loss": 0.2873, + "learning_rate": 0.0002991964475883746, + "loss": 0.3012, "step": 830 }, { "epoch": 0.01, - "learning_rate": 0.0002986371601012395, - "loss": 0.3101, + "learning_rate": 0.00029918676623401765, + "loss": 0.2954, "step": 840 }, { "epoch": 0.01, - "learning_rate": 0.00029862093581673046, - "loss": 0.2923, + "learning_rate": 0.0002991770848796607, + "loss": 0.305, "step": 850 }, { "epoch": 0.01, - "learning_rate": 0.0002986047115322214, - "loss": 0.3072, + "learning_rate": 0.0002991674035253038, + "loss": 0.3022, "step": 860 }, { "epoch": 0.01, - "learning_rate": 0.00029858848724771236, - "loss": 0.2983, + "learning_rate": 0.0002991577221709469, + "loss": 0.2964, "step": 870 }, { "epoch": 0.01, - "learning_rate": 0.0002985722629632033, - "loss": 0.29, + "learning_rate": 0.0002991480408165899, + "loss": 0.287, "step": 880 }, { "epoch": 0.01, - "learning_rate": 0.00029855603867869426, - "loss": 0.2973, + "learning_rate": 0.000299138359462233, + "loss": 0.3079, "step": 890 }, { "epoch": 0.01, - "learning_rate": 0.0002985398143941852, - "loss": 0.2995, + "learning_rate": 0.00029912867810787607, + "loss": 0.2928, "step": 900 }, { "epoch": 0.01, - "learning_rate": 0.00029852359010967616, - "loss": 0.2967, + "learning_rate": 0.00029911899675351915, + "loss": 0.301, "step": 910 }, { "epoch": 0.01, - "learning_rate": 0.0002985073658251671, - "loss": 0.2794, + "learning_rate": 0.00029910931539916223, + "loss": 0.2889, "step": 920 }, { "epoch": 0.01, - "learning_rate": 0.00029849114154065806, - "loss": 0.2759, + "learning_rate": 0.0002990996340448053, + "loss": 0.2932, "step": 930 }, { "epoch": 0.01, - "learning_rate": 0.000298474917256149, - "loss": 0.2869, + "learning_rate": 0.0002990899526904484, + "loss": 0.3026, "step": 940 }, { "epoch": 0.01, - "learning_rate": 0.00029845869297163996, - "loss": 0.283, + "learning_rate": 0.0002990802713360914, + "loss": 0.2827, "step": 950 }, { "epoch": 0.01, - "learning_rate": 0.0002984424686871309, - "loss": 0.2965, + "learning_rate": 0.0002990705899817345, + "loss": 0.2945, "step": 960 }, { "epoch": 0.01, - "learning_rate": 0.0002984262444026218, - "loss": 0.2629, + "learning_rate": 0.0002990609086273776, + "loss": 0.2753, "step": 970 }, { "epoch": 0.01, - "learning_rate": 0.0002984100201181128, - "loss": 0.285, + "learning_rate": 0.0002990512272730206, + "loss": 0.2733, "step": 980 }, { "epoch": 0.01, - "learning_rate": 0.0002983937958336037, - "loss": 0.2759, + "learning_rate": 0.0002990415459186637, + "loss": 0.2932, "step": 990 }, { "epoch": 0.01, - "learning_rate": 0.0002983775715490946, - "loss": 0.2824, + "learning_rate": 0.00029903186456430676, + "loss": 0.277, "step": 1000 }, { "epoch": 0.01, - "eval_cer": 0.9219238401176094, - "eval_loss": 0.21292299032211304, - "eval_runtime": 119.3045, - "eval_samples_per_second": 16.764, - "eval_steps_per_second": 4.191, + "eval_cer": 0.9206128121116258, + "eval_loss": 0.2336636185646057, + "eval_runtime": 119.7068, + "eval_samples_per_second": 16.707, + "eval_steps_per_second": 4.177, "step": 1000 }, { "epoch": 0.01, - "learning_rate": 0.0002983613472645856, - "loss": 0.2942, + "learning_rate": 0.00029902218320994984, + "loss": 0.2856, "step": 1010 }, { "epoch": 0.01, - "learning_rate": 0.0002983451229800765, - "loss": 0.267, + "learning_rate": 0.00029901250185559287, + "loss": 0.2949, "step": 1020 }, { "epoch": 0.01, - "learning_rate": 0.0002983288986955675, - "loss": 0.2817, + "learning_rate": 0.00029900282050123595, + "loss": 0.295, "step": 1030 }, { "epoch": 0.01, - "learning_rate": 0.0002983126744110584, - "loss": 0.2744, + "learning_rate": 0.000298993139146879, + "loss": 0.2615, "step": 1040 }, { "epoch": 0.01, - "learning_rate": 0.0002982964501265494, - "loss": 0.2597, + "learning_rate": 0.0002989834577925221, + "loss": 0.2862, "step": 1050 }, { "epoch": 0.01, - "learning_rate": 0.0002982802258420403, - "loss": 0.2715, + "learning_rate": 0.0002989737764381652, + "loss": 0.2766, "step": 1060 }, { "epoch": 0.01, - "learning_rate": 0.0002982640015575313, - "loss": 0.263, + "learning_rate": 0.00029896409508380826, + "loss": 0.2733, "step": 1070 }, { "epoch": 0.01, - "learning_rate": 0.0002982477772730222, - "loss": 0.2787, + "learning_rate": 0.0002989544137294513, + "loss": 0.2808, "step": 1080 }, { "epoch": 0.01, - "learning_rate": 0.0002982315529885132, - "loss": 0.2777, + "learning_rate": 0.00029894473237509437, + "loss": 0.2812, "step": 1090 }, { "epoch": 0.01, - "learning_rate": 0.0002982153287040041, - "loss": 0.2697, + "learning_rate": 0.00029893505102073745, + "loss": 0.2724, "step": 1100 }, { "epoch": 0.01, - "learning_rate": 0.0002981991044194951, - "loss": 0.266, + "learning_rate": 0.0002989253696663805, + "loss": 0.2764, "step": 1110 }, { "epoch": 0.01, - "learning_rate": 0.000298182880134986, - "loss": 0.2762, + "learning_rate": 0.00029891568831202356, + "loss": 0.2796, "step": 1120 }, { "epoch": 0.01, - "learning_rate": 0.000298166655850477, + "learning_rate": 0.00029890600695766663, "loss": 0.2724, "step": 1130 }, { "epoch": 0.01, - "learning_rate": 0.0002981504315659679, - "loss": 0.2825, + "learning_rate": 0.0002988963256033097, + "loss": 0.2541, "step": 1140 }, { "epoch": 0.01, - "learning_rate": 0.00029813420728145884, - "loss": 0.2645, + "learning_rate": 0.0002988866442489528, + "loss": 0.2541, "step": 1150 }, { "epoch": 0.01, - "learning_rate": 0.0002981179829969498, - "loss": 0.2687, + "learning_rate": 0.0002988769628945958, + "loss": 0.2694, "step": 1160 }, { "epoch": 0.01, - "learning_rate": 0.00029810175871244074, - "loss": 0.249, + "learning_rate": 0.0002988672815402389, + "loss": 0.2667, "step": 1170 }, { "epoch": 0.01, - "learning_rate": 0.00029808553442793167, - "loss": 0.2527, + "learning_rate": 0.000298857600185882, + "loss": 0.2663, "step": 1180 }, { "epoch": 0.01, - "learning_rate": 0.00029806931014342264, - "loss": 0.2484, + "learning_rate": 0.00029884791883152506, + "loss": 0.2622, "step": 1190 }, { "epoch": 0.01, - "learning_rate": 0.00029805308585891357, - "loss": 0.2693, + "learning_rate": 0.00029883823747716814, + "loss": 0.2689, "step": 1200 }, { "epoch": 0.01, - "learning_rate": 0.00029803686157440454, - "loss": 0.2569, + "learning_rate": 0.00029882855612281116, + "loss": 0.2575, "step": 1210 }, { "epoch": 0.01, - "learning_rate": 0.00029802063728989547, - "loss": 0.2584, + "learning_rate": 0.00029881887476845424, + "loss": 0.2625, "step": 1220 }, { "epoch": 0.01, - "learning_rate": 0.00029800441300538644, - "loss": 0.2718, + "learning_rate": 0.0002988091934140973, + "loss": 0.2727, "step": 1230 }, { "epoch": 0.01, - "learning_rate": 0.00029798818872087737, - "loss": 0.2575, + "learning_rate": 0.00029879951205974035, + "loss": 0.2649, "step": 1240 }, { "epoch": 0.01, - "learning_rate": 0.00029797196443636834, - "loss": 0.2677, + "learning_rate": 0.00029878983070538343, + "loss": 0.2687, "step": 1250 }, { "epoch": 0.01, - "learning_rate": 0.00029795574015185927, - "loss": 0.2708, + "learning_rate": 0.0002987801493510265, + "loss": 0.262, "step": 1260 }, { "epoch": 0.01, - "learning_rate": 0.00029793951586735024, - "loss": 0.2558, + "learning_rate": 0.0002987704679966696, + "loss": 0.2517, "step": 1270 }, { "epoch": 0.01, - "learning_rate": 0.00029792329158284116, - "loss": 0.2459, + "learning_rate": 0.00029876078664231267, + "loss": 0.2721, "step": 1280 }, { "epoch": 0.01, - "learning_rate": 0.00029790706729833214, - "loss": 0.2478, + "learning_rate": 0.00029875110528795575, + "loss": 0.2573, "step": 1290 }, { "epoch": 0.01, - "learning_rate": 0.00029789084301382306, - "loss": 0.2354, + "learning_rate": 0.0002987414239335988, + "loss": 0.2716, "step": 1300 }, { "epoch": 0.01, - "learning_rate": 0.00029787461872931404, - "loss": 0.2588, + "learning_rate": 0.00029873174257924185, + "loss": 0.2558, "step": 1310 }, { "epoch": 0.01, - "learning_rate": 0.00029785839444480496, - "loss": 0.2513, + "learning_rate": 0.00029872206122488493, + "loss": 0.2672, "step": 1320 }, { "epoch": 0.01, - "learning_rate": 0.0002978421701602959, - "loss": 0.2347, + "learning_rate": 0.000298712379870528, + "loss": 0.2624, "step": 1330 }, { "epoch": 0.01, - "learning_rate": 0.00029782594587578686, - "loss": 0.2536, + "learning_rate": 0.0002987026985161711, + "loss": 0.2629, "step": 1340 }, { "epoch": 0.01, - "learning_rate": 0.0002978097215912778, - "loss": 0.2344, + "learning_rate": 0.0002986930171618141, + "loss": 0.2537, "step": 1350 }, { "epoch": 0.01, - "learning_rate": 0.0002977934973067687, - "loss": 0.246, + "learning_rate": 0.0002986833358074572, + "loss": 0.2608, "step": 1360 }, { "epoch": 0.01, - "learning_rate": 0.0002977772730222597, - "loss": 0.2383, + "learning_rate": 0.0002986736544531003, + "loss": 0.2553, "step": 1370 }, { "epoch": 0.01, - "learning_rate": 0.0002977610487377506, - "loss": 0.2474, + "learning_rate": 0.0002986639730987433, + "loss": 0.2651, "step": 1380 }, { - "epoch": 0.02, - "learning_rate": 0.0002977448244532416, - "loss": 0.2333, + "epoch": 0.01, + "learning_rate": 0.0002986542917443864, + "loss": 0.2504, "step": 1390 }, { - "epoch": 0.02, - "learning_rate": 0.0002977286001687325, - "loss": 0.2574, + "epoch": 0.01, + "learning_rate": 0.00029864461039002946, + "loss": 0.2465, "step": 1400 }, { - "epoch": 0.02, - "learning_rate": 0.0002977123758842235, - "loss": 0.2434, + "epoch": 0.01, + "learning_rate": 0.00029863492903567254, + "loss": 0.2565, "step": 1410 }, { - "epoch": 0.02, - "learning_rate": 0.0002976961515997144, - "loss": 0.2417, + "epoch": 0.01, + "learning_rate": 0.0002986252476813156, + "loss": 0.2687, "step": 1420 }, { - "epoch": 0.02, - "learning_rate": 0.0002976799273152054, - "loss": 0.2419, + "epoch": 0.01, + "learning_rate": 0.0002986155663269587, + "loss": 0.2671, "step": 1430 }, { - "epoch": 0.02, - "learning_rate": 0.0002976637030306963, - "loss": 0.2287, + "epoch": 0.01, + "learning_rate": 0.00029860588497260173, + "loss": 0.2442, "step": 1440 }, { - "epoch": 0.02, - "learning_rate": 0.0002976474787461873, - "loss": 0.2223, + "epoch": 0.01, + "learning_rate": 0.0002985962036182448, + "loss": 0.2556, "step": 1450 }, { - "epoch": 0.02, - "learning_rate": 0.0002976312544616782, - "loss": 0.2413, + "epoch": 0.01, + "learning_rate": 0.0002985865222638879, + "loss": 0.2609, "step": 1460 }, { - "epoch": 0.02, - "learning_rate": 0.0002976150301771692, - "loss": 0.2437, + "epoch": 0.01, + "learning_rate": 0.00029857684090953097, + "loss": 0.2459, "step": 1470 }, { - "epoch": 0.02, - "learning_rate": 0.0002975988058926601, - "loss": 0.2312, + "epoch": 0.01, + "learning_rate": 0.000298567159555174, + "loss": 0.2409, "step": 1480 }, { - "epoch": 0.02, - "learning_rate": 0.0002975825816081511, - "loss": 0.2286, + "epoch": 0.01, + "learning_rate": 0.0002985574782008171, + "loss": 0.2457, "step": 1490 }, { - "epoch": 0.02, - "learning_rate": 0.000297566357323642, - "loss": 0.2402, + "epoch": 0.01, + "learning_rate": 0.00029854779684646015, + "loss": 0.2614, "step": 1500 }, { - "epoch": 0.02, - "learning_rate": 0.00029755013303913293, - "loss": 0.2251, + "epoch": 0.01, + "learning_rate": 0.0002985381154921032, + "loss": 0.2455, "step": 1510 }, { - "epoch": 0.02, - "learning_rate": 0.0002975339087546239, - "loss": 0.2216, + "epoch": 0.01, + "learning_rate": 0.00029852843413774626, + "loss": 0.2352, "step": 1520 }, { - "epoch": 0.02, - "learning_rate": 0.00029751768447011483, - "loss": 0.258, + "epoch": 0.01, + "learning_rate": 0.00029851875278338934, + "loss": 0.243, "step": 1530 }, { - "epoch": 0.02, - "learning_rate": 0.0002975014601856058, - "loss": 0.2358, + "epoch": 0.01, + "learning_rate": 0.0002985090714290324, + "loss": 0.2383, "step": 1540 }, { - "epoch": 0.02, - "learning_rate": 0.00029748523590109673, - "loss": 0.2496, + "epoch": 0.01, + "learning_rate": 0.0002984993900746755, + "loss": 0.2359, "step": 1550 }, { - "epoch": 0.02, - "learning_rate": 0.00029746901161658765, - "loss": 0.2237, + "epoch": 0.01, + "learning_rate": 0.0002984897087203186, + "loss": 0.2542, "step": 1560 }, { - "epoch": 0.02, - "learning_rate": 0.0002974527873320786, - "loss": 0.2386, + "epoch": 0.01, + "learning_rate": 0.00029848002736596166, + "loss": 0.2485, "step": 1570 }, { - "epoch": 0.02, - "learning_rate": 0.00029743656304756955, - "loss": 0.2381, + "epoch": 0.01, + "learning_rate": 0.0002984703460116047, + "loss": 0.2399, "step": 1580 }, { - "epoch": 0.02, - "learning_rate": 0.0002974203387630605, - "loss": 0.2374, + "epoch": 0.01, + "learning_rate": 0.00029846066465724776, + "loss": 0.2427, "step": 1590 }, { - "epoch": 0.02, - "learning_rate": 0.00029740411447855145, - "loss": 0.2425, + "epoch": 0.01, + "learning_rate": 0.00029845098330289084, + "loss": 0.2422, "step": 1600 }, { - "epoch": 0.02, - "learning_rate": 0.0002973878901940424, - "loss": 0.2353, + "epoch": 0.01, + "learning_rate": 0.00029844130194853387, + "loss": 0.2327, "step": 1610 }, { - "epoch": 0.02, - "learning_rate": 0.00029737166590953335, - "loss": 0.2423, + "epoch": 0.01, + "learning_rate": 0.00029843162059417695, + "loss": 0.24, "step": 1620 }, { - "epoch": 0.02, - "learning_rate": 0.0002973554416250243, - "loss": 0.2683, + "epoch": 0.01, + "learning_rate": 0.00029842193923982003, + "loss": 0.2288, "step": 1630 }, { - "epoch": 0.02, - "learning_rate": 0.00029733921734051525, - "loss": 0.2274, + "epoch": 0.01, + "learning_rate": 0.0002984122578854631, + "loss": 0.2422, "step": 1640 }, { - "epoch": 0.02, - "learning_rate": 0.0002973229930560062, - "loss": 0.2211, + "epoch": 0.01, + "learning_rate": 0.00029840257653110613, + "loss": 0.2256, "step": 1650 }, { - "epoch": 0.02, - "learning_rate": 0.00029730676877149715, - "loss": 0.2365, + "epoch": 0.01, + "learning_rate": 0.0002983928951767492, + "loss": 0.2395, "step": 1660 }, { - "epoch": 0.02, - "learning_rate": 0.0002972905444869881, - "loss": 0.233, + "epoch": 0.01, + "learning_rate": 0.0002983832138223923, + "loss": 0.2367, "step": 1670 }, { - "epoch": 0.02, - "learning_rate": 0.00029727432020247905, - "loss": 0.2353, + "epoch": 0.01, + "learning_rate": 0.0002983735324680354, + "loss": 0.2373, "step": 1680 }, { - "epoch": 0.02, - "learning_rate": 0.00029725809591796997, - "loss": 0.2331, + "epoch": 0.01, + "learning_rate": 0.00029836385111367845, + "loss": 0.2324, "step": 1690 }, { - "epoch": 0.02, - "learning_rate": 0.00029724187163346095, - "loss": 0.2185, + "epoch": 0.01, + "learning_rate": 0.00029835416975932153, + "loss": 0.2337, "step": 1700 }, { - "epoch": 0.02, - "learning_rate": 0.00029722564734895187, - "loss": 0.2196, + "epoch": 0.01, + "learning_rate": 0.0002983444884049646, + "loss": 0.2105, "step": 1710 }, { - "epoch": 0.02, - "learning_rate": 0.00029720942306444285, - "loss": 0.2433, + "epoch": 0.01, + "learning_rate": 0.00029833480705060764, + "loss": 0.2311, "step": 1720 }, { - "epoch": 0.02, - "learning_rate": 0.00029719319877993377, - "loss": 0.2152, + "epoch": 0.01, + "learning_rate": 0.0002983251256962507, + "loss": 0.2334, "step": 1730 }, { - "epoch": 0.02, - "learning_rate": 0.0002971769744954247, - "loss": 0.2256, + "epoch": 0.01, + "learning_rate": 0.0002983154443418938, + "loss": 0.2551, "step": 1740 }, { - "epoch": 0.02, - "learning_rate": 0.00029716075021091567, - "loss": 0.2267, + "epoch": 0.01, + "learning_rate": 0.0002983057629875368, + "loss": 0.2379, "step": 1750 }, { - "epoch": 0.02, - "learning_rate": 0.0002971445259264066, - "loss": 0.2201, + "epoch": 0.01, + "learning_rate": 0.0002982960816331799, + "loss": 0.2399, "step": 1760 }, { - "epoch": 0.02, - "learning_rate": 0.00029712830164189757, - "loss": 0.2292, + "epoch": 0.01, + "learning_rate": 0.000298286400278823, + "loss": 0.2271, "step": 1770 }, { - "epoch": 0.02, - "learning_rate": 0.0002971120773573885, - "loss": 0.237, + "epoch": 0.01, + "learning_rate": 0.00029827671892446606, + "loss": 0.2369, "step": 1780 }, { - "epoch": 0.02, - "learning_rate": 0.00029709585307287947, - "loss": 0.2236, + "epoch": 0.01, + "learning_rate": 0.0002982670375701091, + "loss": 0.2296, "step": 1790 }, { - "epoch": 0.02, - "learning_rate": 0.0002970796287883704, - "loss": 0.2134, + "epoch": 0.01, + "learning_rate": 0.00029825735621575217, + "loss": 0.2223, "step": 1800 }, { - "epoch": 0.02, - "learning_rate": 0.00029706340450386137, - "loss": 0.2331, + "epoch": 0.01, + "learning_rate": 0.00029824767486139525, + "loss": 0.2359, "step": 1810 }, { - "epoch": 0.02, - "learning_rate": 0.0002970471802193523, - "loss": 0.2178, + "epoch": 0.01, + "learning_rate": 0.00029823799350703833, + "loss": 0.2307, "step": 1820 }, { - "epoch": 0.02, - "learning_rate": 0.00029703095593484327, - "loss": 0.2242, + "epoch": 0.01, + "learning_rate": 0.0002982283121526814, + "loss": 0.2218, "step": 1830 }, { - "epoch": 0.02, - "learning_rate": 0.0002970147316503342, - "loss": 0.2079, + "epoch": 0.01, + "learning_rate": 0.0002982186307983245, + "loss": 0.2424, "step": 1840 }, { - "epoch": 0.02, - "learning_rate": 0.00029699850736582517, - "loss": 0.2277, + "epoch": 0.01, + "learning_rate": 0.0002982089494439675, + "loss": 0.2239, "step": 1850 }, { - "epoch": 0.02, - "learning_rate": 0.0002969822830813161, - "loss": 0.2155, + "epoch": 0.01, + "learning_rate": 0.0002981992680896106, + "loss": 0.224, "step": 1860 }, { - "epoch": 0.02, - "learning_rate": 0.000296966058796807, - "loss": 0.2278, + "epoch": 0.01, + "learning_rate": 0.00029818958673525367, + "loss": 0.2339, "step": 1870 }, { - "epoch": 0.02, - "learning_rate": 0.000296949834512298, - "loss": 0.2052, + "epoch": 0.01, + "learning_rate": 0.0002981799053808967, + "loss": 0.2185, "step": 1880 }, { - "epoch": 0.02, - "learning_rate": 0.0002969336102277889, - "loss": 0.217, + "epoch": 0.01, + "learning_rate": 0.0002981702240265398, + "loss": 0.2397, "step": 1890 }, { - "epoch": 0.02, - "learning_rate": 0.0002969173859432799, - "loss": 0.2337, + "epoch": 0.01, + "learning_rate": 0.00029816054267218286, + "loss": 0.2466, "step": 1900 }, { - "epoch": 0.02, - "learning_rate": 0.0002969011616587708, - "loss": 0.2158, + "epoch": 0.01, + "learning_rate": 0.00029815086131782594, + "loss": 0.2206, "step": 1910 }, { - "epoch": 0.02, - "learning_rate": 0.00029688493737426173, - "loss": 0.2174, + "epoch": 0.01, + "learning_rate": 0.000298141179963469, + "loss": 0.2361, "step": 1920 }, { - "epoch": 0.02, - "learning_rate": 0.0002968687130897527, - "loss": 0.2155, + "epoch": 0.01, + "learning_rate": 0.00029813149860911204, + "loss": 0.221, "step": 1930 }, { - "epoch": 0.02, - "learning_rate": 0.00029685248880524363, - "loss": 0.2143, + "epoch": 0.01, + "learning_rate": 0.0002981218172547551, + "loss": 0.205, "step": 1940 }, { - "epoch": 0.02, - "learning_rate": 0.0002968362645207346, - "loss": 0.2047, + "epoch": 0.01, + "learning_rate": 0.0002981121359003982, + "loss": 0.2301, "step": 1950 }, { - "epoch": 0.02, - "learning_rate": 0.00029682004023622553, - "loss": 0.2133, + "epoch": 0.01, + "learning_rate": 0.0002981024545460413, + "loss": 0.2227, "step": 1960 }, { - "epoch": 0.02, - "learning_rate": 0.0002968038159517165, - "loss": 0.2255, + "epoch": 0.01, + "learning_rate": 0.00029809277319168436, + "loss": 0.2191, "step": 1970 }, { - "epoch": 0.02, - "learning_rate": 0.00029678759166720743, - "loss": 0.2277, + "epoch": 0.01, + "learning_rate": 0.00029808309183732744, + "loss": 0.217, "step": 1980 }, { - "epoch": 0.02, - "learning_rate": 0.0002967713673826984, - "loss": 0.2118, + "epoch": 0.01, + "learning_rate": 0.00029807341048297047, + "loss": 0.2146, "step": 1990 }, { - "epoch": 0.02, - "learning_rate": 0.00029675514309818933, - "loss": 0.1971, + "epoch": 0.01, + "learning_rate": 0.00029806372912861355, + "loss": 0.2349, "step": 2000 }, { - "epoch": 0.02, - "eval_cer": 0.9216720470861803, - "eval_loss": 0.1600009799003601, - "eval_runtime": 119.1546, - "eval_samples_per_second": 16.785, - "eval_steps_per_second": 4.196, + "epoch": 0.01, + "eval_cer": 0.9204428878092871, + "eval_loss": 0.1756814867258072, + "eval_runtime": 120.0499, + "eval_samples_per_second": 16.66, + "eval_steps_per_second": 4.165, "step": 2000 }, { - "epoch": 0.02, - "learning_rate": 0.0002967389188136803, - "loss": 0.2216, + "epoch": 0.01, + "learning_rate": 0.00029805404777425657, + "loss": 0.2146, "step": 2010 }, { - "epoch": 0.02, - "learning_rate": 0.00029672269452917123, - "loss": 0.203, + "epoch": 0.01, + "learning_rate": 0.00029804436641989965, + "loss": 0.2262, "step": 2020 }, { - "epoch": 0.02, - "learning_rate": 0.0002967064702446622, - "loss": 0.2086, + "epoch": 0.01, + "learning_rate": 0.00029803468506554273, + "loss": 0.2296, "step": 2030 }, { - "epoch": 0.02, - "learning_rate": 0.00029669024596015313, - "loss": 0.1961, + "epoch": 0.01, + "learning_rate": 0.0002980250037111858, + "loss": 0.2168, "step": 2040 }, { - "epoch": 0.02, - "learning_rate": 0.00029667402167564405, - "loss": 0.2146, + "epoch": 0.01, + "learning_rate": 0.0002980153223568289, + "loss": 0.2247, "step": 2050 }, { - "epoch": 0.02, - "learning_rate": 0.00029665779739113503, - "loss": 0.2089, + "epoch": 0.01, + "learning_rate": 0.00029800564100247197, + "loss": 0.2219, "step": 2060 }, { - "epoch": 0.02, - "learning_rate": 0.00029664157310662595, - "loss": 0.1928, + "epoch": 0.01, + "learning_rate": 0.000297995959648115, + "loss": 0.2259, "step": 2070 }, { - "epoch": 0.02, - "learning_rate": 0.00029662534882211693, - "loss": 0.1947, + "epoch": 0.01, + "learning_rate": 0.0002979862782937581, + "loss": 0.2176, "step": 2080 }, { - "epoch": 0.02, - "learning_rate": 0.00029660912453760785, - "loss": 0.2021, + "epoch": 0.01, + "learning_rate": 0.00029797659693940116, + "loss": 0.22, "step": 2090 }, { - "epoch": 0.02, - "learning_rate": 0.0002965929002530988, - "loss": 0.1977, + "epoch": 0.01, + "learning_rate": 0.00029796691558504424, + "loss": 0.2176, "step": 2100 }, { - "epoch": 0.02, - "learning_rate": 0.00029657667596858975, - "loss": 0.2073, + "epoch": 0.01, + "learning_rate": 0.0002979572342306873, + "loss": 0.2179, "step": 2110 }, { - "epoch": 0.02, - "learning_rate": 0.0002965604516840807, - "loss": 0.2137, + "epoch": 0.01, + "learning_rate": 0.00029794755287633034, + "loss": 0.2146, "step": 2120 }, { - "epoch": 0.02, - "learning_rate": 0.00029654422739957165, - "loss": 0.2106, + "epoch": 0.01, + "learning_rate": 0.0002979378715219734, + "loss": 0.2029, "step": 2130 }, { - "epoch": 0.02, - "learning_rate": 0.0002965280031150626, - "loss": 0.1959, + "epoch": 0.01, + "learning_rate": 0.0002979281901676165, + "loss": 0.2322, "step": 2140 }, { - "epoch": 0.02, - "learning_rate": 0.00029651177883055355, - "loss": 0.2013, + "epoch": 0.01, + "learning_rate": 0.0002979185088132595, + "loss": 0.2138, "step": 2150 }, { - "epoch": 0.02, - "learning_rate": 0.0002964955545460445, - "loss": 0.1952, + "epoch": 0.01, + "learning_rate": 0.0002979088274589026, + "loss": 0.2083, "step": 2160 }, { - "epoch": 0.02, - "learning_rate": 0.00029647933026153545, - "loss": 0.2103, + "epoch": 0.01, + "learning_rate": 0.0002978991461045457, + "loss": 0.2172, "step": 2170 }, { - "epoch": 0.02, - "learning_rate": 0.0002964631059770264, - "loss": 0.2022, + "epoch": 0.01, + "learning_rate": 0.00029788946475018877, + "loss": 0.2299, "step": 2180 }, { - "epoch": 0.02, - "learning_rate": 0.00029644688169251735, - "loss": 0.1931, + "epoch": 0.01, + "learning_rate": 0.00029787978339583185, + "loss": 0.2178, "step": 2190 }, { - "epoch": 0.02, - "learning_rate": 0.00029643065740800827, - "loss": 0.2075, + "epoch": 0.01, + "learning_rate": 0.0002978701020414749, + "loss": 0.2136, "step": 2200 }, { - "epoch": 0.02, - "learning_rate": 0.00029641443312349925, - "loss": 0.1933, + "epoch": 0.01, + "learning_rate": 0.00029786042068711795, + "loss": 0.2081, "step": 2210 }, { - "epoch": 0.02, - "learning_rate": 0.00029639820883899017, - "loss": 0.1968, + "epoch": 0.01, + "learning_rate": 0.00029785073933276103, + "loss": 0.2113, "step": 2220 }, { - "epoch": 0.02, - "learning_rate": 0.00029638198455448115, - "loss": 0.1934, + "epoch": 0.01, + "learning_rate": 0.0002978410579784041, + "loss": 0.2195, "step": 2230 }, { - "epoch": 0.02, - "learning_rate": 0.00029636576026997207, - "loss": 0.2004, + "epoch": 0.01, + "learning_rate": 0.0002978313766240472, + "loss": 0.2239, "step": 2240 }, { - "epoch": 0.02, - "learning_rate": 0.000296349535985463, - "loss": 0.1861, + "epoch": 0.01, + "learning_rate": 0.0002978216952696902, + "loss": 0.2077, "step": 2250 }, { - "epoch": 0.02, - "learning_rate": 0.00029633331170095397, - "loss": 0.1867, + "epoch": 0.01, + "learning_rate": 0.0002978120139153333, + "loss": 0.2167, "step": 2260 }, { - "epoch": 0.02, - "learning_rate": 0.0002963170874164449, - "loss": 0.1855, + "epoch": 0.01, + "learning_rate": 0.0002978023325609764, + "loss": 0.2048, "step": 2270 }, { - "epoch": 0.02, - "learning_rate": 0.0002963008631319358, - "loss": 0.1826, + "epoch": 0.01, + "learning_rate": 0.0002977926512066194, + "loss": 0.2235, "step": 2280 }, { - "epoch": 0.02, - "learning_rate": 0.0002962846388474268, - "loss": 0.1958, + "epoch": 0.01, + "learning_rate": 0.0002977829698522625, + "loss": 0.2353, "step": 2290 }, { - "epoch": 0.02, - "learning_rate": 0.0002962684145629177, - "loss": 0.1922, + "epoch": 0.01, + "learning_rate": 0.00029777328849790556, + "loss": 0.2184, "step": 2300 }, { - "epoch": 0.02, - "learning_rate": 0.0002962521902784087, - "loss": 0.2032, + "epoch": 0.01, + "learning_rate": 0.00029776360714354864, + "loss": 0.2137, "step": 2310 }, { - "epoch": 0.03, - "learning_rate": 0.0002962359659938996, - "loss": 0.1878, + "epoch": 0.01, + "learning_rate": 0.0002977539257891917, + "loss": 0.2075, "step": 2320 }, { - "epoch": 0.03, - "learning_rate": 0.0002962197417093906, - "loss": 0.1884, + "epoch": 0.02, + "learning_rate": 0.0002977442444348348, + "loss": 0.1974, "step": 2330 }, { - "epoch": 0.03, - "learning_rate": 0.0002962035174248815, - "loss": 0.1922, + "epoch": 0.02, + "learning_rate": 0.0002977345630804779, + "loss": 0.1973, "step": 2340 }, { - "epoch": 0.03, - "learning_rate": 0.0002961872931403725, - "loss": 0.2, + "epoch": 0.02, + "learning_rate": 0.0002977248817261209, + "loss": 0.2029, "step": 2350 }, { - "epoch": 0.03, - "learning_rate": 0.00029617106885586347, - "loss": 0.1915, + "epoch": 0.02, + "learning_rate": 0.000297715200371764, + "loss": 0.2081, "step": 2360 }, { - "epoch": 0.03, - "learning_rate": 0.0002961548445713544, - "loss": 0.1799, + "epoch": 0.02, + "learning_rate": 0.00029770551901740707, + "loss": 0.217, "step": 2370 }, { - "epoch": 0.03, - "learning_rate": 0.0002961386202868453, - "loss": 0.1947, + "epoch": 0.02, + "learning_rate": 0.00029769583766305015, + "loss": 0.1976, "step": 2380 }, { - "epoch": 0.03, - "learning_rate": 0.0002961223960023363, - "loss": 0.1913, + "epoch": 0.02, + "learning_rate": 0.00029768615630869317, + "loss": 0.2072, "step": 2390 }, { - "epoch": 0.03, - "learning_rate": 0.0002961061717178272, - "loss": 0.1899, + "epoch": 0.02, + "learning_rate": 0.00029767647495433625, + "loss": 0.204, "step": 2400 }, { - "epoch": 0.03, - "learning_rate": 0.0002960899474333182, - "loss": 0.1886, + "epoch": 0.02, + "learning_rate": 0.00029766679359997933, + "loss": 0.2068, "step": 2410 }, { - "epoch": 0.03, - "learning_rate": 0.0002960737231488091, - "loss": 0.1916, + "epoch": 0.02, + "learning_rate": 0.00029765711224562236, + "loss": 0.1977, "step": 2420 }, { - "epoch": 0.03, - "learning_rate": 0.00029605749886430004, - "loss": 0.1766, + "epoch": 0.02, + "learning_rate": 0.00029764743089126544, + "loss": 0.2093, "step": 2430 }, { - "epoch": 0.03, - "learning_rate": 0.000296041274579791, - "loss": 0.1862, + "epoch": 0.02, + "learning_rate": 0.0002976377495369085, + "loss": 0.2053, "step": 2440 }, { - "epoch": 0.03, - "learning_rate": 0.00029602505029528194, - "loss": 0.1891, + "epoch": 0.02, + "learning_rate": 0.0002976280681825516, + "loss": 0.2134, "step": 2450 }, { - "epoch": 0.03, - "learning_rate": 0.0002960088260107729, - "loss": 0.1748, + "epoch": 0.02, + "learning_rate": 0.0002976183868281947, + "loss": 0.2036, "step": 2460 }, { - "epoch": 0.03, - "learning_rate": 0.00029599260172626384, - "loss": 0.1955, + "epoch": 0.02, + "learning_rate": 0.00029760870547383775, + "loss": 0.2059, "step": 2470 }, { - "epoch": 0.03, - "learning_rate": 0.0002959763774417548, - "loss": 0.1953, + "epoch": 0.02, + "learning_rate": 0.00029759902411948083, + "loss": 0.202, "step": 2480 }, { - "epoch": 0.03, - "learning_rate": 0.00029596015315724573, - "loss": 0.1923, + "epoch": 0.02, + "learning_rate": 0.00029758934276512386, + "loss": 0.1888, "step": 2490 }, { - "epoch": 0.03, - "learning_rate": 0.0002959439288727367, - "loss": 0.2023, + "epoch": 0.02, + "learning_rate": 0.00029757966141076694, + "loss": 0.2163, "step": 2500 }, { - "epoch": 0.03, - "learning_rate": 0.00029592770458822763, - "loss": 0.1891, + "epoch": 0.02, + "learning_rate": 0.00029756998005641, + "loss": 0.2155, "step": 2510 }, { - "epoch": 0.03, - "learning_rate": 0.0002959114803037186, - "loss": 0.1932, + "epoch": 0.02, + "learning_rate": 0.00029756029870205305, + "loss": 0.1994, "step": 2520 }, { - "epoch": 0.03, - "learning_rate": 0.00029589525601920953, - "loss": 0.1976, + "epoch": 0.02, + "learning_rate": 0.0002975506173476961, + "loss": 0.2103, "step": 2530 }, { - "epoch": 0.03, - "learning_rate": 0.0002958790317347005, - "loss": 0.1918, + "epoch": 0.02, + "learning_rate": 0.0002975409359933392, + "loss": 0.2211, "step": 2540 }, { - "epoch": 0.03, - "learning_rate": 0.00029586280745019143, - "loss": 0.1831, + "epoch": 0.02, + "learning_rate": 0.0002975312546389823, + "loss": 0.2132, "step": 2550 }, { - "epoch": 0.03, - "learning_rate": 0.00029584658316568236, - "loss": 0.18, + "epoch": 0.02, + "learning_rate": 0.0002975215732846253, + "loss": 0.2035, "step": 2560 }, { - "epoch": 0.03, - "learning_rate": 0.00029583035888117333, - "loss": 0.1834, + "epoch": 0.02, + "learning_rate": 0.0002975118919302684, + "loss": 0.2082, "step": 2570 }, { - "epoch": 0.03, - "learning_rate": 0.00029581413459666426, - "loss": 0.1782, + "epoch": 0.02, + "learning_rate": 0.00029750221057591147, + "loss": 0.2018, "step": 2580 }, { - "epoch": 0.03, - "learning_rate": 0.00029579791031215523, - "loss": 0.1796, + "epoch": 0.02, + "learning_rate": 0.00029749252922155455, + "loss": 0.197, "step": 2590 }, { - "epoch": 0.03, - "learning_rate": 0.00029578168602764616, - "loss": 0.1826, + "epoch": 0.02, + "learning_rate": 0.00029748284786719763, + "loss": 0.1911, "step": 2600 }, { - "epoch": 0.03, - "learning_rate": 0.0002957654617431371, - "loss": 0.1834, + "epoch": 0.02, + "learning_rate": 0.0002974731665128407, + "loss": 0.1997, "step": 2610 }, { - "epoch": 0.03, - "learning_rate": 0.00029574923745862805, - "loss": 0.1868, + "epoch": 0.02, + "learning_rate": 0.00029746348515848373, + "loss": 0.203, "step": 2620 }, { - "epoch": 0.03, - "learning_rate": 0.000295733013174119, - "loss": 0.1914, + "epoch": 0.02, + "learning_rate": 0.0002974538038041268, + "loss": 0.2004, "step": 2630 }, { - "epoch": 0.03, - "learning_rate": 0.00029571678888960995, - "loss": 0.1823, + "epoch": 0.02, + "learning_rate": 0.0002974441224497699, + "loss": 0.1991, "step": 2640 }, { - "epoch": 0.03, - "learning_rate": 0.0002957005646051009, - "loss": 0.1904, + "epoch": 0.02, + "learning_rate": 0.0002974344410954129, + "loss": 0.1913, "step": 2650 }, { - "epoch": 0.03, - "learning_rate": 0.00029568434032059185, - "loss": 0.1919, + "epoch": 0.02, + "learning_rate": 0.000297424759741056, + "loss": 0.1939, "step": 2660 }, { - "epoch": 0.03, - "learning_rate": 0.0002956681160360828, - "loss": 0.1829, + "epoch": 0.02, + "learning_rate": 0.0002974150783866991, + "loss": 0.2052, "step": 2670 }, { - "epoch": 0.03, - "learning_rate": 0.00029565189175157375, - "loss": 0.178, + "epoch": 0.02, + "learning_rate": 0.00029740539703234216, + "loss": 0.1933, "step": 2680 }, { - "epoch": 0.03, - "learning_rate": 0.0002956356674670647, - "loss": 0.179, + "epoch": 0.02, + "learning_rate": 0.00029739571567798524, + "loss": 0.2108, "step": 2690 }, { - "epoch": 0.03, - "learning_rate": 0.00029561944318255565, - "loss": 0.1911, + "epoch": 0.02, + "learning_rate": 0.00029738603432362826, + "loss": 0.2009, "step": 2700 }, { - "epoch": 0.03, - "learning_rate": 0.0002956032188980466, - "loss": 0.1788, + "epoch": 0.02, + "learning_rate": 0.00029737635296927134, + "loss": 0.1924, "step": 2710 }, { - "epoch": 0.03, - "learning_rate": 0.00029558699461353755, - "loss": 0.1838, + "epoch": 0.02, + "learning_rate": 0.0002973666716149144, + "loss": 0.1862, "step": 2720 }, { - "epoch": 0.03, - "learning_rate": 0.0002955707703290285, - "loss": 0.1755, + "epoch": 0.02, + "learning_rate": 0.0002973569902605575, + "loss": 0.1983, "step": 2730 }, { - "epoch": 0.03, - "learning_rate": 0.0002955545460445194, - "loss": 0.1816, + "epoch": 0.02, + "learning_rate": 0.0002973473089062006, + "loss": 0.1993, "step": 2740 }, { - "epoch": 0.03, - "learning_rate": 0.0002955383217600104, - "loss": 0.1721, + "epoch": 0.02, + "learning_rate": 0.00029733762755184366, + "loss": 0.1986, "step": 2750 }, { - "epoch": 0.03, - "learning_rate": 0.0002955220974755013, - "loss": 0.1712, + "epoch": 0.02, + "learning_rate": 0.0002973279461974867, + "loss": 0.2015, "step": 2760 }, { - "epoch": 0.03, - "learning_rate": 0.0002955058731909923, - "loss": 0.1711, + "epoch": 0.02, + "learning_rate": 0.00029731826484312977, + "loss": 0.2058, "step": 2770 }, { - "epoch": 0.03, - "learning_rate": 0.0002954896489064832, - "loss": 0.1705, + "epoch": 0.02, + "learning_rate": 0.00029730858348877285, + "loss": 0.2012, "step": 2780 }, { - "epoch": 0.03, - "learning_rate": 0.0002954734246219741, - "loss": 0.1892, + "epoch": 0.02, + "learning_rate": 0.0002972989021344159, + "loss": 0.2021, "step": 2790 }, { - "epoch": 0.03, - "learning_rate": 0.0002954572003374651, - "loss": 0.1811, + "epoch": 0.02, + "learning_rate": 0.00029728922078005895, + "loss": 0.1987, "step": 2800 }, { - "epoch": 0.03, - "learning_rate": 0.000295440976052956, - "loss": 0.1793, + "epoch": 0.02, + "learning_rate": 0.00029727953942570203, + "loss": 0.1999, "step": 2810 }, { - "epoch": 0.03, - "learning_rate": 0.000295424751768447, - "loss": 0.1837, + "epoch": 0.02, + "learning_rate": 0.0002972698580713451, + "loss": 0.1976, "step": 2820 }, { - "epoch": 0.03, - "learning_rate": 0.0002954085274839379, - "loss": 0.166, + "epoch": 0.02, + "learning_rate": 0.0002972601767169882, + "loss": 0.2014, "step": 2830 }, { - "epoch": 0.03, - "learning_rate": 0.0002953923031994289, - "loss": 0.186, + "epoch": 0.02, + "learning_rate": 0.0002972504953626312, + "loss": 0.1955, "step": 2840 }, { - "epoch": 0.03, - "learning_rate": 0.0002953760789149198, - "loss": 0.1791, + "epoch": 0.02, + "learning_rate": 0.0002972408140082743, + "loss": 0.216, "step": 2850 }, { - "epoch": 0.03, - "learning_rate": 0.0002953598546304108, - "loss": 0.1692, + "epoch": 0.02, + "learning_rate": 0.0002972311326539174, + "loss": 0.2178, "step": 2860 }, { - "epoch": 0.03, - "learning_rate": 0.0002953436303459017, - "loss": 0.1828, + "epoch": 0.02, + "learning_rate": 0.00029722145129956046, + "loss": 0.1887, "step": 2870 }, { - "epoch": 0.03, - "learning_rate": 0.0002953274060613927, - "loss": 0.1965, + "epoch": 0.02, + "learning_rate": 0.00029721176994520354, + "loss": 0.1936, "step": 2880 }, { - "epoch": 0.03, - "learning_rate": 0.0002953111817768836, - "loss": 0.1773, + "epoch": 0.02, + "learning_rate": 0.00029720208859084656, + "loss": 0.1834, "step": 2890 }, { - "epoch": 0.03, - "learning_rate": 0.0002952949574923746, - "loss": 0.1762, + "epoch": 0.02, + "learning_rate": 0.00029719240723648964, + "loss": 0.1873, "step": 2900 }, { - "epoch": 0.03, - "learning_rate": 0.0002952787332078655, - "loss": 0.1918, + "epoch": 0.02, + "learning_rate": 0.0002971827258821327, + "loss": 0.2133, "step": 2910 }, { - "epoch": 0.03, - "learning_rate": 0.0002952625089233565, - "loss": 0.1681, + "epoch": 0.02, + "learning_rate": 0.00029717304452777575, + "loss": 0.1958, "step": 2920 }, { - "epoch": 0.03, - "learning_rate": 0.0002952462846388474, - "loss": 0.1789, + "epoch": 0.02, + "learning_rate": 0.00029716336317341883, + "loss": 0.1991, "step": 2930 }, { - "epoch": 0.03, - "learning_rate": 0.00029523006035433834, - "loss": 0.1761, + "epoch": 0.02, + "learning_rate": 0.0002971536818190619, + "loss": 0.188, "step": 2940 }, { - "epoch": 0.03, - "learning_rate": 0.0002952138360698293, - "loss": 0.1701, + "epoch": 0.02, + "learning_rate": 0.000297144000464705, + "loss": 0.1802, "step": 2950 }, { - "epoch": 0.03, - "learning_rate": 0.00029519761178532024, - "loss": 0.1794, + "epoch": 0.02, + "learning_rate": 0.00029713431911034807, + "loss": 0.1936, "step": 2960 }, { - "epoch": 0.03, - "learning_rate": 0.00029518138750081116, - "loss": 0.1743, + "epoch": 0.02, + "learning_rate": 0.00029712463775599115, + "loss": 0.1866, "step": 2970 }, { - "epoch": 0.03, - "learning_rate": 0.00029516516321630214, - "loss": 0.1711, + "epoch": 0.02, + "learning_rate": 0.0002971149564016342, + "loss": 0.1826, "step": 2980 }, { - "epoch": 0.03, - "learning_rate": 0.00029514893893179306, - "loss": 0.1774, + "epoch": 0.02, + "learning_rate": 0.00029710527504727725, + "loss": 0.196, "step": 2990 }, { - "epoch": 0.03, - "learning_rate": 0.00029513271464728404, - "loss": 0.171, + "epoch": 0.02, + "learning_rate": 0.00029709559369292033, + "loss": 0.1929, "step": 3000 }, { - "epoch": 0.03, - "eval_cer": 0.9216702801175387, - "eval_loss": 0.12727852165699005, - "eval_runtime": 119.2199, - "eval_samples_per_second": 16.776, - "eval_steps_per_second": 4.194, + "epoch": 0.02, + "eval_cer": 0.9204690995367755, + "eval_loss": 0.14816394448280334, + "eval_runtime": 120.365, + "eval_samples_per_second": 16.616, + "eval_steps_per_second": 4.154, "step": 3000 }, { - "epoch": 0.03, - "learning_rate": 0.00029511649036277496, - "loss": 0.1785, + "epoch": 0.02, + "learning_rate": 0.0002970859123385634, + "loss": 0.1944, "step": 3010 }, { - "epoch": 0.03, - "learning_rate": 0.00029510026607826594, - "loss": 0.166, + "epoch": 0.02, + "learning_rate": 0.00029707623098420644, + "loss": 0.1924, "step": 3020 }, { - "epoch": 0.03, - "learning_rate": 0.00029508404179375686, - "loss": 0.163, + "epoch": 0.02, + "learning_rate": 0.0002970665496298495, + "loss": 0.1789, "step": 3030 }, { - "epoch": 0.03, - "learning_rate": 0.00029506781750924784, - "loss": 0.1605, + "epoch": 0.02, + "learning_rate": 0.0002970568682754926, + "loss": 0.1865, "step": 3040 }, { - "epoch": 0.03, - "learning_rate": 0.00029505159322473876, - "loss": 0.1705, + "epoch": 0.02, + "learning_rate": 0.0002970471869211356, + "loss": 0.1836, "step": 3050 }, { - "epoch": 0.03, - "learning_rate": 0.00029503536894022974, - "loss": 0.1834, + "epoch": 0.02, + "learning_rate": 0.0002970375055667787, + "loss": 0.2035, "step": 3060 }, { - "epoch": 0.03, - "learning_rate": 0.00029501914465572066, - "loss": 0.1673, + "epoch": 0.02, + "learning_rate": 0.0002970278242124218, + "loss": 0.1871, "step": 3070 }, { - "epoch": 0.03, - "learning_rate": 0.00029500292037121164, - "loss": 0.1631, + "epoch": 0.02, + "learning_rate": 0.00029701814285806486, + "loss": 0.1853, "step": 3080 }, { - "epoch": 0.03, - "learning_rate": 0.00029498669608670256, - "loss": 0.159, + "epoch": 0.02, + "learning_rate": 0.00029700846150370794, + "loss": 0.1796, "step": 3090 }, { - "epoch": 0.03, - "learning_rate": 0.00029497047180219354, - "loss": 0.1694, + "epoch": 0.02, + "learning_rate": 0.000296998780149351, + "loss": 0.1727, "step": 3100 }, { - "epoch": 0.03, - "learning_rate": 0.00029495424751768446, - "loss": 0.1719, + "epoch": 0.02, + "learning_rate": 0.0002969890987949941, + "loss": 0.1846, "step": 3110 }, { - "epoch": 0.03, - "learning_rate": 0.0002949380232331754, - "loss": 0.1762, + "epoch": 0.02, + "learning_rate": 0.00029697941744063713, + "loss": 0.1907, "step": 3120 }, { - "epoch": 0.03, - "learning_rate": 0.00029492179894866636, - "loss": 0.1703, + "epoch": 0.02, + "learning_rate": 0.0002969697360862802, + "loss": 0.189, "step": 3130 }, { - "epoch": 0.03, - "learning_rate": 0.0002949055746641573, - "loss": 0.1693, + "epoch": 0.02, + "learning_rate": 0.0002969600547319233, + "loss": 0.185, "step": 3140 }, { - "epoch": 0.03, - "learning_rate": 0.0002948893503796482, - "loss": 0.1753, + "epoch": 0.02, + "learning_rate": 0.00029695037337756637, + "loss": 0.192, "step": 3150 }, { - "epoch": 0.03, - "learning_rate": 0.0002948731260951392, - "loss": 0.1697, + "epoch": 0.02, + "learning_rate": 0.0002969406920232094, + "loss": 0.1885, "step": 3160 }, { - "epoch": 0.03, - "learning_rate": 0.0002948569018106301, - "loss": 0.17, + "epoch": 0.02, + "learning_rate": 0.0002969310106688525, + "loss": 0.1976, "step": 3170 }, { - "epoch": 0.03, - "learning_rate": 0.0002948406775261211, - "loss": 0.1839, + "epoch": 0.02, + "learning_rate": 0.00029692132931449555, + "loss": 0.194, "step": 3180 }, { - "epoch": 0.03, - "learning_rate": 0.000294824453241612, - "loss": 0.1913, + "epoch": 0.02, + "learning_rate": 0.0002969116479601386, + "loss": 0.1877, "step": 3190 }, { - "epoch": 0.03, - "learning_rate": 0.000294808228957103, - "loss": 0.1606, + "epoch": 0.02, + "learning_rate": 0.00029690196660578166, + "loss": 0.1863, "step": 3200 }, { - "epoch": 0.03, - "learning_rate": 0.0002947920046725939, - "loss": 0.1748, + "epoch": 0.02, + "learning_rate": 0.00029689228525142474, + "loss": 0.192, "step": 3210 }, { - "epoch": 0.03, - "learning_rate": 0.0002947757803880849, - "loss": 0.1757, + "epoch": 0.02, + "learning_rate": 0.0002968826038970678, + "loss": 0.1788, "step": 3220 }, { - "epoch": 0.03, - "learning_rate": 0.0002947595561035758, - "loss": 0.1719, + "epoch": 0.02, + "learning_rate": 0.0002968729225427109, + "loss": 0.174, "step": 3230 }, { - "epoch": 0.04, - "learning_rate": 0.0002947433318190668, - "loss": 0.1708, + "epoch": 0.02, + "learning_rate": 0.000296863241188354, + "loss": 0.1919, "step": 3240 }, { - "epoch": 0.04, - "learning_rate": 0.0002947271075345577, - "loss": 0.1648, + "epoch": 0.02, + "learning_rate": 0.00029685355983399706, + "loss": 0.181, "step": 3250 }, { - "epoch": 0.04, - "learning_rate": 0.0002947108832500487, - "loss": 0.1737, + "epoch": 0.02, + "learning_rate": 0.0002968438784796401, + "loss": 0.1869, "step": 3260 }, { - "epoch": 0.04, - "learning_rate": 0.0002946946589655396, - "loss": 0.1641, + "epoch": 0.02, + "learning_rate": 0.00029683419712528316, + "loss": 0.1874, "step": 3270 }, { - "epoch": 0.04, - "learning_rate": 0.0002946784346810306, - "loss": 0.1863, + "epoch": 0.02, + "learning_rate": 0.00029682451577092624, + "loss": 0.1993, "step": 3280 }, { - "epoch": 0.04, - "learning_rate": 0.0002946622103965215, - "loss": 0.1666, + "epoch": 0.02, + "learning_rate": 0.00029681483441656927, + "loss": 0.1709, "step": 3290 }, { - "epoch": 0.04, - "learning_rate": 0.0002946459861120124, - "loss": 0.1733, + "epoch": 0.02, + "learning_rate": 0.00029680515306221235, + "loss": 0.1963, "step": 3300 }, { - "epoch": 0.04, - "learning_rate": 0.0002946297618275034, - "loss": 0.1621, + "epoch": 0.02, + "learning_rate": 0.00029679547170785543, + "loss": 0.1749, "step": 3310 }, { - "epoch": 0.04, - "learning_rate": 0.0002946135375429943, - "loss": 0.1624, + "epoch": 0.02, + "learning_rate": 0.0002967857903534985, + "loss": 0.1753, "step": 3320 }, { - "epoch": 0.04, - "learning_rate": 0.00029459731325848524, - "loss": 0.1572, + "epoch": 0.02, + "learning_rate": 0.00029677610899914153, + "loss": 0.1761, "step": 3330 }, { - "epoch": 0.04, - "learning_rate": 0.0002945810889739762, - "loss": 0.1768, + "epoch": 0.02, + "learning_rate": 0.0002967664276447846, + "loss": 0.174, "step": 3340 }, { - "epoch": 0.04, - "learning_rate": 0.00029456486468946714, - "loss": 0.1717, + "epoch": 0.02, + "learning_rate": 0.0002967567462904277, + "loss": 0.1839, "step": 3350 }, { - "epoch": 0.04, - "learning_rate": 0.0002945486404049581, - "loss": 0.1659, + "epoch": 0.02, + "learning_rate": 0.00029674706493607077, + "loss": 0.187, "step": 3360 }, { - "epoch": 0.04, - "learning_rate": 0.00029453241612044904, - "loss": 0.1695, + "epoch": 0.02, + "learning_rate": 0.00029673738358171385, + "loss": 0.1938, "step": 3370 }, { - "epoch": 0.04, - "learning_rate": 0.00029451619183594, - "loss": 0.1708, + "epoch": 0.02, + "learning_rate": 0.00029672770222735693, + "loss": 0.1758, "step": 3380 }, { - "epoch": 0.04, - "learning_rate": 0.00029449996755143094, - "loss": 0.166, + "epoch": 0.02, + "learning_rate": 0.00029671802087299996, + "loss": 0.1819, "step": 3390 }, { - "epoch": 0.04, - "learning_rate": 0.0002944837432669219, - "loss": 0.1563, + "epoch": 0.02, + "learning_rate": 0.00029670833951864304, + "loss": 0.1855, "step": 3400 }, { - "epoch": 0.04, - "learning_rate": 0.00029446751898241284, - "loss": 0.1631, + "epoch": 0.02, + "learning_rate": 0.0002966986581642861, + "loss": 0.1851, "step": 3410 }, { - "epoch": 0.04, - "learning_rate": 0.0002944512946979038, - "loss": 0.1601, + "epoch": 0.02, + "learning_rate": 0.00029668897680992914, + "loss": 0.1934, "step": 3420 }, { - "epoch": 0.04, - "learning_rate": 0.00029443507041339474, - "loss": 0.1669, + "epoch": 0.02, + "learning_rate": 0.0002966792954555722, + "loss": 0.1875, "step": 3430 }, { - "epoch": 0.04, - "learning_rate": 0.0002944188461288857, - "loss": 0.1585, + "epoch": 0.02, + "learning_rate": 0.0002966696141012153, + "loss": 0.1727, "step": 3440 }, { - "epoch": 0.04, - "learning_rate": 0.00029440262184437664, - "loss": 0.1516, + "epoch": 0.02, + "learning_rate": 0.0002966599327468584, + "loss": 0.1789, "step": 3450 }, { - "epoch": 0.04, - "learning_rate": 0.0002943863975598676, - "loss": 0.169, + "epoch": 0.02, + "learning_rate": 0.0002966502513925014, + "loss": 0.1786, "step": 3460 }, { - "epoch": 0.04, - "learning_rate": 0.00029437017327535854, - "loss": 0.1698, + "epoch": 0.02, + "learning_rate": 0.0002966405700381445, + "loss": 0.1708, "step": 3470 }, { - "epoch": 0.04, - "learning_rate": 0.00029435394899084946, - "loss": 0.171, + "epoch": 0.02, + "learning_rate": 0.00029663088868378757, + "loss": 0.1784, "step": 3480 }, { - "epoch": 0.04, - "learning_rate": 0.00029433772470634044, - "loss": 0.1603, + "epoch": 0.02, + "learning_rate": 0.00029662120732943065, + "loss": 0.1866, "step": 3490 }, { - "epoch": 0.04, - "learning_rate": 0.00029432150042183136, - "loss": 0.1782, + "epoch": 0.02, + "learning_rate": 0.0002966115259750737, + "loss": 0.1944, "step": 3500 }, { - "epoch": 0.04, - "learning_rate": 0.0002943052761373223, - "loss": 0.1563, + "epoch": 0.02, + "learning_rate": 0.0002966018446207168, + "loss": 0.1765, "step": 3510 }, { - "epoch": 0.04, - "learning_rate": 0.00029428905185281326, - "loss": 0.1579, + "epoch": 0.02, + "learning_rate": 0.0002965921632663599, + "loss": 0.1748, "step": 3520 }, { - "epoch": 0.04, - "learning_rate": 0.0002942728275683042, - "loss": 0.1681, + "epoch": 0.02, + "learning_rate": 0.0002965824819120029, + "loss": 0.1763, "step": 3530 }, { - "epoch": 0.04, - "learning_rate": 0.00029425660328379516, - "loss": 0.1658, + "epoch": 0.02, + "learning_rate": 0.000296572800557646, + "loss": 0.1897, "step": 3540 }, { - "epoch": 0.04, - "learning_rate": 0.0002942403789992861, - "loss": 0.1671, + "epoch": 0.02, + "learning_rate": 0.00029656311920328907, + "loss": 0.1747, "step": 3550 }, { - "epoch": 0.04, - "learning_rate": 0.00029422415471477706, - "loss": 0.1589, + "epoch": 0.02, + "learning_rate": 0.0002965534378489321, + "loss": 0.1931, "step": 3560 }, { - "epoch": 0.04, - "learning_rate": 0.000294207930430268, - "loss": 0.1624, + "epoch": 0.02, + "learning_rate": 0.0002965437564945752, + "loss": 0.1789, "step": 3570 }, { - "epoch": 0.04, - "learning_rate": 0.00029419170614575896, - "loss": 0.1705, + "epoch": 0.02, + "learning_rate": 0.00029653407514021826, + "loss": 0.186, "step": 3580 }, { - "epoch": 0.04, - "learning_rate": 0.0002941754818612499, - "loss": 0.1586, + "epoch": 0.02, + "learning_rate": 0.00029652439378586134, + "loss": 0.1809, "step": 3590 }, { - "epoch": 0.04, - "learning_rate": 0.00029415925757674086, - "loss": 0.1525, + "epoch": 0.02, + "learning_rate": 0.00029651471243150436, + "loss": 0.1753, "step": 3600 }, { - "epoch": 0.04, - "learning_rate": 0.0002941430332922318, - "loss": 0.1637, + "epoch": 0.02, + "learning_rate": 0.00029650503107714744, + "loss": 0.1699, "step": 3610 }, { - "epoch": 0.04, - "learning_rate": 0.00029412680900772276, - "loss": 0.1619, + "epoch": 0.02, + "learning_rate": 0.0002964953497227905, + "loss": 0.1679, "step": 3620 }, { - "epoch": 0.04, - "learning_rate": 0.0002941105847232137, - "loss": 0.1533, + "epoch": 0.02, + "learning_rate": 0.0002964856683684336, + "loss": 0.1782, "step": 3630 }, { - "epoch": 0.04, - "learning_rate": 0.00029409436043870466, - "loss": 0.1549, + "epoch": 0.02, + "learning_rate": 0.0002964759870140767, + "loss": 0.1892, "step": 3640 }, { - "epoch": 0.04, - "learning_rate": 0.0002940781361541956, - "loss": 0.1531, + "epoch": 0.02, + "learning_rate": 0.00029646630565971976, + "loss": 0.1684, "step": 3650 }, { - "epoch": 0.04, - "learning_rate": 0.0002940619118696865, - "loss": 0.1524, + "epoch": 0.02, + "learning_rate": 0.0002964566243053628, + "loss": 0.1747, "step": 3660 }, { - "epoch": 0.04, - "learning_rate": 0.0002940456875851775, - "loss": 0.1554, + "epoch": 0.02, + "learning_rate": 0.00029644694295100587, + "loss": 0.1767, "step": 3670 }, { - "epoch": 0.04, - "learning_rate": 0.0002940294633006684, - "loss": 0.1508, + "epoch": 0.02, + "learning_rate": 0.00029643726159664895, + "loss": 0.1824, "step": 3680 }, { - "epoch": 0.04, - "learning_rate": 0.00029401323901615933, - "loss": 0.1555, + "epoch": 0.02, + "learning_rate": 0.00029642758024229197, + "loss": 0.1768, "step": 3690 }, { - "epoch": 0.04, - "learning_rate": 0.0002939970147316503, - "loss": 0.1608, + "epoch": 0.02, + "learning_rate": 0.00029641789888793505, + "loss": 0.1783, "step": 3700 }, { - "epoch": 0.04, - "learning_rate": 0.00029398079044714123, - "loss": 0.1555, + "epoch": 0.02, + "learning_rate": 0.00029640821753357813, + "loss": 0.1656, "step": 3710 }, { - "epoch": 0.04, - "learning_rate": 0.0002939645661626322, - "loss": 0.1636, + "epoch": 0.02, + "learning_rate": 0.0002963985361792212, + "loss": 0.1845, "step": 3720 }, { - "epoch": 0.04, - "learning_rate": 0.0002939483418781231, - "loss": 0.1571, + "epoch": 0.02, + "learning_rate": 0.0002963888548248643, + "loss": 0.1875, "step": 3730 }, { - "epoch": 0.04, - "learning_rate": 0.0002939321175936141, - "loss": 0.1531, + "epoch": 0.02, + "learning_rate": 0.0002963791734705073, + "loss": 0.1781, "step": 3740 }, { - "epoch": 0.04, - "learning_rate": 0.000293915893309105, - "loss": 0.1533, + "epoch": 0.02, + "learning_rate": 0.0002963694921161504, + "loss": 0.1837, "step": 3750 }, { - "epoch": 0.04, - "learning_rate": 0.000293899669024596, - "loss": 0.1546, + "epoch": 0.02, + "learning_rate": 0.0002963598107617935, + "loss": 0.1742, "step": 3760 }, { - "epoch": 0.04, - "learning_rate": 0.0002938834447400869, - "loss": 0.1473, + "epoch": 0.02, + "learning_rate": 0.00029635012940743656, + "loss": 0.175, "step": 3770 }, { - "epoch": 0.04, - "learning_rate": 0.0002938672204555779, - "loss": 0.1682, + "epoch": 0.02, + "learning_rate": 0.00029634044805307964, + "loss": 0.1749, "step": 3780 }, { - "epoch": 0.04, - "learning_rate": 0.0002938509961710688, - "loss": 0.1609, + "epoch": 0.02, + "learning_rate": 0.00029633076669872266, + "loss": 0.1729, "step": 3790 }, { - "epoch": 0.04, - "learning_rate": 0.0002938347718865598, - "loss": 0.1581, + "epoch": 0.02, + "learning_rate": 0.00029632108534436574, + "loss": 0.1797, "step": 3800 }, { - "epoch": 0.04, - "learning_rate": 0.0002938185476020507, - "loss": 0.1504, + "epoch": 0.02, + "learning_rate": 0.0002963114039900088, + "loss": 0.1908, "step": 3810 }, { - "epoch": 0.04, - "learning_rate": 0.0002938023233175417, - "loss": 0.1515, + "epoch": 0.02, + "learning_rate": 0.00029630172263565185, + "loss": 0.1965, "step": 3820 }, { - "epoch": 0.04, - "learning_rate": 0.0002937860990330326, - "loss": 0.153, + "epoch": 0.02, + "learning_rate": 0.0002962920412812949, + "loss": 0.1661, "step": 3830 }, { - "epoch": 0.04, - "learning_rate": 0.00029376987474852355, - "loss": 0.1567, + "epoch": 0.02, + "learning_rate": 0.000296282359926938, + "loss": 0.1709, "step": 3840 }, { - "epoch": 0.04, - "learning_rate": 0.0002937536504640145, - "loss": 0.1674, + "epoch": 0.02, + "learning_rate": 0.0002962726785725811, + "loss": 0.1792, "step": 3850 }, { - "epoch": 0.04, - "learning_rate": 0.00029373742617950545, - "loss": 0.1508, + "epoch": 0.02, + "learning_rate": 0.00029626299721822417, + "loss": 0.1721, "step": 3860 }, { - "epoch": 0.04, - "learning_rate": 0.00029372120189499637, - "loss": 0.1526, + "epoch": 0.02, + "learning_rate": 0.00029625331586386725, + "loss": 0.1671, "step": 3870 }, { - "epoch": 0.04, - "learning_rate": 0.00029370497761048735, - "loss": 0.1456, + "epoch": 0.03, + "learning_rate": 0.00029624363450951027, + "loss": 0.1652, "step": 3880 }, { - "epoch": 0.04, - "learning_rate": 0.00029368875332597827, - "loss": 0.1595, + "epoch": 0.03, + "learning_rate": 0.00029623395315515335, + "loss": 0.1718, "step": 3890 }, { - "epoch": 0.04, - "learning_rate": 0.00029367252904146925, - "loss": 0.1468, + "epoch": 0.03, + "learning_rate": 0.00029622427180079643, + "loss": 0.1702, "step": 3900 }, { - "epoch": 0.04, - "learning_rate": 0.00029365630475696017, - "loss": 0.1524, + "epoch": 0.03, + "learning_rate": 0.0002962145904464395, + "loss": 0.1709, "step": 3910 }, { - "epoch": 0.04, - "learning_rate": 0.00029364008047245115, - "loss": 0.1503, + "epoch": 0.03, + "learning_rate": 0.0002962049090920826, + "loss": 0.1673, "step": 3920 }, { - "epoch": 0.04, - "learning_rate": 0.00029362385618794207, - "loss": 0.1522, + "epoch": 0.03, + "learning_rate": 0.0002961952277377256, + "loss": 0.1748, "step": 3930 }, { - "epoch": 0.04, - "learning_rate": 0.00029360763190343304, - "loss": 0.1531, + "epoch": 0.03, + "learning_rate": 0.0002961855463833687, + "loss": 0.1646, "step": 3940 }, { - "epoch": 0.04, - "learning_rate": 0.00029359140761892397, - "loss": 0.1572, + "epoch": 0.03, + "learning_rate": 0.0002961758650290118, + "loss": 0.1815, "step": 3950 }, { - "epoch": 0.04, - "learning_rate": 0.00029357518333441494, - "loss": 0.163, + "epoch": 0.03, + "learning_rate": 0.0002961661836746548, + "loss": 0.1857, "step": 3960 }, { - "epoch": 0.04, - "learning_rate": 0.00029355895904990587, - "loss": 0.1553, + "epoch": 0.03, + "learning_rate": 0.0002961565023202979, + "loss": 0.1643, "step": 3970 }, { - "epoch": 0.04, - "learning_rate": 0.00029354273476539684, - "loss": 0.1557, + "epoch": 0.03, + "learning_rate": 0.00029614682096594096, + "loss": 0.1717, "step": 3980 }, { - "epoch": 0.04, - "learning_rate": 0.00029352651048088777, - "loss": 0.1667, + "epoch": 0.03, + "learning_rate": 0.00029613713961158404, + "loss": 0.1698, "step": 3990 }, { - "epoch": 0.04, - "learning_rate": 0.00029351028619637874, - "loss": 0.1586, + "epoch": 0.03, + "learning_rate": 0.0002961274582572271, + "loss": 0.1686, "step": 4000 }, { - "epoch": 0.04, - "eval_cer": 0.9215642619990423, - "eval_loss": 0.11099084466695786, - "eval_runtime": 119.2379, - "eval_samples_per_second": 16.773, - "eval_steps_per_second": 4.193, + "epoch": 0.03, + "eval_cer": 0.9202214439046436, + "eval_loss": 0.13143764436244965, + "eval_runtime": 120.5794, + "eval_samples_per_second": 16.587, + "eval_steps_per_second": 4.147, "step": 4000 }, { - "epoch": 0.04, - "learning_rate": 0.00029349406191186967, - "loss": 0.1511, + "epoch": 0.03, + "learning_rate": 0.0002961177769028702, + "loss": 0.1757, "step": 4010 }, { - "epoch": 0.04, - "learning_rate": 0.0002934778376273606, - "loss": 0.1578, + "epoch": 0.03, + "learning_rate": 0.0002961080955485132, + "loss": 0.1865, "step": 4020 }, { - "epoch": 0.04, - "learning_rate": 0.00029346161334285157, - "loss": 0.1567, + "epoch": 0.03, + "learning_rate": 0.0002960984141941563, + "loss": 0.1712, "step": 4030 }, { - "epoch": 0.04, - "learning_rate": 0.0002934453890583425, - "loss": 0.1457, + "epoch": 0.03, + "learning_rate": 0.0002960887328397994, + "loss": 0.1643, "step": 4040 }, { - "epoch": 0.04, - "learning_rate": 0.0002934291647738334, - "loss": 0.1553, + "epoch": 0.03, + "learning_rate": 0.00029607905148544246, + "loss": 0.1675, "step": 4050 }, { - "epoch": 0.04, - "learning_rate": 0.0002934129404893244, - "loss": 0.1615, + "epoch": 0.03, + "learning_rate": 0.0002960693701310855, + "loss": 0.1717, "step": 4060 }, { - "epoch": 0.04, - "learning_rate": 0.0002933967162048153, - "loss": 0.1486, + "epoch": 0.03, + "learning_rate": 0.00029605968877672857, + "loss": 0.1708, "step": 4070 }, { - "epoch": 0.04, - "learning_rate": 0.0002933804919203063, - "loss": 0.1624, + "epoch": 0.03, + "learning_rate": 0.00029605000742237165, + "loss": 0.1727, "step": 4080 }, { - "epoch": 0.04, - "learning_rate": 0.0002933642676357972, - "loss": 0.1493, + "epoch": 0.03, + "learning_rate": 0.0002960403260680147, + "loss": 0.1726, "step": 4090 }, { - "epoch": 0.04, - "learning_rate": 0.0002933480433512882, - "loss": 0.152, + "epoch": 0.03, + "learning_rate": 0.00029603064471365776, + "loss": 0.1588, "step": 4100 }, { - "epoch": 0.04, - "learning_rate": 0.0002933318190667791, - "loss": 0.1416, + "epoch": 0.03, + "learning_rate": 0.00029602096335930083, + "loss": 0.168, "step": 4110 }, { - "epoch": 0.04, - "learning_rate": 0.0002933155947822701, - "loss": 0.158, + "epoch": 0.03, + "learning_rate": 0.0002960112820049439, + "loss": 0.1642, "step": 4120 }, { - "epoch": 0.04, - "learning_rate": 0.000293299370497761, - "loss": 0.1511, + "epoch": 0.03, + "learning_rate": 0.000296001600650587, + "loss": 0.1704, "step": 4130 }, { - "epoch": 0.04, - "learning_rate": 0.000293283146213252, - "loss": 0.1563, + "epoch": 0.03, + "learning_rate": 0.0002959919192962301, + "loss": 0.163, "step": 4140 }, { - "epoch": 0.04, - "learning_rate": 0.0002932669219287429, - "loss": 0.1531, + "epoch": 0.03, + "learning_rate": 0.00029598223794187315, + "loss": 0.1668, "step": 4150 }, { - "epoch": 0.04, - "learning_rate": 0.0002932506976442339, - "loss": 0.1378, + "epoch": 0.03, + "learning_rate": 0.0002959725565875162, + "loss": 0.1732, "step": 4160 }, { - "epoch": 0.05, - "learning_rate": 0.0002932344733597248, - "loss": 0.1406, + "epoch": 0.03, + "learning_rate": 0.00029596287523315926, + "loss": 0.1665, "step": 4170 }, { - "epoch": 0.05, - "learning_rate": 0.0002932182490752158, - "loss": 0.1485, + "epoch": 0.03, + "learning_rate": 0.00029595319387880234, + "loss": 0.1528, "step": 4180 }, { - "epoch": 0.05, - "learning_rate": 0.0002932020247907067, - "loss": 0.1451, + "epoch": 0.03, + "learning_rate": 0.00029594351252444536, + "loss": 0.1749, "step": 4190 }, { - "epoch": 0.05, - "learning_rate": 0.00029318580050619763, - "loss": 0.1501, + "epoch": 0.03, + "learning_rate": 0.00029593383117008844, + "loss": 0.1748, "step": 4200 }, { - "epoch": 0.05, - "learning_rate": 0.0002931695762216886, - "loss": 0.1463, + "epoch": 0.03, + "learning_rate": 0.0002959241498157315, + "loss": 0.1636, "step": 4210 }, { - "epoch": 0.05, - "learning_rate": 0.00029315335193717953, - "loss": 0.154, + "epoch": 0.03, + "learning_rate": 0.0002959144684613746, + "loss": 0.1548, "step": 4220 }, { - "epoch": 0.05, - "learning_rate": 0.00029313712765267045, - "loss": 0.1575, + "epoch": 0.03, + "learning_rate": 0.00029590478710701763, + "loss": 0.1783, "step": 4230 }, { - "epoch": 0.05, - "learning_rate": 0.00029312090336816143, - "loss": 0.1424, + "epoch": 0.03, + "learning_rate": 0.0002958951057526607, + "loss": 0.1676, "step": 4240 }, { - "epoch": 0.05, - "learning_rate": 0.00029310467908365235, - "loss": 0.143, + "epoch": 0.03, + "learning_rate": 0.0002958854243983038, + "loss": 0.1716, "step": 4250 }, { - "epoch": 0.05, - "learning_rate": 0.00029308845479914333, - "loss": 0.1451, + "epoch": 0.03, + "learning_rate": 0.00029587574304394687, + "loss": 0.1813, "step": 4260 }, { - "epoch": 0.05, - "learning_rate": 0.00029307223051463425, - "loss": 0.1514, + "epoch": 0.03, + "learning_rate": 0.00029586606168958995, + "loss": 0.177, "step": 4270 }, { - "epoch": 0.05, - "learning_rate": 0.00029305600623012523, - "loss": 0.1468, + "epoch": 0.03, + "learning_rate": 0.00029585638033523303, + "loss": 0.1679, "step": 4280 }, { - "epoch": 0.05, - "learning_rate": 0.00029303978194561615, - "loss": 0.1588, + "epoch": 0.03, + "learning_rate": 0.0002958466989808761, + "loss": 0.1675, "step": 4290 }, { - "epoch": 0.05, - "learning_rate": 0.00029302355766110713, - "loss": 0.1573, + "epoch": 0.03, + "learning_rate": 0.00029583701762651913, + "loss": 0.1704, "step": 4300 }, { - "epoch": 0.05, - "learning_rate": 0.00029300733337659805, - "loss": 0.1447, + "epoch": 0.03, + "learning_rate": 0.0002958273362721622, + "loss": 0.1601, "step": 4310 }, { - "epoch": 0.05, - "learning_rate": 0.00029299110909208903, - "loss": 0.1515, + "epoch": 0.03, + "learning_rate": 0.0002958176549178053, + "loss": 0.1704, "step": 4320 }, { - "epoch": 0.05, - "learning_rate": 0.00029297488480757995, - "loss": 0.1573, + "epoch": 0.03, + "learning_rate": 0.0002958079735634483, + "loss": 0.1524, "step": 4330 }, { - "epoch": 0.05, - "learning_rate": 0.00029295866052307093, - "loss": 0.1429, + "epoch": 0.03, + "learning_rate": 0.0002957982922090914, + "loss": 0.1649, "step": 4340 }, { - "epoch": 0.05, - "learning_rate": 0.00029294243623856185, - "loss": 0.1429, + "epoch": 0.03, + "learning_rate": 0.0002957886108547345, + "loss": 0.1678, "step": 4350 }, { - "epoch": 0.05, - "learning_rate": 0.0002929262119540528, - "loss": 0.1497, + "epoch": 0.03, + "learning_rate": 0.00029577892950037756, + "loss": 0.165, "step": 4360 }, { - "epoch": 0.05, - "learning_rate": 0.00029290998766954375, - "loss": 0.1399, + "epoch": 0.03, + "learning_rate": 0.0002957692481460206, + "loss": 0.1678, "step": 4370 }, { - "epoch": 0.05, - "learning_rate": 0.00029289376338503467, - "loss": 0.1526, + "epoch": 0.03, + "learning_rate": 0.00029575956679166366, + "loss": 0.1698, "step": 4380 }, { - "epoch": 0.05, - "learning_rate": 0.00029287753910052565, - "loss": 0.156, + "epoch": 0.03, + "learning_rate": 0.00029574988543730674, + "loss": 0.1609, "step": 4390 }, { - "epoch": 0.05, - "learning_rate": 0.00029286131481601657, - "loss": 0.1367, + "epoch": 0.03, + "learning_rate": 0.0002957402040829498, + "loss": 0.1747, "step": 4400 }, { - "epoch": 0.05, - "learning_rate": 0.0002928450905315075, - "loss": 0.1368, + "epoch": 0.03, + "learning_rate": 0.0002957305227285929, + "loss": 0.1796, "step": 4410 }, { - "epoch": 0.05, - "learning_rate": 0.00029282886624699847, - "loss": 0.153, + "epoch": 0.03, + "learning_rate": 0.000295720841374236, + "loss": 0.1647, "step": 4420 }, { - "epoch": 0.05, - "learning_rate": 0.0002928126419624894, - "loss": 0.1457, + "epoch": 0.03, + "learning_rate": 0.000295711160019879, + "loss": 0.1547, "step": 4430 }, { - "epoch": 0.05, - "learning_rate": 0.00029279641767798037, - "loss": 0.1431, + "epoch": 0.03, + "learning_rate": 0.0002957014786655221, + "loss": 0.1632, "step": 4440 }, { - "epoch": 0.05, - "learning_rate": 0.0002927801933934713, - "loss": 0.1368, + "epoch": 0.03, + "learning_rate": 0.00029569179731116517, + "loss": 0.1606, "step": 4450 }, { - "epoch": 0.05, - "learning_rate": 0.00029276396910896227, - "loss": 0.1505, + "epoch": 0.03, + "learning_rate": 0.0002956821159568082, + "loss": 0.1676, "step": 4460 }, { - "epoch": 0.05, - "learning_rate": 0.0002927477448244532, - "loss": 0.1455, + "epoch": 0.03, + "learning_rate": 0.0002956724346024513, + "loss": 0.1658, "step": 4470 }, { - "epoch": 0.05, - "learning_rate": 0.00029273152053994417, - "loss": 0.1596, + "epoch": 0.03, + "learning_rate": 0.00029566275324809435, + "loss": 0.1724, "step": 4480 }, { - "epoch": 0.05, - "learning_rate": 0.0002927152962554351, - "loss": 0.1443, + "epoch": 0.03, + "learning_rate": 0.00029565307189373743, + "loss": 0.165, "step": 4490 }, { - "epoch": 0.05, - "learning_rate": 0.00029269907197092607, - "loss": 0.1393, + "epoch": 0.03, + "learning_rate": 0.0002956433905393805, + "loss": 0.1719, "step": 4500 }, { - "epoch": 0.05, - "learning_rate": 0.000292682847686417, - "loss": 0.1399, + "epoch": 0.03, + "learning_rate": 0.00029563370918502354, + "loss": 0.166, "step": 4510 }, { - "epoch": 0.05, - "learning_rate": 0.00029266662340190797, - "loss": 0.1492, + "epoch": 0.03, + "learning_rate": 0.0002956240278306666, + "loss": 0.1635, "step": 4520 }, { - "epoch": 0.05, - "learning_rate": 0.0002926503991173989, - "loss": 0.1391, + "epoch": 0.03, + "learning_rate": 0.0002956143464763097, + "loss": 0.1696, "step": 4530 }, { - "epoch": 0.05, - "learning_rate": 0.00029263417483288987, - "loss": 0.1409, + "epoch": 0.03, + "learning_rate": 0.0002956046651219528, + "loss": 0.1781, "step": 4540 }, { - "epoch": 0.05, - "learning_rate": 0.0002926179505483808, - "loss": 0.1442, + "epoch": 0.03, + "learning_rate": 0.00029559498376759586, + "loss": 0.1605, "step": 4550 }, { - "epoch": 0.05, - "learning_rate": 0.0002926017262638717, - "loss": 0.1423, + "epoch": 0.03, + "learning_rate": 0.00029558530241323894, + "loss": 0.1701, "step": 4560 }, { - "epoch": 0.05, - "learning_rate": 0.0002925855019793627, - "loss": 0.1387, + "epoch": 0.03, + "learning_rate": 0.00029557562105888196, + "loss": 0.1613, "step": 4570 }, { - "epoch": 0.05, - "learning_rate": 0.0002925692776948536, - "loss": 0.1346, + "epoch": 0.03, + "learning_rate": 0.00029556593970452504, + "loss": 0.1563, "step": 4580 }, { - "epoch": 0.05, - "learning_rate": 0.00029255305341034454, - "loss": 0.1365, + "epoch": 0.03, + "learning_rate": 0.0002955562583501681, + "loss": 0.1591, "step": 4590 }, { - "epoch": 0.05, - "learning_rate": 0.0002925368291258355, - "loss": 0.1439, + "epoch": 0.03, + "learning_rate": 0.00029554657699581115, + "loss": 0.1609, "step": 4600 }, { - "epoch": 0.05, - "learning_rate": 0.00029252060484132644, - "loss": 0.147, + "epoch": 0.03, + "learning_rate": 0.00029553689564145423, + "loss": 0.1613, "step": 4610 }, { - "epoch": 0.05, - "learning_rate": 0.0002925043805568174, - "loss": 0.1396, + "epoch": 0.03, + "learning_rate": 0.0002955272142870973, + "loss": 0.1668, "step": 4620 }, { - "epoch": 0.05, - "learning_rate": 0.00029248815627230834, - "loss": 0.134, + "epoch": 0.03, + "learning_rate": 0.0002955175329327404, + "loss": 0.168, "step": 4630 }, { - "epoch": 0.05, - "learning_rate": 0.0002924719319877993, - "loss": 0.1396, + "epoch": 0.03, + "learning_rate": 0.00029550785157838347, + "loss": 0.1668, "step": 4640 }, { - "epoch": 0.05, - "learning_rate": 0.00029245570770329023, - "loss": 0.147, + "epoch": 0.03, + "learning_rate": 0.0002954981702240265, + "loss": 0.1656, "step": 4650 }, { - "epoch": 0.05, - "learning_rate": 0.0002924394834187812, - "loss": 0.1358, + "epoch": 0.03, + "learning_rate": 0.0002954884888696696, + "loss": 0.1467, "step": 4660 }, { - "epoch": 0.05, - "learning_rate": 0.00029242325913427213, - "loss": 0.1389, + "epoch": 0.03, + "learning_rate": 0.00029547880751531265, + "loss": 0.1548, "step": 4670 }, { - "epoch": 0.05, - "learning_rate": 0.0002924070348497631, - "loss": 0.1312, + "epoch": 0.03, + "learning_rate": 0.00029546912616095573, + "loss": 0.1574, "step": 4680 }, { - "epoch": 0.05, - "learning_rate": 0.00029239081056525403, - "loss": 0.14, + "epoch": 0.03, + "learning_rate": 0.0002954594448065988, + "loss": 0.1495, "step": 4690 }, { - "epoch": 0.05, - "learning_rate": 0.000292374586280745, - "loss": 0.1494, + "epoch": 0.03, + "learning_rate": 0.00029544976345224184, + "loss": 0.1575, "step": 4700 }, { - "epoch": 0.05, - "learning_rate": 0.00029235836199623593, - "loss": 0.144, + "epoch": 0.03, + "learning_rate": 0.0002954400820978849, + "loss": 0.1592, "step": 4710 }, { - "epoch": 0.05, - "learning_rate": 0.0002923421377117269, - "loss": 0.14, + "epoch": 0.03, + "learning_rate": 0.000295430400743528, + "loss": 0.1645, "step": 4720 }, { - "epoch": 0.05, - "learning_rate": 0.00029232591342721783, - "loss": 0.1567, + "epoch": 0.03, + "learning_rate": 0.000295420719389171, + "loss": 0.1587, "step": 4730 }, { - "epoch": 0.05, - "learning_rate": 0.00029230968914270876, - "loss": 0.136, + "epoch": 0.03, + "learning_rate": 0.0002954110380348141, + "loss": 0.1636, "step": 4740 }, { - "epoch": 0.05, - "learning_rate": 0.00029229346485819973, - "loss": 0.1347, + "epoch": 0.03, + "learning_rate": 0.0002954013566804572, + "loss": 0.1643, "step": 4750 }, { - "epoch": 0.05, - "learning_rate": 0.00029227724057369066, - "loss": 0.1401, + "epoch": 0.03, + "learning_rate": 0.00029539167532610026, + "loss": 0.1487, "step": 4760 }, { - "epoch": 0.05, - "learning_rate": 0.00029226101628918163, - "loss": 0.1421, + "epoch": 0.03, + "learning_rate": 0.00029538199397174334, + "loss": 0.1581, "step": 4770 }, { - "epoch": 0.05, - "learning_rate": 0.00029224479200467255, - "loss": 0.1373, + "epoch": 0.03, + "learning_rate": 0.0002953723126173864, + "loss": 0.1535, "step": 4780 }, { - "epoch": 0.05, - "learning_rate": 0.00029222856772016353, - "loss": 0.1348, + "epoch": 0.03, + "learning_rate": 0.00029536263126302945, + "loss": 0.1745, "step": 4790 }, { - "epoch": 0.05, - "learning_rate": 0.00029221234343565445, - "loss": 0.1272, + "epoch": 0.03, + "learning_rate": 0.00029535294990867253, + "loss": 0.1581, "step": 4800 }, { - "epoch": 0.05, - "learning_rate": 0.00029219611915114543, - "loss": 0.1391, + "epoch": 0.03, + "learning_rate": 0.0002953432685543156, + "loss": 0.1652, "step": 4810 }, { - "epoch": 0.05, - "learning_rate": 0.00029217989486663635, - "loss": 0.1392, + "epoch": 0.03, + "learning_rate": 0.0002953335871999587, + "loss": 0.1545, "step": 4820 }, { - "epoch": 0.05, - "learning_rate": 0.00029216367058212733, - "loss": 0.1447, + "epoch": 0.03, + "learning_rate": 0.0002953239058456017, + "loss": 0.1679, "step": 4830 }, { - "epoch": 0.05, - "learning_rate": 0.00029214744629761825, - "loss": 0.1349, + "epoch": 0.03, + "learning_rate": 0.0002953142244912448, + "loss": 0.1594, "step": 4840 }, { - "epoch": 0.05, - "learning_rate": 0.00029213122201310923, - "loss": 0.1868, + "epoch": 0.03, + "learning_rate": 0.00029530454313688787, + "loss": 0.1421, "step": 4850 }, { - "epoch": 0.05, - "learning_rate": 0.00029211499772860015, - "loss": 0.1502, + "epoch": 0.03, + "learning_rate": 0.0002952948617825309, + "loss": 0.1492, "step": 4860 }, { - "epoch": 0.05, - "learning_rate": 0.00029209877344409113, - "loss": 0.1409, + "epoch": 0.03, + "learning_rate": 0.000295285180428174, + "loss": 0.1579, "step": 4870 }, { - "epoch": 0.05, - "learning_rate": 0.00029208254915958205, - "loss": 0.1425, + "epoch": 0.03, + "learning_rate": 0.00029527549907381706, + "loss": 0.1519, "step": 4880 }, { - "epoch": 0.05, - "learning_rate": 0.000292066324875073, - "loss": 0.1322, + "epoch": 0.03, + "learning_rate": 0.00029526581771946014, + "loss": 0.1515, "step": 4890 }, { - "epoch": 0.05, - "learning_rate": 0.00029205010059056395, - "loss": 0.1263, + "epoch": 0.03, + "learning_rate": 0.0002952561363651032, + "loss": 0.1607, "step": 4900 }, { - "epoch": 0.05, - "learning_rate": 0.0002920338763060549, - "loss": 0.1406, + "epoch": 0.03, + "learning_rate": 0.0002952464550107463, + "loss": 0.165, "step": 4910 }, { - "epoch": 0.05, - "learning_rate": 0.0002920176520215458, - "loss": 0.142, + "epoch": 0.03, + "learning_rate": 0.0002952367736563894, + "loss": 0.1546, "step": 4920 }, { - "epoch": 0.05, - "learning_rate": 0.0002920014277370368, - "loss": 0.1412, + "epoch": 0.03, + "learning_rate": 0.0002952270923020324, + "loss": 0.1613, "step": 4930 }, { - "epoch": 0.05, - "learning_rate": 0.0002919852034525277, - "loss": 0.1325, + "epoch": 0.03, + "learning_rate": 0.0002952174109476755, + "loss": 0.1442, "step": 4940 }, { - "epoch": 0.05, - "learning_rate": 0.0002919689791680187, - "loss": 0.1442, + "epoch": 0.03, + "learning_rate": 0.00029520772959331856, + "loss": 0.1547, "step": 4950 }, { - "epoch": 0.05, - "learning_rate": 0.0002919527548835096, - "loss": 0.1586, + "epoch": 0.03, + "learning_rate": 0.00029519804823896164, + "loss": 0.1483, "step": 4960 }, { - "epoch": 0.05, - "learning_rate": 0.0002919365305990006, - "loss": 0.1381, + "epoch": 0.03, + "learning_rate": 0.00029518836688460467, + "loss": 0.1528, "step": 4970 }, { - "epoch": 0.05, - "learning_rate": 0.0002919203063144915, - "loss": 0.129, + "epoch": 0.03, + "learning_rate": 0.00029517868553024775, + "loss": 0.1709, "step": 4980 }, { - "epoch": 0.05, - "learning_rate": 0.00029190408202998247, - "loss": 0.1383, + "epoch": 0.03, + "learning_rate": 0.0002951690041758908, + "loss": 0.1527, "step": 4990 }, { - "epoch": 0.05, - "learning_rate": 0.0002918878577454734, - "loss": 0.1288, + "epoch": 0.03, + "learning_rate": 0.00029515932282153385, + "loss": 0.1435, "step": 5000 }, { - "epoch": 0.05, - "eval_cer": 0.9214405741941297, - "eval_loss": 0.09906036406755447, - "eval_runtime": 119.4172, - "eval_samples_per_second": 16.748, - "eval_steps_per_second": 4.187, + "epoch": 0.03, + "eval_cer": 0.9202720596542764, + "eval_loss": 0.11752115935087204, + "eval_runtime": 120.5405, + "eval_samples_per_second": 16.592, + "eval_steps_per_second": 4.148, "step": 5000 }, { - "epoch": 0.05, - "learning_rate": 0.00029187163346096437, - "loss": 0.128, + "epoch": 0.03, + "learning_rate": 0.00029514964146717693, + "loss": 0.1587, "step": 5010 }, { - "epoch": 0.05, - "learning_rate": 0.0002918554091764553, - "loss": 0.1511, + "epoch": 0.03, + "learning_rate": 0.00029513996011282, + "loss": 0.1598, "step": 5020 }, { - "epoch": 0.05, - "learning_rate": 0.00029183918489194627, - "loss": 0.1456, + "epoch": 0.03, + "learning_rate": 0.0002951302787584631, + "loss": 0.1555, "step": 5030 }, { - "epoch": 0.05, - "learning_rate": 0.0002918229606074372, - "loss": 0.1352, + "epoch": 0.03, + "learning_rate": 0.00029512059740410617, + "loss": 0.1445, "step": 5040 }, { - "epoch": 0.05, - "learning_rate": 0.00029180673632292817, - "loss": 0.1503, + "epoch": 0.03, + "learning_rate": 0.00029511091604974925, + "loss": 0.1461, "step": 5050 }, { - "epoch": 0.05, - "learning_rate": 0.0002917905120384191, - "loss": 0.1408, + "epoch": 0.03, + "learning_rate": 0.00029510123469539233, + "loss": 0.1512, "step": 5060 }, { - "epoch": 0.05, - "learning_rate": 0.00029177428775391, - "loss": 0.1347, + "epoch": 0.03, + "learning_rate": 0.00029509155334103536, + "loss": 0.1567, "step": 5070 }, { - "epoch": 0.05, - "learning_rate": 0.000291758063469401, - "loss": 0.1358, + "epoch": 0.03, + "learning_rate": 0.00029508187198667844, + "loss": 0.1444, "step": 5080 }, { - "epoch": 0.06, - "learning_rate": 0.0002917418391848919, - "loss": 0.1389, + "epoch": 0.03, + "learning_rate": 0.0002950721906323215, + "loss": 0.1479, "step": 5090 }, { - "epoch": 0.06, - "learning_rate": 0.00029172561490038284, - "loss": 0.1555, + "epoch": 0.03, + "learning_rate": 0.00029506250927796454, + "loss": 0.1521, "step": 5100 }, { - "epoch": 0.06, - "learning_rate": 0.0002917093906158738, - "loss": 0.1525, + "epoch": 0.03, + "learning_rate": 0.0002950528279236076, + "loss": 0.1399, "step": 5110 }, { - "epoch": 0.06, - "learning_rate": 0.00029169316633136474, - "loss": 0.153, + "epoch": 0.03, + "learning_rate": 0.0002950431465692507, + "loss": 0.1568, "step": 5120 }, { - "epoch": 0.06, - "learning_rate": 0.0002916769420468557, - "loss": 0.1478, + "epoch": 0.03, + "learning_rate": 0.0002950334652148938, + "loss": 0.1437, "step": 5130 }, { - "epoch": 0.06, - "learning_rate": 0.00029166071776234664, - "loss": 0.1365, + "epoch": 0.03, + "learning_rate": 0.0002950237838605368, + "loss": 0.1578, "step": 5140 }, { - "epoch": 0.06, - "learning_rate": 0.0002916444934778376, - "loss": 0.1396, + "epoch": 0.03, + "learning_rate": 0.0002950141025061799, + "loss": 0.1373, "step": 5150 }, { - "epoch": 0.06, - "learning_rate": 0.00029162826919332854, - "loss": 0.1386, + "epoch": 0.03, + "learning_rate": 0.00029500442115182297, + "loss": 0.1526, "step": 5160 }, { - "epoch": 0.06, - "learning_rate": 0.0002916120449088195, - "loss": 0.133, + "epoch": 0.03, + "learning_rate": 0.00029499473979746605, + "loss": 0.1635, "step": 5170 }, { - "epoch": 0.06, - "learning_rate": 0.00029159582062431044, - "loss": 0.1403, + "epoch": 0.03, + "learning_rate": 0.0002949850584431091, + "loss": 0.1476, "step": 5180 }, { - "epoch": 0.06, - "learning_rate": 0.0002915795963398014, - "loss": 0.135, + "epoch": 0.03, + "learning_rate": 0.0002949753770887522, + "loss": 0.1721, "step": 5190 }, { - "epoch": 0.06, - "learning_rate": 0.00029156337205529234, - "loss": 0.1389, + "epoch": 0.03, + "learning_rate": 0.00029496569573439523, + "loss": 0.1519, "step": 5200 }, { - "epoch": 0.06, - "learning_rate": 0.0002915471477707833, - "loss": 0.136, + "epoch": 0.03, + "learning_rate": 0.0002949560143800383, + "loss": 0.1522, "step": 5210 }, { - "epoch": 0.06, - "learning_rate": 0.00029153092348627424, - "loss": 0.1329, + "epoch": 0.03, + "learning_rate": 0.0002949463330256814, + "loss": 0.1545, "step": 5220 }, { - "epoch": 0.06, - "learning_rate": 0.0002915146992017652, - "loss": 0.132, + "epoch": 0.03, + "learning_rate": 0.0002949366516713244, + "loss": 0.1531, "step": 5230 }, { - "epoch": 0.06, - "learning_rate": 0.00029149847491725614, - "loss": 0.1432, + "epoch": 0.03, + "learning_rate": 0.0002949269703169675, + "loss": 0.1531, "step": 5240 }, { - "epoch": 0.06, - "learning_rate": 0.00029148225063274706, - "loss": 0.1297, + "epoch": 0.03, + "learning_rate": 0.0002949172889626106, + "loss": 0.1446, "step": 5250 }, { - "epoch": 0.06, - "learning_rate": 0.00029146602634823804, - "loss": 0.1317, + "epoch": 0.03, + "learning_rate": 0.00029490760760825366, + "loss": 0.1454, "step": 5260 }, { - "epoch": 0.06, - "learning_rate": 0.00029144980206372896, - "loss": 0.1353, + "epoch": 0.03, + "learning_rate": 0.00029489792625389674, + "loss": 0.1457, "step": 5270 }, { - "epoch": 0.06, - "learning_rate": 0.0002914335777792199, - "loss": 0.1417, + "epoch": 0.03, + "learning_rate": 0.00029488824489953976, + "loss": 0.1523, "step": 5280 }, { - "epoch": 0.06, - "learning_rate": 0.00029141735349471086, - "loss": 0.1398, + "epoch": 0.03, + "learning_rate": 0.00029487856354518284, + "loss": 0.1594, "step": 5290 }, { - "epoch": 0.06, - "learning_rate": 0.0002914011292102018, - "loss": 0.1376, + "epoch": 0.03, + "learning_rate": 0.0002948688821908259, + "loss": 0.1423, "step": 5300 }, { - "epoch": 0.06, - "learning_rate": 0.00029138490492569276, - "loss": 0.13, + "epoch": 0.03, + "learning_rate": 0.000294859200836469, + "loss": 0.1493, "step": 5310 }, { - "epoch": 0.06, - "learning_rate": 0.0002913686806411837, - "loss": 0.1448, + "epoch": 0.03, + "learning_rate": 0.0002948495194821121, + "loss": 0.1573, "step": 5320 }, { - "epoch": 0.06, - "learning_rate": 0.00029135245635667466, - "loss": 0.1401, + "epoch": 0.03, + "learning_rate": 0.00029483983812775516, + "loss": 0.1592, "step": 5330 }, { - "epoch": 0.06, - "learning_rate": 0.0002913362320721656, - "loss": 0.1402, + "epoch": 0.03, + "learning_rate": 0.0002948301567733982, + "loss": 0.1715, "step": 5340 }, { - "epoch": 0.06, - "learning_rate": 0.00029132000778765656, - "loss": 0.1411, + "epoch": 0.03, + "learning_rate": 0.00029482047541904127, + "loss": 0.138, "step": 5350 }, { - "epoch": 0.06, - "learning_rate": 0.0002913037835031475, - "loss": 0.1274, + "epoch": 0.03, + "learning_rate": 0.00029481079406468435, + "loss": 0.1524, "step": 5360 }, { - "epoch": 0.06, - "learning_rate": 0.00029128755921863846, - "loss": 0.1372, + "epoch": 0.03, + "learning_rate": 0.00029480111271032737, + "loss": 0.1443, "step": 5370 }, { - "epoch": 0.06, - "learning_rate": 0.0002912713349341294, - "loss": 0.1362, + "epoch": 0.03, + "learning_rate": 0.00029479143135597045, + "loss": 0.1384, "step": 5380 }, { - "epoch": 0.06, - "learning_rate": 0.00029125511064962036, - "loss": 0.1357, + "epoch": 0.03, + "learning_rate": 0.00029478175000161353, + "loss": 0.1533, "step": 5390 }, { - "epoch": 0.06, - "learning_rate": 0.0002912388863651113, - "loss": 0.1325, + "epoch": 0.03, + "learning_rate": 0.0002947720686472566, + "loss": 0.1419, "step": 5400 }, { - "epoch": 0.06, - "learning_rate": 0.00029122266208060225, - "loss": 0.138, + "epoch": 0.03, + "learning_rate": 0.0002947623872928997, + "loss": 0.1362, "step": 5410 }, { - "epoch": 0.06, - "learning_rate": 0.0002912064377960932, - "loss": 0.1309, + "epoch": 0.03, + "learning_rate": 0.0002947527059385427, + "loss": 0.1451, "step": 5420 }, { - "epoch": 0.06, - "learning_rate": 0.0002911902135115841, - "loss": 0.1452, + "epoch": 0.04, + "learning_rate": 0.0002947430245841858, + "loss": 0.1496, "step": 5430 }, { - "epoch": 0.06, - "learning_rate": 0.0002911739892270751, - "loss": 0.1371, + "epoch": 0.04, + "learning_rate": 0.0002947333432298289, + "loss": 0.1457, "step": 5440 }, { - "epoch": 0.06, - "learning_rate": 0.000291157764942566, - "loss": 0.133, + "epoch": 0.04, + "learning_rate": 0.00029472366187547195, + "loss": 0.1553, "step": 5450 }, { - "epoch": 0.06, - "learning_rate": 0.0002911415406580569, - "loss": 0.1354, + "epoch": 0.04, + "learning_rate": 0.00029471398052111503, + "loss": 0.1477, "step": 5460 }, { - "epoch": 0.06, - "learning_rate": 0.0002911253163735479, - "loss": 0.1233, + "epoch": 0.04, + "learning_rate": 0.00029470429916675806, + "loss": 0.1456, "step": 5470 }, { - "epoch": 0.06, - "learning_rate": 0.0002911090920890388, - "loss": 0.131, + "epoch": 0.04, + "learning_rate": 0.00029469461781240114, + "loss": 0.1504, "step": 5480 }, { - "epoch": 0.06, - "learning_rate": 0.0002910928678045298, - "loss": 0.1545, + "epoch": 0.04, + "learning_rate": 0.0002946849364580442, + "loss": 0.144, "step": 5490 }, { - "epoch": 0.06, - "learning_rate": 0.0002910766435200207, - "loss": 0.1374, + "epoch": 0.04, + "learning_rate": 0.00029467525510368725, + "loss": 0.1527, "step": 5500 }, { - "epoch": 0.06, - "learning_rate": 0.0002910604192355117, - "loss": 0.1313, + "epoch": 0.04, + "learning_rate": 0.0002946655737493303, + "loss": 0.1424, "step": 5510 }, { - "epoch": 0.06, - "learning_rate": 0.0002910441949510026, - "loss": 0.1244, + "epoch": 0.04, + "learning_rate": 0.0002946558923949734, + "loss": 0.1421, "step": 5520 }, { - "epoch": 0.06, - "learning_rate": 0.0002910279706664936, - "loss": 0.1247, + "epoch": 0.04, + "learning_rate": 0.0002946462110406165, + "loss": 0.1441, "step": 5530 }, { - "epoch": 0.06, - "learning_rate": 0.0002910117463819845, - "loss": 0.1355, + "epoch": 0.04, + "learning_rate": 0.00029463652968625956, + "loss": 0.1489, "step": 5540 }, { - "epoch": 0.06, - "learning_rate": 0.0002909955220974755, - "loss": 0.1336, + "epoch": 0.04, + "learning_rate": 0.00029462684833190264, + "loss": 0.143, "step": 5550 }, { - "epoch": 0.06, - "learning_rate": 0.0002909792978129664, - "loss": 0.1368, + "epoch": 0.04, + "learning_rate": 0.00029461716697754567, + "loss": 0.1462, "step": 5560 }, { - "epoch": 0.06, - "learning_rate": 0.0002909630735284574, - "loss": 0.1348, + "epoch": 0.04, + "learning_rate": 0.00029460748562318875, + "loss": 0.1505, "step": 5570 }, { - "epoch": 0.06, - "learning_rate": 0.0002909468492439483, - "loss": 0.1383, + "epoch": 0.04, + "learning_rate": 0.00029459780426883183, + "loss": 0.1619, "step": 5580 }, { - "epoch": 0.06, - "learning_rate": 0.0002909306249594393, - "loss": 0.1282, + "epoch": 0.04, + "learning_rate": 0.0002945881229144749, + "loss": 0.1587, "step": 5590 }, { - "epoch": 0.06, - "learning_rate": 0.0002909144006749302, - "loss": 0.1278, + "epoch": 0.04, + "learning_rate": 0.00029457844156011794, + "loss": 0.1495, "step": 5600 }, { - "epoch": 0.06, - "learning_rate": 0.00029089817639042114, - "loss": 0.1272, + "epoch": 0.04, + "learning_rate": 0.000294568760205761, + "loss": 0.1498, "step": 5610 }, { - "epoch": 0.06, - "learning_rate": 0.0002908819521059121, - "loss": 0.1335, + "epoch": 0.04, + "learning_rate": 0.0002945590788514041, + "loss": 0.1476, "step": 5620 }, { - "epoch": 0.06, - "learning_rate": 0.00029086572782140304, - "loss": 0.1348, + "epoch": 0.04, + "learning_rate": 0.0002945493974970471, + "loss": 0.1599, "step": 5630 }, { - "epoch": 0.06, - "learning_rate": 0.00029084950353689396, - "loss": 0.1387, + "epoch": 0.04, + "learning_rate": 0.0002945397161426902, + "loss": 0.1463, "step": 5640 }, { - "epoch": 0.06, - "learning_rate": 0.00029083327925238494, - "loss": 0.1367, + "epoch": 0.04, + "learning_rate": 0.0002945300347883333, + "loss": 0.1478, "step": 5650 }, { - "epoch": 0.06, - "learning_rate": 0.00029081705496787586, - "loss": 0.1468, + "epoch": 0.04, + "learning_rate": 0.00029452035343397636, + "loss": 0.1506, "step": 5660 }, { - "epoch": 0.06, - "learning_rate": 0.00029080083068336684, - "loss": 0.1306, + "epoch": 0.04, + "learning_rate": 0.00029451067207961944, + "loss": 0.1525, "step": 5670 }, { - "epoch": 0.06, - "learning_rate": 0.00029078460639885776, - "loss": 0.145, + "epoch": 0.04, + "learning_rate": 0.0002945009907252625, + "loss": 0.1511, "step": 5680 }, { - "epoch": 0.06, - "learning_rate": 0.00029076838211434874, - "loss": 0.141, + "epoch": 0.04, + "learning_rate": 0.0002944913093709056, + "loss": 0.1454, "step": 5690 }, { - "epoch": 0.06, - "learning_rate": 0.00029075215782983966, - "loss": 0.1261, + "epoch": 0.04, + "learning_rate": 0.0002944816280165486, + "loss": 0.158, "step": 5700 }, { - "epoch": 0.06, - "learning_rate": 0.00029073593354533064, - "loss": 0.1361, + "epoch": 0.04, + "learning_rate": 0.0002944719466621917, + "loss": 0.1532, "step": 5710 }, { - "epoch": 0.06, - "learning_rate": 0.00029071970926082156, - "loss": 0.1385, + "epoch": 0.04, + "learning_rate": 0.0002944622653078348, + "loss": 0.1466, "step": 5720 }, { - "epoch": 0.06, - "learning_rate": 0.00029070348497631254, - "loss": 0.1294, + "epoch": 0.04, + "learning_rate": 0.00029445258395347786, + "loss": 0.1484, "step": 5730 }, { - "epoch": 0.06, - "learning_rate": 0.00029068726069180346, - "loss": 0.1286, + "epoch": 0.04, + "learning_rate": 0.0002944429025991209, + "loss": 0.1447, "step": 5740 }, { - "epoch": 0.06, - "learning_rate": 0.00029067103640729444, - "loss": 0.1454, + "epoch": 0.04, + "learning_rate": 0.00029443322124476397, + "loss": 0.1752, "step": 5750 }, { - "epoch": 0.06, - "learning_rate": 0.00029065481212278536, - "loss": 0.1253, + "epoch": 0.04, + "learning_rate": 0.00029442353989040705, + "loss": 0.154, "step": 5760 }, { - "epoch": 0.06, - "learning_rate": 0.00029063858783827634, - "loss": 0.1316, + "epoch": 0.04, + "learning_rate": 0.0002944138585360501, + "loss": 0.1467, "step": 5770 }, { - "epoch": 0.06, - "learning_rate": 0.00029062236355376726, - "loss": 0.1319, + "epoch": 0.04, + "learning_rate": 0.00029440417718169315, + "loss": 0.1485, "step": 5780 }, { - "epoch": 0.06, - "learning_rate": 0.0002906061392692582, - "loss": 0.1247, + "epoch": 0.04, + "learning_rate": 0.00029439449582733623, + "loss": 0.1538, "step": 5790 }, { - "epoch": 0.06, - "learning_rate": 0.00029058991498474916, - "loss": 0.1451, + "epoch": 0.04, + "learning_rate": 0.0002943848144729793, + "loss": 0.1539, "step": 5800 }, { - "epoch": 0.06, - "learning_rate": 0.0002905736907002401, - "loss": 0.1398, + "epoch": 0.04, + "learning_rate": 0.0002943751331186224, + "loss": 0.15, "step": 5810 }, { - "epoch": 0.06, - "learning_rate": 0.00029055746641573106, - "loss": 0.1298, + "epoch": 0.04, + "learning_rate": 0.0002943654517642655, + "loss": 0.1469, "step": 5820 }, { - "epoch": 0.06, - "learning_rate": 0.000290541242131222, - "loss": 0.123, + "epoch": 0.04, + "learning_rate": 0.00029435577040990855, + "loss": 0.1423, "step": 5830 }, { - "epoch": 0.06, - "learning_rate": 0.0002905250178467129, - "loss": 0.1342, + "epoch": 0.04, + "learning_rate": 0.0002943460890555516, + "loss": 0.1426, "step": 5840 }, { - "epoch": 0.06, - "learning_rate": 0.0002905087935622039, - "loss": 0.1303, + "epoch": 0.04, + "learning_rate": 0.00029433640770119466, + "loss": 0.1513, "step": 5850 }, { - "epoch": 0.06, - "learning_rate": 0.0002904925692776948, - "loss": 0.1299, + "epoch": 0.04, + "learning_rate": 0.00029432672634683774, + "loss": 0.1474, "step": 5860 }, { - "epoch": 0.06, - "learning_rate": 0.0002904763449931858, - "loss": 0.1395, + "epoch": 0.04, + "learning_rate": 0.00029431704499248076, + "loss": 0.1476, "step": 5870 }, { - "epoch": 0.06, - "learning_rate": 0.0002904601207086767, - "loss": 0.13, + "epoch": 0.04, + "learning_rate": 0.00029430736363812384, + "loss": 0.1538, "step": 5880 }, { - "epoch": 0.06, - "learning_rate": 0.0002904438964241677, - "loss": 0.1409, + "epoch": 0.04, + "learning_rate": 0.0002942976822837669, + "loss": 0.1421, "step": 5890 }, { - "epoch": 0.06, - "learning_rate": 0.0002904276721396586, - "loss": 0.1451, + "epoch": 0.04, + "learning_rate": 0.00029428800092941, + "loss": 0.1368, "step": 5900 }, { - "epoch": 0.06, - "learning_rate": 0.0002904114478551496, - "loss": 0.139, + "epoch": 0.04, + "learning_rate": 0.00029427831957505303, + "loss": 0.1442, "step": 5910 }, { - "epoch": 0.06, - "learning_rate": 0.0002903952235706405, - "loss": 0.1381, + "epoch": 0.04, + "learning_rate": 0.0002942686382206961, + "loss": 0.1365, "step": 5920 }, { - "epoch": 0.06, - "learning_rate": 0.0002903789992861315, - "loss": 0.1276, + "epoch": 0.04, + "learning_rate": 0.0002942589568663392, + "loss": 0.1462, "step": 5930 }, { - "epoch": 0.06, - "learning_rate": 0.0002903627750016224, - "loss": 0.1415, + "epoch": 0.04, + "learning_rate": 0.00029424927551198227, + "loss": 0.1438, "step": 5940 }, { - "epoch": 0.06, - "learning_rate": 0.0002903465507171134, - "loss": 0.1416, + "epoch": 0.04, + "learning_rate": 0.00029423959415762535, + "loss": 0.1495, "step": 5950 }, { - "epoch": 0.06, - "learning_rate": 0.0002903303264326043, - "loss": 0.1318, + "epoch": 0.04, + "learning_rate": 0.00029422991280326843, + "loss": 0.1427, "step": 5960 }, { - "epoch": 0.06, - "learning_rate": 0.0002903141021480952, - "loss": 0.1215, + "epoch": 0.04, + "learning_rate": 0.0002942202314489115, + "loss": 0.1476, "step": 5970 }, { - "epoch": 0.06, - "learning_rate": 0.0002902978778635862, - "loss": 0.1336, + "epoch": 0.04, + "learning_rate": 0.00029421055009455453, + "loss": 0.1562, "step": 5980 }, { - "epoch": 0.06, - "learning_rate": 0.0002902816535790771, - "loss": 0.1293, + "epoch": 0.04, + "learning_rate": 0.0002942008687401976, + "loss": 0.1451, "step": 5990 }, { - "epoch": 0.06, - "learning_rate": 0.0002902654292945681, - "loss": 0.1338, + "epoch": 0.04, + "learning_rate": 0.00029419118738584064, + "loss": 0.1505, "step": 6000 }, { - "epoch": 0.06, - "eval_cer": 0.921543058375343, - "eval_loss": 0.09102348238229752, - "eval_runtime": 119.7739, - "eval_samples_per_second": 16.698, - "eval_steps_per_second": 4.175, + "epoch": 0.04, + "eval_cer": 0.9203606372161338, + "eval_loss": 0.1086047813296318, + "eval_runtime": 120.5193, + "eval_samples_per_second": 16.595, + "eval_steps_per_second": 4.149, "step": 6000 }, { - "epoch": 0.07, - "learning_rate": 0.000290249205010059, - "loss": 0.1346, + "epoch": 0.04, + "learning_rate": 0.0002941815060314837, + "loss": 0.1335, "step": 6010 }, { - "epoch": 0.07, - "learning_rate": 0.00029023298072554995, - "loss": 0.13, + "epoch": 0.04, + "learning_rate": 0.0002941718246771268, + "loss": 0.1449, "step": 6020 }, { - "epoch": 0.07, - "learning_rate": 0.0002902167564410409, - "loss": 0.1322, + "epoch": 0.04, + "learning_rate": 0.0002941621433227699, + "loss": 0.1478, "step": 6030 }, { - "epoch": 0.07, - "learning_rate": 0.00029020053215653185, - "loss": 0.1275, + "epoch": 0.04, + "learning_rate": 0.00029415246196841296, + "loss": 0.159, "step": 6040 }, { - "epoch": 0.07, - "learning_rate": 0.0002901843078720228, - "loss": 0.1379, + "epoch": 0.04, + "learning_rate": 0.000294142780614056, + "loss": 0.1473, "step": 6050 }, { - "epoch": 0.07, - "learning_rate": 0.00029016808358751375, - "loss": 0.1326, + "epoch": 0.04, + "learning_rate": 0.00029413309925969906, + "loss": 0.1431, "step": 6060 }, { - "epoch": 0.07, - "learning_rate": 0.0002901518593030047, - "loss": 0.1202, + "epoch": 0.04, + "learning_rate": 0.00029412341790534214, + "loss": 0.1511, "step": 6070 }, { - "epoch": 0.07, - "learning_rate": 0.00029013563501849565, - "loss": 0.1233, + "epoch": 0.04, + "learning_rate": 0.0002941137365509852, + "loss": 0.1466, "step": 6080 }, { - "epoch": 0.07, - "learning_rate": 0.0002901194107339866, - "loss": 0.1486, + "epoch": 0.04, + "learning_rate": 0.0002941040551966283, + "loss": 0.1526, "step": 6090 }, { - "epoch": 0.07, - "learning_rate": 0.00029010318644947754, - "loss": 0.1317, + "epoch": 0.04, + "learning_rate": 0.0002940943738422714, + "loss": 0.1464, "step": 6100 }, { - "epoch": 0.07, - "learning_rate": 0.0002900869621649685, - "loss": 0.1278, + "epoch": 0.04, + "learning_rate": 0.0002940846924879144, + "loss": 0.155, "step": 6110 }, { - "epoch": 0.07, - "learning_rate": 0.00029007073788045944, - "loss": 0.1427, + "epoch": 0.04, + "learning_rate": 0.0002940750111335575, + "loss": 0.1405, "step": 6120 }, { - "epoch": 0.07, - "learning_rate": 0.0002900545135959504, - "loss": 0.1348, + "epoch": 0.04, + "learning_rate": 0.00029406532977920057, + "loss": 0.1549, "step": 6130 }, { - "epoch": 0.07, - "learning_rate": 0.00029003828931144134, - "loss": 0.1195, + "epoch": 0.04, + "learning_rate": 0.0002940556484248436, + "loss": 0.1439, "step": 6140 }, { - "epoch": 0.07, - "learning_rate": 0.00029002206502693227, - "loss": 0.1203, + "epoch": 0.04, + "learning_rate": 0.0002940459670704867, + "loss": 0.1446, "step": 6150 }, { - "epoch": 0.07, - "learning_rate": 0.00029000584074242324, - "loss": 0.1311, + "epoch": 0.04, + "learning_rate": 0.00029403628571612975, + "loss": 0.1538, "step": 6160 }, { - "epoch": 0.07, - "learning_rate": 0.00028998961645791417, - "loss": 0.1335, + "epoch": 0.04, + "learning_rate": 0.00029402660436177283, + "loss": 0.1401, "step": 6170 }, { - "epoch": 0.07, - "learning_rate": 0.00028997339217340514, - "loss": 0.1284, + "epoch": 0.04, + "learning_rate": 0.0002940169230074159, + "loss": 0.1451, "step": 6180 }, { - "epoch": 0.07, - "learning_rate": 0.00028995716788889607, - "loss": 0.1286, + "epoch": 0.04, + "learning_rate": 0.00029400724165305894, + "loss": 0.1303, "step": 6190 }, { - "epoch": 0.07, - "learning_rate": 0.000289940943604387, - "loss": 0.1289, + "epoch": 0.04, + "learning_rate": 0.000293997560298702, + "loss": 0.1395, "step": 6200 }, { - "epoch": 0.07, - "learning_rate": 0.00028992471931987797, - "loss": 0.1301, + "epoch": 0.04, + "learning_rate": 0.0002939878789443451, + "loss": 0.1384, "step": 6210 }, { - "epoch": 0.07, - "learning_rate": 0.0002899084950353689, - "loss": 0.1272, + "epoch": 0.04, + "learning_rate": 0.0002939781975899882, + "loss": 0.1402, "step": 6220 }, { - "epoch": 0.07, - "learning_rate": 0.00028989227075085986, - "loss": 0.1329, + "epoch": 0.04, + "learning_rate": 0.00029396851623563126, + "loss": 0.1452, "step": 6230 }, { - "epoch": 0.07, - "learning_rate": 0.0002898760464663508, - "loss": 0.1332, + "epoch": 0.04, + "learning_rate": 0.0002939588348812743, + "loss": 0.1342, "step": 6240 }, { - "epoch": 0.07, - "learning_rate": 0.00028985982218184176, - "loss": 0.1293, + "epoch": 0.04, + "learning_rate": 0.00029394915352691736, + "loss": 0.1362, "step": 6250 }, { - "epoch": 0.07, - "learning_rate": 0.0002898435978973327, - "loss": 0.1207, + "epoch": 0.04, + "learning_rate": 0.00029393947217256044, + "loss": 0.1499, "step": 6260 }, { - "epoch": 0.07, - "learning_rate": 0.00028982737361282366, - "loss": 0.1405, + "epoch": 0.04, + "learning_rate": 0.00029392979081820347, + "loss": 0.1445, "step": 6270 }, { - "epoch": 0.07, - "learning_rate": 0.0002898111493283146, - "loss": 0.1211, + "epoch": 0.04, + "learning_rate": 0.00029392010946384655, + "loss": 0.1339, "step": 6280 }, { - "epoch": 0.07, - "learning_rate": 0.00028979492504380556, - "loss": 0.1315, + "epoch": 0.04, + "learning_rate": 0.00029391042810948963, + "loss": 0.1372, "step": 6290 }, { - "epoch": 0.07, - "learning_rate": 0.0002897787007592965, - "loss": 0.1317, + "epoch": 0.04, + "learning_rate": 0.0002939007467551327, + "loss": 0.1323, "step": 6300 }, { - "epoch": 0.07, - "learning_rate": 0.00028976247647478746, - "loss": 0.1211, + "epoch": 0.04, + "learning_rate": 0.0002938910654007758, + "loss": 0.1459, "step": 6310 }, { - "epoch": 0.07, - "learning_rate": 0.0002897462521902784, - "loss": 0.1283, + "epoch": 0.04, + "learning_rate": 0.00029388138404641887, + "loss": 0.1472, "step": 6320 }, { - "epoch": 0.07, - "learning_rate": 0.0002897300279057693, - "loss": 0.142, + "epoch": 0.04, + "learning_rate": 0.0002938717026920619, + "loss": 0.144, "step": 6330 }, { - "epoch": 0.07, - "learning_rate": 0.0002897138036212603, - "loss": 0.1284, + "epoch": 0.04, + "learning_rate": 0.00029386202133770497, + "loss": 0.1399, "step": 6340 }, { - "epoch": 0.07, - "learning_rate": 0.0002896975793367512, - "loss": 0.1266, + "epoch": 0.04, + "learning_rate": 0.00029385233998334805, + "loss": 0.1411, "step": 6350 }, { - "epoch": 0.07, - "learning_rate": 0.0002896813550522422, - "loss": 0.135, + "epoch": 0.04, + "learning_rate": 0.00029384265862899113, + "loss": 0.1462, "step": 6360 }, { - "epoch": 0.07, - "learning_rate": 0.0002896651307677331, - "loss": 0.1346, + "epoch": 0.04, + "learning_rate": 0.0002938329772746342, + "loss": 0.1461, "step": 6370 }, { - "epoch": 0.07, - "learning_rate": 0.00028964890648322403, - "loss": 0.132, + "epoch": 0.04, + "learning_rate": 0.00029382329592027724, + "loss": 0.1473, "step": 6380 }, { - "epoch": 0.07, - "learning_rate": 0.000289632682198715, - "loss": 0.1221, + "epoch": 0.04, + "learning_rate": 0.0002938136145659203, + "loss": 0.1478, "step": 6390 }, { - "epoch": 0.07, - "learning_rate": 0.00028961645791420593, - "loss": 0.142, + "epoch": 0.04, + "learning_rate": 0.00029380393321156334, + "loss": 0.1348, "step": 6400 }, { - "epoch": 0.07, - "learning_rate": 0.0002896002336296969, - "loss": 0.1257, + "epoch": 0.04, + "learning_rate": 0.0002937942518572064, + "loss": 0.1443, "step": 6410 }, { - "epoch": 0.07, - "learning_rate": 0.00028958400934518783, - "loss": 0.1231, + "epoch": 0.04, + "learning_rate": 0.0002937845705028495, + "loss": 0.148, "step": 6420 }, { - "epoch": 0.07, - "learning_rate": 0.0002895677850606788, - "loss": 0.1177, + "epoch": 0.04, + "learning_rate": 0.0002937748891484926, + "loss": 0.1411, "step": 6430 }, { - "epoch": 0.07, - "learning_rate": 0.00028955156077616973, - "loss": 0.1264, + "epoch": 0.04, + "learning_rate": 0.00029376520779413566, + "loss": 0.1418, "step": 6440 }, { - "epoch": 0.07, - "learning_rate": 0.0002895353364916607, - "loss": 0.1353, + "epoch": 0.04, + "learning_rate": 0.00029375552643977874, + "loss": 0.1392, "step": 6450 }, { - "epoch": 0.07, - "learning_rate": 0.00028951911220715163, - "loss": 0.125, + "epoch": 0.04, + "learning_rate": 0.0002937458450854218, + "loss": 0.1498, "step": 6460 }, { - "epoch": 0.07, - "learning_rate": 0.0002895028879226426, - "loss": 0.1241, + "epoch": 0.04, + "learning_rate": 0.00029373616373106485, + "loss": 0.1484, "step": 6470 }, { - "epoch": 0.07, - "learning_rate": 0.00028948666363813353, - "loss": 0.1258, + "epoch": 0.04, + "learning_rate": 0.0002937264823767079, + "loss": 0.1362, "step": 6480 }, { - "epoch": 0.07, - "learning_rate": 0.0002894704393536245, - "loss": 0.1227, + "epoch": 0.04, + "learning_rate": 0.000293716801022351, + "loss": 0.1456, "step": 6490 }, { - "epoch": 0.07, - "learning_rate": 0.00028945421506911543, - "loss": 0.122, + "epoch": 0.04, + "learning_rate": 0.0002937071196679941, + "loss": 0.1453, "step": 6500 }, { - "epoch": 0.07, - "learning_rate": 0.0002894379907846064, - "loss": 0.1283, + "epoch": 0.04, + "learning_rate": 0.0002936974383136371, + "loss": 0.1413, "step": 6510 }, { - "epoch": 0.07, - "learning_rate": 0.0002894217665000973, - "loss": 0.1242, + "epoch": 0.04, + "learning_rate": 0.0002936877569592802, + "loss": 0.1515, "step": 6520 }, { - "epoch": 0.07, - "learning_rate": 0.00028940554221558825, - "loss": 0.1202, + "epoch": 0.04, + "learning_rate": 0.00029367807560492327, + "loss": 0.143, "step": 6530 }, { - "epoch": 0.07, - "learning_rate": 0.0002893893179310792, - "loss": 0.1391, + "epoch": 0.04, + "learning_rate": 0.0002936683942505663, + "loss": 0.1395, "step": 6540 }, { - "epoch": 0.07, - "learning_rate": 0.00028937309364657015, - "loss": 0.1221, + "epoch": 0.04, + "learning_rate": 0.0002936587128962094, + "loss": 0.1388, "step": 6550 }, { - "epoch": 0.07, - "learning_rate": 0.00028935686936206107, - "loss": 0.1273, + "epoch": 0.04, + "learning_rate": 0.00029364903154185246, + "loss": 0.1405, "step": 6560 }, { - "epoch": 0.07, - "learning_rate": 0.00028934064507755205, - "loss": 0.1261, + "epoch": 0.04, + "learning_rate": 0.00029363935018749554, + "loss": 0.1428, "step": 6570 }, { - "epoch": 0.07, - "learning_rate": 0.00028932442079304297, - "loss": 0.1184, + "epoch": 0.04, + "learning_rate": 0.0002936296688331386, + "loss": 0.1373, "step": 6580 }, { - "epoch": 0.07, - "learning_rate": 0.00028930819650853395, - "loss": 0.1249, + "epoch": 0.04, + "learning_rate": 0.0002936199874787817, + "loss": 0.1329, "step": 6590 }, { - "epoch": 0.07, - "learning_rate": 0.00028929197222402487, - "loss": 0.1201, + "epoch": 0.04, + "learning_rate": 0.0002936103061244248, + "loss": 0.1354, "step": 6600 }, { - "epoch": 0.07, - "learning_rate": 0.00028927574793951585, - "loss": 0.123, + "epoch": 0.04, + "learning_rate": 0.0002936006247700678, + "loss": 0.1373, "step": 6610 }, { - "epoch": 0.07, - "learning_rate": 0.00028925952365500677, - "loss": 0.1265, + "epoch": 0.04, + "learning_rate": 0.0002935909434157109, + "loss": 0.1326, "step": 6620 }, { - "epoch": 0.07, - "learning_rate": 0.00028924329937049775, - "loss": 0.1253, + "epoch": 0.04, + "learning_rate": 0.00029358126206135396, + "loss": 0.1493, "step": 6630 }, { - "epoch": 0.07, - "learning_rate": 0.00028922707508598867, - "loss": 0.1209, + "epoch": 0.04, + "learning_rate": 0.000293571580706997, + "loss": 0.1384, "step": 6640 }, { - "epoch": 0.07, - "learning_rate": 0.00028921085080147965, - "loss": 0.1268, + "epoch": 0.04, + "learning_rate": 0.00029356189935264007, + "loss": 0.134, "step": 6650 }, { - "epoch": 0.07, - "learning_rate": 0.00028919462651697057, - "loss": 0.1238, + "epoch": 0.04, + "learning_rate": 0.00029355221799828315, + "loss": 0.1398, "step": 6660 }, { - "epoch": 0.07, - "learning_rate": 0.00028917840223246155, - "loss": 0.1186, + "epoch": 0.04, + "learning_rate": 0.0002935425366439262, + "loss": 0.1439, "step": 6670 }, { - "epoch": 0.07, - "learning_rate": 0.00028916217794795247, - "loss": 0.1252, + "epoch": 0.04, + "learning_rate": 0.00029353285528956925, + "loss": 0.1395, "step": 6680 }, { - "epoch": 0.07, - "learning_rate": 0.00028914595366344345, - "loss": 0.1234, + "epoch": 0.04, + "learning_rate": 0.00029352317393521233, + "loss": 0.1417, "step": 6690 }, { - "epoch": 0.07, - "learning_rate": 0.00028912972937893437, - "loss": 0.1147, + "epoch": 0.04, + "learning_rate": 0.0002935134925808554, + "loss": 0.14, "step": 6700 }, { - "epoch": 0.07, - "learning_rate": 0.0002891135050944253, - "loss": 0.1238, + "epoch": 0.04, + "learning_rate": 0.0002935038112264985, + "loss": 0.148, "step": 6710 }, { - "epoch": 0.07, - "learning_rate": 0.00028909728080991627, - "loss": 0.1231, + "epoch": 0.04, + "learning_rate": 0.00029349412987214157, + "loss": 0.1517, "step": 6720 }, { - "epoch": 0.07, - "learning_rate": 0.0002890810565254072, - "loss": 0.1242, + "epoch": 0.04, + "learning_rate": 0.00029348444851778465, + "loss": 0.1478, "step": 6730 }, { - "epoch": 0.07, - "learning_rate": 0.0002890648322408981, - "loss": 0.1145, + "epoch": 0.04, + "learning_rate": 0.00029347476716342773, + "loss": 0.1413, "step": 6740 }, { - "epoch": 0.07, - "learning_rate": 0.0002890486079563891, - "loss": 0.1202, + "epoch": 0.04, + "learning_rate": 0.00029346508580907076, + "loss": 0.1348, "step": 6750 }, { - "epoch": 0.07, - "learning_rate": 0.00028903238367188, - "loss": 0.1109, + "epoch": 0.04, + "learning_rate": 0.00029345540445471384, + "loss": 0.128, "step": 6760 }, { - "epoch": 0.07, - "learning_rate": 0.000289016159387371, - "loss": 0.1177, + "epoch": 0.04, + "learning_rate": 0.0002934457231003569, + "loss": 0.1242, "step": 6770 }, { - "epoch": 0.07, - "learning_rate": 0.0002889999351028619, - "loss": 0.1124, + "epoch": 0.04, + "learning_rate": 0.00029343604174599994, + "loss": 0.1384, "step": 6780 }, { - "epoch": 0.07, - "learning_rate": 0.0002889837108183529, - "loss": 0.1215, + "epoch": 0.04, + "learning_rate": 0.000293426360391643, + "loss": 0.1522, "step": 6790 }, { - "epoch": 0.07, - "learning_rate": 0.0002889674865338438, - "loss": 0.1277, + "epoch": 0.04, + "learning_rate": 0.0002934166790372861, + "loss": 0.1375, "step": 6800 }, { - "epoch": 0.07, - "learning_rate": 0.0002889512622493348, - "loss": 0.1248, + "epoch": 0.04, + "learning_rate": 0.0002934069976829292, + "loss": 0.1435, "step": 6810 }, { - "epoch": 0.07, - "learning_rate": 0.0002889350379648257, - "loss": 0.109, + "epoch": 0.04, + "learning_rate": 0.0002933973163285722, + "loss": 0.1282, "step": 6820 }, { - "epoch": 0.07, - "learning_rate": 0.0002889188136803167, - "loss": 0.1191, + "epoch": 0.04, + "learning_rate": 0.0002933876349742153, + "loss": 0.1349, "step": 6830 }, { - "epoch": 0.07, - "learning_rate": 0.0002889025893958076, - "loss": 0.1284, + "epoch": 0.04, + "learning_rate": 0.00029337795361985837, + "loss": 0.1427, "step": 6840 }, { - "epoch": 0.07, - "learning_rate": 0.0002888863651112986, - "loss": 0.1247, + "epoch": 0.04, + "learning_rate": 0.00029336827226550145, + "loss": 0.1346, "step": 6850 }, { - "epoch": 0.07, - "learning_rate": 0.0002888701408267895, - "loss": 0.1157, + "epoch": 0.04, + "learning_rate": 0.0002933585909111445, + "loss": 0.1294, "step": 6860 }, { - "epoch": 0.07, - "learning_rate": 0.0002888539165422805, - "loss": 0.127, + "epoch": 0.04, + "learning_rate": 0.0002933489095567876, + "loss": 0.1475, "step": 6870 }, { - "epoch": 0.07, - "learning_rate": 0.0002888376922577714, - "loss": 0.1161, + "epoch": 0.04, + "learning_rate": 0.00029333922820243063, + "loss": 0.1376, "step": 6880 }, { - "epoch": 0.07, - "learning_rate": 0.00028882146797326233, - "loss": 0.1162, + "epoch": 0.04, + "learning_rate": 0.0002933295468480737, + "loss": 0.1389, "step": 6890 }, { - "epoch": 0.07, - "learning_rate": 0.0002888052436887533, - "loss": 0.113, + "epoch": 0.04, + "learning_rate": 0.0002933198654937168, + "loss": 0.1385, "step": 6900 }, { - "epoch": 0.07, - "learning_rate": 0.00028878901940424423, - "loss": 0.1135, + "epoch": 0.04, + "learning_rate": 0.0002933101841393598, + "loss": 0.132, "step": 6910 }, { - "epoch": 0.07, - "learning_rate": 0.00028877279511973516, - "loss": 0.1152, + "epoch": 0.04, + "learning_rate": 0.0002933005027850029, + "loss": 0.1271, "step": 6920 }, { - "epoch": 0.07, - "learning_rate": 0.00028875657083522613, - "loss": 0.1077, + "epoch": 0.04, + "learning_rate": 0.000293290821430646, + "loss": 0.1367, "step": 6930 }, { - "epoch": 0.08, - "learning_rate": 0.00028874034655071705, - "loss": 0.1186, + "epoch": 0.04, + "learning_rate": 0.00029328114007628905, + "loss": 0.149, "step": 6940 }, { - "epoch": 0.08, - "learning_rate": 0.00028872412226620803, - "loss": 0.1136, + "epoch": 0.04, + "learning_rate": 0.00029327145872193213, + "loss": 0.1377, "step": 6950 }, { - "epoch": 0.08, - "learning_rate": 0.00028870789798169895, - "loss": 0.1168, + "epoch": 0.04, + "learning_rate": 0.00029326177736757516, + "loss": 0.1376, "step": 6960 }, { - "epoch": 0.08, - "learning_rate": 0.00028869167369718993, - "loss": 0.1265, + "epoch": 0.04, + "learning_rate": 0.00029325209601321824, + "loss": 0.1402, "step": 6970 }, { - "epoch": 0.08, - "learning_rate": 0.00028867544941268085, - "loss": 0.1165, + "epoch": 0.05, + "learning_rate": 0.0002932424146588613, + "loss": 0.1444, "step": 6980 }, { - "epoch": 0.08, - "learning_rate": 0.00028865922512817183, - "loss": 0.1229, + "epoch": 0.05, + "learning_rate": 0.0002932327333045044, + "loss": 0.1421, "step": 6990 }, { - "epoch": 0.08, - "learning_rate": 0.00028864300084366275, - "loss": 0.1279, + "epoch": 0.05, + "learning_rate": 0.0002932230519501475, + "loss": 0.1438, "step": 7000 }, { - "epoch": 0.08, - "eval_cer": 0.921452942974621, - "eval_loss": 0.0831136554479599, - "eval_runtime": 119.574, - "eval_samples_per_second": 16.726, - "eval_steps_per_second": 4.182, + "epoch": 0.05, + "eval_cer": 0.9203208676985651, + "eval_loss": 0.09841650724411011, + "eval_runtime": 120.3287, + "eval_samples_per_second": 16.621, + "eval_steps_per_second": 4.155, "step": 7000 }, { - "epoch": 0.08, - "learning_rate": 0.00028862677655915373, - "loss": 0.1185, + "epoch": 0.05, + "learning_rate": 0.0002932133705957905, + "loss": 0.1261, "step": 7010 }, { - "epoch": 0.08, - "learning_rate": 0.00028861055227464465, - "loss": 0.1192, + "epoch": 0.05, + "learning_rate": 0.0002932036892414336, + "loss": 0.1343, "step": 7020 }, { - "epoch": 0.08, - "learning_rate": 0.00028859432799013563, - "loss": 0.1238, + "epoch": 0.05, + "learning_rate": 0.00029319400788707666, + "loss": 0.1392, "step": 7030 }, { - "epoch": 0.08, - "learning_rate": 0.00028857810370562655, - "loss": 0.1241, + "epoch": 0.05, + "learning_rate": 0.0002931843265327197, + "loss": 0.1348, "step": 7040 }, { - "epoch": 0.08, - "learning_rate": 0.00028856187942111753, - "loss": 0.1138, + "epoch": 0.05, + "learning_rate": 0.00029317464517836277, + "loss": 0.1412, "step": 7050 }, { - "epoch": 0.08, - "learning_rate": 0.00028854565513660845, - "loss": 0.1182, + "epoch": 0.05, + "learning_rate": 0.00029316496382400585, + "loss": 0.1379, "step": 7060 }, { - "epoch": 0.08, - "learning_rate": 0.0002885294308520994, - "loss": 0.1194, + "epoch": 0.05, + "learning_rate": 0.00029315528246964893, + "loss": 0.1321, "step": 7070 }, { - "epoch": 0.08, - "learning_rate": 0.00028851320656759035, - "loss": 0.1303, + "epoch": 0.05, + "learning_rate": 0.000293145601115292, + "loss": 0.1372, "step": 7080 }, { - "epoch": 0.08, - "learning_rate": 0.0002884969822830813, - "loss": 0.1358, + "epoch": 0.05, + "learning_rate": 0.0002931359197609351, + "loss": 0.1428, "step": 7090 }, { - "epoch": 0.08, - "learning_rate": 0.00028848075799857225, - "loss": 0.1262, + "epoch": 0.05, + "learning_rate": 0.0002931262384065781, + "loss": 0.1326, "step": 7100 }, { - "epoch": 0.08, - "learning_rate": 0.0002884645337140632, - "loss": 0.1248, + "epoch": 0.05, + "learning_rate": 0.0002931165570522212, + "loss": 0.1317, "step": 7110 }, { - "epoch": 0.08, - "learning_rate": 0.00028844830942955415, - "loss": 0.1215, + "epoch": 0.05, + "learning_rate": 0.0002931068756978643, + "loss": 0.1363, "step": 7120 }, { - "epoch": 0.08, - "learning_rate": 0.0002884320851450451, - "loss": 0.1323, + "epoch": 0.05, + "learning_rate": 0.00029309719434350735, + "loss": 0.1345, "step": 7130 }, { - "epoch": 0.08, - "learning_rate": 0.00028841586086053605, - "loss": 0.1175, + "epoch": 0.05, + "learning_rate": 0.00029308751298915043, + "loss": 0.1292, "step": 7140 }, { - "epoch": 0.08, - "learning_rate": 0.00028839963657602697, - "loss": 0.1205, + "epoch": 0.05, + "learning_rate": 0.00029307783163479346, + "loss": 0.1308, "step": 7150 }, { - "epoch": 0.08, - "learning_rate": 0.00028838341229151795, - "loss": 0.1139, + "epoch": 0.05, + "learning_rate": 0.00029306815028043654, + "loss": 0.1367, "step": 7160 }, { - "epoch": 0.08, - "learning_rate": 0.00028836718800700887, - "loss": 0.1184, + "epoch": 0.05, + "learning_rate": 0.0002930584689260796, + "loss": 0.1389, "step": 7170 }, { - "epoch": 0.08, - "learning_rate": 0.00028835096372249985, - "loss": 0.115, + "epoch": 0.05, + "learning_rate": 0.00029304878757172264, + "loss": 0.1341, "step": 7180 }, { - "epoch": 0.08, - "learning_rate": 0.00028833473943799077, - "loss": 0.117, + "epoch": 0.05, + "learning_rate": 0.0002930391062173657, + "loss": 0.1278, "step": 7190 }, { - "epoch": 0.08, - "learning_rate": 0.00028831851515348175, - "loss": 0.1201, + "epoch": 0.05, + "learning_rate": 0.0002930294248630088, + "loss": 0.1542, "step": 7200 }, { - "epoch": 0.08, - "learning_rate": 0.00028830229086897267, - "loss": 0.1133, + "epoch": 0.05, + "learning_rate": 0.0002930197435086519, + "loss": 0.1322, "step": 7210 }, { - "epoch": 0.08, - "learning_rate": 0.0002882860665844636, - "loss": 0.1316, + "epoch": 0.05, + "learning_rate": 0.00029301006215429496, + "loss": 0.1383, "step": 7220 }, { - "epoch": 0.08, - "learning_rate": 0.00028826984229995457, - "loss": 0.1196, + "epoch": 0.05, + "learning_rate": 0.00029300038079993804, + "loss": 0.1471, "step": 7230 }, { - "epoch": 0.08, - "learning_rate": 0.0002882536180154455, - "loss": 0.1137, + "epoch": 0.05, + "learning_rate": 0.00029299069944558107, + "loss": 0.142, "step": 7240 }, { - "epoch": 0.08, - "learning_rate": 0.0002882373937309364, - "loss": 0.128, + "epoch": 0.05, + "learning_rate": 0.00029298101809122415, + "loss": 0.1319, "step": 7250 }, { - "epoch": 0.08, - "learning_rate": 0.0002882211694464274, - "loss": 0.1314, + "epoch": 0.05, + "learning_rate": 0.00029297133673686723, + "loss": 0.1375, "step": 7260 }, { - "epoch": 0.08, - "learning_rate": 0.0002882049451619183, - "loss": 0.1218, + "epoch": 0.05, + "learning_rate": 0.0002929616553825103, + "loss": 0.1252, "step": 7270 }, { - "epoch": 0.08, - "learning_rate": 0.0002881887208774093, - "loss": 0.1072, + "epoch": 0.05, + "learning_rate": 0.00029295197402815333, + "loss": 0.1299, "step": 7280 }, { - "epoch": 0.08, - "learning_rate": 0.0002881724965929002, - "loss": 0.1161, + "epoch": 0.05, + "learning_rate": 0.0002929422926737964, + "loss": 0.1458, "step": 7290 }, { - "epoch": 0.08, - "learning_rate": 0.0002881562723083912, - "loss": 0.1276, + "epoch": 0.05, + "learning_rate": 0.0002929326113194395, + "loss": 0.1378, "step": 7300 }, { - "epoch": 0.08, - "learning_rate": 0.0002881400480238821, - "loss": 0.1186, + "epoch": 0.05, + "learning_rate": 0.0002929229299650825, + "loss": 0.139, "step": 7310 }, { - "epoch": 0.08, - "learning_rate": 0.0002881238237393731, - "loss": 0.1299, + "epoch": 0.05, + "learning_rate": 0.0002929132486107256, + "loss": 0.1283, "step": 7320 }, { - "epoch": 0.08, - "learning_rate": 0.000288107599454864, - "loss": 0.1154, + "epoch": 0.05, + "learning_rate": 0.0002929035672563687, + "loss": 0.1338, "step": 7330 }, { - "epoch": 0.08, - "learning_rate": 0.000288091375170355, - "loss": 0.1202, + "epoch": 0.05, + "learning_rate": 0.00029289388590201176, + "loss": 0.1248, "step": 7340 }, { - "epoch": 0.08, - "learning_rate": 0.0002880751508858459, - "loss": 0.1296, + "epoch": 0.05, + "learning_rate": 0.00029288420454765484, + "loss": 0.1316, "step": 7350 }, { - "epoch": 0.08, - "learning_rate": 0.0002880589266013369, - "loss": 0.123, + "epoch": 0.05, + "learning_rate": 0.0002928745231932979, + "loss": 0.1321, "step": 7360 }, { - "epoch": 0.08, - "learning_rate": 0.0002880427023168278, - "loss": 0.1149, + "epoch": 0.05, + "learning_rate": 0.000292864841838941, + "loss": 0.131, "step": 7370 }, { - "epoch": 0.08, - "learning_rate": 0.0002880264780323188, - "loss": 0.1254, + "epoch": 0.05, + "learning_rate": 0.000292855160484584, + "loss": 0.1313, "step": 7380 }, { - "epoch": 0.08, - "learning_rate": 0.0002880102537478097, - "loss": 0.1189, + "epoch": 0.05, + "learning_rate": 0.0002928454791302271, + "loss": 0.1424, "step": 7390 }, { - "epoch": 0.08, - "learning_rate": 0.00028799402946330064, - "loss": 0.1229, + "epoch": 0.05, + "learning_rate": 0.0002928357977758702, + "loss": 0.1266, "step": 7400 }, { - "epoch": 0.08, - "learning_rate": 0.0002879778051787916, - "loss": 0.116, + "epoch": 0.05, + "learning_rate": 0.0002928261164215132, + "loss": 0.1284, "step": 7410 }, { - "epoch": 0.08, - "learning_rate": 0.00028796158089428254, - "loss": 0.115, + "epoch": 0.05, + "learning_rate": 0.0002928164350671563, + "loss": 0.1332, "step": 7420 }, { - "epoch": 0.08, - "learning_rate": 0.00028794535660977346, - "loss": 0.123, + "epoch": 0.05, + "learning_rate": 0.00029280675371279937, + "loss": 0.1358, "step": 7430 }, { - "epoch": 0.08, - "learning_rate": 0.00028792913232526443, - "loss": 0.1188, + "epoch": 0.05, + "learning_rate": 0.00029279707235844245, + "loss": 0.122, "step": 7440 }, { - "epoch": 0.08, - "learning_rate": 0.00028791290804075536, - "loss": 0.1172, + "epoch": 0.05, + "learning_rate": 0.0002927873910040855, + "loss": 0.1325, "step": 7450 }, { - "epoch": 0.08, - "learning_rate": 0.00028789668375624633, - "loss": 0.1156, + "epoch": 0.05, + "learning_rate": 0.00029277770964972855, + "loss": 0.1434, "step": 7460 }, { - "epoch": 0.08, - "learning_rate": 0.00028788045947173726, - "loss": 0.1142, + "epoch": 0.05, + "learning_rate": 0.00029276802829537163, + "loss": 0.1273, "step": 7470 }, { - "epoch": 0.08, - "learning_rate": 0.00028786423518722823, - "loss": 0.1208, + "epoch": 0.05, + "learning_rate": 0.0002927583469410147, + "loss": 0.1311, "step": 7480 }, { - "epoch": 0.08, - "learning_rate": 0.00028784801090271916, - "loss": 0.1257, + "epoch": 0.05, + "learning_rate": 0.0002927486655866578, + "loss": 0.1464, "step": 7490 }, { - "epoch": 0.08, - "learning_rate": 0.00028783178661821013, - "loss": 0.1139, + "epoch": 0.05, + "learning_rate": 0.00029273898423230087, + "loss": 0.1308, "step": 7500 }, { - "epoch": 0.08, - "learning_rate": 0.00028781556233370106, - "loss": 0.1199, + "epoch": 0.05, + "learning_rate": 0.00029272930287794395, + "loss": 0.1379, "step": 7510 }, { - "epoch": 0.08, - "learning_rate": 0.00028779933804919203, - "loss": 0.1149, + "epoch": 0.05, + "learning_rate": 0.000292719621523587, + "loss": 0.1346, "step": 7520 }, { - "epoch": 0.08, - "learning_rate": 0.00028778311376468296, - "loss": 0.1076, + "epoch": 0.05, + "learning_rate": 0.00029270994016923006, + "loss": 0.1377, "step": 7530 }, { - "epoch": 0.08, - "learning_rate": 0.00028776688948017393, - "loss": 0.1148, + "epoch": 0.05, + "learning_rate": 0.00029270025881487314, + "loss": 0.1296, "step": 7540 }, { - "epoch": 0.08, - "learning_rate": 0.00028775066519566486, - "loss": 0.1246, + "epoch": 0.05, + "learning_rate": 0.00029269057746051616, + "loss": 0.1384, "step": 7550 }, { - "epoch": 0.08, - "learning_rate": 0.00028773444091115583, - "loss": 0.1186, + "epoch": 0.05, + "learning_rate": 0.00029268089610615924, + "loss": 0.1259, "step": 7560 }, { - "epoch": 0.08, - "learning_rate": 0.00028771821662664675, - "loss": 0.1242, + "epoch": 0.05, + "learning_rate": 0.0002926712147518023, + "loss": 0.1289, "step": 7570 }, { - "epoch": 0.08, - "learning_rate": 0.0002877019923421377, - "loss": 0.114, + "epoch": 0.05, + "learning_rate": 0.0002926615333974454, + "loss": 0.1312, "step": 7580 }, { - "epoch": 0.08, - "learning_rate": 0.00028768576805762865, - "loss": 0.1179, + "epoch": 0.05, + "learning_rate": 0.00029265185204308843, + "loss": 0.1331, "step": 7590 }, { - "epoch": 0.08, - "learning_rate": 0.0002876695437731196, - "loss": 0.1254, + "epoch": 0.05, + "learning_rate": 0.0002926421706887315, + "loss": 0.1336, "step": 7600 }, { - "epoch": 0.08, - "learning_rate": 0.0002876533194886105, - "loss": 0.1205, + "epoch": 0.05, + "learning_rate": 0.0002926324893343746, + "loss": 0.136, "step": 7610 }, { - "epoch": 0.08, - "learning_rate": 0.0002876370952041015, - "loss": 0.1218, + "epoch": 0.05, + "learning_rate": 0.00029262280798001767, + "loss": 0.1287, "step": 7620 }, { - "epoch": 0.08, - "learning_rate": 0.0002876208709195924, - "loss": 0.1113, + "epoch": 0.05, + "learning_rate": 0.00029261312662566075, + "loss": 0.1359, "step": 7630 }, { - "epoch": 0.08, - "learning_rate": 0.0002876046466350834, - "loss": 0.1354, + "epoch": 0.05, + "learning_rate": 0.00029260344527130383, + "loss": 0.1299, "step": 7640 }, { - "epoch": 0.08, - "learning_rate": 0.0002875884223505743, - "loss": 0.1374, + "epoch": 0.05, + "learning_rate": 0.00029259376391694685, + "loss": 0.1235, "step": 7650 }, { - "epoch": 0.08, - "learning_rate": 0.0002875721980660653, - "loss": 0.1217, + "epoch": 0.05, + "learning_rate": 0.00029258408256258993, + "loss": 0.1242, "step": 7660 }, { - "epoch": 0.08, - "learning_rate": 0.0002875559737815562, - "loss": 0.1097, + "epoch": 0.05, + "learning_rate": 0.000292574401208233, + "loss": 0.1304, "step": 7670 }, { - "epoch": 0.08, - "learning_rate": 0.0002875397494970472, - "loss": 0.1222, + "epoch": 0.05, + "learning_rate": 0.00029256471985387604, + "loss": 0.1341, "step": 7680 }, { - "epoch": 0.08, - "learning_rate": 0.0002875235252125381, - "loss": 0.1363, + "epoch": 0.05, + "learning_rate": 0.0002925550384995191, + "loss": 0.1333, "step": 7690 }, { - "epoch": 0.08, - "learning_rate": 0.0002875073009280291, - "loss": 0.1267, + "epoch": 0.05, + "learning_rate": 0.0002925453571451622, + "loss": 0.1355, "step": 7700 }, { - "epoch": 0.08, - "learning_rate": 0.00028749107664352, - "loss": 0.1217, + "epoch": 0.05, + "learning_rate": 0.0002925356757908053, + "loss": 0.1384, "step": 7710 }, { - "epoch": 0.08, - "learning_rate": 0.000287474852359011, - "loss": 0.1178, + "epoch": 0.05, + "learning_rate": 0.00029252599443644836, + "loss": 0.1281, "step": 7720 }, { - "epoch": 0.08, - "learning_rate": 0.0002874586280745019, - "loss": 0.1254, + "epoch": 0.05, + "learning_rate": 0.0002925163130820914, + "loss": 0.1317, "step": 7730 }, { - "epoch": 0.08, - "learning_rate": 0.0002874424037899929, - "loss": 0.1305, + "epoch": 0.05, + "learning_rate": 0.00029250663172773446, + "loss": 0.1337, "step": 7740 }, { - "epoch": 0.08, - "learning_rate": 0.0002874261795054838, - "loss": 0.1097, + "epoch": 0.05, + "learning_rate": 0.00029249695037337754, + "loss": 0.1392, "step": 7750 }, { - "epoch": 0.08, - "learning_rate": 0.0002874099552209747, - "loss": 0.1116, + "epoch": 0.05, + "learning_rate": 0.0002924872690190206, + "loss": 0.1284, "step": 7760 }, { - "epoch": 0.08, - "learning_rate": 0.0002873937309364657, - "loss": 0.1104, + "epoch": 0.05, + "learning_rate": 0.0002924775876646637, + "loss": 0.1259, "step": 7770 }, { - "epoch": 0.08, - "learning_rate": 0.0002873775066519566, - "loss": 0.1208, + "epoch": 0.05, + "learning_rate": 0.00029246790631030673, + "loss": 0.1305, "step": 7780 }, { - "epoch": 0.08, - "learning_rate": 0.00028736128236744754, - "loss": 0.1144, + "epoch": 0.05, + "learning_rate": 0.0002924582249559498, + "loss": 0.1325, "step": 7790 }, { - "epoch": 0.08, - "learning_rate": 0.0002873450580829385, - "loss": 0.1207, + "epoch": 0.05, + "learning_rate": 0.0002924485436015929, + "loss": 0.1327, "step": 7800 }, { - "epoch": 0.08, - "learning_rate": 0.00028732883379842944, - "loss": 0.115, + "epoch": 0.05, + "learning_rate": 0.0002924388622472359, + "loss": 0.1305, "step": 7810 }, { - "epoch": 0.08, - "learning_rate": 0.0002873126095139204, - "loss": 0.12, + "epoch": 0.05, + "learning_rate": 0.000292429180892879, + "loss": 0.1284, "step": 7820 }, { - "epoch": 0.08, - "learning_rate": 0.00028729638522941134, - "loss": 0.1122, + "epoch": 0.05, + "learning_rate": 0.00029241949953852207, + "loss": 0.131, "step": 7830 }, { - "epoch": 0.08, - "learning_rate": 0.0002872801609449023, - "loss": 0.1203, + "epoch": 0.05, + "learning_rate": 0.00029240981818416515, + "loss": 0.1227, "step": 7840 }, { - "epoch": 0.08, - "learning_rate": 0.00028726393666039324, - "loss": 0.1189, - "step": 7850 + "epoch": 0.05, + "learning_rate": 0.00029240013682980823, + "loss": 0.1229, + "step": 7850 }, { - "epoch": 0.09, - "learning_rate": 0.0002872477123758842, - "loss": 0.1176, + "epoch": 0.05, + "learning_rate": 0.0002923904554754513, + "loss": 0.139, "step": 7860 }, { - "epoch": 0.09, - "learning_rate": 0.00028723148809137514, - "loss": 0.1142, + "epoch": 0.05, + "learning_rate": 0.00029238077412109434, + "loss": 0.137, "step": 7870 }, { - "epoch": 0.09, - "learning_rate": 0.0002872152638068661, - "loss": 0.1177, + "epoch": 0.05, + "learning_rate": 0.0002923710927667374, + "loss": 0.1292, "step": 7880 }, { - "epoch": 0.09, - "learning_rate": 0.00028719903952235704, - "loss": 0.1166, + "epoch": 0.05, + "learning_rate": 0.0002923614114123805, + "loss": 0.1209, "step": 7890 }, { - "epoch": 0.09, - "learning_rate": 0.000287182815237848, - "loss": 0.1095, + "epoch": 0.05, + "learning_rate": 0.0002923517300580236, + "loss": 0.1206, "step": 7900 }, { - "epoch": 0.09, - "learning_rate": 0.00028716659095333894, - "loss": 0.1064, + "epoch": 0.05, + "learning_rate": 0.00029234204870366666, + "loss": 0.1245, "step": 7910 }, { - "epoch": 0.09, - "learning_rate": 0.0002871503666688299, - "loss": 0.1134, + "epoch": 0.05, + "learning_rate": 0.0002923323673493097, + "loss": 0.1208, "step": 7920 }, { - "epoch": 0.09, - "learning_rate": 0.00028713414238432084, - "loss": 0.1142, + "epoch": 0.05, + "learning_rate": 0.00029232268599495276, + "loss": 0.1367, "step": 7930 }, { - "epoch": 0.09, - "learning_rate": 0.00028711791809981176, - "loss": 0.1209, + "epoch": 0.05, + "learning_rate": 0.00029231300464059584, + "loss": 0.1284, "step": 7940 }, { - "epoch": 0.09, - "learning_rate": 0.00028710169381530274, - "loss": 0.1073, + "epoch": 0.05, + "learning_rate": 0.00029230332328623887, + "loss": 0.1203, "step": 7950 }, { - "epoch": 0.09, - "learning_rate": 0.00028708546953079366, - "loss": 0.1179, + "epoch": 0.05, + "learning_rate": 0.00029229364193188195, + "loss": 0.1426, "step": 7960 }, { - "epoch": 0.09, - "learning_rate": 0.0002870692452462846, - "loss": 0.1076, + "epoch": 0.05, + "learning_rate": 0.000292283960577525, + "loss": 0.1313, "step": 7970 }, { - "epoch": 0.09, - "learning_rate": 0.00028705302096177556, - "loss": 0.1142, + "epoch": 0.05, + "learning_rate": 0.0002922742792231681, + "loss": 0.1297, "step": 7980 }, { - "epoch": 0.09, - "learning_rate": 0.0002870367966772665, - "loss": 0.1047, + "epoch": 0.05, + "learning_rate": 0.0002922645978688112, + "loss": 0.1345, "step": 7990 }, { - "epoch": 0.09, - "learning_rate": 0.00028702057239275746, - "loss": 0.1147, + "epoch": 0.05, + "learning_rate": 0.00029225491651445427, + "loss": 0.1362, "step": 8000 }, { - "epoch": 0.09, - "eval_cer": 0.9214838649258491, - "eval_loss": 0.07892972975969315, - "eval_runtime": 119.8333, - "eval_samples_per_second": 16.69, - "eval_steps_per_second": 4.172, + "epoch": 0.05, + "eval_cer": 0.9203235792565811, + "eval_loss": 0.09412429481744766, + "eval_runtime": 120.4163, + "eval_samples_per_second": 16.609, + "eval_steps_per_second": 4.152, "step": 8000 }, { - "epoch": 0.09, - "learning_rate": 0.0002870043481082484, - "loss": 0.1164, + "epoch": 0.05, + "learning_rate": 0.0002922452351600973, + "loss": 0.1282, "step": 8010 }, { - "epoch": 0.09, - "learning_rate": 0.00028698812382373936, - "loss": 0.1024, + "epoch": 0.05, + "learning_rate": 0.00029223555380574037, + "loss": 0.1346, "step": 8020 }, { - "epoch": 0.09, - "learning_rate": 0.0002869718995392303, - "loss": 0.1255, + "epoch": 0.05, + "learning_rate": 0.00029222587245138345, + "loss": 0.1372, "step": 8030 }, { - "epoch": 0.09, - "learning_rate": 0.00028695567525472126, - "loss": 0.1093, + "epoch": 0.05, + "learning_rate": 0.00029221619109702653, + "loss": 0.1296, "step": 8040 }, { - "epoch": 0.09, - "learning_rate": 0.0002869394509702122, - "loss": 0.1093, + "epoch": 0.05, + "learning_rate": 0.00029220650974266956, + "loss": 0.1306, "step": 8050 }, { - "epoch": 0.09, - "learning_rate": 0.00028692322668570316, - "loss": 0.1086, + "epoch": 0.05, + "learning_rate": 0.00029219682838831264, + "loss": 0.1472, "step": 8060 }, { - "epoch": 0.09, - "learning_rate": 0.0002869070024011941, - "loss": 0.1254, + "epoch": 0.05, + "learning_rate": 0.0002921871470339557, + "loss": 0.1274, "step": 8070 }, { - "epoch": 0.09, - "learning_rate": 0.00028689077811668506, - "loss": 0.1386, + "epoch": 0.05, + "learning_rate": 0.00029217746567959874, + "loss": 0.1247, "step": 8080 }, { - "epoch": 0.09, - "learning_rate": 0.000286874553832176, - "loss": 0.1147, + "epoch": 0.05, + "learning_rate": 0.0002921677843252418, + "loss": 0.1447, "step": 8090 }, { - "epoch": 0.09, - "learning_rate": 0.00028685832954766696, - "loss": 0.114, + "epoch": 0.05, + "learning_rate": 0.0002921581029708849, + "loss": 0.1404, "step": 8100 }, { - "epoch": 0.09, - "learning_rate": 0.0002868421052631579, - "loss": 0.1222, + "epoch": 0.05, + "learning_rate": 0.000292148421616528, + "loss": 0.126, "step": 8110 }, { - "epoch": 0.09, - "learning_rate": 0.0002868258809786488, - "loss": 0.1074, + "epoch": 0.05, + "learning_rate": 0.00029213874026217106, + "loss": 0.1356, "step": 8120 }, { - "epoch": 0.09, - "learning_rate": 0.0002868096566941398, - "loss": 0.12, + "epoch": 0.05, + "learning_rate": 0.00029212905890781414, + "loss": 0.1206, "step": 8130 }, { - "epoch": 0.09, - "learning_rate": 0.0002867934324096307, - "loss": 0.1091, + "epoch": 0.05, + "learning_rate": 0.0002921193775534572, + "loss": 0.132, "step": 8140 }, { - "epoch": 0.09, - "learning_rate": 0.0002867772081251216, - "loss": 0.1147, + "epoch": 0.05, + "learning_rate": 0.00029210969619910025, + "loss": 0.1217, "step": 8150 }, { - "epoch": 0.09, - "learning_rate": 0.0002867609838406126, - "loss": 0.1153, + "epoch": 0.05, + "learning_rate": 0.0002921000148447433, + "loss": 0.1342, "step": 8160 }, { - "epoch": 0.09, - "learning_rate": 0.0002867447595561035, - "loss": 0.1097, + "epoch": 0.05, + "learning_rate": 0.0002920903334903864, + "loss": 0.1156, "step": 8170 }, { - "epoch": 0.09, - "learning_rate": 0.0002867285352715945, - "loss": 0.107, + "epoch": 0.05, + "learning_rate": 0.00029208065213602943, + "loss": 0.1298, "step": 8180 }, { - "epoch": 0.09, - "learning_rate": 0.0002867123109870854, - "loss": 0.1204, + "epoch": 0.05, + "learning_rate": 0.0002920709707816725, + "loss": 0.1287, "step": 8190 }, { - "epoch": 0.09, - "learning_rate": 0.0002866960867025764, - "loss": 0.1244, + "epoch": 0.05, + "learning_rate": 0.0002920612894273156, + "loss": 0.1279, "step": 8200 }, { - "epoch": 0.09, - "learning_rate": 0.0002866798624180673, - "loss": 0.11, + "epoch": 0.05, + "learning_rate": 0.00029205160807295867, + "loss": 0.1285, "step": 8210 }, { - "epoch": 0.09, - "learning_rate": 0.0002866636381335583, - "loss": 0.1081, + "epoch": 0.05, + "learning_rate": 0.0002920419267186017, + "loss": 0.1315, "step": 8220 }, { - "epoch": 0.09, - "learning_rate": 0.0002866474138490492, - "loss": 0.1055, + "epoch": 0.05, + "learning_rate": 0.0002920322453642448, + "loss": 0.1204, "step": 8230 }, { - "epoch": 0.09, - "learning_rate": 0.0002866311895645402, - "loss": 0.1167, + "epoch": 0.05, + "learning_rate": 0.00029202256400988786, + "loss": 0.125, "step": 8240 }, { - "epoch": 0.09, - "learning_rate": 0.0002866149652800311, - "loss": 0.1107, + "epoch": 0.05, + "learning_rate": 0.00029201288265553094, + "loss": 0.1237, "step": 8250 }, { - "epoch": 0.09, - "learning_rate": 0.0002865987409955221, - "loss": 0.1058, + "epoch": 0.05, + "learning_rate": 0.000292003201301174, + "loss": 0.1432, "step": 8260 }, { - "epoch": 0.09, - "learning_rate": 0.000286582516711013, - "loss": 0.1101, + "epoch": 0.05, + "learning_rate": 0.0002919935199468171, + "loss": 0.1284, "step": 8270 }, { - "epoch": 0.09, - "learning_rate": 0.000286566292426504, - "loss": 0.1065, + "epoch": 0.05, + "learning_rate": 0.0002919838385924602, + "loss": 0.13, "step": 8280 }, { - "epoch": 0.09, - "learning_rate": 0.0002865500681419949, - "loss": 0.108, + "epoch": 0.05, + "learning_rate": 0.0002919741572381032, + "loss": 0.1318, "step": 8290 }, { - "epoch": 0.09, - "learning_rate": 0.00028653384385748584, - "loss": 0.1025, + "epoch": 0.05, + "learning_rate": 0.0002919644758837463, + "loss": 0.128, "step": 8300 }, { - "epoch": 0.09, - "learning_rate": 0.0002865176195729768, - "loss": 0.123, + "epoch": 0.05, + "learning_rate": 0.00029195479452938936, + "loss": 0.1307, "step": 8310 }, { - "epoch": 0.09, - "learning_rate": 0.00028650139528846774, - "loss": 0.1112, + "epoch": 0.05, + "learning_rate": 0.0002919451131750324, + "loss": 0.1311, "step": 8320 }, { - "epoch": 0.09, - "learning_rate": 0.00028648517100395867, - "loss": 0.1043, + "epoch": 0.05, + "learning_rate": 0.00029193543182067547, + "loss": 0.1209, "step": 8330 }, { - "epoch": 0.09, - "learning_rate": 0.00028646894671944964, - "loss": 0.1235, + "epoch": 0.05, + "learning_rate": 0.00029192575046631855, + "loss": 0.1346, "step": 8340 }, { - "epoch": 0.09, - "learning_rate": 0.00028645272243494057, - "loss": 0.1194, + "epoch": 0.05, + "learning_rate": 0.0002919160691119616, + "loss": 0.1222, "step": 8350 }, { - "epoch": 0.09, - "learning_rate": 0.00028643649815043154, - "loss": 0.1048, + "epoch": 0.05, + "learning_rate": 0.00029190638775760465, + "loss": 0.1243, "step": 8360 }, { - "epoch": 0.09, - "learning_rate": 0.00028642027386592247, - "loss": 0.1095, + "epoch": 0.05, + "learning_rate": 0.00029189670640324773, + "loss": 0.1249, "step": 8370 }, { - "epoch": 0.09, - "learning_rate": 0.00028640404958141344, - "loss": 0.1066, + "epoch": 0.05, + "learning_rate": 0.0002918870250488908, + "loss": 0.1351, "step": 8380 }, { - "epoch": 0.09, - "learning_rate": 0.00028638782529690436, - "loss": 0.1044, + "epoch": 0.05, + "learning_rate": 0.0002918773436945339, + "loss": 0.1447, "step": 8390 }, { - "epoch": 0.09, - "learning_rate": 0.00028637160101239534, - "loss": 0.106, + "epoch": 0.05, + "learning_rate": 0.00029186766234017697, + "loss": 0.143, "step": 8400 }, { - "epoch": 0.09, - "learning_rate": 0.00028635537672788626, - "loss": 0.1109, + "epoch": 0.05, + "learning_rate": 0.00029185798098582005, + "loss": 0.1344, "step": 8410 }, { - "epoch": 0.09, - "learning_rate": 0.00028633915244337724, - "loss": 0.1125, + "epoch": 0.05, + "learning_rate": 0.0002918482996314631, + "loss": 0.117, "step": 8420 }, { - "epoch": 0.09, - "learning_rate": 0.00028632292815886816, - "loss": 0.1088, + "epoch": 0.05, + "learning_rate": 0.00029183861827710616, + "loss": 0.1292, "step": 8430 }, { - "epoch": 0.09, - "learning_rate": 0.00028630670387435914, - "loss": 0.127, + "epoch": 0.05, + "learning_rate": 0.00029182893692274923, + "loss": 0.1385, "step": 8440 }, { - "epoch": 0.09, - "learning_rate": 0.00028629047958985006, - "loss": 0.1128, + "epoch": 0.05, + "learning_rate": 0.00029181925556839226, + "loss": 0.1363, "step": 8450 }, { - "epoch": 0.09, - "learning_rate": 0.00028627425530534104, - "loss": 0.1098, + "epoch": 0.05, + "learning_rate": 0.00029180957421403534, + "loss": 0.1302, "step": 8460 }, { - "epoch": 0.09, - "learning_rate": 0.00028625803102083196, - "loss": 0.1152, + "epoch": 0.05, + "learning_rate": 0.0002917998928596784, + "loss": 0.1254, "step": 8470 }, { - "epoch": 0.09, - "learning_rate": 0.0002862418067363229, - "loss": 0.1003, + "epoch": 0.05, + "learning_rate": 0.0002917902115053215, + "loss": 0.129, "step": 8480 }, { - "epoch": 0.09, - "learning_rate": 0.00028622558245181386, - "loss": 0.1096, + "epoch": 0.05, + "learning_rate": 0.0002917805301509646, + "loss": 0.1159, "step": 8490 }, { - "epoch": 0.09, - "learning_rate": 0.0002862093581673048, - "loss": 0.1068, + "epoch": 0.05, + "learning_rate": 0.0002917708487966076, + "loss": 0.1278, "step": 8500 }, { - "epoch": 0.09, - "learning_rate": 0.0002861931338827957, - "loss": 0.1088, + "epoch": 0.05, + "learning_rate": 0.0002917611674422507, + "loss": 0.1308, "step": 8510 }, { - "epoch": 0.09, - "learning_rate": 0.0002861769095982867, - "loss": 0.1215, + "epoch": 0.05, + "learning_rate": 0.00029175148608789376, + "loss": 0.1204, "step": 8520 }, { - "epoch": 0.09, - "learning_rate": 0.0002861606853137776, - "loss": 0.1076, + "epoch": 0.06, + "learning_rate": 0.00029174180473353684, + "loss": 0.1307, "step": 8530 }, { - "epoch": 0.09, - "learning_rate": 0.0002861444610292686, - "loss": 0.1144, + "epoch": 0.06, + "learning_rate": 0.0002917321233791799, + "loss": 0.1383, "step": 8540 }, { - "epoch": 0.09, - "learning_rate": 0.0002861282367447595, - "loss": 0.1205, + "epoch": 0.06, + "learning_rate": 0.000291722442024823, + "loss": 0.1287, "step": 8550 }, { - "epoch": 0.09, - "learning_rate": 0.0002861120124602505, - "loss": 0.1111, + "epoch": 0.06, + "learning_rate": 0.00029171276067046603, + "loss": 0.1343, "step": 8560 }, { - "epoch": 0.09, - "learning_rate": 0.0002860957881757414, - "loss": 0.1116, + "epoch": 0.06, + "learning_rate": 0.0002917030793161091, + "loss": 0.1179, "step": 8570 }, { - "epoch": 0.09, - "learning_rate": 0.0002860795638912324, - "loss": 0.1151, + "epoch": 0.06, + "learning_rate": 0.00029169339796175214, + "loss": 0.124, "step": 8580 }, { - "epoch": 0.09, - "learning_rate": 0.0002860633396067233, - "loss": 0.1128, + "epoch": 0.06, + "learning_rate": 0.0002916837166073952, + "loss": 0.1261, "step": 8590 }, { - "epoch": 0.09, - "learning_rate": 0.0002860471153222143, - "loss": 0.1058, + "epoch": 0.06, + "learning_rate": 0.0002916740352530383, + "loss": 0.1152, "step": 8600 }, { - "epoch": 0.09, - "learning_rate": 0.0002860308910377052, - "loss": 0.1157, + "epoch": 0.06, + "learning_rate": 0.0002916643538986814, + "loss": 0.1229, "step": 8610 }, { - "epoch": 0.09, - "learning_rate": 0.0002860146667531962, - "loss": 0.1057, + "epoch": 0.06, + "learning_rate": 0.00029165467254432445, + "loss": 0.1166, "step": 8620 }, { - "epoch": 0.09, - "learning_rate": 0.0002859984424686871, - "loss": 0.0962, + "epoch": 0.06, + "learning_rate": 0.00029164499118996753, + "loss": 0.1296, "step": 8630 }, { - "epoch": 0.09, - "learning_rate": 0.0002859822181841781, - "loss": 0.1077, + "epoch": 0.06, + "learning_rate": 0.00029163530983561056, + "loss": 0.1257, "step": 8640 }, { - "epoch": 0.09, - "learning_rate": 0.000285965993899669, - "loss": 0.1187, + "epoch": 0.06, + "learning_rate": 0.00029162562848125364, + "loss": 0.138, "step": 8650 }, { - "epoch": 0.09, - "learning_rate": 0.00028594976961515993, - "loss": 0.1142, + "epoch": 0.06, + "learning_rate": 0.0002916159471268967, + "loss": 0.1365, "step": 8660 }, { - "epoch": 0.09, - "learning_rate": 0.0002859335453306509, - "loss": 0.1132, + "epoch": 0.06, + "learning_rate": 0.0002916062657725398, + "loss": 0.1164, "step": 8670 }, { - "epoch": 0.09, - "learning_rate": 0.0002859173210461418, - "loss": 0.1068, + "epoch": 0.06, + "learning_rate": 0.0002915965844181829, + "loss": 0.1351, "step": 8680 }, { - "epoch": 0.09, - "learning_rate": 0.00028590109676163275, - "loss": 0.1165, + "epoch": 0.06, + "learning_rate": 0.0002915869030638259, + "loss": 0.1285, "step": 8690 }, { - "epoch": 0.09, - "learning_rate": 0.0002858848724771237, - "loss": 0.1093, + "epoch": 0.06, + "learning_rate": 0.000291577221709469, + "loss": 0.1225, "step": 8700 }, { - "epoch": 0.09, - "learning_rate": 0.00028586864819261465, - "loss": 0.1184, + "epoch": 0.06, + "learning_rate": 0.00029156754035511206, + "loss": 0.1274, "step": 8710 }, { - "epoch": 0.09, - "learning_rate": 0.0002858524239081056, - "loss": 0.1123, + "epoch": 0.06, + "learning_rate": 0.0002915578590007551, + "loss": 0.1229, "step": 8720 }, { - "epoch": 0.09, - "learning_rate": 0.00028583619962359655, - "loss": 0.1108, + "epoch": 0.06, + "learning_rate": 0.00029154817764639817, + "loss": 0.1333, "step": 8730 }, { - "epoch": 0.09, - "learning_rate": 0.0002858199753390875, - "loss": 0.1044, + "epoch": 0.06, + "learning_rate": 0.00029153849629204125, + "loss": 0.1284, "step": 8740 }, { - "epoch": 0.09, - "learning_rate": 0.00028580375105457845, - "loss": 0.1077, + "epoch": 0.06, + "learning_rate": 0.00029152881493768433, + "loss": 0.1239, "step": 8750 }, { - "epoch": 0.09, - "learning_rate": 0.0002857875267700694, - "loss": 0.1204, + "epoch": 0.06, + "learning_rate": 0.0002915191335833274, + "loss": 0.1329, "step": 8760 }, { - "epoch": 0.09, - "learning_rate": 0.00028577130248556035, - "loss": 0.1126, + "epoch": 0.06, + "learning_rate": 0.0002915094522289705, + "loss": 0.1271, "step": 8770 }, { - "epoch": 0.09, - "learning_rate": 0.0002857550782010513, - "loss": 0.1024, + "epoch": 0.06, + "learning_rate": 0.0002914997708746135, + "loss": 0.122, "step": 8780 }, { - "epoch": 0.1, - "learning_rate": 0.00028573885391654225, - "loss": 0.1104, + "epoch": 0.06, + "learning_rate": 0.0002914900895202566, + "loss": 0.1344, "step": 8790 }, { - "epoch": 0.1, - "learning_rate": 0.0002857226296320332, - "loss": 0.1063, + "epoch": 0.06, + "learning_rate": 0.0002914804081658997, + "loss": 0.12, "step": 8800 }, { - "epoch": 0.1, - "learning_rate": 0.00028570640534752415, - "loss": 0.1092, + "epoch": 0.06, + "learning_rate": 0.00029147072681154275, + "loss": 0.1229, "step": 8810 }, { - "epoch": 0.1, - "learning_rate": 0.0002856901810630151, - "loss": 0.0945, + "epoch": 0.06, + "learning_rate": 0.0002914610454571858, + "loss": 0.1309, "step": 8820 }, { - "epoch": 0.1, - "learning_rate": 0.00028567395677850605, - "loss": 0.1241, + "epoch": 0.06, + "learning_rate": 0.00029145136410282886, + "loss": 0.1243, "step": 8830 }, { - "epoch": 0.1, - "learning_rate": 0.00028565773249399697, - "loss": 0.1164, + "epoch": 0.06, + "learning_rate": 0.00029144168274847194, + "loss": 0.1253, "step": 8840 }, { - "epoch": 0.1, - "learning_rate": 0.00028564150820948795, - "loss": 0.1069, + "epoch": 0.06, + "learning_rate": 0.00029143200139411496, + "loss": 0.1226, "step": 8850 }, { - "epoch": 0.1, - "learning_rate": 0.00028562528392497887, - "loss": 0.1099, + "epoch": 0.06, + "learning_rate": 0.00029142232003975804, + "loss": 0.1384, "step": 8860 }, { - "epoch": 0.1, - "learning_rate": 0.0002856090596404698, - "loss": 0.1102, + "epoch": 0.06, + "learning_rate": 0.0002914126386854011, + "loss": 0.1259, "step": 8870 }, { - "epoch": 0.1, - "learning_rate": 0.00028559283535596077, - "loss": 0.1125, + "epoch": 0.06, + "learning_rate": 0.0002914029573310442, + "loss": 0.119, "step": 8880 }, { - "epoch": 0.1, - "learning_rate": 0.0002855766110714517, - "loss": 0.1021, + "epoch": 0.06, + "learning_rate": 0.0002913932759766873, + "loss": 0.1297, "step": 8890 }, { - "epoch": 0.1, - "learning_rate": 0.00028556038678694267, - "loss": 0.1178, + "epoch": 0.06, + "learning_rate": 0.00029138359462233036, + "loss": 0.1283, "step": 8900 }, { - "epoch": 0.1, - "learning_rate": 0.0002855441625024336, - "loss": 0.1221, + "epoch": 0.06, + "learning_rate": 0.00029137391326797344, + "loss": 0.1276, "step": 8910 }, { - "epoch": 0.1, - "learning_rate": 0.00028552793821792457, - "loss": 0.1061, + "epoch": 0.06, + "learning_rate": 0.00029136423191361647, + "loss": 0.1265, "step": 8920 }, { - "epoch": 0.1, - "learning_rate": 0.0002855117139334155, - "loss": 0.1006, + "epoch": 0.06, + "learning_rate": 0.00029135455055925955, + "loss": 0.1229, "step": 8930 }, { - "epoch": 0.1, - "learning_rate": 0.00028549548964890647, - "loss": 0.1199, + "epoch": 0.06, + "learning_rate": 0.00029134486920490263, + "loss": 0.1367, "step": 8940 }, { - "epoch": 0.1, - "learning_rate": 0.0002854792653643974, - "loss": 0.1207, + "epoch": 0.06, + "learning_rate": 0.0002913351878505457, + "loss": 0.1156, "step": 8950 }, { - "epoch": 0.1, - "learning_rate": 0.00028546304107988837, - "loss": 0.1136, + "epoch": 0.06, + "learning_rate": 0.00029132550649618873, + "loss": 0.1181, "step": 8960 }, { - "epoch": 0.1, - "learning_rate": 0.0002854468167953793, - "loss": 0.1118, + "epoch": 0.06, + "learning_rate": 0.0002913158251418318, + "loss": 0.1173, "step": 8970 }, { - "epoch": 0.1, - "learning_rate": 0.00028543059251087027, - "loss": 0.1192, + "epoch": 0.06, + "learning_rate": 0.0002913061437874749, + "loss": 0.1178, "step": 8980 }, { - "epoch": 0.1, - "learning_rate": 0.0002854143682263612, - "loss": 0.1235, + "epoch": 0.06, + "learning_rate": 0.0002912964624331179, + "loss": 0.1138, "step": 8990 }, { - "epoch": 0.1, - "learning_rate": 0.00028539814394185217, - "loss": 0.1091, + "epoch": 0.06, + "learning_rate": 0.000291286781078761, + "loss": 0.1207, "step": 9000 }, { - "epoch": 0.1, - "eval_cer": 0.9215925334973081, - "eval_loss": 0.07693669945001602, - "eval_runtime": 119.5218, - "eval_samples_per_second": 16.733, - "eval_steps_per_second": 4.183, + "epoch": 0.06, + "eval_cer": 0.9200921929725455, + "eval_loss": 0.08904129266738892, + "eval_runtime": 120.7527, + "eval_samples_per_second": 16.563, + "eval_steps_per_second": 4.141, "step": 9000 }, { - "epoch": 0.1, - "learning_rate": 0.0002853819196573431, - "loss": 0.1211, + "epoch": 0.06, + "learning_rate": 0.0002912770997244041, + "loss": 0.1224, "step": 9010 }, { - "epoch": 0.1, - "learning_rate": 0.000285365695372834, - "loss": 0.1222, + "epoch": 0.06, + "learning_rate": 0.00029126741837004716, + "loss": 0.1263, "step": 9020 }, { - "epoch": 0.1, - "learning_rate": 0.000285349471088325, - "loss": 0.1071, + "epoch": 0.06, + "learning_rate": 0.00029125773701569024, + "loss": 0.1122, "step": 9030 }, { - "epoch": 0.1, - "learning_rate": 0.0002853332468038159, - "loss": 0.1145, + "epoch": 0.06, + "learning_rate": 0.0002912480556613333, + "loss": 0.1397, "step": 9040 }, { - "epoch": 0.1, - "learning_rate": 0.00028531702251930683, - "loss": 0.1123, + "epoch": 0.06, + "learning_rate": 0.0002912383743069764, + "loss": 0.1378, "step": 9050 }, { - "epoch": 0.1, - "learning_rate": 0.0002853007982347978, - "loss": 0.1209, + "epoch": 0.06, + "learning_rate": 0.0002912286929526194, + "loss": 0.13, "step": 9060 }, { - "epoch": 0.1, - "learning_rate": 0.00028528457395028873, - "loss": 0.1103, + "epoch": 0.06, + "learning_rate": 0.0002912190115982625, + "loss": 0.1289, "step": 9070 }, { - "epoch": 0.1, - "learning_rate": 0.0002852683496657797, - "loss": 0.1048, + "epoch": 0.06, + "learning_rate": 0.0002912093302439056, + "loss": 0.1193, "step": 9080 }, { - "epoch": 0.1, - "learning_rate": 0.00028525212538127063, - "loss": 0.1054, + "epoch": 0.06, + "learning_rate": 0.0002911996488895486, + "loss": 0.121, "step": 9090 }, { - "epoch": 0.1, - "learning_rate": 0.0002852359010967616, - "loss": 0.1125, + "epoch": 0.06, + "learning_rate": 0.0002911899675351917, + "loss": 0.1117, "step": 9100 }, { - "epoch": 0.1, - "learning_rate": 0.00028521967681225253, - "loss": 0.1202, + "epoch": 0.06, + "learning_rate": 0.00029118028618083477, + "loss": 0.1257, "step": 9110 }, { - "epoch": 0.1, - "learning_rate": 0.0002852034525277435, - "loss": 0.1137, + "epoch": 0.06, + "learning_rate": 0.00029117060482647785, + "loss": 0.1286, "step": 9120 }, { - "epoch": 0.1, - "learning_rate": 0.00028518722824323443, - "loss": 0.1047, + "epoch": 0.06, + "learning_rate": 0.0002911609234721209, + "loss": 0.1253, "step": 9130 }, { - "epoch": 0.1, - "learning_rate": 0.0002851710039587254, - "loss": 0.1019, + "epoch": 0.06, + "learning_rate": 0.00029115124211776395, + "loss": 0.1231, "step": 9140 }, { - "epoch": 0.1, - "learning_rate": 0.00028515477967421633, - "loss": 0.1066, + "epoch": 0.06, + "learning_rate": 0.00029114156076340703, + "loss": 0.1191, "step": 9150 }, { - "epoch": 0.1, - "learning_rate": 0.0002851385553897073, - "loss": 0.1212, + "epoch": 0.06, + "learning_rate": 0.0002911318794090501, + "loss": 0.1254, "step": 9160 }, { - "epoch": 0.1, - "learning_rate": 0.00028512233110519823, - "loss": 0.0986, + "epoch": 0.06, + "learning_rate": 0.0002911221980546932, + "loss": 0.1206, "step": 9170 }, { - "epoch": 0.1, - "learning_rate": 0.0002851061068206892, - "loss": 0.1006, + "epoch": 0.06, + "learning_rate": 0.00029111251670033627, + "loss": 0.1197, "step": 9180 }, { - "epoch": 0.1, - "learning_rate": 0.00028508988253618013, - "loss": 0.1098, + "epoch": 0.06, + "learning_rate": 0.0002911028353459793, + "loss": 0.1212, "step": 9190 }, { - "epoch": 0.1, - "learning_rate": 0.00028507365825167105, - "loss": 0.1098, + "epoch": 0.06, + "learning_rate": 0.0002910931539916224, + "loss": 0.1221, "step": 9200 }, { - "epoch": 0.1, - "learning_rate": 0.00028505743396716203, - "loss": 0.1189, + "epoch": 0.06, + "learning_rate": 0.00029108347263726546, + "loss": 0.1264, "step": 9210 }, { - "epoch": 0.1, - "learning_rate": 0.00028504120968265295, - "loss": 0.1087, + "epoch": 0.06, + "learning_rate": 0.0002910737912829085, + "loss": 0.1127, "step": 9220 }, { - "epoch": 0.1, - "learning_rate": 0.0002850249853981439, - "loss": 0.1163, + "epoch": 0.06, + "learning_rate": 0.00029106410992855156, + "loss": 0.1353, "step": 9230 }, { - "epoch": 0.1, - "learning_rate": 0.00028500876111363485, - "loss": 0.1028, + "epoch": 0.06, + "learning_rate": 0.00029105442857419464, + "loss": 0.118, "step": 9240 }, { - "epoch": 0.1, - "learning_rate": 0.0002849925368291258, - "loss": 0.1086, + "epoch": 0.06, + "learning_rate": 0.0002910447472198377, + "loss": 0.1233, "step": 9250 }, { - "epoch": 0.1, - "learning_rate": 0.00028497631254461675, - "loss": 0.1094, + "epoch": 0.06, + "learning_rate": 0.0002910350658654808, + "loss": 0.1133, "step": 9260 }, { - "epoch": 0.1, - "learning_rate": 0.0002849600882601077, - "loss": 0.0985, + "epoch": 0.06, + "learning_rate": 0.00029102538451112383, + "loss": 0.1122, "step": 9270 }, { - "epoch": 0.1, - "learning_rate": 0.00028494386397559865, - "loss": 0.1095, + "epoch": 0.06, + "learning_rate": 0.0002910157031567669, + "loss": 0.1188, "step": 9280 }, { - "epoch": 0.1, - "learning_rate": 0.0002849276396910896, - "loss": 0.1119, + "epoch": 0.06, + "learning_rate": 0.00029100602180241, + "loss": 0.1215, "step": 9290 }, { - "epoch": 0.1, - "learning_rate": 0.00028491141540658055, - "loss": 0.0963, + "epoch": 0.06, + "learning_rate": 0.00029099634044805307, + "loss": 0.1203, "step": 9300 }, { - "epoch": 0.1, - "learning_rate": 0.00028489519112207147, - "loss": 0.0963, + "epoch": 0.06, + "learning_rate": 0.00029098665909369615, + "loss": 0.1171, "step": 9310 }, { - "epoch": 0.1, - "learning_rate": 0.00028487896683756245, - "loss": 0.104, + "epoch": 0.06, + "learning_rate": 0.0002909769777393392, + "loss": 0.1298, "step": 9320 }, { - "epoch": 0.1, - "learning_rate": 0.00028486274255305337, - "loss": 0.0979, + "epoch": 0.06, + "learning_rate": 0.00029096729638498225, + "loss": 0.1149, "step": 9330 }, { - "epoch": 0.1, - "learning_rate": 0.00028484651826854435, - "loss": 0.1092, + "epoch": 0.06, + "learning_rate": 0.00029095761503062533, + "loss": 0.1204, "step": 9340 }, { - "epoch": 0.1, - "learning_rate": 0.00028483029398403527, - "loss": 0.0961, + "epoch": 0.06, + "learning_rate": 0.0002909479336762684, + "loss": 0.1112, "step": 9350 }, { - "epoch": 0.1, - "learning_rate": 0.00028481406969952625, - "loss": 0.1008, + "epoch": 0.06, + "learning_rate": 0.00029093825232191144, + "loss": 0.1196, "step": 9360 }, { - "epoch": 0.1, - "learning_rate": 0.00028479784541501717, - "loss": 0.1129, + "epoch": 0.06, + "learning_rate": 0.0002909285709675545, + "loss": 0.1193, "step": 9370 }, { - "epoch": 0.1, - "learning_rate": 0.0002847816211305081, - "loss": 0.0995, + "epoch": 0.06, + "learning_rate": 0.0002909188896131976, + "loss": 0.1165, "step": 9380 }, { - "epoch": 0.1, - "learning_rate": 0.00028476539684599907, - "loss": 0.1149, + "epoch": 0.06, + "learning_rate": 0.0002909092082588407, + "loss": 0.1229, "step": 9390 }, { - "epoch": 0.1, - "learning_rate": 0.00028474917256149, - "loss": 0.102, + "epoch": 0.06, + "learning_rate": 0.00029089952690448376, + "loss": 0.1221, "step": 9400 }, { - "epoch": 0.1, - "learning_rate": 0.00028473294827698097, - "loss": 0.1029, + "epoch": 0.06, + "learning_rate": 0.0002908898455501268, + "loss": 0.1232, "step": 9410 }, { - "epoch": 0.1, - "learning_rate": 0.0002847167239924719, - "loss": 0.1057, + "epoch": 0.06, + "learning_rate": 0.00029088016419576986, + "loss": 0.113, "step": 9420 }, { - "epoch": 0.1, - "learning_rate": 0.00028470049970796287, - "loss": 0.1133, + "epoch": 0.06, + "learning_rate": 0.00029087048284141294, + "loss": 0.1181, "step": 9430 }, { - "epoch": 0.1, - "learning_rate": 0.0002846842754234538, - "loss": 0.1063, + "epoch": 0.06, + "learning_rate": 0.000290860801487056, + "loss": 0.1147, "step": 9440 }, { - "epoch": 0.1, - "learning_rate": 0.00028466805113894477, - "loss": 0.1068, + "epoch": 0.06, + "learning_rate": 0.0002908511201326991, + "loss": 0.1206, "step": 9450 }, { - "epoch": 0.1, - "learning_rate": 0.0002846518268544357, - "loss": 0.1102, + "epoch": 0.06, + "learning_rate": 0.0002908414387783421, + "loss": 0.1307, "step": 9460 }, { - "epoch": 0.1, - "learning_rate": 0.00028463560256992667, - "loss": 0.1117, + "epoch": 0.06, + "learning_rate": 0.0002908317574239852, + "loss": 0.1103, "step": 9470 }, { - "epoch": 0.1, - "learning_rate": 0.0002846193782854176, - "loss": 0.102, + "epoch": 0.06, + "learning_rate": 0.0002908220760696283, + "loss": 0.1193, "step": 9480 }, { - "epoch": 0.1, - "learning_rate": 0.00028460315400090857, - "loss": 0.1106, + "epoch": 0.06, + "learning_rate": 0.0002908123947152713, + "loss": 0.112, "step": 9490 }, { - "epoch": 0.1, - "learning_rate": 0.0002845869297163995, - "loss": 0.0974, + "epoch": 0.06, + "learning_rate": 0.0002908027133609144, + "loss": 0.1163, "step": 9500 }, { - "epoch": 0.1, - "learning_rate": 0.00028457070543189047, - "loss": 0.1049, + "epoch": 0.06, + "learning_rate": 0.00029079303200655747, + "loss": 0.112, "step": 9510 }, { - "epoch": 0.1, - "learning_rate": 0.0002845544811473814, - "loss": 0.1143, + "epoch": 0.06, + "learning_rate": 0.00029078335065220055, + "loss": 0.1215, "step": 9520 }, { - "epoch": 0.1, - "learning_rate": 0.0002845382568628723, - "loss": 0.1028, + "epoch": 0.06, + "learning_rate": 0.00029077366929784363, + "loss": 0.1113, "step": 9530 }, { - "epoch": 0.1, - "learning_rate": 0.0002845220325783633, - "loss": 0.1086, + "epoch": 0.06, + "learning_rate": 0.0002907639879434867, + "loss": 0.1199, "step": 9540 }, { - "epoch": 0.1, - "learning_rate": 0.0002845058082938542, - "loss": 0.102, + "epoch": 0.06, + "learning_rate": 0.00029075430658912974, + "loss": 0.1195, "step": 9550 }, { - "epoch": 0.1, - "learning_rate": 0.00028448958400934514, - "loss": 0.0954, + "epoch": 0.06, + "learning_rate": 0.0002907446252347728, + "loss": 0.1104, "step": 9560 }, { - "epoch": 0.1, - "learning_rate": 0.0002844733597248361, - "loss": 0.101, + "epoch": 0.06, + "learning_rate": 0.0002907349438804159, + "loss": 0.1064, "step": 9570 }, { - "epoch": 0.1, - "learning_rate": 0.00028445713544032704, - "loss": 0.105, + "epoch": 0.06, + "learning_rate": 0.000290725262526059, + "loss": 0.1188, "step": 9580 }, { - "epoch": 0.1, - "learning_rate": 0.000284440911155818, - "loss": 0.1084, + "epoch": 0.06, + "learning_rate": 0.000290715581171702, + "loss": 0.1191, "step": 9590 }, { - "epoch": 0.1, - "learning_rate": 0.00028442468687130893, - "loss": 0.1114, + "epoch": 0.06, + "learning_rate": 0.0002907058998173451, + "loss": 0.1127, "step": 9600 }, { - "epoch": 0.1, - "learning_rate": 0.0002844084625867999, - "loss": 0.1004, + "epoch": 0.06, + "learning_rate": 0.00029069621846298816, + "loss": 0.1081, "step": 9610 }, { - "epoch": 0.1, - "learning_rate": 0.00028439223830229083, - "loss": 0.1189, + "epoch": 0.06, + "learning_rate": 0.0002906865371086312, + "loss": 0.1121, "step": 9620 }, { - "epoch": 0.1, - "learning_rate": 0.0002843760140177818, - "loss": 0.1078, + "epoch": 0.06, + "learning_rate": 0.00029067685575427427, + "loss": 0.1163, "step": 9630 }, { - "epoch": 0.1, - "learning_rate": 0.00028435978973327273, - "loss": 0.0992, + "epoch": 0.06, + "learning_rate": 0.00029066717439991735, + "loss": 0.1198, "step": 9640 }, { - "epoch": 0.1, - "learning_rate": 0.0002843435654487637, - "loss": 0.1045, + "epoch": 0.06, + "learning_rate": 0.0002906574930455604, + "loss": 0.1142, "step": 9650 }, { - "epoch": 0.1, - "learning_rate": 0.00028432734116425463, - "loss": 0.122, + "epoch": 0.06, + "learning_rate": 0.0002906478116912035, + "loss": 0.1139, "step": 9660 }, { - "epoch": 0.1, - "learning_rate": 0.0002843111168797456, - "loss": 0.0945, + "epoch": 0.06, + "learning_rate": 0.0002906381303368466, + "loss": 0.1096, "step": 9670 }, { - "epoch": 0.1, - "learning_rate": 0.00028429489259523653, - "loss": 0.1106, + "epoch": 0.06, + "learning_rate": 0.00029062844898248967, + "loss": 0.1076, "step": 9680 }, { - "epoch": 0.1, - "learning_rate": 0.0002842786683107275, - "loss": 0.0978, + "epoch": 0.06, + "learning_rate": 0.0002906187676281327, + "loss": 0.1236, "step": 9690 }, { - "epoch": 0.1, - "learning_rate": 0.00028426244402621843, - "loss": 0.1033, + "epoch": 0.06, + "learning_rate": 0.00029060908627377577, + "loss": 0.1202, "step": 9700 }, { - "epoch": 0.11, - "learning_rate": 0.00028424621974170936, - "loss": 0.1088, + "epoch": 0.06, + "learning_rate": 0.00029059940491941885, + "loss": 0.1304, "step": 9710 }, { - "epoch": 0.11, - "learning_rate": 0.00028422999545720033, - "loss": 0.0911, + "epoch": 0.06, + "learning_rate": 0.00029058972356506193, + "loss": 0.115, "step": 9720 }, { - "epoch": 0.11, - "learning_rate": 0.00028421377117269125, - "loss": 0.1039, + "epoch": 0.06, + "learning_rate": 0.00029058004221070496, + "loss": 0.1073, "step": 9730 }, { - "epoch": 0.11, - "learning_rate": 0.0002841975468881822, - "loss": 0.1029, + "epoch": 0.06, + "learning_rate": 0.00029057036085634804, + "loss": 0.1184, "step": 9740 }, { - "epoch": 0.11, - "learning_rate": 0.00028418132260367315, - "loss": 0.0984, + "epoch": 0.06, + "learning_rate": 0.0002905606795019911, + "loss": 0.1168, "step": 9750 }, { - "epoch": 0.11, - "learning_rate": 0.0002841650983191641, - "loss": 0.1087, + "epoch": 0.06, + "learning_rate": 0.00029055099814763414, + "loss": 0.1299, "step": 9760 }, { - "epoch": 0.11, - "learning_rate": 0.00028414887403465505, - "loss": 0.1012, + "epoch": 0.06, + "learning_rate": 0.0002905413167932772, + "loss": 0.1141, "step": 9770 }, { - "epoch": 0.11, - "learning_rate": 0.000284132649750146, - "loss": 0.1072, + "epoch": 0.06, + "learning_rate": 0.0002905316354389203, + "loss": 0.1167, "step": 9780 }, { - "epoch": 0.11, - "learning_rate": 0.00028411642546563695, - "loss": 0.0967, + "epoch": 0.06, + "learning_rate": 0.0002905219540845634, + "loss": 0.1216, "step": 9790 }, { - "epoch": 0.11, - "learning_rate": 0.0002841002011811279, - "loss": 0.1093, + "epoch": 0.06, + "learning_rate": 0.00029051227273020646, + "loss": 0.1187, "step": 9800 }, { - "epoch": 0.11, - "learning_rate": 0.00028408397689661885, - "loss": 0.1048, + "epoch": 0.06, + "learning_rate": 0.00029050259137584954, + "loss": 0.129, "step": 9810 }, { - "epoch": 0.11, - "learning_rate": 0.0002840677526121098, - "loss": 0.1094, + "epoch": 0.06, + "learning_rate": 0.0002904929100214926, + "loss": 0.1273, "step": 9820 }, { - "epoch": 0.11, - "learning_rate": 0.00028405152832760075, - "loss": 0.1049, + "epoch": 0.06, + "learning_rate": 0.00029048322866713565, + "loss": 0.1172, "step": 9830 }, { - "epoch": 0.11, - "learning_rate": 0.0002840353040430917, - "loss": 0.1031, + "epoch": 0.06, + "learning_rate": 0.0002904735473127787, + "loss": 0.1277, "step": 9840 }, { - "epoch": 0.11, - "learning_rate": 0.00028401907975858265, - "loss": 0.1044, + "epoch": 0.06, + "learning_rate": 0.0002904638659584218, + "loss": 0.121, "step": 9850 }, { - "epoch": 0.11, - "learning_rate": 0.0002840028554740736, - "loss": 0.101, + "epoch": 0.06, + "learning_rate": 0.00029045418460406483, + "loss": 0.1226, "step": 9860 }, { - "epoch": 0.11, - "learning_rate": 0.00028398663118956455, - "loss": 0.1065, + "epoch": 0.06, + "learning_rate": 0.0002904445032497079, + "loss": 0.1169, "step": 9870 }, { - "epoch": 0.11, - "learning_rate": 0.0002839704069050555, - "loss": 0.099, + "epoch": 0.06, + "learning_rate": 0.000290434821895351, + "loss": 0.1157, "step": 9880 }, { - "epoch": 0.11, - "learning_rate": 0.0002839541826205464, - "loss": 0.1066, + "epoch": 0.06, + "learning_rate": 0.00029042514054099407, + "loss": 0.1224, "step": 9890 }, { - "epoch": 0.11, - "learning_rate": 0.0002839379583360374, - "loss": 0.104, + "epoch": 0.06, + "learning_rate": 0.0002904154591866371, + "loss": 0.1175, "step": 9900 }, { - "epoch": 0.11, - "learning_rate": 0.0002839217340515283, - "loss": 0.1003, + "epoch": 0.06, + "learning_rate": 0.0002904057778322802, + "loss": 0.1297, "step": 9910 }, { - "epoch": 0.11, - "learning_rate": 0.0002839055097670192, - "loss": 0.1034, + "epoch": 0.06, + "learning_rate": 0.00029039609647792326, + "loss": 0.1127, "step": 9920 }, { - "epoch": 0.11, - "learning_rate": 0.0002838892854825102, - "loss": 0.1119, + "epoch": 0.06, + "learning_rate": 0.00029038641512356633, + "loss": 0.1217, "step": 9930 }, { - "epoch": 0.11, - "learning_rate": 0.0002838730611980011, - "loss": 0.1158, + "epoch": 0.06, + "learning_rate": 0.0002903767337692094, + "loss": 0.1264, "step": 9940 }, { - "epoch": 0.11, - "learning_rate": 0.0002838568369134921, - "loss": 0.1124, + "epoch": 0.06, + "learning_rate": 0.0002903670524148525, + "loss": 0.1153, "step": 9950 }, { - "epoch": 0.11, - "learning_rate": 0.000283840612628983, - "loss": 0.1072, + "epoch": 0.06, + "learning_rate": 0.0002903573710604956, + "loss": 0.1199, "step": 9960 }, { - "epoch": 0.11, - "learning_rate": 0.000283824388344474, - "loss": 0.1058, + "epoch": 0.06, + "learning_rate": 0.0002903476897061386, + "loss": 0.1229, "step": 9970 }, { - "epoch": 0.11, - "learning_rate": 0.0002838081640599649, - "loss": 0.1102, + "epoch": 0.06, + "learning_rate": 0.0002903380083517817, + "loss": 0.1257, "step": 9980 }, { - "epoch": 0.11, - "learning_rate": 0.0002837919397754559, - "loss": 0.1007, + "epoch": 0.06, + "learning_rate": 0.0002903283269974247, + "loss": 0.1215, "step": 9990 }, { - "epoch": 0.11, - "learning_rate": 0.0002837757154909468, - "loss": 0.0935, + "epoch": 0.06, + "learning_rate": 0.0002903186456430678, + "loss": 0.108, "step": 10000 }, { - "epoch": 0.11, - "eval_cer": 0.9213963999780896, - "eval_loss": 0.06996258348226547, - "eval_runtime": 119.4757, - "eval_samples_per_second": 16.74, - "eval_steps_per_second": 4.185, + "epoch": 0.06, + "eval_cer": 0.9202810981809965, + "eval_loss": 0.08496131747961044, + "eval_runtime": 120.7005, + "eval_samples_per_second": 16.57, + "eval_steps_per_second": 4.142, "step": 10000 }, { - "epoch": 0.11, - "learning_rate": 0.0002837594912064378, - "loss": 0.1024, + "epoch": 0.06, + "learning_rate": 0.00029030896428871086, + "loss": 0.1288, "step": 10010 }, { - "epoch": 0.11, - "learning_rate": 0.0002837432669219287, - "loss": 0.1001, + "epoch": 0.06, + "learning_rate": 0.00029029928293435394, + "loss": 0.1277, "step": 10020 }, { - "epoch": 0.11, - "learning_rate": 0.0002837270426374197, - "loss": 0.1021, + "epoch": 0.06, + "learning_rate": 0.000290289601579997, + "loss": 0.1249, "step": 10030 }, { - "epoch": 0.11, - "learning_rate": 0.0002837108183529106, - "loss": 0.0967, + "epoch": 0.06, + "learning_rate": 0.00029027992022564005, + "loss": 0.1236, "step": 10040 }, { - "epoch": 0.11, - "learning_rate": 0.0002836945940684016, - "loss": 0.0974, + "epoch": 0.06, + "learning_rate": 0.00029027023887128313, + "loss": 0.1177, "step": 10050 }, { - "epoch": 0.11, - "learning_rate": 0.0002836783697838925, - "loss": 0.1106, + "epoch": 0.06, + "learning_rate": 0.0002902605575169262, + "loss": 0.1177, "step": 10060 }, { - "epoch": 0.11, - "learning_rate": 0.00028366214549938344, - "loss": 0.0999, + "epoch": 0.06, + "learning_rate": 0.0002902508761625693, + "loss": 0.1067, "step": 10070 }, { - "epoch": 0.11, - "learning_rate": 0.0002836459212148744, - "loss": 0.1062, + "epoch": 0.07, + "learning_rate": 0.00029024119480821237, + "loss": 0.1173, "step": 10080 }, { - "epoch": 0.11, - "learning_rate": 0.00028362969693036534, - "loss": 0.1109, + "epoch": 0.07, + "learning_rate": 0.00029023151345385545, + "loss": 0.1194, "step": 10090 }, { - "epoch": 0.11, - "learning_rate": 0.0002836134726458563, - "loss": 0.1064, + "epoch": 0.07, + "learning_rate": 0.0002902218320994985, + "loss": 0.1133, "step": 10100 }, { - "epoch": 0.11, - "learning_rate": 0.00028359724836134724, - "loss": 0.0995, + "epoch": 0.07, + "learning_rate": 0.00029021215074514155, + "loss": 0.1167, "step": 10110 }, { - "epoch": 0.11, - "learning_rate": 0.00028358102407683816, - "loss": 0.1122, + "epoch": 0.07, + "learning_rate": 0.00029020246939078463, + "loss": 0.119, "step": 10120 }, { - "epoch": 0.11, - "learning_rate": 0.00028356479979232914, - "loss": 0.0955, + "epoch": 0.07, + "learning_rate": 0.00029019278803642766, + "loss": 0.1302, "step": 10130 }, { - "epoch": 0.11, - "learning_rate": 0.00028354857550782006, - "loss": 0.0956, + "epoch": 0.07, + "learning_rate": 0.00029018310668207074, + "loss": 0.117, "step": 10140 }, { - "epoch": 0.11, - "learning_rate": 0.00028353235122331104, - "loss": 0.1052, + "epoch": 0.07, + "learning_rate": 0.0002901734253277138, + "loss": 0.1096, "step": 10150 }, { - "epoch": 0.11, - "learning_rate": 0.00028351612693880196, - "loss": 0.1107, + "epoch": 0.07, + "learning_rate": 0.0002901637439733569, + "loss": 0.1137, "step": 10160 }, { - "epoch": 0.11, - "learning_rate": 0.00028349990265429294, - "loss": 0.112, + "epoch": 0.07, + "learning_rate": 0.000290154062619, + "loss": 0.1066, "step": 10170 }, { - "epoch": 0.11, - "learning_rate": 0.00028348367836978386, - "loss": 0.1185, + "epoch": 0.07, + "learning_rate": 0.000290144381264643, + "loss": 0.1131, "step": 10180 }, { - "epoch": 0.11, - "learning_rate": 0.00028346745408527484, - "loss": 0.1036, + "epoch": 0.07, + "learning_rate": 0.0002901346999102861, + "loss": 0.1181, "step": 10190 }, { - "epoch": 0.11, - "learning_rate": 0.00028345122980076576, - "loss": 0.1033, + "epoch": 0.07, + "learning_rate": 0.00029012501855592916, + "loss": 0.1111, "step": 10200 }, { - "epoch": 0.11, - "learning_rate": 0.00028343500551625674, - "loss": 0.1077, + "epoch": 0.07, + "learning_rate": 0.00029011533720157224, + "loss": 0.1074, "step": 10210 }, { - "epoch": 0.11, - "learning_rate": 0.00028341878123174766, - "loss": 0.1082, + "epoch": 0.07, + "learning_rate": 0.0002901056558472153, + "loss": 0.1192, "step": 10220 }, { - "epoch": 0.11, - "learning_rate": 0.00028340255694723863, - "loss": 0.1053, + "epoch": 0.07, + "learning_rate": 0.00029009597449285835, + "loss": 0.123, "step": 10230 }, { - "epoch": 0.11, - "learning_rate": 0.00028338633266272956, - "loss": 0.1074, + "epoch": 0.07, + "learning_rate": 0.00029008629313850143, + "loss": 0.1196, "step": 10240 }, { - "epoch": 0.11, - "learning_rate": 0.0002833701083782205, - "loss": 0.1003, + "epoch": 0.07, + "learning_rate": 0.0002900766117841445, + "loss": 0.1151, "step": 10250 }, { - "epoch": 0.11, - "learning_rate": 0.00028335388409371146, - "loss": 0.1075, + "epoch": 0.07, + "learning_rate": 0.00029006693042978753, + "loss": 0.1218, "step": 10260 }, { - "epoch": 0.11, - "learning_rate": 0.0002833376598092024, - "loss": 0.0988, + "epoch": 0.07, + "learning_rate": 0.0002900572490754306, + "loss": 0.1234, "step": 10270 }, { - "epoch": 0.11, - "learning_rate": 0.00028332143552469336, - "loss": 0.1048, + "epoch": 0.07, + "learning_rate": 0.0002900475677210737, + "loss": 0.1194, "step": 10280 }, { - "epoch": 0.11, - "learning_rate": 0.0002833052112401843, - "loss": 0.1001, + "epoch": 0.07, + "learning_rate": 0.0002900378863667168, + "loss": 0.1171, "step": 10290 }, { - "epoch": 0.11, - "learning_rate": 0.0002832889869556752, - "loss": 0.0907, + "epoch": 0.07, + "learning_rate": 0.00029002820501235985, + "loss": 0.122, "step": 10300 }, { - "epoch": 0.11, - "learning_rate": 0.0002832727626711662, - "loss": 0.1003, + "epoch": 0.07, + "learning_rate": 0.00029001852365800293, + "loss": 0.1293, "step": 10310 }, { - "epoch": 0.11, - "learning_rate": 0.0002832565383866571, - "loss": 0.1047, + "epoch": 0.07, + "learning_rate": 0.00029000884230364596, + "loss": 0.1249, "step": 10320 }, { - "epoch": 0.11, - "learning_rate": 0.0002832403141021481, - "loss": 0.1092, + "epoch": 0.07, + "learning_rate": 0.00028999916094928904, + "loss": 0.1106, "step": 10330 }, { - "epoch": 0.11, - "learning_rate": 0.000283224089817639, - "loss": 0.0985, + "epoch": 0.07, + "learning_rate": 0.0002899894795949321, + "loss": 0.111, "step": 10340 }, { - "epoch": 0.11, - "learning_rate": 0.00028320786553313, - "loss": 0.0957, + "epoch": 0.07, + "learning_rate": 0.0002899797982405752, + "loss": 0.1155, "step": 10350 }, { - "epoch": 0.11, - "learning_rate": 0.0002831916412486209, - "loss": 0.0962, + "epoch": 0.07, + "learning_rate": 0.0002899701168862183, + "loss": 0.1093, "step": 10360 }, { - "epoch": 0.11, - "learning_rate": 0.0002831754169641119, - "loss": 0.0989, + "epoch": 0.07, + "learning_rate": 0.0002899604355318613, + "loss": 0.1148, "step": 10370 }, { - "epoch": 0.11, - "learning_rate": 0.0002831591926796028, - "loss": 0.0934, + "epoch": 0.07, + "learning_rate": 0.0002899507541775044, + "loss": 0.1198, "step": 10380 }, { - "epoch": 0.11, - "learning_rate": 0.0002831429683950938, - "loss": 0.1004, + "epoch": 0.07, + "learning_rate": 0.0002899410728231474, + "loss": 0.1193, "step": 10390 }, { - "epoch": 0.11, - "learning_rate": 0.0002831267441105847, - "loss": 0.0972, + "epoch": 0.07, + "learning_rate": 0.0002899313914687905, + "loss": 0.1049, "step": 10400 }, { - "epoch": 0.11, - "learning_rate": 0.0002831105198260757, - "loss": 0.1068, + "epoch": 0.07, + "learning_rate": 0.00028992171011443357, + "loss": 0.1124, "step": 10410 }, { - "epoch": 0.11, - "learning_rate": 0.0002830942955415666, - "loss": 0.0989, + "epoch": 0.07, + "learning_rate": 0.00028991202876007665, + "loss": 0.1122, "step": 10420 }, { - "epoch": 0.11, - "learning_rate": 0.0002830780712570575, - "loss": 0.098, + "epoch": 0.07, + "learning_rate": 0.00028990234740571973, + "loss": 0.1122, "step": 10430 }, { - "epoch": 0.11, - "learning_rate": 0.0002830618469725485, - "loss": 0.1016, + "epoch": 0.07, + "learning_rate": 0.0002898926660513628, + "loss": 0.114, "step": 10440 }, { - "epoch": 0.11, - "learning_rate": 0.0002830456226880394, - "loss": 0.1041, + "epoch": 0.07, + "learning_rate": 0.00028988298469700583, + "loss": 0.1279, "step": 10450 }, { - "epoch": 0.11, - "learning_rate": 0.0002830293984035304, - "loss": 0.1038, + "epoch": 0.07, + "learning_rate": 0.0002898733033426489, + "loss": 0.1215, "step": 10460 }, { - "epoch": 0.11, - "learning_rate": 0.0002830131741190213, - "loss": 0.1167, + "epoch": 0.07, + "learning_rate": 0.000289863621988292, + "loss": 0.1143, "step": 10470 }, { - "epoch": 0.11, - "learning_rate": 0.00028299694983451224, - "loss": 0.1067, + "epoch": 0.07, + "learning_rate": 0.00028985394063393507, + "loss": 0.1178, "step": 10480 }, { - "epoch": 0.11, - "learning_rate": 0.0002829807255500032, - "loss": 0.0931, + "epoch": 0.07, + "learning_rate": 0.00028984425927957815, + "loss": 0.1145, "step": 10490 }, { - "epoch": 0.11, - "learning_rate": 0.00028296450126549414, - "loss": 0.0998, + "epoch": 0.07, + "learning_rate": 0.0002898345779252212, + "loss": 0.1103, "step": 10500 }, { - "epoch": 0.11, - "learning_rate": 0.0002829482769809851, - "loss": 0.0965, + "epoch": 0.07, + "learning_rate": 0.00028982489657086426, + "loss": 0.1113, "step": 10510 }, { - "epoch": 0.11, - "learning_rate": 0.00028293205269647604, - "loss": 0.1071, + "epoch": 0.07, + "learning_rate": 0.00028981521521650734, + "loss": 0.1196, "step": 10520 }, { - "epoch": 0.11, - "learning_rate": 0.000282915828411967, - "loss": 0.1023, + "epoch": 0.07, + "learning_rate": 0.00028980553386215036, + "loss": 0.1134, "step": 10530 }, { - "epoch": 0.11, - "learning_rate": 0.00028289960412745794, - "loss": 0.1127, + "epoch": 0.07, + "learning_rate": 0.00028979585250779344, + "loss": 0.1102, "step": 10540 }, { - "epoch": 0.11, - "learning_rate": 0.0002828833798429489, - "loss": 0.0975, + "epoch": 0.07, + "learning_rate": 0.0002897861711534365, + "loss": 0.1164, "step": 10550 }, { - "epoch": 0.11, - "learning_rate": 0.00028286715555843984, - "loss": 0.1011, + "epoch": 0.07, + "learning_rate": 0.0002897764897990796, + "loss": 0.1105, "step": 10560 }, { - "epoch": 0.11, - "learning_rate": 0.0002828509312739308, - "loss": 0.1101, + "epoch": 0.07, + "learning_rate": 0.0002897668084447227, + "loss": 0.117, "step": 10570 }, { - "epoch": 0.11, - "learning_rate": 0.00028283470698942174, - "loss": 0.1124, + "epoch": 0.07, + "learning_rate": 0.00028975712709036576, + "loss": 0.1184, "step": 10580 }, { - "epoch": 0.11, - "learning_rate": 0.0002828184827049127, - "loss": 0.098, + "epoch": 0.07, + "learning_rate": 0.0002897474457360088, + "loss": 0.106, "step": 10590 }, { - "epoch": 0.11, - "learning_rate": 0.00028280225842040364, - "loss": 0.1024, + "epoch": 0.07, + "learning_rate": 0.00028973776438165187, + "loss": 0.1166, "step": 10600 }, { - "epoch": 0.11, - "learning_rate": 0.00028278603413589456, - "loss": 0.1028, + "epoch": 0.07, + "learning_rate": 0.00028972808302729495, + "loss": 0.1231, "step": 10610 }, { - "epoch": 0.11, - "learning_rate": 0.00028276980985138554, - "loss": 0.107, + "epoch": 0.07, + "learning_rate": 0.00028971840167293803, + "loss": 0.1099, "step": 10620 }, { - "epoch": 0.11, - "learning_rate": 0.00028275358556687646, - "loss": 0.1051, + "epoch": 0.07, + "learning_rate": 0.00028970872031858105, + "loss": 0.1197, "step": 10630 }, { - "epoch": 0.12, - "learning_rate": 0.00028273736128236744, - "loss": 0.0993, + "epoch": 0.07, + "learning_rate": 0.00028969903896422413, + "loss": 0.1077, "step": 10640 }, { - "epoch": 0.12, - "learning_rate": 0.00028272113699785836, - "loss": 0.1063, + "epoch": 0.07, + "learning_rate": 0.0002896893576098672, + "loss": 0.1333, "step": 10650 }, { - "epoch": 0.12, - "learning_rate": 0.0002827049127133493, - "loss": 0.1104, + "epoch": 0.07, + "learning_rate": 0.00028967967625551024, + "loss": 0.1157, "step": 10660 }, { - "epoch": 0.12, - "learning_rate": 0.00028268868842884026, - "loss": 0.0975, + "epoch": 0.07, + "learning_rate": 0.0002896699949011533, + "loss": 0.1154, "step": 10670 }, { - "epoch": 0.12, - "learning_rate": 0.0002826724641443312, - "loss": 0.1101, + "epoch": 0.07, + "learning_rate": 0.0002896603135467964, + "loss": 0.1191, "step": 10680 }, { - "epoch": 0.12, - "learning_rate": 0.00028265623985982216, - "loss": 0.1053, + "epoch": 0.07, + "learning_rate": 0.0002896506321924395, + "loss": 0.1076, "step": 10690 }, { - "epoch": 0.12, - "learning_rate": 0.0002826400155753131, - "loss": 0.1012, + "epoch": 0.07, + "learning_rate": 0.00028964095083808256, + "loss": 0.1175, "step": 10700 }, { - "epoch": 0.12, - "learning_rate": 0.00028262379129080406, - "loss": 0.104, + "epoch": 0.07, + "learning_rate": 0.00028963126948372564, + "loss": 0.1108, "step": 10710 }, { - "epoch": 0.12, - "learning_rate": 0.000282607567006295, - "loss": 0.0979, + "epoch": 0.07, + "learning_rate": 0.0002896215881293687, + "loss": 0.1103, "step": 10720 }, { - "epoch": 0.12, - "learning_rate": 0.00028259134272178596, - "loss": 0.103, + "epoch": 0.07, + "learning_rate": 0.00028961190677501174, + "loss": 0.1112, "step": 10730 }, { - "epoch": 0.12, - "learning_rate": 0.0002825751184372769, - "loss": 0.104, + "epoch": 0.07, + "learning_rate": 0.0002896022254206548, + "loss": 0.1196, "step": 10740 }, { - "epoch": 0.12, - "learning_rate": 0.00028255889415276786, - "loss": 0.0937, + "epoch": 0.07, + "learning_rate": 0.0002895925440662979, + "loss": 0.1198, "step": 10750 }, { - "epoch": 0.12, - "learning_rate": 0.0002825426698682588, - "loss": 0.0917, + "epoch": 0.07, + "learning_rate": 0.000289582862711941, + "loss": 0.1203, "step": 10760 }, { - "epoch": 0.12, - "learning_rate": 0.00028252644558374976, - "loss": 0.0985, + "epoch": 0.07, + "learning_rate": 0.000289573181357584, + "loss": 0.1255, "step": 10770 }, { - "epoch": 0.12, - "learning_rate": 0.0002825102212992407, - "loss": 0.0966, + "epoch": 0.07, + "learning_rate": 0.0002895635000032271, + "loss": 0.1105, "step": 10780 }, { - "epoch": 0.12, - "learning_rate": 0.00028249399701473166, - "loss": 0.1004, + "epoch": 0.07, + "learning_rate": 0.00028955381864887017, + "loss": 0.1034, "step": 10790 }, { - "epoch": 0.12, - "learning_rate": 0.0002824777727302226, - "loss": 0.0914, + "epoch": 0.07, + "learning_rate": 0.0002895441372945132, + "loss": 0.1062, "step": 10800 }, { - "epoch": 0.12, - "learning_rate": 0.0002824615484457135, - "loss": 0.114, + "epoch": 0.07, + "learning_rate": 0.00028953445594015627, + "loss": 0.1156, "step": 10810 }, { - "epoch": 0.12, - "learning_rate": 0.0002824453241612045, - "loss": 0.109, + "epoch": 0.07, + "learning_rate": 0.00028952477458579935, + "loss": 0.1167, "step": 10820 }, { - "epoch": 0.12, - "learning_rate": 0.0002824290998766954, - "loss": 0.1022, + "epoch": 0.07, + "learning_rate": 0.00028951509323144243, + "loss": 0.1108, "step": 10830 }, { - "epoch": 0.12, - "learning_rate": 0.0002824128755921863, - "loss": 0.1053, + "epoch": 0.07, + "learning_rate": 0.0002895054118770855, + "loss": 0.1143, "step": 10840 }, { - "epoch": 0.12, - "learning_rate": 0.0002823966513076773, - "loss": 0.1018, + "epoch": 0.07, + "learning_rate": 0.0002894957305227286, + "loss": 0.1137, "step": 10850 }, { - "epoch": 0.12, - "learning_rate": 0.0002823804270231682, - "loss": 0.0953, + "epoch": 0.07, + "learning_rate": 0.00028948604916837167, + "loss": 0.1101, "step": 10860 }, { - "epoch": 0.12, - "learning_rate": 0.0002823642027386592, - "loss": 0.1034, + "epoch": 0.07, + "learning_rate": 0.0002894763678140147, + "loss": 0.11, "step": 10870 }, { - "epoch": 0.12, - "learning_rate": 0.0002823479784541501, - "loss": 0.0978, + "epoch": 0.07, + "learning_rate": 0.0002894666864596578, + "loss": 0.1036, "step": 10880 }, { - "epoch": 0.12, - "learning_rate": 0.0002823317541696411, - "loss": 0.1051, + "epoch": 0.07, + "learning_rate": 0.00028945700510530086, + "loss": 0.1133, "step": 10890 }, { - "epoch": 0.12, - "learning_rate": 0.000282315529885132, - "loss": 0.0957, + "epoch": 0.07, + "learning_rate": 0.0002894473237509439, + "loss": 0.1183, "step": 10900 }, { - "epoch": 0.12, - "learning_rate": 0.000282299305600623, - "loss": 0.1073, + "epoch": 0.07, + "learning_rate": 0.00028943764239658696, + "loss": 0.111, "step": 10910 }, { - "epoch": 0.12, - "learning_rate": 0.0002822830813161139, - "loss": 0.0977, + "epoch": 0.07, + "learning_rate": 0.00028942796104223004, + "loss": 0.1195, "step": 10920 }, { - "epoch": 0.12, - "learning_rate": 0.0002822668570316049, - "loss": 0.0946, + "epoch": 0.07, + "learning_rate": 0.0002894182796878731, + "loss": 0.1145, "step": 10930 }, { - "epoch": 0.12, - "learning_rate": 0.0002822506327470958, - "loss": 0.0938, + "epoch": 0.07, + "learning_rate": 0.00028940859833351615, + "loss": 0.1164, "step": 10940 }, { - "epoch": 0.12, - "learning_rate": 0.0002822344084625868, - "loss": 0.0944, + "epoch": 0.07, + "learning_rate": 0.0002893989169791592, + "loss": 0.1166, "step": 10950 }, { - "epoch": 0.12, - "learning_rate": 0.0002822181841780777, - "loss": 0.1044, + "epoch": 0.07, + "learning_rate": 0.0002893892356248023, + "loss": 0.1019, "step": 10960 }, { - "epoch": 0.12, - "learning_rate": 0.0002822019598935687, - "loss": 0.0956, + "epoch": 0.07, + "learning_rate": 0.0002893795542704454, + "loss": 0.1066, "step": 10970 }, { - "epoch": 0.12, - "learning_rate": 0.0002821857356090596, - "loss": 0.0984, + "epoch": 0.07, + "learning_rate": 0.00028936987291608847, + "loss": 0.1175, "step": 10980 }, { - "epoch": 0.12, - "learning_rate": 0.00028216951132455055, - "loss": 0.0991, + "epoch": 0.07, + "learning_rate": 0.00028936019156173155, + "loss": 0.1139, "step": 10990 }, { - "epoch": 0.12, - "learning_rate": 0.0002821532870400415, - "loss": 0.0963, + "epoch": 0.07, + "learning_rate": 0.00028935051020737457, + "loss": 0.1142, "step": 11000 }, { - "epoch": 0.12, - "eval_cer": 0.9214661952394331, - "eval_loss": 0.06781847774982452, - "eval_runtime": 119.2974, - "eval_samples_per_second": 16.765, - "eval_steps_per_second": 4.191, + "epoch": 0.07, + "eval_cer": 0.920128347079426, + "eval_loss": 0.07976210117340088, + "eval_runtime": 120.34, + "eval_samples_per_second": 16.62, + "eval_steps_per_second": 4.155, "step": 11000 }, { - "epoch": 0.12, - "learning_rate": 0.00028213706275553245, - "loss": 0.0994, + "epoch": 0.07, + "learning_rate": 0.00028934082885301765, + "loss": 0.1083, "step": 11010 }, { - "epoch": 0.12, - "learning_rate": 0.00028212083847102337, - "loss": 0.0998, + "epoch": 0.07, + "learning_rate": 0.00028933114749866073, + "loss": 0.1146, "step": 11020 }, { - "epoch": 0.12, - "learning_rate": 0.00028210461418651435, - "loss": 0.1019, + "epoch": 0.07, + "learning_rate": 0.00028932146614430376, + "loss": 0.1131, "step": 11030 }, { - "epoch": 0.12, - "learning_rate": 0.00028208838990200527, - "loss": 0.1003, + "epoch": 0.07, + "learning_rate": 0.00028931178478994684, + "loss": 0.1171, "step": 11040 }, { - "epoch": 0.12, - "learning_rate": 0.00028207216561749624, - "loss": 0.0943, + "epoch": 0.07, + "learning_rate": 0.0002893021034355899, + "loss": 0.1049, "step": 11050 }, { - "epoch": 0.12, - "learning_rate": 0.00028205594133298717, - "loss": 0.1088, + "epoch": 0.07, + "learning_rate": 0.000289292422081233, + "loss": 0.1213, "step": 11060 }, { - "epoch": 0.12, - "learning_rate": 0.00028203971704847814, - "loss": 0.104, + "epoch": 0.07, + "learning_rate": 0.0002892827407268761, + "loss": 0.1202, "step": 11070 }, { - "epoch": 0.12, - "learning_rate": 0.00028202349276396907, - "loss": 0.1064, + "epoch": 0.07, + "learning_rate": 0.0002892730593725191, + "loss": 0.1142, "step": 11080 }, { - "epoch": 0.12, - "learning_rate": 0.00028200726847946004, - "loss": 0.0923, + "epoch": 0.07, + "learning_rate": 0.0002892633780181622, + "loss": 0.1154, "step": 11090 }, { - "epoch": 0.12, - "learning_rate": 0.00028199104419495097, - "loss": 0.0942, + "epoch": 0.07, + "learning_rate": 0.00028925369666380526, + "loss": 0.1266, "step": 11100 }, { - "epoch": 0.12, - "learning_rate": 0.00028197481991044194, - "loss": 0.1042, + "epoch": 0.07, + "learning_rate": 0.00028924401530944834, + "loss": 0.1064, "step": 11110 }, { - "epoch": 0.12, - "learning_rate": 0.00028195859562593287, - "loss": 0.1065, + "epoch": 0.07, + "learning_rate": 0.0002892343339550914, + "loss": 0.1048, "step": 11120 }, { - "epoch": 0.12, - "learning_rate": 0.00028194237134142384, - "loss": 0.0944, + "epoch": 0.07, + "learning_rate": 0.0002892246526007345, + "loss": 0.1167, "step": 11130 }, { - "epoch": 0.12, - "learning_rate": 0.00028192614705691477, - "loss": 0.0981, + "epoch": 0.07, + "learning_rate": 0.0002892149712463775, + "loss": 0.1051, "step": 11140 }, { - "epoch": 0.12, - "learning_rate": 0.00028190992277240574, - "loss": 0.1063, + "epoch": 0.07, + "learning_rate": 0.0002892052898920206, + "loss": 0.1121, "step": 11150 }, { - "epoch": 0.12, - "learning_rate": 0.00028189369848789667, - "loss": 0.0996, + "epoch": 0.07, + "learning_rate": 0.0002891956085376637, + "loss": 0.1068, "step": 11160 }, { - "epoch": 0.12, - "learning_rate": 0.0002818774742033876, - "loss": 0.095, + "epoch": 0.07, + "learning_rate": 0.0002891859271833067, + "loss": 0.1137, "step": 11170 }, { - "epoch": 0.12, - "learning_rate": 0.00028186124991887856, - "loss": 0.0984, + "epoch": 0.07, + "learning_rate": 0.0002891762458289498, + "loss": 0.1107, "step": 11180 }, { - "epoch": 0.12, - "learning_rate": 0.0002818450256343695, - "loss": 0.0981, + "epoch": 0.07, + "learning_rate": 0.00028916656447459287, + "loss": 0.1118, "step": 11190 }, { - "epoch": 0.12, - "learning_rate": 0.0002818288013498604, - "loss": 0.0924, + "epoch": 0.07, + "learning_rate": 0.00028915688312023595, + "loss": 0.1275, "step": 11200 }, { - "epoch": 0.12, - "learning_rate": 0.0002818125770653514, - "loss": 0.1067, + "epoch": 0.07, + "learning_rate": 0.00028914720176587903, + "loss": 0.1006, "step": 11210 }, { - "epoch": 0.12, - "learning_rate": 0.0002817963527808423, - "loss": 0.1034, + "epoch": 0.07, + "learning_rate": 0.00028913752041152206, + "loss": 0.1065, "step": 11220 }, { - "epoch": 0.12, - "learning_rate": 0.0002817801284963333, - "loss": 0.1002, + "epoch": 0.07, + "learning_rate": 0.00028912783905716514, + "loss": 0.1061, "step": 11230 }, { - "epoch": 0.12, - "learning_rate": 0.0002817639042118242, - "loss": 0.0915, + "epoch": 0.07, + "learning_rate": 0.0002891181577028082, + "loss": 0.1058, "step": 11240 }, { - "epoch": 0.12, - "learning_rate": 0.0002817476799273152, - "loss": 0.109, + "epoch": 0.07, + "learning_rate": 0.0002891084763484513, + "loss": 0.1008, "step": 11250 }, { - "epoch": 0.12, - "learning_rate": 0.0002817314556428061, - "loss": 0.1033, + "epoch": 0.07, + "learning_rate": 0.0002890987949940944, + "loss": 0.1071, "step": 11260 }, { - "epoch": 0.12, - "learning_rate": 0.0002817152313582971, - "loss": 0.0966, + "epoch": 0.07, + "learning_rate": 0.0002890891136397374, + "loss": 0.1137, "step": 11270 }, { - "epoch": 0.12, - "learning_rate": 0.000281699007073788, - "loss": 0.1002, + "epoch": 0.07, + "learning_rate": 0.0002890794322853805, + "loss": 0.1134, "step": 11280 }, { - "epoch": 0.12, - "learning_rate": 0.000281682782789279, - "loss": 0.1009, + "epoch": 0.07, + "learning_rate": 0.00028906975093102356, + "loss": 0.1041, "step": 11290 }, { - "epoch": 0.12, - "learning_rate": 0.0002816665585047699, - "loss": 0.1017, + "epoch": 0.07, + "learning_rate": 0.0002890600695766666, + "loss": 0.1209, "step": 11300 }, { - "epoch": 0.12, - "learning_rate": 0.0002816503342202609, - "loss": 0.0967, + "epoch": 0.07, + "learning_rate": 0.00028905038822230967, + "loss": 0.1086, "step": 11310 }, { - "epoch": 0.12, - "learning_rate": 0.0002816341099357518, - "loss": 0.0945, + "epoch": 0.07, + "learning_rate": 0.00028904070686795275, + "loss": 0.1082, "step": 11320 }, { - "epoch": 0.12, - "learning_rate": 0.0002816178856512428, - "loss": 0.0935, + "epoch": 0.07, + "learning_rate": 0.0002890310255135958, + "loss": 0.1062, "step": 11330 }, { - "epoch": 0.12, - "learning_rate": 0.0002816016613667337, - "loss": 0.0939, + "epoch": 0.07, + "learning_rate": 0.0002890213441592389, + "loss": 0.111, "step": 11340 }, { - "epoch": 0.12, - "learning_rate": 0.00028158543708222463, - "loss": 0.0963, + "epoch": 0.07, + "learning_rate": 0.000289011662804882, + "loss": 0.1112, "step": 11350 }, { - "epoch": 0.12, - "learning_rate": 0.0002815692127977156, - "loss": 0.0959, + "epoch": 0.07, + "learning_rate": 0.000289001981450525, + "loss": 0.1177, "step": 11360 }, { - "epoch": 0.12, - "learning_rate": 0.00028155298851320653, - "loss": 0.0963, + "epoch": 0.07, + "learning_rate": 0.0002889923000961681, + "loss": 0.1056, "step": 11370 }, { - "epoch": 0.12, - "learning_rate": 0.00028153676422869745, - "loss": 0.104, + "epoch": 0.07, + "learning_rate": 0.00028898261874181117, + "loss": 0.1022, "step": 11380 }, { - "epoch": 0.12, - "learning_rate": 0.00028152053994418843, - "loss": 0.1027, + "epoch": 0.07, + "learning_rate": 0.00028897293738745425, + "loss": 0.1045, "step": 11390 }, { - "epoch": 0.12, - "learning_rate": 0.00028150431565967935, - "loss": 0.0981, + "epoch": 0.07, + "learning_rate": 0.0002889632560330973, + "loss": 0.1075, "step": 11400 }, { - "epoch": 0.12, - "learning_rate": 0.00028148809137517033, - "loss": 0.0978, + "epoch": 0.07, + "learning_rate": 0.00028895357467874036, + "loss": 0.1036, "step": 11410 }, { - "epoch": 0.12, - "learning_rate": 0.00028147186709066125, - "loss": 0.1097, + "epoch": 0.07, + "learning_rate": 0.00028894389332438343, + "loss": 0.1022, "step": 11420 }, { - "epoch": 0.12, - "learning_rate": 0.00028145564280615223, - "loss": 0.099, + "epoch": 0.07, + "learning_rate": 0.00028893421197002646, + "loss": 0.1255, "step": 11430 }, { - "epoch": 0.12, - "learning_rate": 0.00028143941852164315, - "loss": 0.1052, + "epoch": 0.07, + "learning_rate": 0.00028892453061566954, + "loss": 0.1036, "step": 11440 }, { - "epoch": 0.12, - "learning_rate": 0.00028142319423713413, - "loss": 0.1009, + "epoch": 0.07, + "learning_rate": 0.0002889148492613126, + "loss": 0.1194, "step": 11450 }, { - "epoch": 0.12, - "learning_rate": 0.00028140696995262505, - "loss": 0.0964, + "epoch": 0.07, + "learning_rate": 0.0002889051679069557, + "loss": 0.1103, "step": 11460 }, { - "epoch": 0.12, - "learning_rate": 0.000281390745668116, - "loss": 0.0966, + "epoch": 0.07, + "learning_rate": 0.0002888954865525988, + "loss": 0.1209, "step": 11470 }, { - "epoch": 0.12, - "learning_rate": 0.00028137452138360695, - "loss": 0.0981, + "epoch": 0.07, + "learning_rate": 0.00028888580519824186, + "loss": 0.114, "step": 11480 }, { - "epoch": 0.12, - "learning_rate": 0.0002813582970990979, - "loss": 0.1012, + "epoch": 0.07, + "learning_rate": 0.00028887612384388494, + "loss": 0.1153, "step": 11490 }, { - "epoch": 0.12, - "learning_rate": 0.00028134207281458885, - "loss": 0.0976, + "epoch": 0.07, + "learning_rate": 0.00028886644248952796, + "loss": 0.1126, "step": 11500 }, { - "epoch": 0.12, - "learning_rate": 0.0002813258485300798, - "loss": 0.1002, + "epoch": 0.07, + "learning_rate": 0.00028885676113517104, + "loss": 0.1131, "step": 11510 }, { - "epoch": 0.12, - "learning_rate": 0.00028130962424557075, - "loss": 0.0932, + "epoch": 0.07, + "learning_rate": 0.0002888470797808141, + "loss": 0.1094, "step": 11520 }, { - "epoch": 0.12, - "learning_rate": 0.00028129339996106167, - "loss": 0.0993, + "epoch": 0.07, + "learning_rate": 0.0002888373984264572, + "loss": 0.1006, "step": 11530 }, { - "epoch": 0.12, - "learning_rate": 0.00028127717567655265, - "loss": 0.0977, + "epoch": 0.07, + "learning_rate": 0.00028882771707210023, + "loss": 0.1115, "step": 11540 }, { - "epoch": 0.12, - "learning_rate": 0.00028126095139204357, - "loss": 0.1063, + "epoch": 0.07, + "learning_rate": 0.0002888180357177433, + "loss": 0.1005, "step": 11550 }, { - "epoch": 0.13, - "learning_rate": 0.0002812447271075345, - "loss": 0.0902, + "epoch": 0.07, + "learning_rate": 0.0002888083543633864, + "loss": 0.1102, "step": 11560 }, { - "epoch": 0.13, - "learning_rate": 0.00028122850282302547, - "loss": 0.0902, + "epoch": 0.07, + "learning_rate": 0.0002887986730090294, + "loss": 0.0981, "step": 11570 }, { - "epoch": 0.13, - "learning_rate": 0.0002812122785385164, - "loss": 0.0981, + "epoch": 0.07, + "learning_rate": 0.0002887889916546725, + "loss": 0.1029, "step": 11580 }, { - "epoch": 0.13, - "learning_rate": 0.00028119605425400737, - "loss": 0.1027, + "epoch": 0.07, + "learning_rate": 0.0002887793103003156, + "loss": 0.1115, "step": 11590 }, { - "epoch": 0.13, - "learning_rate": 0.0002811798299694983, - "loss": 0.0953, + "epoch": 0.07, + "learning_rate": 0.00028876962894595865, + "loss": 0.1028, "step": 11600 }, { - "epoch": 0.13, - "learning_rate": 0.00028116360568498927, - "loss": 0.0897, + "epoch": 0.07, + "learning_rate": 0.00028875994759160173, + "loss": 0.1053, "step": 11610 }, { - "epoch": 0.13, - "learning_rate": 0.0002811473814004802, - "loss": 0.0976, + "epoch": 0.07, + "learning_rate": 0.0002887502662372448, + "loss": 0.1137, "step": 11620 }, { - "epoch": 0.13, - "learning_rate": 0.00028113115711597117, - "loss": 0.0914, + "epoch": 0.08, + "learning_rate": 0.0002887405848828879, + "loss": 0.1059, "step": 11630 }, { - "epoch": 0.13, - "learning_rate": 0.0002811149328314621, - "loss": 0.0903, + "epoch": 0.08, + "learning_rate": 0.0002887309035285309, + "loss": 0.1125, "step": 11640 }, { - "epoch": 0.13, - "learning_rate": 0.00028109870854695307, - "loss": 0.0907, + "epoch": 0.08, + "learning_rate": 0.000288721222174174, + "loss": 0.1039, "step": 11650 }, { - "epoch": 0.13, - "learning_rate": 0.000281082484262444, - "loss": 0.1059, + "epoch": 0.08, + "learning_rate": 0.0002887115408198171, + "loss": 0.1143, "step": 11660 }, { - "epoch": 0.13, - "learning_rate": 0.00028106625997793497, - "loss": 0.0884, + "epoch": 0.08, + "learning_rate": 0.0002887018594654601, + "loss": 0.1081, "step": 11670 }, { - "epoch": 0.13, - "learning_rate": 0.0002810500356934259, - "loss": 0.0975, + "epoch": 0.08, + "learning_rate": 0.0002886921781111032, + "loss": 0.1031, "step": 11680 }, { - "epoch": 0.13, - "learning_rate": 0.00028103381140891687, - "loss": 0.0968, + "epoch": 0.08, + "learning_rate": 0.00028868249675674626, + "loss": 0.0974, "step": 11690 }, { - "epoch": 0.13, - "learning_rate": 0.0002810175871244078, - "loss": 0.0988, + "epoch": 0.08, + "learning_rate": 0.00028867281540238934, + "loss": 0.1086, "step": 11700 }, { - "epoch": 0.13, - "learning_rate": 0.0002810013628398987, - "loss": 0.0966, + "epoch": 0.08, + "learning_rate": 0.00028866313404803237, + "loss": 0.1157, "step": 11710 }, { - "epoch": 0.13, - "learning_rate": 0.0002809851385553897, - "loss": 0.1044, + "epoch": 0.08, + "learning_rate": 0.00028865345269367545, + "loss": 0.104, "step": 11720 }, { - "epoch": 0.13, - "learning_rate": 0.0002809689142708806, - "loss": 0.0962, + "epoch": 0.08, + "learning_rate": 0.00028864377133931853, + "loss": 0.1155, "step": 11730 }, { - "epoch": 0.13, - "learning_rate": 0.0002809526899863716, - "loss": 0.0923, + "epoch": 0.08, + "learning_rate": 0.0002886340899849616, + "loss": 0.1152, "step": 11740 }, { - "epoch": 0.13, - "learning_rate": 0.0002809364657018625, - "loss": 0.1074, + "epoch": 0.08, + "learning_rate": 0.0002886244086306047, + "loss": 0.1047, "step": 11750 }, { - "epoch": 0.13, - "learning_rate": 0.0002809202414173535, - "loss": 0.0948, + "epoch": 0.08, + "learning_rate": 0.00028861472727624777, + "loss": 0.107, "step": 11760 }, { - "epoch": 0.13, - "learning_rate": 0.0002809040171328444, - "loss": 0.0994, + "epoch": 0.08, + "learning_rate": 0.0002886050459218908, + "loss": 0.1107, "step": 11770 }, { - "epoch": 0.13, - "learning_rate": 0.0002808877928483354, - "loss": 0.0997, + "epoch": 0.08, + "learning_rate": 0.0002885953645675339, + "loss": 0.1163, "step": 11780 }, { - "epoch": 0.13, - "learning_rate": 0.0002808715685638263, - "loss": 0.102, + "epoch": 0.08, + "learning_rate": 0.00028858568321317695, + "loss": 0.1133, "step": 11790 }, { - "epoch": 0.13, - "learning_rate": 0.0002808553442793173, - "loss": 0.0933, + "epoch": 0.08, + "learning_rate": 0.00028857600185882, + "loss": 0.1188, "step": 11800 }, { - "epoch": 0.13, - "learning_rate": 0.0002808391199948082, - "loss": 0.0978, + "epoch": 0.08, + "learning_rate": 0.00028856632050446306, + "loss": 0.1077, "step": 11810 }, { - "epoch": 0.13, - "learning_rate": 0.0002808228957102992, - "loss": 0.1094, + "epoch": 0.08, + "learning_rate": 0.00028855663915010614, + "loss": 0.1058, "step": 11820 }, { - "epoch": 0.13, - "learning_rate": 0.0002808066714257901, - "loss": 0.0969, + "epoch": 0.08, + "learning_rate": 0.0002885469577957492, + "loss": 0.11, "step": 11830 }, { - "epoch": 0.13, - "learning_rate": 0.0002807904471412811, - "loss": 0.0997, + "epoch": 0.08, + "learning_rate": 0.0002885372764413923, + "loss": 0.1238, "step": 11840 }, { - "epoch": 0.13, - "learning_rate": 0.000280774222856772, - "loss": 0.0954, + "epoch": 0.08, + "learning_rate": 0.0002885275950870353, + "loss": 0.1099, "step": 11850 }, { - "epoch": 0.13, - "learning_rate": 0.00028075799857226293, - "loss": 0.0969, + "epoch": 0.08, + "learning_rate": 0.0002885179137326784, + "loss": 0.108, "step": 11860 }, { - "epoch": 0.13, - "learning_rate": 0.0002807417742877539, - "loss": 0.0951, + "epoch": 0.08, + "learning_rate": 0.0002885082323783215, + "loss": 0.113, "step": 11870 }, { - "epoch": 0.13, - "learning_rate": 0.00028072555000324483, - "loss": 0.1154, + "epoch": 0.08, + "learning_rate": 0.00028849855102396456, + "loss": 0.1078, "step": 11880 }, { - "epoch": 0.13, - "learning_rate": 0.00028070932571873575, - "loss": 0.099, + "epoch": 0.08, + "learning_rate": 0.00028848886966960764, + "loss": 0.109, "step": 11890 }, { - "epoch": 0.13, - "learning_rate": 0.00028069310143422673, - "loss": 0.1068, + "epoch": 0.08, + "learning_rate": 0.0002884791883152507, + "loss": 0.1145, "step": 11900 }, { - "epoch": 0.13, - "learning_rate": 0.00028067687714971765, - "loss": 0.0981, + "epoch": 0.08, + "learning_rate": 0.00028846950696089375, + "loss": 0.1139, "step": 11910 }, { - "epoch": 0.13, - "learning_rate": 0.00028066065286520863, - "loss": 0.12, + "epoch": 0.08, + "learning_rate": 0.00028845982560653683, + "loss": 0.1083, "step": 11920 }, { - "epoch": 0.13, - "learning_rate": 0.00028064442858069955, - "loss": 0.0987, + "epoch": 0.08, + "learning_rate": 0.0002884501442521799, + "loss": 0.1032, "step": 11930 }, { - "epoch": 0.13, - "learning_rate": 0.00028062820429619053, - "loss": 0.0977, + "epoch": 0.08, + "learning_rate": 0.00028844046289782293, + "loss": 0.0933, "step": 11940 }, { - "epoch": 0.13, - "learning_rate": 0.00028061198001168145, - "loss": 0.0918, + "epoch": 0.08, + "learning_rate": 0.000288430781543466, + "loss": 0.1059, "step": 11950 }, { - "epoch": 0.13, - "learning_rate": 0.00028059575572717243, - "loss": 0.0954, + "epoch": 0.08, + "learning_rate": 0.0002884211001891091, + "loss": 0.1007, "step": 11960 }, { - "epoch": 0.13, - "learning_rate": 0.00028057953144266335, - "loss": 0.1047, + "epoch": 0.08, + "learning_rate": 0.00028841141883475217, + "loss": 0.1074, "step": 11970 }, { - "epoch": 0.13, - "learning_rate": 0.00028056330715815433, - "loss": 0.0993, + "epoch": 0.08, + "learning_rate": 0.00028840173748039525, + "loss": 0.1127, "step": 11980 }, { - "epoch": 0.13, - "learning_rate": 0.00028054708287364525, - "loss": 0.0886, + "epoch": 0.08, + "learning_rate": 0.0002883920561260383, + "loss": 0.1007, "step": 11990 }, { - "epoch": 0.13, - "learning_rate": 0.00028053085858913623, - "loss": 0.0969, + "epoch": 0.08, + "learning_rate": 0.00028838237477168136, + "loss": 0.1081, "step": 12000 }, { - "epoch": 0.13, - "eval_cer": 0.9214017008840144, - "eval_loss": 0.06535026431083679, - "eval_runtime": 119.7432, - "eval_samples_per_second": 16.702, - "eval_steps_per_second": 4.176, + "epoch": 0.08, + "eval_cer": 0.920316348435205, + "eval_loss": 0.07571277767419815, + "eval_runtime": 120.2448, + "eval_samples_per_second": 16.633, + "eval_steps_per_second": 4.158, "step": 12000 }, { - "epoch": 0.13, - "learning_rate": 0.00028051463430462715, - "loss": 0.0961, + "epoch": 0.08, + "learning_rate": 0.00028837269341732444, + "loss": 0.1088, "step": 12010 }, { - "epoch": 0.13, - "learning_rate": 0.00028049841002011813, - "loss": 0.0948, + "epoch": 0.08, + "learning_rate": 0.0002883630120629675, + "loss": 0.111, "step": 12020 }, { - "epoch": 0.13, - "learning_rate": 0.00028048218573560905, - "loss": 0.1013, + "epoch": 0.08, + "learning_rate": 0.0002883533307086106, + "loss": 0.1104, "step": 12030 }, { - "epoch": 0.13, - "learning_rate": 0.0002804659614511, - "loss": 0.1052, + "epoch": 0.08, + "learning_rate": 0.0002883436493542536, + "loss": 0.1104, "step": 12040 }, { - "epoch": 0.13, - "learning_rate": 0.00028044973716659095, - "loss": 0.0965, + "epoch": 0.08, + "learning_rate": 0.0002883339679998967, + "loss": 0.1076, "step": 12050 }, { - "epoch": 0.13, - "learning_rate": 0.0002804335128820819, - "loss": 0.1053, + "epoch": 0.08, + "learning_rate": 0.0002883242866455398, + "loss": 0.1234, "step": 12060 }, { - "epoch": 0.13, - "learning_rate": 0.0002804172885975728, - "loss": 0.094, + "epoch": 0.08, + "learning_rate": 0.0002883146052911828, + "loss": 0.1044, "step": 12070 }, { - "epoch": 0.13, - "learning_rate": 0.0002804010643130638, - "loss": 0.0907, + "epoch": 0.08, + "learning_rate": 0.0002883049239368259, + "loss": 0.1194, "step": 12080 }, { - "epoch": 0.13, - "learning_rate": 0.0002803848400285547, - "loss": 0.1052, + "epoch": 0.08, + "learning_rate": 0.00028829524258246897, + "loss": 0.1128, "step": 12090 }, { - "epoch": 0.13, - "learning_rate": 0.00028036861574404567, - "loss": 0.0983, + "epoch": 0.08, + "learning_rate": 0.00028828556122811205, + "loss": 0.1037, "step": 12100 }, { - "epoch": 0.13, - "learning_rate": 0.0002803523914595366, - "loss": 0.0967, + "epoch": 0.08, + "learning_rate": 0.00028827587987375513, + "loss": 0.1062, "step": 12110 }, { - "epoch": 0.13, - "learning_rate": 0.00028033616717502757, - "loss": 0.1051, + "epoch": 0.08, + "learning_rate": 0.0002882661985193982, + "loss": 0.1088, "step": 12120 }, { - "epoch": 0.13, - "learning_rate": 0.0002803199428905185, - "loss": 0.1058, + "epoch": 0.08, + "learning_rate": 0.00028825651716504123, + "loss": 0.1076, "step": 12130 }, { - "epoch": 0.13, - "learning_rate": 0.00028030371860600947, - "loss": 0.1048, + "epoch": 0.08, + "learning_rate": 0.0002882468358106843, + "loss": 0.116, "step": 12140 }, { - "epoch": 0.13, - "learning_rate": 0.0002802874943215004, - "loss": 0.1193, + "epoch": 0.08, + "learning_rate": 0.0002882371544563274, + "loss": 0.1093, "step": 12150 }, { - "epoch": 0.13, - "learning_rate": 0.00028027127003699137, - "loss": 0.0992, + "epoch": 0.08, + "learning_rate": 0.00028822747310197047, + "loss": 0.1039, "step": 12160 }, { - "epoch": 0.13, - "learning_rate": 0.0002802550457524823, - "loss": 0.1056, + "epoch": 0.08, + "learning_rate": 0.0002882177917476135, + "loss": 0.1146, "step": 12170 }, { - "epoch": 0.13, - "learning_rate": 0.00028023882146797327, - "loss": 0.0924, + "epoch": 0.08, + "learning_rate": 0.0002882081103932566, + "loss": 0.1074, "step": 12180 }, { - "epoch": 0.13, - "learning_rate": 0.0002802225971834642, - "loss": 0.0996, + "epoch": 0.08, + "learning_rate": 0.00028819842903889966, + "loss": 0.1046, "step": 12190 }, { - "epoch": 0.13, - "learning_rate": 0.00028020637289895517, - "loss": 0.0855, + "epoch": 0.08, + "learning_rate": 0.0002881887476845427, + "loss": 0.1088, "step": 12200 }, { - "epoch": 0.13, - "learning_rate": 0.0002801901486144461, - "loss": 0.0992, + "epoch": 0.08, + "learning_rate": 0.00028817906633018576, + "loss": 0.11, "step": 12210 }, { - "epoch": 0.13, - "learning_rate": 0.000280173924329937, - "loss": 0.0962, + "epoch": 0.08, + "learning_rate": 0.00028816938497582884, + "loss": 0.1105, "step": 12220 }, { - "epoch": 0.13, - "learning_rate": 0.000280157700045428, - "loss": 0.1151, + "epoch": 0.08, + "learning_rate": 0.0002881597036214719, + "loss": 0.1048, "step": 12230 }, { - "epoch": 0.13, - "learning_rate": 0.0002801414757609189, - "loss": 0.0965, + "epoch": 0.08, + "learning_rate": 0.000288150022267115, + "loss": 0.1145, "step": 12240 }, { - "epoch": 0.13, - "learning_rate": 0.00028012525147640984, - "loss": 0.0954, + "epoch": 0.08, + "learning_rate": 0.0002881403409127581, + "loss": 0.1006, "step": 12250 }, { - "epoch": 0.13, - "learning_rate": 0.0002801090271919008, - "loss": 0.0906, + "epoch": 0.08, + "learning_rate": 0.00028813065955840116, + "loss": 0.0995, "step": 12260 }, { - "epoch": 0.13, - "learning_rate": 0.00028009280290739174, - "loss": 0.114, + "epoch": 0.08, + "learning_rate": 0.0002881209782040442, + "loss": 0.1108, "step": 12270 }, { - "epoch": 0.13, - "learning_rate": 0.0002800765786228827, - "loss": 0.1015, + "epoch": 0.08, + "learning_rate": 0.00028811129684968727, + "loss": 0.1227, "step": 12280 }, { - "epoch": 0.13, - "learning_rate": 0.00028006035433837364, - "loss": 0.0931, + "epoch": 0.08, + "learning_rate": 0.00028810161549533035, + "loss": 0.1099, "step": 12290 }, { - "epoch": 0.13, - "learning_rate": 0.0002800441300538646, - "loss": 0.0954, + "epoch": 0.08, + "learning_rate": 0.0002880919341409734, + "loss": 0.1059, "step": 12300 }, { - "epoch": 0.13, - "learning_rate": 0.00028002790576935554, - "loss": 0.1049, + "epoch": 0.08, + "learning_rate": 0.00028808225278661645, + "loss": 0.1061, "step": 12310 }, { - "epoch": 0.13, - "learning_rate": 0.0002800116814848465, - "loss": 0.0943, + "epoch": 0.08, + "learning_rate": 0.00028807257143225953, + "loss": 0.112, "step": 12320 }, { - "epoch": 0.13, - "learning_rate": 0.00027999545720033744, - "loss": 0.0909, + "epoch": 0.08, + "learning_rate": 0.0002880628900779026, + "loss": 0.1048, "step": 12330 }, { - "epoch": 0.13, - "learning_rate": 0.0002799792329158284, - "loss": 0.1034, + "epoch": 0.08, + "learning_rate": 0.00028805320872354564, + "loss": 0.1037, "step": 12340 }, { - "epoch": 0.13, - "learning_rate": 0.00027996300863131934, - "loss": 0.0931, + "epoch": 0.08, + "learning_rate": 0.0002880435273691887, + "loss": 0.1008, "step": 12350 }, { - "epoch": 0.13, - "learning_rate": 0.0002799467843468103, - "loss": 0.0913, + "epoch": 0.08, + "learning_rate": 0.0002880338460148318, + "loss": 0.0988, "step": 12360 }, { - "epoch": 0.13, - "learning_rate": 0.00027993056006230124, - "loss": 0.0804, + "epoch": 0.08, + "learning_rate": 0.0002880241646604749, + "loss": 0.11, "step": 12370 }, { - "epoch": 0.13, - "learning_rate": 0.0002799143357777922, - "loss": 0.0984, + "epoch": 0.08, + "learning_rate": 0.00028801448330611796, + "loss": 0.1127, "step": 12380 }, { - "epoch": 0.13, - "learning_rate": 0.00027989811149328313, - "loss": 0.0924, + "epoch": 0.08, + "learning_rate": 0.00028800480195176104, + "loss": 0.1076, "step": 12390 }, { - "epoch": 0.13, - "learning_rate": 0.00027988188720877406, - "loss": 0.093, + "epoch": 0.08, + "learning_rate": 0.0002879951205974041, + "loss": 0.1037, "step": 12400 }, { - "epoch": 0.13, - "learning_rate": 0.00027986566292426503, - "loss": 0.1012, + "epoch": 0.08, + "learning_rate": 0.00028798543924304714, + "loss": 0.1055, "step": 12410 }, { - "epoch": 0.13, - "learning_rate": 0.00027984943863975596, - "loss": 0.0914, + "epoch": 0.08, + "learning_rate": 0.0002879757578886902, + "loss": 0.1052, "step": 12420 }, { - "epoch": 0.13, - "learning_rate": 0.0002798332143552469, - "loss": 0.0984, + "epoch": 0.08, + "learning_rate": 0.0002879660765343333, + "loss": 0.0989, "step": 12430 }, { - "epoch": 0.13, - "learning_rate": 0.00027981699007073786, - "loss": 0.0973, + "epoch": 0.08, + "learning_rate": 0.0002879563951799763, + "loss": 0.1195, "step": 12440 }, { - "epoch": 0.13, - "learning_rate": 0.0002798007657862288, - "loss": 0.1051, + "epoch": 0.08, + "learning_rate": 0.0002879467138256194, + "loss": 0.1037, "step": 12450 }, { - "epoch": 0.13, - "learning_rate": 0.00027978454150171976, - "loss": 0.0996, + "epoch": 0.08, + "learning_rate": 0.0002879370324712625, + "loss": 0.1097, "step": 12460 }, { - "epoch": 0.13, - "learning_rate": 0.0002797683172172107, - "loss": 0.0902, + "epoch": 0.08, + "learning_rate": 0.00028792735111690557, + "loss": 0.1202, "step": 12470 }, { - "epoch": 0.13, - "learning_rate": 0.00027975209293270166, - "loss": 0.1008, + "epoch": 0.08, + "learning_rate": 0.0002879176697625486, + "loss": 0.1073, "step": 12480 }, { - "epoch": 0.14, - "learning_rate": 0.0002797358686481926, - "loss": 0.0881, + "epoch": 0.08, + "learning_rate": 0.00028790798840819167, + "loss": 0.1054, "step": 12490 }, { - "epoch": 0.14, - "learning_rate": 0.00027971964436368355, - "loss": 0.118, + "epoch": 0.08, + "learning_rate": 0.00028789830705383475, + "loss": 0.0992, "step": 12500 }, { - "epoch": 0.14, - "learning_rate": 0.0002797034200791745, - "loss": 0.0947, + "epoch": 0.08, + "learning_rate": 0.00028788862569947783, + "loss": 0.1095, "step": 12510 }, { - "epoch": 0.14, - "learning_rate": 0.00027968719579466545, - "loss": 0.0953, + "epoch": 0.08, + "learning_rate": 0.0002878789443451209, + "loss": 0.1057, "step": 12520 }, { - "epoch": 0.14, - "learning_rate": 0.0002796709715101564, - "loss": 0.0905, + "epoch": 0.08, + "learning_rate": 0.000287869262990764, + "loss": 0.1009, "step": 12530 }, { - "epoch": 0.14, - "learning_rate": 0.00027965474722564735, - "loss": 0.1052, + "epoch": 0.08, + "learning_rate": 0.00028785958163640707, + "loss": 0.1088, "step": 12540 }, { - "epoch": 0.14, - "learning_rate": 0.0002796385229411383, - "loss": 0.0961, + "epoch": 0.08, + "learning_rate": 0.0002878499002820501, + "loss": 0.1106, "step": 12550 }, { - "epoch": 0.14, - "learning_rate": 0.00027962229865662925, - "loss": 0.1071, + "epoch": 0.08, + "learning_rate": 0.0002878402189276932, + "loss": 0.1064, "step": 12560 }, { - "epoch": 0.14, - "learning_rate": 0.0002796060743721202, - "loss": 0.0917, + "epoch": 0.08, + "learning_rate": 0.0002878305375733362, + "loss": 0.1094, "step": 12570 }, { - "epoch": 0.14, - "learning_rate": 0.0002795898500876111, - "loss": 0.098, + "epoch": 0.08, + "learning_rate": 0.0002878208562189793, + "loss": 0.1145, "step": 12580 }, { - "epoch": 0.14, - "learning_rate": 0.0002795736258031021, - "loss": 0.0869, + "epoch": 0.08, + "learning_rate": 0.00028781117486462236, + "loss": 0.1088, "step": 12590 }, { - "epoch": 0.14, - "learning_rate": 0.000279557401518593, - "loss": 0.0996, + "epoch": 0.08, + "learning_rate": 0.00028780149351026544, + "loss": 0.1171, "step": 12600 }, { - "epoch": 0.14, - "learning_rate": 0.0002795411772340839, - "loss": 0.0908, + "epoch": 0.08, + "learning_rate": 0.0002877918121559085, + "loss": 0.101, "step": 12610 }, { - "epoch": 0.14, - "learning_rate": 0.0002795249529495749, - "loss": 0.0963, + "epoch": 0.08, + "learning_rate": 0.00028778213080155155, + "loss": 0.1133, "step": 12620 }, { - "epoch": 0.14, - "learning_rate": 0.0002795087286650658, - "loss": 0.0969, + "epoch": 0.08, + "learning_rate": 0.0002877724494471946, + "loss": 0.1089, "step": 12630 }, { - "epoch": 0.14, - "learning_rate": 0.0002794925043805568, - "loss": 0.0977, + "epoch": 0.08, + "learning_rate": 0.0002877627680928377, + "loss": 0.1027, "step": 12640 }, { - "epoch": 0.14, - "learning_rate": 0.0002794762800960477, - "loss": 0.101, + "epoch": 0.08, + "learning_rate": 0.0002877530867384808, + "loss": 0.1025, "step": 12650 }, { - "epoch": 0.14, - "learning_rate": 0.0002794600558115387, - "loss": 0.0879, + "epoch": 0.08, + "learning_rate": 0.00028774340538412387, + "loss": 0.1063, "step": 12660 }, { - "epoch": 0.14, - "learning_rate": 0.0002794438315270296, - "loss": 0.1024, + "epoch": 0.08, + "learning_rate": 0.00028773372402976695, + "loss": 0.1088, "step": 12670 }, { - "epoch": 0.14, - "learning_rate": 0.0002794276072425206, - "loss": 0.0902, + "epoch": 0.08, + "learning_rate": 0.00028772404267540997, + "loss": 0.1023, "step": 12680 }, { - "epoch": 0.14, - "learning_rate": 0.0002794113829580115, - "loss": 0.0901, + "epoch": 0.08, + "learning_rate": 0.00028771436132105305, + "loss": 0.1077, "step": 12690 }, { - "epoch": 0.14, - "learning_rate": 0.0002793951586735025, - "loss": 0.0964, + "epoch": 0.08, + "learning_rate": 0.00028770467996669613, + "loss": 0.1099, "step": 12700 }, { - "epoch": 0.14, - "learning_rate": 0.0002793789343889934, - "loss": 0.0897, + "epoch": 0.08, + "learning_rate": 0.00028769499861233916, + "loss": 0.1072, "step": 12710 }, { - "epoch": 0.14, - "learning_rate": 0.0002793627101044844, - "loss": 0.0989, + "epoch": 0.08, + "learning_rate": 0.00028768531725798224, + "loss": 0.106, "step": 12720 }, { - "epoch": 0.14, - "learning_rate": 0.0002793464858199753, - "loss": 0.0982, + "epoch": 0.08, + "learning_rate": 0.0002876756359036253, + "loss": 0.1086, "step": 12730 }, { - "epoch": 0.14, - "learning_rate": 0.0002793302615354663, - "loss": 0.0858, + "epoch": 0.08, + "learning_rate": 0.0002876659545492684, + "loss": 0.1094, "step": 12740 }, { - "epoch": 0.14, - "learning_rate": 0.0002793140372509572, - "loss": 0.0909, + "epoch": 0.08, + "learning_rate": 0.0002876562731949115, + "loss": 0.1035, "step": 12750 }, { - "epoch": 0.14, - "learning_rate": 0.00027929781296644814, - "loss": 0.1005, + "epoch": 0.08, + "learning_rate": 0.0002876465918405545, + "loss": 0.1051, "step": 12760 }, { - "epoch": 0.14, - "learning_rate": 0.0002792815886819391, - "loss": 0.095, + "epoch": 0.08, + "learning_rate": 0.0002876369104861976, + "loss": 0.1097, "step": 12770 }, { - "epoch": 0.14, - "learning_rate": 0.00027926536439743004, - "loss": 0.0894, + "epoch": 0.08, + "learning_rate": 0.00028762722913184066, + "loss": 0.1026, "step": 12780 }, { - "epoch": 0.14, - "learning_rate": 0.00027924914011292096, - "loss": 0.0868, + "epoch": 0.08, + "learning_rate": 0.00028761754777748374, + "loss": 0.1115, "step": 12790 }, { - "epoch": 0.14, - "learning_rate": 0.00027923291582841194, - "loss": 0.0896, + "epoch": 0.08, + "learning_rate": 0.0002876078664231268, + "loss": 0.1126, "step": 12800 }, { - "epoch": 0.14, - "learning_rate": 0.00027921669154390286, - "loss": 0.094, + "epoch": 0.08, + "learning_rate": 0.00028759818506876985, + "loss": 0.1075, "step": 12810 }, { - "epoch": 0.14, - "learning_rate": 0.00027920046725939384, - "loss": 0.0945, + "epoch": 0.08, + "learning_rate": 0.0002875885037144129, + "loss": 0.1071, "step": 12820 }, { - "epoch": 0.14, - "learning_rate": 0.00027918424297488476, - "loss": 0.0835, + "epoch": 0.08, + "learning_rate": 0.000287578822360056, + "loss": 0.1042, "step": 12830 }, { - "epoch": 0.14, - "learning_rate": 0.00027916801869037574, - "loss": 0.0945, + "epoch": 0.08, + "learning_rate": 0.00028756914100569903, + "loss": 0.1119, "step": 12840 }, { - "epoch": 0.14, - "learning_rate": 0.00027915179440586666, - "loss": 0.0914, + "epoch": 0.08, + "learning_rate": 0.0002875594596513421, + "loss": 0.1126, "step": 12850 }, { - "epoch": 0.14, - "learning_rate": 0.00027913557012135764, - "loss": 0.0824, + "epoch": 0.08, + "learning_rate": 0.0002875497782969852, + "loss": 0.1006, "step": 12860 }, { - "epoch": 0.14, - "learning_rate": 0.00027911934583684856, - "loss": 0.0904, + "epoch": 0.08, + "learning_rate": 0.00028754009694262827, + "loss": 0.1066, "step": 12870 }, { - "epoch": 0.14, - "learning_rate": 0.00027910312155233954, - "loss": 0.095, + "epoch": 0.08, + "learning_rate": 0.00028753041558827135, + "loss": 0.1041, "step": 12880 }, { - "epoch": 0.14, - "learning_rate": 0.00027908689726783046, - "loss": 0.0966, + "epoch": 0.08, + "learning_rate": 0.00028752073423391443, + "loss": 0.1031, "step": 12890 }, { - "epoch": 0.14, - "learning_rate": 0.00027907067298332144, - "loss": 0.0903, + "epoch": 0.08, + "learning_rate": 0.00028751105287955746, + "loss": 0.1085, "step": 12900 }, { - "epoch": 0.14, - "learning_rate": 0.00027905444869881236, - "loss": 0.0904, + "epoch": 0.08, + "learning_rate": 0.00028750137152520053, + "loss": 0.1102, "step": 12910 }, { - "epoch": 0.14, - "learning_rate": 0.00027903822441430334, - "loss": 0.0936, + "epoch": 0.08, + "learning_rate": 0.0002874916901708436, + "loss": 0.0984, "step": 12920 }, { - "epoch": 0.14, - "learning_rate": 0.00027902200012979426, - "loss": 0.0857, + "epoch": 0.08, + "learning_rate": 0.0002874820088164867, + "loss": 0.0965, "step": 12930 }, { - "epoch": 0.14, - "learning_rate": 0.0002790057758452852, - "loss": 0.0866, + "epoch": 0.08, + "learning_rate": 0.0002874723274621298, + "loss": 0.1145, "step": 12940 }, { - "epoch": 0.14, - "learning_rate": 0.00027898955156077616, - "loss": 0.0838, + "epoch": 0.08, + "learning_rate": 0.0002874626461077728, + "loss": 0.1155, "step": 12950 }, { - "epoch": 0.14, - "learning_rate": 0.0002789733272762671, - "loss": 0.0933, + "epoch": 0.08, + "learning_rate": 0.0002874529647534159, + "loss": 0.1136, "step": 12960 }, { - "epoch": 0.14, - "learning_rate": 0.000278957102991758, - "loss": 0.0837, + "epoch": 0.08, + "learning_rate": 0.00028744328339905896, + "loss": 0.1069, "step": 12970 }, { - "epoch": 0.14, - "learning_rate": 0.000278940878707249, - "loss": 0.0938, + "epoch": 0.08, + "learning_rate": 0.000287433602044702, + "loss": 0.1121, "step": 12980 }, { - "epoch": 0.14, - "learning_rate": 0.0002789246544227399, - "loss": 0.0889, + "epoch": 0.08, + "learning_rate": 0.00028742392069034506, + "loss": 0.1005, "step": 12990 }, { - "epoch": 0.14, - "learning_rate": 0.0002789084301382309, - "loss": 0.0957, + "epoch": 0.08, + "learning_rate": 0.00028741423933598814, + "loss": 0.0987, "step": 13000 }, { - "epoch": 0.14, - "eval_cer": 0.9214971171906612, - "eval_loss": 0.06272387504577637, - "eval_runtime": 119.4875, - "eval_samples_per_second": 16.738, - "eval_steps_per_second": 4.185, + "epoch": 0.08, + "eval_cer": 0.9200958083832336, + "eval_loss": 0.07392711937427521, + "eval_runtime": 120.3312, + "eval_samples_per_second": 16.621, + "eval_steps_per_second": 4.155, "step": 13000 }, { - "epoch": 0.14, - "learning_rate": 0.0002788922058537218, - "loss": 0.0954, + "epoch": 0.08, + "learning_rate": 0.0002874045579816312, + "loss": 0.1149, "step": 13010 }, { - "epoch": 0.14, - "learning_rate": 0.0002788759815692128, - "loss": 0.0972, + "epoch": 0.08, + "learning_rate": 0.0002873948766272743, + "loss": 0.1011, "step": 13020 }, { - "epoch": 0.14, - "learning_rate": 0.0002788597572847037, - "loss": 0.0898, + "epoch": 0.08, + "learning_rate": 0.0002873851952729174, + "loss": 0.1136, "step": 13030 }, { - "epoch": 0.14, - "learning_rate": 0.0002788435330001947, - "loss": 0.0877, + "epoch": 0.08, + "learning_rate": 0.0002873755139185604, + "loss": 0.1109, "step": 13040 }, { - "epoch": 0.14, - "learning_rate": 0.0002788273087156856, - "loss": 0.0902, + "epoch": 0.08, + "learning_rate": 0.0002873658325642035, + "loss": 0.1117, "step": 13050 }, { - "epoch": 0.14, - "learning_rate": 0.0002788110844311766, - "loss": 0.093, + "epoch": 0.08, + "learning_rate": 0.00028735615120984657, + "loss": 0.1051, "step": 13060 }, { - "epoch": 0.14, - "learning_rate": 0.0002787948601466675, - "loss": 0.0872, + "epoch": 0.08, + "learning_rate": 0.00028734646985548965, + "loss": 0.1075, "step": 13070 }, { - "epoch": 0.14, - "learning_rate": 0.0002787786358621585, - "loss": 0.0936, + "epoch": 0.08, + "learning_rate": 0.0002873367885011327, + "loss": 0.1025, "step": 13080 }, { - "epoch": 0.14, - "learning_rate": 0.0002787624115776494, - "loss": 0.0958, + "epoch": 0.08, + "learning_rate": 0.00028732710714677575, + "loss": 0.0982, "step": 13090 }, { - "epoch": 0.14, - "learning_rate": 0.0002787461872931404, - "loss": 0.0992, + "epoch": 0.08, + "learning_rate": 0.00028731742579241883, + "loss": 0.1047, "step": 13100 }, { - "epoch": 0.14, - "learning_rate": 0.0002787299630086313, - "loss": 0.0883, + "epoch": 0.08, + "learning_rate": 0.00028730774443806186, + "loss": 0.1087, "step": 13110 }, { - "epoch": 0.14, - "learning_rate": 0.0002787137387241222, - "loss": 0.0882, + "epoch": 0.08, + "learning_rate": 0.00028729806308370494, + "loss": 0.1004, "step": 13120 }, { - "epoch": 0.14, - "learning_rate": 0.0002786975144396132, - "loss": 0.0991, + "epoch": 0.08, + "learning_rate": 0.000287288381729348, + "loss": 0.1101, "step": 13130 }, { - "epoch": 0.14, - "learning_rate": 0.0002786812901551041, - "loss": 0.0987, + "epoch": 0.08, + "learning_rate": 0.0002872787003749911, + "loss": 0.1023, "step": 13140 }, { - "epoch": 0.14, - "learning_rate": 0.00027866506587059505, - "loss": 0.0913, + "epoch": 0.08, + "learning_rate": 0.0002872690190206342, + "loss": 0.111, "step": 13150 }, { - "epoch": 0.14, - "learning_rate": 0.000278648841586086, - "loss": 0.0919, + "epoch": 0.08, + "learning_rate": 0.00028725933766627726, + "loss": 0.1117, "step": 13160 }, { - "epoch": 0.14, - "learning_rate": 0.00027863261730157695, - "loss": 0.1029, + "epoch": 0.09, + "learning_rate": 0.00028724965631192034, + "loss": 0.1172, "step": 13170 }, { - "epoch": 0.14, - "learning_rate": 0.0002786163930170679, - "loss": 0.1001, + "epoch": 0.09, + "learning_rate": 0.00028723997495756336, + "loss": 0.1033, "step": 13180 }, { - "epoch": 0.14, - "learning_rate": 0.00027860016873255885, - "loss": 0.1008, + "epoch": 0.09, + "learning_rate": 0.00028723029360320644, + "loss": 0.1043, "step": 13190 }, { - "epoch": 0.14, - "learning_rate": 0.0002785839444480498, - "loss": 0.0954, + "epoch": 0.09, + "learning_rate": 0.0002872206122488495, + "loss": 0.1074, "step": 13200 }, { - "epoch": 0.14, - "learning_rate": 0.00027856772016354074, - "loss": 0.0915, + "epoch": 0.09, + "learning_rate": 0.00028721093089449255, + "loss": 0.1021, "step": 13210 }, { - "epoch": 0.14, - "learning_rate": 0.0002785514958790317, - "loss": 0.0923, + "epoch": 0.09, + "learning_rate": 0.00028720124954013563, + "loss": 0.0979, "step": 13220 }, { - "epoch": 0.14, - "learning_rate": 0.00027853527159452264, - "loss": 0.096, + "epoch": 0.09, + "learning_rate": 0.0002871915681857787, + "loss": 0.1012, "step": 13230 }, { - "epoch": 0.14, - "learning_rate": 0.0002785190473100136, - "loss": 0.093, + "epoch": 0.09, + "learning_rate": 0.0002871818868314218, + "loss": 0.0964, "step": 13240 }, { - "epoch": 0.14, - "learning_rate": 0.00027850282302550454, - "loss": 0.0876, + "epoch": 0.09, + "learning_rate": 0.0002871722054770648, + "loss": 0.1136, "step": 13250 }, { - "epoch": 0.14, - "learning_rate": 0.0002784865987409955, - "loss": 0.0932, - "step": 13260 + "epoch": 0.09, + "learning_rate": 0.0002871625241227079, + "loss": 0.1072, + "step": 13260 }, { - "epoch": 0.14, - "learning_rate": 0.00027847037445648644, - "loss": 0.0908, + "epoch": 0.09, + "learning_rate": 0.000287152842768351, + "loss": 0.1078, "step": 13270 }, { - "epoch": 0.14, - "learning_rate": 0.0002784541501719774, - "loss": 0.0926, + "epoch": 0.09, + "learning_rate": 0.00028714316141399405, + "loss": 0.1058, "step": 13280 }, { - "epoch": 0.14, - "learning_rate": 0.00027843792588746834, - "loss": 0.0954, + "epoch": 0.09, + "learning_rate": 0.00028713348005963713, + "loss": 0.0991, "step": 13290 }, { - "epoch": 0.14, - "learning_rate": 0.00027842170160295927, - "loss": 0.0944, + "epoch": 0.09, + "learning_rate": 0.0002871237987052802, + "loss": 0.1021, "step": 13300 }, { - "epoch": 0.14, - "learning_rate": 0.00027840547731845024, - "loss": 0.097, + "epoch": 0.09, + "learning_rate": 0.0002871141173509233, + "loss": 0.1068, "step": 13310 }, { - "epoch": 0.14, - "learning_rate": 0.00027838925303394117, - "loss": 0.0984, + "epoch": 0.09, + "learning_rate": 0.0002871044359965663, + "loss": 0.1028, "step": 13320 }, { - "epoch": 0.14, - "learning_rate": 0.0002783730287494321, - "loss": 0.0953, + "epoch": 0.09, + "learning_rate": 0.0002870947546422094, + "loss": 0.1019, "step": 13330 }, { - "epoch": 0.14, - "learning_rate": 0.00027835680446492306, - "loss": 0.1034, + "epoch": 0.09, + "learning_rate": 0.0002870850732878525, + "loss": 0.0967, "step": 13340 }, { - "epoch": 0.14, - "learning_rate": 0.000278340580180414, - "loss": 0.0965, + "epoch": 0.09, + "learning_rate": 0.0002870753919334955, + "loss": 0.1013, "step": 13350 }, { - "epoch": 0.14, - "learning_rate": 0.00027832435589590496, - "loss": 0.1001, + "epoch": 0.09, + "learning_rate": 0.0002870657105791386, + "loss": 0.1055, "step": 13360 }, { - "epoch": 0.14, - "learning_rate": 0.0002783081316113959, - "loss": 0.1089, + "epoch": 0.09, + "learning_rate": 0.00028705602922478166, + "loss": 0.0909, "step": 13370 }, { - "epoch": 0.14, - "learning_rate": 0.00027829190732688686, - "loss": 0.1111, + "epoch": 0.09, + "learning_rate": 0.00028704634787042474, + "loss": 0.1077, "step": 13380 }, { - "epoch": 0.14, - "learning_rate": 0.0002782756830423778, - "loss": 0.0912, + "epoch": 0.09, + "learning_rate": 0.00028703666651606777, + "loss": 0.1056, "step": 13390 }, { - "epoch": 0.14, - "learning_rate": 0.00027825945875786876, - "loss": 0.0981, + "epoch": 0.09, + "learning_rate": 0.00028702698516171085, + "loss": 0.0997, "step": 13400 }, { - "epoch": 0.15, - "learning_rate": 0.0002782432344733597, - "loss": 0.1012, + "epoch": 0.09, + "learning_rate": 0.00028701730380735393, + "loss": 0.0975, "step": 13410 }, { - "epoch": 0.15, - "learning_rate": 0.00027822701018885066, - "loss": 0.0897, + "epoch": 0.09, + "learning_rate": 0.000287007622452997, + "loss": 0.0976, "step": 13420 }, { - "epoch": 0.15, - "learning_rate": 0.0002782107859043416, - "loss": 0.0968, + "epoch": 0.09, + "learning_rate": 0.0002869979410986401, + "loss": 0.1058, "step": 13430 }, { - "epoch": 0.15, - "learning_rate": 0.00027819456161983256, - "loss": 0.1027, + "epoch": 0.09, + "learning_rate": 0.00028698825974428317, + "loss": 0.101, "step": 13440 }, { - "epoch": 0.15, - "learning_rate": 0.0002781783373353235, - "loss": 0.0907, + "epoch": 0.09, + "learning_rate": 0.0002869785783899262, + "loss": 0.1106, "step": 13450 }, { - "epoch": 0.15, - "learning_rate": 0.00027816211305081446, - "loss": 0.1063, + "epoch": 0.09, + "learning_rate": 0.0002869688970355693, + "loss": 0.0943, "step": 13460 }, { - "epoch": 0.15, - "learning_rate": 0.0002781458887663054, - "loss": 0.1095, + "epoch": 0.09, + "learning_rate": 0.00028695921568121235, + "loss": 0.1046, "step": 13470 }, { - "epoch": 0.15, - "learning_rate": 0.0002781296644817963, - "loss": 0.0861, + "epoch": 0.09, + "learning_rate": 0.0002869495343268554, + "loss": 0.1279, "step": 13480 }, { - "epoch": 0.15, - "learning_rate": 0.0002781134401972873, - "loss": 0.0987, + "epoch": 0.09, + "learning_rate": 0.00028693985297249846, + "loss": 0.1141, "step": 13490 }, { - "epoch": 0.15, - "learning_rate": 0.0002780972159127782, - "loss": 0.0899, + "epoch": 0.09, + "learning_rate": 0.00028693017161814154, + "loss": 0.1097, "step": 13500 }, { - "epoch": 0.15, - "learning_rate": 0.00027808099162826913, - "loss": 0.0959, + "epoch": 0.09, + "learning_rate": 0.0002869204902637846, + "loss": 0.1144, "step": 13510 }, { - "epoch": 0.15, - "learning_rate": 0.0002780647673437601, - "loss": 0.0928, + "epoch": 0.09, + "learning_rate": 0.0002869108089094277, + "loss": 0.1093, "step": 13520 }, { - "epoch": 0.15, - "learning_rate": 0.00027804854305925103, - "loss": 0.0975, + "epoch": 0.09, + "learning_rate": 0.0002869011275550707, + "loss": 0.1072, "step": 13530 }, { - "epoch": 0.15, - "learning_rate": 0.000278032318774742, - "loss": 0.0966, + "epoch": 0.09, + "learning_rate": 0.0002868914462007138, + "loss": 0.1045, "step": 13540 }, { - "epoch": 0.15, - "learning_rate": 0.00027801609449023293, - "loss": 0.0934, + "epoch": 0.09, + "learning_rate": 0.0002868817648463569, + "loss": 0.1038, "step": 13550 }, { - "epoch": 0.15, - "learning_rate": 0.0002779998702057239, - "loss": 0.0905, + "epoch": 0.09, + "learning_rate": 0.00028687208349199996, + "loss": 0.1176, "step": 13560 }, { - "epoch": 0.15, - "learning_rate": 0.00027798364592121483, - "loss": 0.0887, + "epoch": 0.09, + "learning_rate": 0.00028686240213764304, + "loss": 0.1019, "step": 13570 }, { - "epoch": 0.15, - "learning_rate": 0.0002779674216367058, - "loss": 0.0946, + "epoch": 0.09, + "learning_rate": 0.00028685272078328607, + "loss": 0.1171, "step": 13580 }, { - "epoch": 0.15, - "learning_rate": 0.00027795119735219673, - "loss": 0.0971, + "epoch": 0.09, + "learning_rate": 0.00028684303942892915, + "loss": 0.1281, "step": 13590 }, { - "epoch": 0.15, - "learning_rate": 0.0002779349730676877, - "loss": 0.081, + "epoch": 0.09, + "learning_rate": 0.00028683335807457223, + "loss": 0.1104, "step": 13600 }, { - "epoch": 0.15, - "learning_rate": 0.00027791874878317863, - "loss": 0.0848, + "epoch": 0.09, + "learning_rate": 0.00028682367672021525, + "loss": 0.1136, "step": 13610 }, { - "epoch": 0.15, - "learning_rate": 0.0002779025244986696, - "loss": 0.0933, + "epoch": 0.09, + "learning_rate": 0.00028681399536585833, + "loss": 0.1009, "step": 13620 }, { - "epoch": 0.15, - "learning_rate": 0.0002778863002141605, - "loss": 0.0921, + "epoch": 0.09, + "learning_rate": 0.0002868043140115014, + "loss": 0.1042, "step": 13630 }, { - "epoch": 0.15, - "learning_rate": 0.0002778700759296515, - "loss": 0.0883, + "epoch": 0.09, + "learning_rate": 0.0002867946326571445, + "loss": 0.1112, "step": 13640 }, { - "epoch": 0.15, - "learning_rate": 0.0002778538516451424, - "loss": 0.077, + "epoch": 0.09, + "learning_rate": 0.00028678495130278757, + "loss": 0.1037, "step": 13650 }, { - "epoch": 0.15, - "learning_rate": 0.00027783762736063335, - "loss": 0.0907, + "epoch": 0.09, + "learning_rate": 0.00028677526994843065, + "loss": 0.106, "step": 13660 }, { - "epoch": 0.15, - "learning_rate": 0.0002778214030761243, - "loss": 0.0832, + "epoch": 0.09, + "learning_rate": 0.0002867655885940737, + "loss": 0.1124, "step": 13670 }, { - "epoch": 0.15, - "learning_rate": 0.00027780517879161525, - "loss": 0.0916, + "epoch": 0.09, + "learning_rate": 0.00028675590723971676, + "loss": 0.1055, "step": 13680 }, { - "epoch": 0.15, - "learning_rate": 0.0002777889545071062, - "loss": 0.0848, + "epoch": 0.09, + "learning_rate": 0.00028674622588535984, + "loss": 0.1024, "step": 13690 }, { - "epoch": 0.15, - "learning_rate": 0.00027777273022259715, - "loss": 0.0874, + "epoch": 0.09, + "learning_rate": 0.0002867365445310029, + "loss": 0.1022, "step": 13700 }, { - "epoch": 0.15, - "learning_rate": 0.00027775650593808807, - "loss": 0.0793, + "epoch": 0.09, + "learning_rate": 0.000286726863176646, + "loss": 0.0967, "step": 13710 }, { - "epoch": 0.15, - "learning_rate": 0.00027774028165357905, - "loss": 0.0903, + "epoch": 0.09, + "learning_rate": 0.000286717181822289, + "loss": 0.1016, "step": 13720 }, { - "epoch": 0.15, - "learning_rate": 0.00027772405736906997, - "loss": 0.0911, + "epoch": 0.09, + "learning_rate": 0.0002867075004679321, + "loss": 0.0918, "step": 13730 }, { - "epoch": 0.15, - "learning_rate": 0.00027770783308456095, - "loss": 0.0928, + "epoch": 0.09, + "learning_rate": 0.0002866978191135752, + "loss": 0.0949, "step": 13740 }, { - "epoch": 0.15, - "learning_rate": 0.00027769160880005187, - "loss": 0.0982, + "epoch": 0.09, + "learning_rate": 0.0002866881377592182, + "loss": 0.1166, "step": 13750 }, { - "epoch": 0.15, - "learning_rate": 0.00027767538451554285, - "loss": 0.1, + "epoch": 0.09, + "learning_rate": 0.0002866784564048613, + "loss": 0.1115, "step": 13760 }, { - "epoch": 0.15, - "learning_rate": 0.00027765916023103377, - "loss": 0.0926, + "epoch": 0.09, + "learning_rate": 0.00028666877505050437, + "loss": 0.1073, "step": 13770 }, { - "epoch": 0.15, - "learning_rate": 0.00027764293594652475, - "loss": 0.1051, + "epoch": 0.09, + "learning_rate": 0.00028665909369614745, + "loss": 0.1031, "step": 13780 }, { - "epoch": 0.15, - "learning_rate": 0.00027762671166201567, - "loss": 0.0971, + "epoch": 0.09, + "learning_rate": 0.0002866494123417905, + "loss": 0.105, "step": 13790 }, { - "epoch": 0.15, - "learning_rate": 0.00027761048737750665, - "loss": 0.1014, + "epoch": 0.09, + "learning_rate": 0.0002866397309874336, + "loss": 0.1006, "step": 13800 }, { - "epoch": 0.15, - "learning_rate": 0.00027759426309299757, - "loss": 0.089, + "epoch": 0.09, + "learning_rate": 0.00028663004963307663, + "loss": 0.1089, "step": 13810 }, { - "epoch": 0.15, - "learning_rate": 0.00027757803880848855, - "loss": 0.1, + "epoch": 0.09, + "learning_rate": 0.0002866203682787197, + "loss": 0.1081, "step": 13820 }, { - "epoch": 0.15, - "learning_rate": 0.00027756181452397947, - "loss": 0.091, + "epoch": 0.09, + "learning_rate": 0.0002866106869243628, + "loss": 0.1045, "step": 13830 }, { - "epoch": 0.15, - "learning_rate": 0.0002775455902394704, - "loss": 0.0993, + "epoch": 0.09, + "learning_rate": 0.00028660100557000587, + "loss": 0.0947, "step": 13840 }, { - "epoch": 0.15, - "learning_rate": 0.00027752936595496137, - "loss": 0.0947, + "epoch": 0.09, + "learning_rate": 0.0002865913242156489, + "loss": 0.1136, "step": 13850 }, { - "epoch": 0.15, - "learning_rate": 0.0002775131416704523, - "loss": 0.0995, + "epoch": 0.09, + "learning_rate": 0.000286581642861292, + "loss": 0.1049, "step": 13860 }, { - "epoch": 0.15, - "learning_rate": 0.00027749691738594327, - "loss": 0.0935, + "epoch": 0.09, + "learning_rate": 0.00028657196150693506, + "loss": 0.1044, "step": 13870 }, { - "epoch": 0.15, - "learning_rate": 0.0002774806931014342, - "loss": 0.0893, + "epoch": 0.09, + "learning_rate": 0.0002865622801525781, + "loss": 0.111, "step": 13880 }, { - "epoch": 0.15, - "learning_rate": 0.0002774644688169251, - "loss": 0.1036, + "epoch": 0.09, + "learning_rate": 0.00028655259879822116, + "loss": 0.1042, "step": 13890 }, { - "epoch": 0.15, - "learning_rate": 0.0002774482445324161, - "loss": 0.096, + "epoch": 0.09, + "learning_rate": 0.00028654291744386424, + "loss": 0.106, "step": 13900 }, { - "epoch": 0.15, - "learning_rate": 0.000277432020247907, - "loss": 0.0934, + "epoch": 0.09, + "learning_rate": 0.0002865332360895073, + "loss": 0.1027, "step": 13910 }, { - "epoch": 0.15, - "learning_rate": 0.000277415795963398, - "loss": 0.0981, + "epoch": 0.09, + "learning_rate": 0.0002865235547351504, + "loss": 0.1079, "step": 13920 }, { - "epoch": 0.15, - "learning_rate": 0.0002773995716788889, - "loss": 0.0952, + "epoch": 0.09, + "learning_rate": 0.0002865138733807935, + "loss": 0.1066, "step": 13930 }, { - "epoch": 0.15, - "learning_rate": 0.0002773833473943799, - "loss": 0.0957, + "epoch": 0.09, + "learning_rate": 0.00028650419202643656, + "loss": 0.1073, "step": 13940 }, { - "epoch": 0.15, - "learning_rate": 0.0002773671231098708, - "loss": 0.0892, + "epoch": 0.09, + "learning_rate": 0.0002864945106720796, + "loss": 0.1035, "step": 13950 }, { - "epoch": 0.15, - "learning_rate": 0.0002773508988253618, - "loss": 0.0905, + "epoch": 0.09, + "learning_rate": 0.00028648482931772267, + "loss": 0.1221, "step": 13960 }, { - "epoch": 0.15, - "learning_rate": 0.0002773346745408527, - "loss": 0.0882, + "epoch": 0.09, + "learning_rate": 0.00028647514796336575, + "loss": 0.1062, "step": 13970 }, { - "epoch": 0.15, - "learning_rate": 0.0002773184502563437, - "loss": 0.0995, + "epoch": 0.09, + "learning_rate": 0.00028646546660900877, + "loss": 0.1043, "step": 13980 }, { - "epoch": 0.15, - "learning_rate": 0.0002773022259718346, - "loss": 0.0896, + "epoch": 0.09, + "learning_rate": 0.00028645578525465185, + "loss": 0.1011, "step": 13990 }, { - "epoch": 0.15, - "learning_rate": 0.0002772860016873256, - "loss": 0.0886, + "epoch": 0.09, + "learning_rate": 0.00028644610390029493, + "loss": 0.1103, "step": 14000 }, { - "epoch": 0.15, - "eval_cer": 0.9214635447864706, - "eval_loss": 0.06437470763921738, - "eval_runtime": 119.5472, - "eval_samples_per_second": 16.73, - "eval_steps_per_second": 4.182, + "epoch": 0.09, + "eval_cer": 0.9202286747260197, + "eval_loss": 0.07276194542646408, + "eval_runtime": 120.2789, + "eval_samples_per_second": 16.628, + "eval_steps_per_second": 4.157, "step": 14000 }, { - "epoch": 0.15, - "learning_rate": 0.0002772697774028165, - "loss": 0.0909, + "epoch": 0.09, + "learning_rate": 0.000286436422545938, + "loss": 0.1069, "step": 14010 }, { - "epoch": 0.15, - "learning_rate": 0.00027725355311830743, - "loss": 0.0954, + "epoch": 0.09, + "learning_rate": 0.00028642674119158104, + "loss": 0.1014, "step": 14020 }, { - "epoch": 0.15, - "learning_rate": 0.0002772373288337984, - "loss": 0.1053, + "epoch": 0.09, + "learning_rate": 0.0002864170598372241, + "loss": 0.1042, "step": 14030 }, { - "epoch": 0.15, - "learning_rate": 0.00027722110454928933, - "loss": 0.0889, + "epoch": 0.09, + "learning_rate": 0.0002864073784828672, + "loss": 0.1031, "step": 14040 }, { - "epoch": 0.15, - "learning_rate": 0.0002772048802647803, - "loss": 0.0901, + "epoch": 0.09, + "learning_rate": 0.0002863976971285103, + "loss": 0.1017, "step": 14050 }, { - "epoch": 0.15, - "learning_rate": 0.00027718865598027123, - "loss": 0.0892, + "epoch": 0.09, + "learning_rate": 0.00028638801577415336, + "loss": 0.1092, "step": 14060 }, { - "epoch": 0.15, - "learning_rate": 0.00027717243169576215, - "loss": 0.0894, + "epoch": 0.09, + "learning_rate": 0.00028637833441979644, + "loss": 0.139, "step": 14070 }, { - "epoch": 0.15, - "learning_rate": 0.00027715620741125313, - "loss": 0.0876, + "epoch": 0.09, + "learning_rate": 0.0002863686530654395, + "loss": 0.1212, "step": 14080 }, { - "epoch": 0.15, - "learning_rate": 0.0002771399831267441, - "loss": 0.0883, + "epoch": 0.09, + "learning_rate": 0.00028635897171108254, + "loss": 0.1001, "step": 14090 }, { - "epoch": 0.15, - "learning_rate": 0.00027712375884223503, - "loss": 0.0968, + "epoch": 0.09, + "learning_rate": 0.0002863492903567256, + "loss": 0.1005, "step": 14100 }, { - "epoch": 0.15, - "learning_rate": 0.000277107534557726, - "loss": 0.0847, + "epoch": 0.09, + "learning_rate": 0.0002863396090023687, + "loss": 0.0959, "step": 14110 }, { - "epoch": 0.15, - "learning_rate": 0.00027709131027321693, - "loss": 0.0836, + "epoch": 0.09, + "learning_rate": 0.0002863299276480117, + "loss": 0.1051, "step": 14120 }, { - "epoch": 0.15, - "learning_rate": 0.0002770750859887079, - "loss": 0.0908, + "epoch": 0.09, + "learning_rate": 0.0002863202462936548, + "loss": 0.101, "step": 14130 }, { - "epoch": 0.15, - "learning_rate": 0.00027705886170419883, - "loss": 0.082, + "epoch": 0.09, + "learning_rate": 0.0002863105649392979, + "loss": 0.0959, "step": 14140 }, { - "epoch": 0.15, - "learning_rate": 0.0002770426374196898, - "loss": 0.0848, + "epoch": 0.09, + "learning_rate": 0.00028630088358494097, + "loss": 0.1032, "step": 14150 }, { - "epoch": 0.15, - "learning_rate": 0.00027702641313518073, - "loss": 0.0904, + "epoch": 0.09, + "learning_rate": 0.000286291202230584, + "loss": 0.0946, "step": 14160 }, { - "epoch": 0.15, - "learning_rate": 0.00027701018885067165, - "loss": 0.0919, + "epoch": 0.09, + "learning_rate": 0.00028628152087622707, + "loss": 0.104, "step": 14170 }, { - "epoch": 0.15, - "learning_rate": 0.00027699396456616263, - "loss": 0.0955, + "epoch": 0.09, + "learning_rate": 0.00028627183952187015, + "loss": 0.1004, "step": 14180 }, { - "epoch": 0.15, - "learning_rate": 0.00027697774028165355, - "loss": 0.0847, + "epoch": 0.09, + "learning_rate": 0.00028626215816751323, + "loss": 0.1112, "step": 14190 }, { - "epoch": 0.15, - "learning_rate": 0.0002769615159971445, - "loss": 0.0886, + "epoch": 0.09, + "learning_rate": 0.0002862524768131563, + "loss": 0.1029, "step": 14200 }, { - "epoch": 0.15, - "learning_rate": 0.00027694529171263545, - "loss": 0.095, + "epoch": 0.09, + "learning_rate": 0.0002862427954587994, + "loss": 0.101, "step": 14210 }, { - "epoch": 0.15, - "learning_rate": 0.0002769290674281264, - "loss": 0.0864, + "epoch": 0.09, + "learning_rate": 0.0002862331141044424, + "loss": 0.1008, "step": 14220 }, { - "epoch": 0.15, - "learning_rate": 0.00027691284314361735, - "loss": 0.0972, + "epoch": 0.09, + "learning_rate": 0.0002862234327500855, + "loss": 0.0969, "step": 14230 }, { - "epoch": 0.15, - "learning_rate": 0.0002768966188591083, - "loss": 0.0822, + "epoch": 0.09, + "learning_rate": 0.0002862137513957286, + "loss": 0.1021, "step": 14240 }, { - "epoch": 0.15, - "learning_rate": 0.00027688039457459925, - "loss": 0.0812, + "epoch": 0.09, + "learning_rate": 0.0002862040700413716, + "loss": 0.1099, "step": 14250 }, { - "epoch": 0.15, - "learning_rate": 0.00027686417029009017, - "loss": 0.0778, + "epoch": 0.09, + "learning_rate": 0.0002861943886870147, + "loss": 0.1084, "step": 14260 }, { - "epoch": 0.15, - "learning_rate": 0.00027684794600558115, - "loss": 0.0912, + "epoch": 0.09, + "learning_rate": 0.00028618470733265776, + "loss": 0.1078, "step": 14270 }, { - "epoch": 0.15, - "learning_rate": 0.00027683172172107207, - "loss": 0.0923, + "epoch": 0.09, + "learning_rate": 0.00028617502597830084, + "loss": 0.1011, "step": 14280 }, { - "epoch": 0.15, - "learning_rate": 0.00027681549743656305, - "loss": 0.0866, + "epoch": 0.09, + "learning_rate": 0.0002861653446239439, + "loss": 0.1044, "step": 14290 }, { - "epoch": 0.15, - "learning_rate": 0.00027679927315205397, - "loss": 0.0802, + "epoch": 0.09, + "learning_rate": 0.00028615566326958695, + "loss": 0.1026, "step": 14300 }, { - "epoch": 0.15, - "learning_rate": 0.00027678304886754495, - "loss": 0.0866, + "epoch": 0.09, + "learning_rate": 0.00028614598191523, + "loss": 0.101, "step": 14310 }, { - "epoch": 0.15, - "learning_rate": 0.00027676682458303587, - "loss": 0.0843, + "epoch": 0.09, + "learning_rate": 0.0002861363005608731, + "loss": 0.1053, "step": 14320 }, { - "epoch": 0.15, - "learning_rate": 0.00027675060029852685, - "loss": 0.0875, + "epoch": 0.09, + "learning_rate": 0.0002861266192065162, + "loss": 0.0979, "step": 14330 }, { - "epoch": 0.16, - "learning_rate": 0.00027673437601401777, - "loss": 0.0984, + "epoch": 0.09, + "learning_rate": 0.00028611693785215926, + "loss": 0.1103, "step": 14340 }, { - "epoch": 0.16, - "learning_rate": 0.0002767181517295087, - "loss": 0.0879, + "epoch": 0.09, + "learning_rate": 0.00028610725649780234, + "loss": 0.1124, "step": 14350 }, { - "epoch": 0.16, - "learning_rate": 0.00027670192744499967, - "loss": 0.0877, + "epoch": 0.09, + "learning_rate": 0.00028609757514344537, + "loss": 0.1092, "step": 14360 }, { - "epoch": 0.16, - "learning_rate": 0.0002766857031604906, - "loss": 0.086, + "epoch": 0.09, + "learning_rate": 0.00028608789378908845, + "loss": 0.1079, "step": 14370 }, { - "epoch": 0.16, - "learning_rate": 0.00027666947887598157, - "loss": 0.0944, + "epoch": 0.09, + "learning_rate": 0.0002860782124347315, + "loss": 0.0947, "step": 14380 }, { - "epoch": 0.16, - "learning_rate": 0.0002766532545914725, - "loss": 0.0847, + "epoch": 0.09, + "learning_rate": 0.00028606853108037456, + "loss": 0.1024, "step": 14390 }, { - "epoch": 0.16, - "learning_rate": 0.0002766370303069634, - "loss": 0.0815, + "epoch": 0.09, + "learning_rate": 0.00028605884972601763, + "loss": 0.1067, "step": 14400 }, { - "epoch": 0.16, - "learning_rate": 0.0002766208060224544, - "loss": 0.0936, + "epoch": 0.09, + "learning_rate": 0.0002860491683716607, + "loss": 0.1036, "step": 14410 }, { - "epoch": 0.16, - "learning_rate": 0.0002766045817379453, - "loss": 0.0882, + "epoch": 0.09, + "learning_rate": 0.0002860394870173038, + "loss": 0.1066, "step": 14420 }, { - "epoch": 0.16, - "learning_rate": 0.0002765883574534363, - "loss": 0.0889, + "epoch": 0.09, + "learning_rate": 0.0002860298056629469, + "loss": 0.1053, "step": 14430 }, { - "epoch": 0.16, - "learning_rate": 0.0002765721331689272, - "loss": 0.0938, + "epoch": 0.09, + "learning_rate": 0.0002860201243085899, + "loss": 0.1058, "step": 14440 }, { - "epoch": 0.16, - "learning_rate": 0.0002765559088844182, - "loss": 0.0971, + "epoch": 0.09, + "learning_rate": 0.000286010442954233, + "loss": 0.1182, "step": 14450 }, { - "epoch": 0.16, - "learning_rate": 0.0002765396845999091, - "loss": 0.0902, + "epoch": 0.09, + "learning_rate": 0.00028600076159987606, + "loss": 0.1034, "step": 14460 }, { - "epoch": 0.16, - "learning_rate": 0.0002765234603154001, - "loss": 0.0842, + "epoch": 0.09, + "learning_rate": 0.00028599108024551914, + "loss": 0.1111, "step": 14470 }, { - "epoch": 0.16, - "learning_rate": 0.000276507236030891, - "loss": 0.0873, + "epoch": 0.09, + "learning_rate": 0.0002859813988911622, + "loss": 0.099, "step": 14480 }, { - "epoch": 0.16, - "learning_rate": 0.000276491011746382, - "loss": 0.0913, + "epoch": 0.09, + "learning_rate": 0.00028597171753680524, + "loss": 0.1009, "step": 14490 }, { - "epoch": 0.16, - "learning_rate": 0.0002764747874618729, - "loss": 0.091, + "epoch": 0.09, + "learning_rate": 0.0002859620361824483, + "loss": 0.0996, "step": 14500 }, { - "epoch": 0.16, - "learning_rate": 0.0002764585631773639, - "loss": 0.0955, + "epoch": 0.09, + "learning_rate": 0.0002859523548280914, + "loss": 0.0919, "step": 14510 }, { - "epoch": 0.16, - "learning_rate": 0.0002764423388928548, - "loss": 0.0896, + "epoch": 0.09, + "learning_rate": 0.00028594267347373443, + "loss": 0.099, "step": 14520 }, { - "epoch": 0.16, - "learning_rate": 0.00027642611460834574, - "loss": 0.0911, + "epoch": 0.09, + "learning_rate": 0.0002859329921193775, + "loss": 0.1008, "step": 14530 }, { - "epoch": 0.16, - "learning_rate": 0.0002764098903238367, - "loss": 0.1007, + "epoch": 0.09, + "learning_rate": 0.0002859233107650206, + "loss": 0.0936, "step": 14540 }, { - "epoch": 0.16, - "learning_rate": 0.00027639366603932763, - "loss": 0.1051, + "epoch": 0.09, + "learning_rate": 0.00028591362941066367, + "loss": 0.0996, "step": 14550 }, { - "epoch": 0.16, - "learning_rate": 0.0002763774417548186, - "loss": 0.0886, + "epoch": 0.09, + "learning_rate": 0.00028590394805630675, + "loss": 0.0957, "step": 14560 }, { - "epoch": 0.16, - "learning_rate": 0.00027636121747030953, - "loss": 0.0879, + "epoch": 0.09, + "learning_rate": 0.00028589426670194983, + "loss": 0.0986, "step": 14570 }, { - "epoch": 0.16, - "learning_rate": 0.00027634499318580046, - "loss": 0.0833, + "epoch": 0.09, + "learning_rate": 0.00028588458534759285, + "loss": 0.1045, "step": 14580 }, { - "epoch": 0.16, - "learning_rate": 0.00027632876890129143, - "loss": 0.0873, + "epoch": 0.09, + "learning_rate": 0.00028587490399323593, + "loss": 0.1011, "step": 14590 }, { - "epoch": 0.16, - "learning_rate": 0.00027631254461678236, - "loss": 0.0857, + "epoch": 0.09, + "learning_rate": 0.000285865222638879, + "loss": 0.0972, "step": 14600 }, { - "epoch": 0.16, - "learning_rate": 0.00027629632033227333, - "loss": 0.0853, + "epoch": 0.09, + "learning_rate": 0.0002858555412845221, + "loss": 0.1052, "step": 14610 }, { - "epoch": 0.16, - "learning_rate": 0.00027628009604776426, - "loss": 0.0898, + "epoch": 0.09, + "learning_rate": 0.0002858458599301651, + "loss": 0.1155, "step": 14620 }, { - "epoch": 0.16, - "learning_rate": 0.00027626387176325523, - "loss": 0.0815, + "epoch": 0.09, + "learning_rate": 0.0002858361785758082, + "loss": 0.0995, "step": 14630 }, { - "epoch": 0.16, - "learning_rate": 0.00027624764747874616, - "loss": 0.0858, + "epoch": 0.09, + "learning_rate": 0.0002858264972214513, + "loss": 0.1212, "step": 14640 }, { - "epoch": 0.16, - "learning_rate": 0.00027623142319423713, - "loss": 0.0953, + "epoch": 0.09, + "learning_rate": 0.0002858168158670943, + "loss": 0.1033, "step": 14650 }, { - "epoch": 0.16, - "learning_rate": 0.00027621519890972805, - "loss": 0.0823, + "epoch": 0.09, + "learning_rate": 0.0002858071345127374, + "loss": 0.1007, "step": 14660 }, { - "epoch": 0.16, - "learning_rate": 0.00027619897462521903, - "loss": 0.0971, + "epoch": 0.09, + "learning_rate": 0.00028579745315838046, + "loss": 0.0987, "step": 14670 }, { - "epoch": 0.16, - "learning_rate": 0.00027618275034070995, - "loss": 0.1007, + "epoch": 0.09, + "learning_rate": 0.00028578777180402354, + "loss": 0.1038, "step": 14680 }, { - "epoch": 0.16, - "learning_rate": 0.00027616652605620093, - "loss": 0.098, + "epoch": 0.09, + "learning_rate": 0.0002857780904496666, + "loss": 0.1036, "step": 14690 }, { - "epoch": 0.16, - "learning_rate": 0.00027615030177169185, - "loss": 0.0908, + "epoch": 0.09, + "learning_rate": 0.0002857684090953097, + "loss": 0.0976, "step": 14700 }, { - "epoch": 0.16, - "learning_rate": 0.0002761340774871828, - "loss": 0.0975, + "epoch": 0.09, + "learning_rate": 0.0002857587277409528, + "loss": 0.106, "step": 14710 }, { - "epoch": 0.16, - "learning_rate": 0.00027611785320267375, - "loss": 0.0949, + "epoch": 0.1, + "learning_rate": 0.0002857490463865958, + "loss": 0.1001, "step": 14720 }, { - "epoch": 0.16, - "learning_rate": 0.0002761016289181647, - "loss": 0.1008, + "epoch": 0.1, + "learning_rate": 0.0002857393650322389, + "loss": 0.0998, "step": 14730 }, { - "epoch": 0.16, - "learning_rate": 0.00027608540463365565, - "loss": 0.0952, + "epoch": 0.1, + "learning_rate": 0.00028572968367788197, + "loss": 0.0958, "step": 14740 }, { - "epoch": 0.16, - "learning_rate": 0.0002760691803491466, - "loss": 0.0924, + "epoch": 0.1, + "learning_rate": 0.00028572000232352505, + "loss": 0.1017, "step": 14750 }, { - "epoch": 0.16, - "learning_rate": 0.0002760529560646375, - "loss": 0.0887, + "epoch": 0.1, + "learning_rate": 0.0002857103209691681, + "loss": 0.0914, "step": 14760 }, { - "epoch": 0.16, - "learning_rate": 0.0002760367317801285, - "loss": 0.1009, + "epoch": 0.1, + "learning_rate": 0.00028570063961481115, + "loss": 0.0973, "step": 14770 }, { - "epoch": 0.16, - "learning_rate": 0.0002760205074956194, - "loss": 0.0833, + "epoch": 0.1, + "learning_rate": 0.00028569095826045423, + "loss": 0.1059, "step": 14780 }, { - "epoch": 0.16, - "learning_rate": 0.0002760042832111104, - "loss": 0.0973, + "epoch": 0.1, + "learning_rate": 0.00028568127690609726, + "loss": 0.087, "step": 14790 }, { - "epoch": 0.16, - "learning_rate": 0.0002759880589266013, - "loss": 0.0969, + "epoch": 0.1, + "learning_rate": 0.00028567159555174034, + "loss": 0.0975, "step": 14800 }, { - "epoch": 0.16, - "learning_rate": 0.0002759718346420923, - "loss": 0.0857, + "epoch": 0.1, + "learning_rate": 0.0002856619141973834, + "loss": 0.0959, "step": 14810 }, { - "epoch": 0.16, - "learning_rate": 0.0002759556103575832, - "loss": 0.087, + "epoch": 0.1, + "learning_rate": 0.0002856522328430265, + "loss": 0.1045, "step": 14820 }, { - "epoch": 0.16, - "learning_rate": 0.0002759393860730742, - "loss": 0.0939, + "epoch": 0.1, + "learning_rate": 0.0002856425514886696, + "loss": 0.1027, "step": 14830 }, { - "epoch": 0.16, - "learning_rate": 0.0002759231617885651, - "loss": 0.0885, + "epoch": 0.1, + "learning_rate": 0.00028563287013431266, + "loss": 0.1016, "step": 14840 }, { - "epoch": 0.16, - "learning_rate": 0.0002759069375040561, - "loss": 0.0903, + "epoch": 0.1, + "learning_rate": 0.00028562318877995574, + "loss": 0.1028, "step": 14850 }, { - "epoch": 0.16, - "learning_rate": 0.000275890713219547, - "loss": 0.0893, + "epoch": 0.1, + "learning_rate": 0.00028561350742559876, + "loss": 0.1035, "step": 14860 }, { - "epoch": 0.16, - "learning_rate": 0.000275874488935038, - "loss": 0.097, + "epoch": 0.1, + "learning_rate": 0.00028560382607124184, + "loss": 0.0938, "step": 14870 }, { - "epoch": 0.16, - "learning_rate": 0.0002758582646505289, - "loss": 0.0963, + "epoch": 0.1, + "learning_rate": 0.0002855941447168849, + "loss": 0.106, "step": 14880 }, { - "epoch": 0.16, - "learning_rate": 0.0002758420403660198, - "loss": 0.0869, + "epoch": 0.1, + "learning_rate": 0.00028558446336252795, + "loss": 0.1043, "step": 14890 }, { - "epoch": 0.16, - "learning_rate": 0.0002758258160815108, - "loss": 0.09, + "epoch": 0.1, + "learning_rate": 0.00028557478200817103, + "loss": 0.0851, "step": 14900 }, { - "epoch": 0.16, - "learning_rate": 0.0002758095917970017, - "loss": 0.0989, + "epoch": 0.1, + "learning_rate": 0.0002855651006538141, + "loss": 0.0939, "step": 14910 }, { - "epoch": 0.16, - "learning_rate": 0.0002757933675124927, - "loss": 0.0868, + "epoch": 0.1, + "learning_rate": 0.0002855554192994572, + "loss": 0.0974, "step": 14920 }, { - "epoch": 0.16, - "learning_rate": 0.0002757771432279836, - "loss": 0.0831, + "epoch": 0.1, + "learning_rate": 0.0002855457379451002, + "loss": 0.0912, "step": 14930 }, { - "epoch": 0.16, - "learning_rate": 0.00027576091894347454, - "loss": 0.0824, + "epoch": 0.1, + "learning_rate": 0.0002855360565907433, + "loss": 0.0976, "step": 14940 }, { - "epoch": 0.16, - "learning_rate": 0.0002757446946589655, - "loss": 0.0881, + "epoch": 0.1, + "learning_rate": 0.0002855263752363864, + "loss": 0.0929, "step": 14950 }, { - "epoch": 0.16, - "learning_rate": 0.00027572847037445644, - "loss": 0.0929, + "epoch": 0.1, + "learning_rate": 0.00028551669388202945, + "loss": 0.0936, "step": 14960 }, { - "epoch": 0.16, - "learning_rate": 0.0002757122460899474, - "loss": 0.0923, + "epoch": 0.1, + "learning_rate": 0.00028550701252767253, + "loss": 0.0907, "step": 14970 }, { - "epoch": 0.16, - "learning_rate": 0.00027569602180543834, - "loss": 0.0881, + "epoch": 0.1, + "learning_rate": 0.0002854973311733156, + "loss": 0.0955, "step": 14980 }, { - "epoch": 0.16, - "learning_rate": 0.0002756797975209293, - "loss": 0.0958, + "epoch": 0.1, + "learning_rate": 0.00028548764981895864, + "loss": 0.1038, "step": 14990 }, { - "epoch": 0.16, - "learning_rate": 0.00027566357323642024, - "loss": 0.0911, + "epoch": 0.1, + "learning_rate": 0.0002854779684646017, + "loss": 0.0961, "step": 15000 }, { - "epoch": 0.16, - "eval_cer": 0.9214812144728868, - "eval_loss": 0.06044168025255203, - "eval_runtime": 119.8479, - "eval_samples_per_second": 16.688, - "eval_steps_per_second": 4.172, + "epoch": 0.1, + "eval_cer": 0.920247655632132, + "eval_loss": 0.06776795536279678, + "eval_runtime": 120.3481, + "eval_samples_per_second": 16.618, + "eval_steps_per_second": 4.155, "step": 15000 }, { - "epoch": 0.16, - "learning_rate": 0.0002756473489519112, - "loss": 0.0954, + "epoch": 0.1, + "learning_rate": 0.0002854682871102448, + "loss": 0.0853, "step": 15010 }, { - "epoch": 0.16, - "learning_rate": 0.00027563112466740214, - "loss": 0.0879, + "epoch": 0.1, + "learning_rate": 0.0002854586057558878, + "loss": 0.0897, "step": 15020 }, { - "epoch": 0.16, - "learning_rate": 0.0002756149003828931, - "loss": 0.0972, + "epoch": 0.1, + "learning_rate": 0.0002854489244015309, + "loss": 0.0973, "step": 15030 }, { - "epoch": 0.16, - "learning_rate": 0.00027559867609838404, - "loss": 0.091, + "epoch": 0.1, + "learning_rate": 0.000285439243047174, + "loss": 0.1026, "step": 15040 }, { - "epoch": 0.16, - "learning_rate": 0.000275582451813875, - "loss": 0.0835, + "epoch": 0.1, + "learning_rate": 0.00028542956169281706, + "loss": 0.1108, "step": 15050 }, { - "epoch": 0.16, - "learning_rate": 0.00027556622752936594, - "loss": 0.0884, + "epoch": 0.1, + "learning_rate": 0.00028541988033846014, + "loss": 0.1114, "step": 15060 }, { - "epoch": 0.16, - "learning_rate": 0.0002755500032448569, - "loss": 0.0962, + "epoch": 0.1, + "learning_rate": 0.00028541019898410317, + "loss": 0.1023, "step": 15070 }, { - "epoch": 0.16, - "learning_rate": 0.00027553377896034784, - "loss": 0.0848, + "epoch": 0.1, + "learning_rate": 0.00028540051762974625, + "loss": 0.0959, "step": 15080 }, { - "epoch": 0.16, - "learning_rate": 0.00027551755467583876, - "loss": 0.0942, + "epoch": 0.1, + "learning_rate": 0.00028539083627538933, + "loss": 0.0984, "step": 15090 }, { - "epoch": 0.16, - "learning_rate": 0.00027550133039132974, - "loss": 0.09, + "epoch": 0.1, + "learning_rate": 0.0002853811549210324, + "loss": 0.0919, "step": 15100 }, { - "epoch": 0.16, - "learning_rate": 0.00027548510610682066, - "loss": 0.0853, + "epoch": 0.1, + "learning_rate": 0.0002853714735666755, + "loss": 0.1085, "step": 15110 }, { - "epoch": 0.16, - "learning_rate": 0.0002754688818223116, - "loss": 0.0895, + "epoch": 0.1, + "learning_rate": 0.00028536179221231857, + "loss": 0.1042, "step": 15120 }, { - "epoch": 0.16, - "learning_rate": 0.00027545265753780256, - "loss": 0.0821, + "epoch": 0.1, + "learning_rate": 0.0002853521108579616, + "loss": 0.1105, "step": 15130 }, { - "epoch": 0.16, - "learning_rate": 0.0002754364332532935, - "loss": 0.0891, + "epoch": 0.1, + "learning_rate": 0.00028534242950360467, + "loss": 0.0926, "step": 15140 }, { - "epoch": 0.16, - "learning_rate": 0.00027542020896878446, - "loss": 0.0927, + "epoch": 0.1, + "learning_rate": 0.00028533274814924775, + "loss": 0.0997, "step": 15150 }, { - "epoch": 0.16, - "learning_rate": 0.0002754039846842754, - "loss": 0.0904, + "epoch": 0.1, + "learning_rate": 0.0002853230667948908, + "loss": 0.0958, "step": 15160 }, { - "epoch": 0.16, - "learning_rate": 0.00027538776039976636, - "loss": 0.0901, + "epoch": 0.1, + "learning_rate": 0.00028531338544053386, + "loss": 0.101, "step": 15170 }, { - "epoch": 0.16, - "learning_rate": 0.0002753715361152573, - "loss": 0.0884, + "epoch": 0.1, + "learning_rate": 0.00028530370408617694, + "loss": 0.1052, "step": 15180 }, { - "epoch": 0.16, - "learning_rate": 0.00027535531183074826, - "loss": 0.0894, + "epoch": 0.1, + "learning_rate": 0.00028529402273182, + "loss": 0.0912, "step": 15190 }, { - "epoch": 0.16, - "learning_rate": 0.0002753390875462392, - "loss": 0.0913, + "epoch": 0.1, + "learning_rate": 0.0002852843413774631, + "loss": 0.1009, "step": 15200 }, { - "epoch": 0.16, - "learning_rate": 0.00027532286326173016, - "loss": 0.0953, + "epoch": 0.1, + "learning_rate": 0.0002852746600231061, + "loss": 0.0997, "step": 15210 }, { - "epoch": 0.16, - "learning_rate": 0.0002753066389772211, - "loss": 0.0818, + "epoch": 0.1, + "learning_rate": 0.0002852649786687492, + "loss": 0.0946, "step": 15220 }, { - "epoch": 0.16, - "learning_rate": 0.00027529041469271206, - "loss": 0.0934, + "epoch": 0.1, + "learning_rate": 0.0002852552973143923, + "loss": 0.0972, "step": 15230 }, { - "epoch": 0.16, - "learning_rate": 0.000275274190408203, - "loss": 0.0835, + "epoch": 0.1, + "learning_rate": 0.00028524561596003536, + "loss": 0.1068, "step": 15240 }, { - "epoch": 0.16, - "learning_rate": 0.00027525796612369396, - "loss": 0.0962, + "epoch": 0.1, + "learning_rate": 0.00028523593460567844, + "loss": 0.1036, "step": 15250 }, { - "epoch": 0.17, - "learning_rate": 0.0002752417418391849, - "loss": 0.0937, + "epoch": 0.1, + "learning_rate": 0.00028522625325132147, + "loss": 0.0936, "step": 15260 }, { - "epoch": 0.17, - "learning_rate": 0.0002752255175546758, - "loss": 0.1017, + "epoch": 0.1, + "learning_rate": 0.00028521657189696455, + "loss": 0.0935, "step": 15270 }, { - "epoch": 0.17, - "learning_rate": 0.0002752092932701668, - "loss": 0.0894, + "epoch": 0.1, + "learning_rate": 0.0002852068905426076, + "loss": 0.0956, "step": 15280 }, { - "epoch": 0.17, - "learning_rate": 0.0002751930689856577, - "loss": 0.0877, + "epoch": 0.1, + "learning_rate": 0.00028519720918825065, + "loss": 0.1018, "step": 15290 }, { - "epoch": 0.17, - "learning_rate": 0.0002751768447011486, - "loss": 0.0813, + "epoch": 0.1, + "learning_rate": 0.00028518752783389373, + "loss": 0.0972, "step": 15300 }, { - "epoch": 0.17, - "learning_rate": 0.0002751606204166396, - "loss": 0.0938, + "epoch": 0.1, + "learning_rate": 0.0002851778464795368, + "loss": 0.1001, "step": 15310 }, { - "epoch": 0.17, - "learning_rate": 0.0002751443961321305, - "loss": 0.0776, + "epoch": 0.1, + "learning_rate": 0.0002851681651251799, + "loss": 0.0963, "step": 15320 }, { - "epoch": 0.17, - "learning_rate": 0.0002751281718476215, - "loss": 0.0809, + "epoch": 0.1, + "learning_rate": 0.00028515848377082297, + "loss": 0.1074, "step": 15330 }, { - "epoch": 0.17, - "learning_rate": 0.0002751119475631124, - "loss": 0.0817, + "epoch": 0.1, + "learning_rate": 0.00028514880241646605, + "loss": 0.0972, "step": 15340 }, { - "epoch": 0.17, - "learning_rate": 0.0002750957232786034, - "loss": 0.0865, + "epoch": 0.1, + "learning_rate": 0.0002851391210621091, + "loss": 0.0921, "step": 15350 }, { - "epoch": 0.17, - "learning_rate": 0.0002750794989940943, - "loss": 0.0922, + "epoch": 0.1, + "learning_rate": 0.00028512943970775216, + "loss": 0.0981, "step": 15360 }, { - "epoch": 0.17, - "learning_rate": 0.0002750632747095853, - "loss": 0.0924, + "epoch": 0.1, + "learning_rate": 0.00028511975835339524, + "loss": 0.103, "step": 15370 }, { - "epoch": 0.17, - "learning_rate": 0.0002750470504250762, - "loss": 0.095, + "epoch": 0.1, + "learning_rate": 0.0002851100769990383, + "loss": 0.0917, "step": 15380 }, { - "epoch": 0.17, - "learning_rate": 0.0002750308261405672, - "loss": 0.1013, + "epoch": 0.1, + "learning_rate": 0.00028510039564468134, + "loss": 0.0997, "step": 15390 }, { - "epoch": 0.17, - "learning_rate": 0.0002750146018560581, - "loss": 0.0971, + "epoch": 0.1, + "learning_rate": 0.0002850907142903244, + "loss": 0.0978, "step": 15400 }, { - "epoch": 0.17, - "learning_rate": 0.0002749983775715491, - "loss": 0.0958, + "epoch": 0.1, + "learning_rate": 0.0002850810329359675, + "loss": 0.1009, "step": 15410 }, { - "epoch": 0.17, - "learning_rate": 0.00027498215328704, - "loss": 0.096, + "epoch": 0.1, + "learning_rate": 0.0002850713515816105, + "loss": 0.0993, "step": 15420 }, { - "epoch": 0.17, - "learning_rate": 0.000274965929002531, - "loss": 0.1043, + "epoch": 0.1, + "learning_rate": 0.0002850616702272536, + "loss": 0.1005, "step": 15430 }, { - "epoch": 0.17, - "learning_rate": 0.0002749497047180219, - "loss": 0.0855, + "epoch": 0.1, + "learning_rate": 0.0002850519888728967, + "loss": 0.0921, "step": 15440 }, { - "epoch": 0.17, - "learning_rate": 0.00027493348043351284, - "loss": 0.0932, + "epoch": 0.1, + "learning_rate": 0.00028504230751853977, + "loss": 0.0853, "step": 15450 }, { - "epoch": 0.17, - "learning_rate": 0.0002749172561490038, - "loss": 0.0868, + "epoch": 0.1, + "learning_rate": 0.00028503262616418285, + "loss": 0.1108, "step": 15460 }, { - "epoch": 0.17, - "learning_rate": 0.00027490103186449474, - "loss": 0.0947, + "epoch": 0.1, + "learning_rate": 0.0002850229448098259, + "loss": 0.1126, "step": 15470 }, { - "epoch": 0.17, - "learning_rate": 0.00027488480757998567, - "loss": 0.0881, + "epoch": 0.1, + "learning_rate": 0.000285013263455469, + "loss": 0.1089, "step": 15480 }, { - "epoch": 0.17, - "learning_rate": 0.00027486858329547664, - "loss": 0.0916, + "epoch": 0.1, + "learning_rate": 0.00028500358210111203, + "loss": 0.099, "step": 15490 }, { - "epoch": 0.17, - "learning_rate": 0.00027485235901096756, - "loss": 0.0855, + "epoch": 0.1, + "learning_rate": 0.0002849939007467551, + "loss": 0.0974, "step": 15500 }, { - "epoch": 0.17, - "learning_rate": 0.00027483613472645854, - "loss": 0.089, + "epoch": 0.1, + "learning_rate": 0.0002849842193923982, + "loss": 0.0993, "step": 15510 }, { - "epoch": 0.17, - "learning_rate": 0.00027481991044194946, - "loss": 0.0988, + "epoch": 0.1, + "learning_rate": 0.00028497453803804127, + "loss": 0.0981, "step": 15520 }, { - "epoch": 0.17, - "learning_rate": 0.00027480368615744044, - "loss": 0.0937, + "epoch": 0.1, + "learning_rate": 0.0002849648566836843, + "loss": 0.0908, "step": 15530 }, { - "epoch": 0.17, - "learning_rate": 0.00027478746187293136, - "loss": 0.0862, + "epoch": 0.1, + "learning_rate": 0.0002849551753293274, + "loss": 0.1029, "step": 15540 }, { - "epoch": 0.17, - "learning_rate": 0.00027477123758842234, - "loss": 0.0863, + "epoch": 0.1, + "learning_rate": 0.00028494549397497046, + "loss": 0.0925, "step": 15550 }, { - "epoch": 0.17, - "learning_rate": 0.00027475501330391326, - "loss": 0.1047, + "epoch": 0.1, + "learning_rate": 0.0002849358126206135, + "loss": 0.1004, "step": 15560 }, { - "epoch": 0.17, - "learning_rate": 0.00027473878901940424, - "loss": 0.0856, + "epoch": 0.1, + "learning_rate": 0.00028492613126625656, + "loss": 0.0998, "step": 15570 }, { - "epoch": 0.17, - "learning_rate": 0.00027472256473489516, - "loss": 0.0929, + "epoch": 0.1, + "learning_rate": 0.00028491644991189964, + "loss": 0.1028, "step": 15580 }, { - "epoch": 0.17, - "learning_rate": 0.00027470634045038614, - "loss": 0.0877, + "epoch": 0.1, + "learning_rate": 0.0002849067685575427, + "loss": 0.0997, "step": 15590 }, { - "epoch": 0.17, - "learning_rate": 0.00027469011616587706, - "loss": 0.0975, + "epoch": 0.1, + "learning_rate": 0.0002848970872031858, + "loss": 0.0942, "step": 15600 }, { - "epoch": 0.17, - "learning_rate": 0.00027467389188136804, - "loss": 0.0911, + "epoch": 0.1, + "learning_rate": 0.0002848874058488289, + "loss": 0.0996, "step": 15610 }, { - "epoch": 0.17, - "learning_rate": 0.00027465766759685896, - "loss": 0.089, + "epoch": 0.1, + "learning_rate": 0.00028487772449447196, + "loss": 0.0999, "step": 15620 }, { - "epoch": 0.17, - "learning_rate": 0.0002746414433123499, - "loss": 0.0878, + "epoch": 0.1, + "learning_rate": 0.000284868043140115, + "loss": 0.09, "step": 15630 }, { - "epoch": 0.17, - "learning_rate": 0.00027462521902784086, - "loss": 0.0853, + "epoch": 0.1, + "learning_rate": 0.00028485836178575807, + "loss": 0.0962, "step": 15640 }, { - "epoch": 0.17, - "learning_rate": 0.0002746089947433318, - "loss": 0.0846, + "epoch": 0.1, + "learning_rate": 0.00028484868043140115, + "loss": 0.0972, "step": 15650 }, { - "epoch": 0.17, - "learning_rate": 0.0002745927704588227, - "loss": 0.0783, + "epoch": 0.1, + "learning_rate": 0.00028483899907704417, + "loss": 0.0863, "step": 15660 }, { - "epoch": 0.17, - "learning_rate": 0.0002745765461743137, - "loss": 0.0989, + "epoch": 0.1, + "learning_rate": 0.00028482931772268725, + "loss": 0.0994, "step": 15670 }, { - "epoch": 0.17, - "learning_rate": 0.0002745603218898046, - "loss": 0.089, + "epoch": 0.1, + "learning_rate": 0.00028481963636833033, + "loss": 0.101, "step": 15680 }, { - "epoch": 0.17, - "learning_rate": 0.0002745440976052956, - "loss": 0.0923, + "epoch": 0.1, + "learning_rate": 0.0002848099550139734, + "loss": 0.0956, "step": 15690 }, { - "epoch": 0.17, - "learning_rate": 0.0002745278733207865, - "loss": 0.0868, + "epoch": 0.1, + "learning_rate": 0.00028480027365961644, + "loss": 0.0891, "step": 15700 }, { - "epoch": 0.17, - "learning_rate": 0.0002745116490362775, - "loss": 0.0876, + "epoch": 0.1, + "learning_rate": 0.0002847905923052595, + "loss": 0.0925, "step": 15710 }, { - "epoch": 0.17, - "learning_rate": 0.0002744954247517684, - "loss": 0.0838, + "epoch": 0.1, + "learning_rate": 0.0002847809109509026, + "loss": 0.0992, "step": 15720 }, { - "epoch": 0.17, - "learning_rate": 0.0002744792004672594, - "loss": 0.0957, + "epoch": 0.1, + "learning_rate": 0.0002847712295965457, + "loss": 0.0942, "step": 15730 }, { - "epoch": 0.17, - "learning_rate": 0.0002744629761827503, - "loss": 0.0894, + "epoch": 0.1, + "learning_rate": 0.00028476154824218875, + "loss": 0.1007, "step": 15740 }, { - "epoch": 0.17, - "learning_rate": 0.0002744467518982413, - "loss": 0.0945, + "epoch": 0.1, + "learning_rate": 0.00028475186688783183, + "loss": 0.0996, "step": 15750 }, { - "epoch": 0.17, - "learning_rate": 0.0002744305276137322, - "loss": 0.0971, + "epoch": 0.1, + "learning_rate": 0.00028474218553347486, + "loss": 0.1, "step": 15760 }, { - "epoch": 0.17, - "learning_rate": 0.0002744143033292232, - "loss": 0.0871, + "epoch": 0.1, + "learning_rate": 0.00028473250417911794, + "loss": 0.1066, "step": 15770 }, { - "epoch": 0.17, - "learning_rate": 0.0002743980790447141, - "loss": 0.0884, + "epoch": 0.1, + "learning_rate": 0.000284722822824761, + "loss": 0.107, "step": 15780 }, { - "epoch": 0.17, - "learning_rate": 0.0002743818547602051, - "loss": 0.0861, + "epoch": 0.1, + "learning_rate": 0.00028471314147040405, + "loss": 0.0939, "step": 15790 }, { - "epoch": 0.17, - "learning_rate": 0.000274365630475696, - "loss": 0.0829, + "epoch": 0.1, + "learning_rate": 0.0002847034601160471, + "loss": 0.1056, "step": 15800 }, { - "epoch": 0.17, - "learning_rate": 0.0002743494061911869, - "loss": 0.0895, + "epoch": 0.1, + "learning_rate": 0.0002846937787616902, + "loss": 0.099, "step": 15810 }, { - "epoch": 0.17, - "learning_rate": 0.0002743331819066779, - "loss": 0.0827, + "epoch": 0.1, + "learning_rate": 0.0002846840974073333, + "loss": 0.0986, "step": 15820 }, { - "epoch": 0.17, - "learning_rate": 0.0002743169576221688, - "loss": 0.0899, + "epoch": 0.1, + "learning_rate": 0.00028467441605297636, + "loss": 0.1002, "step": 15830 }, { - "epoch": 0.17, - "learning_rate": 0.00027430073333765975, - "loss": 0.0965, + "epoch": 0.1, + "learning_rate": 0.0002846647346986194, + "loss": 0.106, "step": 15840 }, { - "epoch": 0.17, - "learning_rate": 0.0002742845090531507, - "loss": 0.09, + "epoch": 0.1, + "learning_rate": 0.00028465505334426247, + "loss": 0.1035, "step": 15850 }, { - "epoch": 0.17, - "learning_rate": 0.00027426828476864165, - "loss": 0.0854, + "epoch": 0.1, + "learning_rate": 0.00028464537198990555, + "loss": 0.1059, "step": 15860 }, { - "epoch": 0.17, - "learning_rate": 0.0002742520604841326, - "loss": 0.0973, + "epoch": 0.1, + "learning_rate": 0.00028463569063554863, + "loss": 0.0931, "step": 15870 }, { - "epoch": 0.17, - "learning_rate": 0.00027423583619962355, - "loss": 0.103, + "epoch": 0.1, + "learning_rate": 0.0002846260092811917, + "loss": 0.0956, "step": 15880 }, { - "epoch": 0.17, - "learning_rate": 0.0002742196119151145, - "loss": 0.0963, + "epoch": 0.1, + "learning_rate": 0.0002846163279268348, + "loss": 0.1004, "step": 15890 }, { - "epoch": 0.17, - "learning_rate": 0.00027420338763060545, - "loss": 0.0896, + "epoch": 0.1, + "learning_rate": 0.0002846066465724778, + "loss": 0.0895, "step": 15900 }, { - "epoch": 0.17, - "learning_rate": 0.0002741871633460964, - "loss": 0.0876, + "epoch": 0.1, + "learning_rate": 0.0002845969652181209, + "loss": 0.0894, "step": 15910 }, { - "epoch": 0.17, - "learning_rate": 0.00027417093906158735, - "loss": 0.0921, + "epoch": 0.1, + "learning_rate": 0.000284587283863764, + "loss": 0.0906, "step": 15920 }, { - "epoch": 0.17, - "learning_rate": 0.0002741547147770783, - "loss": 0.0888, + "epoch": 0.1, + "learning_rate": 0.000284577602509407, + "loss": 0.0971, "step": 15930 }, { - "epoch": 0.17, - "learning_rate": 0.00027413849049256925, - "loss": 0.0865, + "epoch": 0.1, + "learning_rate": 0.0002845679211550501, + "loss": 0.0994, "step": 15940 }, { - "epoch": 0.17, - "learning_rate": 0.0002741222662080602, - "loss": 0.0831, + "epoch": 0.1, + "learning_rate": 0.00028455823980069316, + "loss": 0.0999, "step": 15950 }, { - "epoch": 0.17, - "learning_rate": 0.00027410604192355115, - "loss": 0.0939, + "epoch": 0.1, + "learning_rate": 0.00028454855844633624, + "loss": 0.1041, "step": 15960 }, { - "epoch": 0.17, - "learning_rate": 0.0002740898176390421, - "loss": 0.0862, + "epoch": 0.1, + "learning_rate": 0.0002845388770919793, + "loss": 0.1059, "step": 15970 }, { - "epoch": 0.17, - "learning_rate": 0.00027407359335453305, - "loss": 0.0933, + "epoch": 0.1, + "learning_rate": 0.00028452919573762234, + "loss": 0.106, "step": 15980 }, { - "epoch": 0.17, - "learning_rate": 0.00027405736907002397, - "loss": 0.0881, + "epoch": 0.1, + "learning_rate": 0.0002845195143832654, + "loss": 0.0953, "step": 15990 }, { - "epoch": 0.17, - "learning_rate": 0.00027404114478551494, - "loss": 0.0955, + "epoch": 0.1, + "learning_rate": 0.0002845098330289085, + "loss": 0.0976, "step": 16000 }, { - "epoch": 0.17, - "eval_cer": 0.9214582438805459, - "eval_loss": 0.05950654670596123, - "eval_runtime": 119.4029, - "eval_samples_per_second": 16.75, - "eval_steps_per_second": 4.188, + "epoch": 0.1, + "eval_cer": 0.9202431363687719, + "eval_loss": 0.06717900186777115, + "eval_runtime": 120.6812, + "eval_samples_per_second": 16.573, + "eval_steps_per_second": 4.143, "step": 16000 }, { - "epoch": 0.17, - "learning_rate": 0.00027402492050100587, - "loss": 0.0842, + "epoch": 0.1, + "learning_rate": 0.0002845001516745516, + "loss": 0.0971, "step": 16010 }, { - "epoch": 0.17, - "learning_rate": 0.0002740086962164968, - "loss": 0.0837, + "epoch": 0.1, + "learning_rate": 0.00028449047032019466, + "loss": 0.1026, "step": 16020 }, { - "epoch": 0.17, - "learning_rate": 0.00027399247193198777, - "loss": 0.0868, + "epoch": 0.1, + "learning_rate": 0.0002844807889658377, + "loss": 0.0891, "step": 16030 }, { - "epoch": 0.17, - "learning_rate": 0.0002739762476474787, - "loss": 0.0852, + "epoch": 0.1, + "learning_rate": 0.00028447110761148077, + "loss": 0.1018, "step": 16040 }, { - "epoch": 0.17, - "learning_rate": 0.00027396002336296967, - "loss": 0.0816, + "epoch": 0.1, + "learning_rate": 0.00028446142625712385, + "loss": 0.1035, "step": 16050 }, { - "epoch": 0.17, - "learning_rate": 0.0002739437990784606, - "loss": 0.0899, + "epoch": 0.1, + "learning_rate": 0.0002844517449027669, + "loss": 0.1053, "step": 16060 }, { - "epoch": 0.17, - "learning_rate": 0.00027392757479395157, - "loss": 0.0872, + "epoch": 0.1, + "learning_rate": 0.00028444206354840995, + "loss": 0.0942, "step": 16070 }, { - "epoch": 0.17, - "learning_rate": 0.0002739113505094425, - "loss": 0.0844, + "epoch": 0.1, + "learning_rate": 0.00028443238219405303, + "loss": 0.0926, "step": 16080 }, { - "epoch": 0.17, - "learning_rate": 0.00027389512622493347, - "loss": 0.082, + "epoch": 0.1, + "learning_rate": 0.0002844227008396961, + "loss": 0.1007, "step": 16090 }, { - "epoch": 0.17, - "learning_rate": 0.0002738789019404244, - "loss": 0.0878, + "epoch": 0.1, + "learning_rate": 0.0002844130194853392, + "loss": 0.102, "step": 16100 }, { - "epoch": 0.17, - "learning_rate": 0.00027386267765591537, - "loss": 0.0857, + "epoch": 0.1, + "learning_rate": 0.0002844033381309823, + "loss": 0.0927, "step": 16110 }, { - "epoch": 0.17, - "learning_rate": 0.0002738464533714063, - "loss": 0.0819, + "epoch": 0.1, + "learning_rate": 0.0002843936567766253, + "loss": 0.0997, "step": 16120 }, { - "epoch": 0.17, - "learning_rate": 0.00027383022908689726, - "loss": 0.0882, + "epoch": 0.1, + "learning_rate": 0.0002843839754222684, + "loss": 0.0954, "step": 16130 }, { - "epoch": 0.17, - "learning_rate": 0.0002738140048023882, - "loss": 0.0796, + "epoch": 0.1, + "learning_rate": 0.00028437429406791146, + "loss": 0.1012, "step": 16140 }, { - "epoch": 0.17, - "learning_rate": 0.00027379778051787916, - "loss": 0.0844, + "epoch": 0.1, + "learning_rate": 0.00028436461271355454, + "loss": 0.0955, "step": 16150 }, { - "epoch": 0.17, - "learning_rate": 0.0002737815562333701, - "loss": 0.0884, + "epoch": 0.1, + "learning_rate": 0.00028435493135919756, + "loss": 0.1029, "step": 16160 }, { - "epoch": 0.17, - "learning_rate": 0.000273765331948861, - "loss": 0.0858, + "epoch": 0.1, + "learning_rate": 0.00028434525000484064, + "loss": 0.0899, "step": 16170 }, { - "epoch": 0.18, - "learning_rate": 0.000273749107664352, - "loss": 0.0905, + "epoch": 0.1, + "learning_rate": 0.0002843355686504837, + "loss": 0.1038, "step": 16180 }, { - "epoch": 0.18, - "learning_rate": 0.0002737328833798429, - "loss": 0.0831, + "epoch": 0.1, + "learning_rate": 0.00028432588729612675, + "loss": 0.0971, "step": 16190 }, { - "epoch": 0.18, - "learning_rate": 0.00027371665909533383, - "loss": 0.098, + "epoch": 0.1, + "learning_rate": 0.00028431620594176983, + "loss": 0.111, "step": 16200 }, { - "epoch": 0.18, - "learning_rate": 0.0002737004348108248, - "loss": 0.088, + "epoch": 0.1, + "learning_rate": 0.0002843065245874129, + "loss": 0.0914, "step": 16210 }, { - "epoch": 0.18, - "learning_rate": 0.00027368421052631573, - "loss": 0.0832, + "epoch": 0.1, + "learning_rate": 0.000284296843233056, + "loss": 0.0933, "step": 16220 }, { - "epoch": 0.18, - "learning_rate": 0.0002736679862418067, - "loss": 0.0864, + "epoch": 0.1, + "learning_rate": 0.00028428716187869907, + "loss": 0.0908, "step": 16230 }, { - "epoch": 0.18, - "learning_rate": 0.00027365176195729763, - "loss": 0.0843, + "epoch": 0.1, + "learning_rate": 0.00028427748052434215, + "loss": 0.0858, "step": 16240 }, { - "epoch": 0.18, - "learning_rate": 0.0002736355376727886, - "loss": 0.0817, + "epoch": 0.1, + "learning_rate": 0.00028426779916998523, + "loss": 0.0952, "step": 16250 }, { - "epoch": 0.18, - "learning_rate": 0.00027361931338827953, - "loss": 0.0913, + "epoch": 0.1, + "learning_rate": 0.00028425811781562825, + "loss": 0.089, "step": 16260 }, { - "epoch": 0.18, - "learning_rate": 0.0002736030891037705, - "loss": 0.0863, + "epoch": 0.11, + "learning_rate": 0.00028424843646127133, + "loss": 0.0954, "step": 16270 }, { - "epoch": 0.18, - "learning_rate": 0.00027358686481926143, - "loss": 0.0874, + "epoch": 0.11, + "learning_rate": 0.0002842387551069144, + "loss": 0.0928, "step": 16280 }, { - "epoch": 0.18, - "learning_rate": 0.0002735706405347524, - "loss": 0.0858, + "epoch": 0.11, + "learning_rate": 0.0002842290737525575, + "loss": 0.0905, "step": 16290 }, { - "epoch": 0.18, - "learning_rate": 0.00027355441625024333, - "loss": 0.0769, + "epoch": 0.11, + "learning_rate": 0.0002842193923982005, + "loss": 0.1, "step": 16300 }, { - "epoch": 0.18, - "learning_rate": 0.0002735381919657343, - "loss": 0.0884, + "epoch": 0.11, + "learning_rate": 0.0002842097110438436, + "loss": 0.0976, "step": 16310 }, { - "epoch": 0.18, - "learning_rate": 0.00027352196768122523, - "loss": 0.0808, + "epoch": 0.11, + "learning_rate": 0.0002842000296894867, + "loss": 0.0956, "step": 16320 }, { - "epoch": 0.18, - "learning_rate": 0.0002735057433967162, - "loss": 0.0812, + "epoch": 0.11, + "learning_rate": 0.0002841903483351297, + "loss": 0.1034, "step": 16330 }, { - "epoch": 0.18, - "learning_rate": 0.00027348951911220713, - "loss": 0.082, + "epoch": 0.11, + "learning_rate": 0.0002841806669807728, + "loss": 0.0926, "step": 16340 }, { - "epoch": 0.18, - "learning_rate": 0.00027347329482769805, - "loss": 0.0843, + "epoch": 0.11, + "learning_rate": 0.00028417098562641586, + "loss": 0.102, "step": 16350 }, { - "epoch": 0.18, - "learning_rate": 0.00027345707054318903, - "loss": 0.0783, + "epoch": 0.11, + "learning_rate": 0.00028416130427205894, + "loss": 0.0967, "step": 16360 }, { - "epoch": 0.18, - "learning_rate": 0.00027344084625867995, - "loss": 0.0893, + "epoch": 0.11, + "learning_rate": 0.000284151622917702, + "loss": 0.0974, "step": 16370 }, { - "epoch": 0.18, - "learning_rate": 0.0002734246219741709, - "loss": 0.0849, + "epoch": 0.11, + "learning_rate": 0.0002841419415633451, + "loss": 0.0878, "step": 16380 }, { - "epoch": 0.18, - "learning_rate": 0.00027340839768966185, - "loss": 0.0844, + "epoch": 0.11, + "learning_rate": 0.0002841322602089882, + "loss": 0.0982, "step": 16390 }, { - "epoch": 0.18, - "learning_rate": 0.0002733921734051528, - "loss": 0.0831, + "epoch": 0.11, + "learning_rate": 0.0002841225788546312, + "loss": 0.0962, "step": 16400 }, { - "epoch": 0.18, - "learning_rate": 0.00027337594912064375, - "loss": 0.0858, + "epoch": 0.11, + "learning_rate": 0.0002841128975002743, + "loss": 0.0977, "step": 16410 }, { - "epoch": 0.18, - "learning_rate": 0.00027335972483613467, - "loss": 0.0789, + "epoch": 0.11, + "learning_rate": 0.00028410321614591737, + "loss": 0.0946, "step": 16420 }, { - "epoch": 0.18, - "learning_rate": 0.00027334350055162565, - "loss": 0.0707, + "epoch": 0.11, + "learning_rate": 0.0002840935347915604, + "loss": 0.1005, "step": 16430 }, { - "epoch": 0.18, - "learning_rate": 0.0002733272762671166, - "loss": 0.0818, + "epoch": 0.11, + "learning_rate": 0.0002840838534372035, + "loss": 0.0946, "step": 16440 }, { - "epoch": 0.18, - "learning_rate": 0.00027331105198260755, - "loss": 0.0765, + "epoch": 0.11, + "learning_rate": 0.00028407417208284655, + "loss": 0.1006, "step": 16450 }, { - "epoch": 0.18, - "learning_rate": 0.0002732948276980985, - "loss": 0.0836, + "epoch": 0.11, + "learning_rate": 0.00028406449072848963, + "loss": 0.1001, "step": 16460 }, { - "epoch": 0.18, - "learning_rate": 0.00027327860341358945, - "loss": 0.0802, + "epoch": 0.11, + "learning_rate": 0.00028405480937413266, + "loss": 0.099, "step": 16470 }, { - "epoch": 0.18, - "learning_rate": 0.0002732623791290804, - "loss": 0.0945, + "epoch": 0.11, + "learning_rate": 0.00028404512801977574, + "loss": 0.094, "step": 16480 }, { - "epoch": 0.18, - "learning_rate": 0.00027324615484457135, - "loss": 0.0826, + "epoch": 0.11, + "learning_rate": 0.0002840354466654188, + "loss": 0.0894, "step": 16490 }, { - "epoch": 0.18, - "learning_rate": 0.00027322993056006227, - "loss": 0.0798, + "epoch": 0.11, + "learning_rate": 0.0002840257653110619, + "loss": 0.0975, "step": 16500 }, { - "epoch": 0.18, - "learning_rate": 0.00027321370627555325, - "loss": 0.0963, + "epoch": 0.11, + "learning_rate": 0.000284016083956705, + "loss": 0.0951, "step": 16510 }, { - "epoch": 0.18, - "learning_rate": 0.00027319748199104417, - "loss": 0.0834, + "epoch": 0.11, + "learning_rate": 0.00028400640260234806, + "loss": 0.0971, "step": 16520 }, { - "epoch": 0.18, - "learning_rate": 0.0002731812577065351, - "loss": 0.0883, + "epoch": 0.11, + "learning_rate": 0.00028399672124799114, + "loss": 0.0979, "step": 16530 }, { - "epoch": 0.18, - "learning_rate": 0.00027316503342202607, - "loss": 0.0924, + "epoch": 0.11, + "learning_rate": 0.00028398703989363416, + "loss": 0.0917, "step": 16540 }, { - "epoch": 0.18, - "learning_rate": 0.000273148809137517, - "loss": 0.0785, + "epoch": 0.11, + "learning_rate": 0.00028397735853927724, + "loss": 0.0933, "step": 16550 }, { - "epoch": 0.18, - "learning_rate": 0.00027313258485300797, - "loss": 0.0859, + "epoch": 0.11, + "learning_rate": 0.00028396767718492027, + "loss": 0.0916, "step": 16560 }, { - "epoch": 0.18, - "learning_rate": 0.0002731163605684989, - "loss": 0.0902, + "epoch": 0.11, + "learning_rate": 0.00028395799583056335, + "loss": 0.0933, "step": 16570 }, { - "epoch": 0.18, - "learning_rate": 0.00027310013628398987, - "loss": 0.09, + "epoch": 0.11, + "learning_rate": 0.00028394831447620643, + "loss": 0.1018, "step": 16580 }, { - "epoch": 0.18, - "learning_rate": 0.0002730839119994808, - "loss": 0.0858, + "epoch": 0.11, + "learning_rate": 0.0002839386331218495, + "loss": 0.0857, "step": 16590 }, { - "epoch": 0.18, - "learning_rate": 0.00027306768771497177, - "loss": 0.0908, + "epoch": 0.11, + "learning_rate": 0.0002839289517674926, + "loss": 0.0895, "step": 16600 }, { - "epoch": 0.18, - "learning_rate": 0.0002730514634304627, - "loss": 0.0912, + "epoch": 0.11, + "learning_rate": 0.0002839192704131356, + "loss": 0.0986, "step": 16610 }, { - "epoch": 0.18, - "learning_rate": 0.00027303523914595367, - "loss": 0.0878, + "epoch": 0.11, + "learning_rate": 0.0002839095890587787, + "loss": 0.0917, "step": 16620 }, { - "epoch": 0.18, - "learning_rate": 0.0002730190148614446, - "loss": 0.0884, + "epoch": 0.11, + "learning_rate": 0.00028389990770442177, + "loss": 0.0929, "step": 16630 }, { - "epoch": 0.18, - "learning_rate": 0.00027300279057693557, - "loss": 0.0851, + "epoch": 0.11, + "learning_rate": 0.00028389022635006485, + "loss": 0.0973, "step": 16640 }, { - "epoch": 0.18, - "learning_rate": 0.0002729865662924265, - "loss": 0.0772, + "epoch": 0.11, + "learning_rate": 0.00028388054499570793, + "loss": 0.0982, "step": 16650 }, { - "epoch": 0.18, - "learning_rate": 0.00027297034200791747, - "loss": 0.0799, + "epoch": 0.11, + "learning_rate": 0.000283870863641351, + "loss": 0.1178, "step": 16660 }, { - "epoch": 0.18, - "learning_rate": 0.0002729541177234084, - "loss": 0.0876, + "epoch": 0.11, + "learning_rate": 0.00028386118228699404, + "loss": 0.094, "step": 16670 }, { - "epoch": 0.18, - "learning_rate": 0.0002729378934388993, - "loss": 0.0866, + "epoch": 0.11, + "learning_rate": 0.0002838515009326371, + "loss": 0.0945, "step": 16680 }, { - "epoch": 0.18, - "learning_rate": 0.0002729216691543903, - "loss": 0.0835, + "epoch": 0.11, + "learning_rate": 0.0002838418195782802, + "loss": 0.1011, "step": 16690 }, { - "epoch": 0.18, - "learning_rate": 0.0002729054448698812, - "loss": 0.0943, + "epoch": 0.11, + "learning_rate": 0.0002838321382239232, + "loss": 0.1004, "step": 16700 }, { - "epoch": 0.18, - "learning_rate": 0.00027288922058537213, - "loss": 0.0843, + "epoch": 0.11, + "learning_rate": 0.0002838224568695663, + "loss": 0.0913, "step": 16710 }, { - "epoch": 0.18, - "learning_rate": 0.0002728729963008631, - "loss": 0.0888, + "epoch": 0.11, + "learning_rate": 0.0002838127755152094, + "loss": 0.1008, "step": 16720 }, { - "epoch": 0.18, - "learning_rate": 0.00027285677201635403, - "loss": 0.0936, + "epoch": 0.11, + "learning_rate": 0.00028380309416085246, + "loss": 0.1036, "step": 16730 }, { - "epoch": 0.18, - "learning_rate": 0.000272840547731845, - "loss": 0.0931, + "epoch": 0.11, + "learning_rate": 0.00028379341280649554, + "loss": 0.0951, "step": 16740 }, { - "epoch": 0.18, - "learning_rate": 0.00027282432344733593, - "loss": 0.082, + "epoch": 0.11, + "learning_rate": 0.00028378373145213857, + "loss": 0.1009, "step": 16750 }, { - "epoch": 0.18, - "learning_rate": 0.0002728080991628269, - "loss": 0.0804, + "epoch": 0.11, + "learning_rate": 0.00028377405009778165, + "loss": 0.0869, "step": 16760 }, { - "epoch": 0.18, - "learning_rate": 0.00027279187487831783, - "loss": 0.0873, + "epoch": 0.11, + "learning_rate": 0.0002837643687434247, + "loss": 0.0986, "step": 16770 }, { - "epoch": 0.18, - "learning_rate": 0.0002727756505938088, - "loss": 0.0888, + "epoch": 0.11, + "learning_rate": 0.0002837546873890678, + "loss": 0.0959, "step": 16780 }, { - "epoch": 0.18, - "learning_rate": 0.00027275942630929973, - "loss": 0.0806, + "epoch": 0.11, + "learning_rate": 0.0002837450060347109, + "loss": 0.0997, "step": 16790 }, { - "epoch": 0.18, - "learning_rate": 0.0002727432020247907, - "loss": 0.0851, + "epoch": 0.11, + "learning_rate": 0.0002837353246803539, + "loss": 0.0886, "step": 16800 }, { - "epoch": 0.18, - "learning_rate": 0.00027272697774028163, - "loss": 0.0846, + "epoch": 0.11, + "learning_rate": 0.000283725643325997, + "loss": 0.0863, "step": 16810 }, { - "epoch": 0.18, - "learning_rate": 0.0002727107534557726, - "loss": 0.0833, + "epoch": 0.11, + "learning_rate": 0.00028371596197164007, + "loss": 0.095, "step": 16820 }, { - "epoch": 0.18, - "learning_rate": 0.00027269452917126353, - "loss": 0.083, + "epoch": 0.11, + "learning_rate": 0.0002837062806172831, + "loss": 0.085, "step": 16830 }, { - "epoch": 0.18, - "learning_rate": 0.0002726783048867545, - "loss": 0.0862, + "epoch": 0.11, + "learning_rate": 0.0002836965992629262, + "loss": 0.0993, "step": 16840 }, { - "epoch": 0.18, - "learning_rate": 0.00027266208060224543, - "loss": 0.0827, + "epoch": 0.11, + "learning_rate": 0.00028368691790856926, + "loss": 0.0941, "step": 16850 }, { - "epoch": 0.18, - "learning_rate": 0.00027264585631773635, - "loss": 0.0831, + "epoch": 0.11, + "learning_rate": 0.00028367723655421234, + "loss": 0.0962, "step": 16860 }, { - "epoch": 0.18, - "learning_rate": 0.00027262963203322733, - "loss": 0.0835, + "epoch": 0.11, + "learning_rate": 0.0002836675551998554, + "loss": 0.099, "step": 16870 }, { - "epoch": 0.18, - "learning_rate": 0.00027261340774871825, - "loss": 0.0839, + "epoch": 0.11, + "learning_rate": 0.0002836578738454985, + "loss": 0.0865, "step": 16880 }, { - "epoch": 0.18, - "learning_rate": 0.0002725971834642092, - "loss": 0.0901, + "epoch": 0.11, + "learning_rate": 0.0002836481924911415, + "loss": 0.0984, "step": 16890 }, { - "epoch": 0.18, - "learning_rate": 0.00027258095917970015, - "loss": 0.0827, + "epoch": 0.11, + "learning_rate": 0.0002836385111367846, + "loss": 0.0927, "step": 16900 }, { - "epoch": 0.18, - "learning_rate": 0.0002725647348951911, - "loss": 0.0917, + "epoch": 0.11, + "learning_rate": 0.0002836288297824277, + "loss": 0.0898, "step": 16910 }, { - "epoch": 0.18, - "learning_rate": 0.00027254851061068205, - "loss": 0.0954, + "epoch": 0.11, + "learning_rate": 0.00028361914842807076, + "loss": 0.091, "step": 16920 }, { - "epoch": 0.18, - "learning_rate": 0.000272532286326173, - "loss": 0.087, + "epoch": 0.11, + "learning_rate": 0.00028360946707371384, + "loss": 0.0903, "step": 16930 }, { - "epoch": 0.18, - "learning_rate": 0.00027251606204166395, - "loss": 0.0893, + "epoch": 0.11, + "learning_rate": 0.00028359978571935687, + "loss": 0.0881, "step": 16940 }, { - "epoch": 0.18, - "learning_rate": 0.0002724998377571549, - "loss": 0.0942, + "epoch": 0.11, + "learning_rate": 0.00028359010436499995, + "loss": 0.0926, "step": 16950 }, { - "epoch": 0.18, - "learning_rate": 0.00027248361347264585, - "loss": 0.0891, + "epoch": 0.11, + "learning_rate": 0.00028358042301064297, + "loss": 0.0982, "step": 16960 }, { - "epoch": 0.18, - "learning_rate": 0.0002724673891881368, - "loss": 0.0878, + "epoch": 0.11, + "learning_rate": 0.00028357074165628605, + "loss": 0.0906, "step": 16970 }, { - "epoch": 0.18, - "learning_rate": 0.00027245116490362775, - "loss": 0.089, + "epoch": 0.11, + "learning_rate": 0.00028356106030192913, + "loss": 0.0915, "step": 16980 }, { - "epoch": 0.18, - "learning_rate": 0.0002724349406191187, - "loss": 0.0756, + "epoch": 0.11, + "learning_rate": 0.0002835513789475722, + "loss": 0.0924, "step": 16990 }, { - "epoch": 0.18, - "learning_rate": 0.00027241871633460965, - "loss": 0.0875, + "epoch": 0.11, + "learning_rate": 0.0002835416975932153, + "loss": 0.0949, "step": 17000 }, { - "epoch": 0.18, - "eval_cer": 0.9212735956574979, - "eval_loss": 0.05866820365190506, - "eval_runtime": 119.9281, - "eval_samples_per_second": 16.677, - "eval_steps_per_second": 4.169, + "epoch": 0.11, + "eval_cer": 0.9201943283244831, + "eval_loss": 0.06401708722114563, + "eval_runtime": 120.4041, + "eval_samples_per_second": 16.611, + "eval_steps_per_second": 4.153, "step": 17000 }, { - "epoch": 0.18, - "learning_rate": 0.0002724024920501006, - "loss": 0.0736, + "epoch": 0.11, + "learning_rate": 0.00028353201623885837, + "loss": 0.1014, "step": 17010 }, { - "epoch": 0.18, - "learning_rate": 0.00027238626776559155, - "loss": 0.0832, + "epoch": 0.11, + "learning_rate": 0.00028352233488450145, + "loss": 0.0924, "step": 17020 }, { - "epoch": 0.18, - "learning_rate": 0.0002723700434810825, - "loss": 0.0712, + "epoch": 0.11, + "learning_rate": 0.0002835126535301445, + "loss": 0.0964, "step": 17030 }, { - "epoch": 0.18, - "learning_rate": 0.0002723538191965734, - "loss": 0.092, + "epoch": 0.11, + "learning_rate": 0.00028350297217578756, + "loss": 0.0907, "step": 17040 }, { - "epoch": 0.18, - "learning_rate": 0.00027233759491206437, - "loss": 0.0879, + "epoch": 0.11, + "learning_rate": 0.00028349329082143064, + "loss": 0.1097, "step": 17050 }, { - "epoch": 0.18, - "learning_rate": 0.0002723213706275553, - "loss": 0.0869, + "epoch": 0.11, + "learning_rate": 0.0002834836094670737, + "loss": 0.0916, "step": 17060 }, { - "epoch": 0.18, - "learning_rate": 0.0002723051463430462, - "loss": 0.0783, + "epoch": 0.11, + "learning_rate": 0.00028347392811271674, + "loss": 0.0922, "step": 17070 }, { - "epoch": 0.18, - "learning_rate": 0.0002722889220585372, - "loss": 0.0812, + "epoch": 0.11, + "learning_rate": 0.0002834642467583598, + "loss": 0.0875, "step": 17080 }, { - "epoch": 0.18, - "learning_rate": 0.0002722726977740281, - "loss": 0.0955, + "epoch": 0.11, + "learning_rate": 0.0002834545654040029, + "loss": 0.0863, "step": 17090 }, { - "epoch": 0.18, - "learning_rate": 0.0002722564734895191, - "loss": 0.0858, + "epoch": 0.11, + "learning_rate": 0.0002834448840496459, + "loss": 0.1121, "step": 17100 }, { - "epoch": 0.19, - "learning_rate": 0.00027224024920501, - "loss": 0.0829, + "epoch": 0.11, + "learning_rate": 0.000283435202695289, + "loss": 0.0921, "step": 17110 }, { - "epoch": 0.19, - "learning_rate": 0.000272224024920501, - "loss": 0.0859, + "epoch": 0.11, + "learning_rate": 0.0002834255213409321, + "loss": 0.0899, "step": 17120 }, { - "epoch": 0.19, - "learning_rate": 0.0002722078006359919, - "loss": 0.0855, + "epoch": 0.11, + "learning_rate": 0.00028341583998657517, + "loss": 0.0917, "step": 17130 }, { - "epoch": 0.19, - "learning_rate": 0.0002721915763514829, - "loss": 0.0893, + "epoch": 0.11, + "learning_rate": 0.00028340615863221825, + "loss": 0.092, "step": 17140 }, { - "epoch": 0.19, - "learning_rate": 0.0002721753520669738, - "loss": 0.0886, + "epoch": 0.11, + "learning_rate": 0.0002833964772778613, + "loss": 0.0889, "step": 17150 }, { - "epoch": 0.19, - "learning_rate": 0.0002721591277824648, - "loss": 0.0813, + "epoch": 0.11, + "learning_rate": 0.0002833867959235044, + "loss": 0.0928, "step": 17160 }, { - "epoch": 0.19, - "learning_rate": 0.0002721429034979557, - "loss": 0.0995, + "epoch": 0.11, + "learning_rate": 0.00028337711456914743, + "loss": 0.0906, "step": 17170 }, { - "epoch": 0.19, - "learning_rate": 0.0002721266792134467, - "loss": 0.0892, + "epoch": 0.11, + "learning_rate": 0.0002833674332147905, + "loss": 0.0987, "step": 17180 }, { - "epoch": 0.19, - "learning_rate": 0.0002721104549289376, - "loss": 0.0879, + "epoch": 0.11, + "learning_rate": 0.0002833577518604336, + "loss": 0.0935, "step": 17190 }, { - "epoch": 0.19, - "learning_rate": 0.0002720942306444286, - "loss": 0.0851, + "epoch": 0.11, + "learning_rate": 0.0002833480705060766, + "loss": 0.1067, "step": 17200 }, { - "epoch": 0.19, - "learning_rate": 0.0002720780063599195, - "loss": 0.0859, + "epoch": 0.11, + "learning_rate": 0.0002833383891517197, + "loss": 0.0941, "step": 17210 }, { - "epoch": 0.19, - "learning_rate": 0.00027206178207541044, - "loss": 0.0853, + "epoch": 0.11, + "learning_rate": 0.0002833287077973628, + "loss": 0.0891, "step": 17220 }, { - "epoch": 0.19, - "learning_rate": 0.0002720455577909014, - "loss": 0.0845, + "epoch": 0.11, + "learning_rate": 0.0002833190264430058, + "loss": 0.0937, "step": 17230 }, { - "epoch": 0.19, - "learning_rate": 0.00027202933350639234, - "loss": 0.0964, + "epoch": 0.11, + "learning_rate": 0.0002833093450886489, + "loss": 0.1014, "step": 17240 }, { - "epoch": 0.19, - "learning_rate": 0.00027201310922188326, - "loss": 0.0858, + "epoch": 0.11, + "learning_rate": 0.00028329966373429196, + "loss": 0.0965, "step": 17250 }, { - "epoch": 0.19, - "learning_rate": 0.00027199688493737424, - "loss": 0.0865, + "epoch": 0.11, + "learning_rate": 0.00028328998237993504, + "loss": 0.0962, "step": 17260 }, { - "epoch": 0.19, - "learning_rate": 0.00027198066065286516, - "loss": 0.0876, + "epoch": 0.11, + "learning_rate": 0.0002832803010255781, + "loss": 0.1005, "step": 17270 }, { - "epoch": 0.19, - "learning_rate": 0.00027196443636835614, - "loss": 0.0833, + "epoch": 0.11, + "learning_rate": 0.0002832706196712212, + "loss": 0.0978, "step": 17280 }, { - "epoch": 0.19, - "learning_rate": 0.00027194821208384706, - "loss": 0.0977, + "epoch": 0.11, + "learning_rate": 0.0002832609383168643, + "loss": 0.099, "step": 17290 }, { - "epoch": 0.19, - "learning_rate": 0.00027193198779933804, - "loss": 0.0904, + "epoch": 0.11, + "learning_rate": 0.0002832512569625073, + "loss": 0.0997, "step": 17300 }, { - "epoch": 0.19, - "learning_rate": 0.00027191576351482896, - "loss": 0.0912, + "epoch": 0.11, + "learning_rate": 0.0002832415756081504, + "loss": 0.0924, "step": 17310 }, { - "epoch": 0.19, - "learning_rate": 0.00027189953923031993, - "loss": 0.089, + "epoch": 0.11, + "learning_rate": 0.00028323189425379346, + "loss": 0.0928, "step": 17320 }, { - "epoch": 0.19, - "learning_rate": 0.00027188331494581086, - "loss": 0.0984, + "epoch": 0.11, + "learning_rate": 0.00028322221289943654, + "loss": 0.0959, "step": 17330 }, { - "epoch": 0.19, - "learning_rate": 0.00027186709066130183, - "loss": 0.0859, + "epoch": 0.11, + "learning_rate": 0.00028321253154507957, + "loss": 0.0911, "step": 17340 }, { - "epoch": 0.19, - "learning_rate": 0.00027185086637679276, - "loss": 0.0783, + "epoch": 0.11, + "learning_rate": 0.00028320285019072265, + "loss": 0.1007, "step": 17350 }, { - "epoch": 0.19, - "learning_rate": 0.00027183464209228373, - "loss": 0.0956, + "epoch": 0.11, + "learning_rate": 0.00028319316883636573, + "loss": 0.0861, "step": 17360 }, { - "epoch": 0.19, - "learning_rate": 0.00027181841780777466, - "loss": 0.0877, + "epoch": 0.11, + "learning_rate": 0.00028318348748200876, + "loss": 0.0894, "step": 17370 }, { - "epoch": 0.19, - "learning_rate": 0.00027180219352326563, - "loss": 0.0843, + "epoch": 0.11, + "learning_rate": 0.00028317380612765183, + "loss": 0.0874, "step": 17380 }, { - "epoch": 0.19, - "learning_rate": 0.00027178596923875656, - "loss": 0.0786, + "epoch": 0.11, + "learning_rate": 0.0002831641247732949, + "loss": 0.1041, "step": 17390 }, { - "epoch": 0.19, - "learning_rate": 0.0002717697449542475, - "loss": 0.0852, + "epoch": 0.11, + "learning_rate": 0.000283154443418938, + "loss": 0.0932, "step": 17400 }, { - "epoch": 0.19, - "learning_rate": 0.00027175352066973846, - "loss": 0.0811, + "epoch": 0.11, + "learning_rate": 0.0002831447620645811, + "loss": 0.0876, "step": 17410 }, { - "epoch": 0.19, - "learning_rate": 0.0002717372963852294, - "loss": 0.0789, + "epoch": 0.11, + "learning_rate": 0.00028313508071022415, + "loss": 0.0971, "step": 17420 }, { - "epoch": 0.19, - "learning_rate": 0.0002717210721007203, - "loss": 0.0799, + "epoch": 0.11, + "learning_rate": 0.00028312539935586723, + "loss": 0.0878, "step": 17430 }, { - "epoch": 0.19, - "learning_rate": 0.0002717048478162113, + "epoch": 0.11, + "learning_rate": 0.00028311571800151026, "loss": 0.0911, "step": 17440 }, { - "epoch": 0.19, - "learning_rate": 0.0002716886235317022, - "loss": 0.087, + "epoch": 0.11, + "learning_rate": 0.00028310603664715334, + "loss": 0.0871, "step": 17450 }, { - "epoch": 0.19, - "learning_rate": 0.0002716723992471932, - "loss": 0.0806, + "epoch": 0.11, + "learning_rate": 0.0002830963552927964, + "loss": 0.0888, "step": 17460 }, { - "epoch": 0.19, - "learning_rate": 0.0002716561749626841, - "loss": 0.0774, + "epoch": 0.11, + "learning_rate": 0.00028308667393843944, + "loss": 0.0856, "step": 17470 }, { - "epoch": 0.19, - "learning_rate": 0.0002716399506781751, - "loss": 0.0854, + "epoch": 0.11, + "learning_rate": 0.0002830769925840825, + "loss": 0.0913, "step": 17480 }, { - "epoch": 0.19, - "learning_rate": 0.000271623726393666, - "loss": 0.0761, + "epoch": 0.11, + "learning_rate": 0.0002830673112297256, + "loss": 0.0973, "step": 17490 }, { - "epoch": 0.19, - "learning_rate": 0.000271607502109157, - "loss": 0.0781, + "epoch": 0.11, + "learning_rate": 0.0002830576298753687, + "loss": 0.0857, "step": 17500 }, { - "epoch": 0.19, - "learning_rate": 0.0002715912778246479, - "loss": 0.0777, + "epoch": 0.11, + "learning_rate": 0.0002830479485210117, + "loss": 0.1043, "step": 17510 }, { - "epoch": 0.19, - "learning_rate": 0.0002715750535401389, - "loss": 0.082, + "epoch": 0.11, + "learning_rate": 0.0002830382671666548, + "loss": 0.0951, "step": 17520 }, { - "epoch": 0.19, - "learning_rate": 0.0002715588292556298, - "loss": 0.0859, + "epoch": 0.11, + "learning_rate": 0.00028302858581229787, + "loss": 0.1021, "step": 17530 }, { - "epoch": 0.19, - "learning_rate": 0.0002715426049711208, - "loss": 0.0875, + "epoch": 0.11, + "learning_rate": 0.00028301890445794095, + "loss": 0.0907, "step": 17540 }, { - "epoch": 0.19, - "learning_rate": 0.0002715263806866117, - "loss": 0.0868, + "epoch": 0.11, + "learning_rate": 0.00028300922310358403, + "loss": 0.0894, "step": 17550 }, { - "epoch": 0.19, - "learning_rate": 0.0002715101564021027, - "loss": 0.0794, + "epoch": 0.11, + "learning_rate": 0.0002829995417492271, + "loss": 0.1018, "step": 17560 }, { - "epoch": 0.19, - "learning_rate": 0.0002714939321175936, - "loss": 0.0943, + "epoch": 0.11, + "learning_rate": 0.00028298986039487013, + "loss": 0.0914, "step": 17570 }, { - "epoch": 0.19, - "learning_rate": 0.0002714777078330845, - "loss": 0.0904, + "epoch": 0.11, + "learning_rate": 0.0002829801790405132, + "loss": 0.0827, "step": 17580 }, { - "epoch": 0.19, - "learning_rate": 0.0002714614835485755, - "loss": 0.0911, + "epoch": 0.11, + "learning_rate": 0.0002829704976861563, + "loss": 0.1096, "step": 17590 }, { - "epoch": 0.19, - "learning_rate": 0.0002714452592640664, - "loss": 0.0902, + "epoch": 0.11, + "learning_rate": 0.0002829608163317993, + "loss": 0.1036, "step": 17600 }, { - "epoch": 0.19, - "learning_rate": 0.00027142903497955734, - "loss": 0.0915, + "epoch": 0.11, + "learning_rate": 0.0002829511349774424, + "loss": 0.1066, "step": 17610 }, { - "epoch": 0.19, - "learning_rate": 0.0002714128106950483, - "loss": 0.0863, + "epoch": 0.11, + "learning_rate": 0.0002829414536230855, + "loss": 0.0907, "step": 17620 }, { - "epoch": 0.19, - "learning_rate": 0.00027139658641053924, - "loss": 0.0789, + "epoch": 0.11, + "learning_rate": 0.00028293177226872856, + "loss": 0.0906, "step": 17630 }, { - "epoch": 0.19, - "learning_rate": 0.0002713803621260302, - "loss": 0.0766, + "epoch": 0.11, + "learning_rate": 0.00028292209091437164, + "loss": 0.0943, "step": 17640 }, { - "epoch": 0.19, - "learning_rate": 0.00027136413784152114, - "loss": 0.0813, + "epoch": 0.11, + "learning_rate": 0.00028291240956001466, + "loss": 0.0983, "step": 17650 }, { - "epoch": 0.19, - "learning_rate": 0.0002713479135570121, - "loss": 0.081, + "epoch": 0.11, + "learning_rate": 0.00028290272820565774, + "loss": 0.1, "step": 17660 }, { - "epoch": 0.19, - "learning_rate": 0.00027133168927250304, - "loss": 0.0783, + "epoch": 0.11, + "learning_rate": 0.0002828930468513008, + "loss": 0.0911, "step": 17670 }, { - "epoch": 0.19, - "learning_rate": 0.000271315464987994, - "loss": 0.0812, + "epoch": 0.11, + "learning_rate": 0.0002828833654969439, + "loss": 0.0865, "step": 17680 }, { - "epoch": 0.19, - "learning_rate": 0.00027129924070348494, - "loss": 0.0886, + "epoch": 0.11, + "learning_rate": 0.000282873684142587, + "loss": 0.0978, "step": 17690 }, { - "epoch": 0.19, - "learning_rate": 0.0002712830164189759, - "loss": 0.0758, + "epoch": 0.11, + "learning_rate": 0.00028286400278823006, + "loss": 0.0998, "step": 17700 }, { - "epoch": 0.19, - "learning_rate": 0.00027126679213446684, - "loss": 0.0801, + "epoch": 0.11, + "learning_rate": 0.0002828543214338731, + "loss": 0.0952, "step": 17710 }, { - "epoch": 0.19, - "learning_rate": 0.0002712505678499578, - "loss": 0.0862, + "epoch": 0.11, + "learning_rate": 0.00028284464007951617, + "loss": 0.0994, "step": 17720 }, { - "epoch": 0.19, - "learning_rate": 0.00027123434356544874, - "loss": 0.0839, + "epoch": 0.11, + "learning_rate": 0.00028283495872515925, + "loss": 0.0895, "step": 17730 }, { - "epoch": 0.19, - "learning_rate": 0.0002712181192809397, - "loss": 0.0905, + "epoch": 0.11, + "learning_rate": 0.0002828252773708023, + "loss": 0.0916, "step": 17740 }, { - "epoch": 0.19, - "learning_rate": 0.00027120189499643064, - "loss": 0.0941, + "epoch": 0.11, + "learning_rate": 0.00028281559601644535, + "loss": 0.0995, "step": 17750 }, { - "epoch": 0.19, - "learning_rate": 0.00027118567071192156, - "loss": 0.0797, + "epoch": 0.11, + "learning_rate": 0.00028280591466208843, + "loss": 0.0827, "step": 17760 }, { - "epoch": 0.19, - "learning_rate": 0.00027116944642741254, - "loss": 0.086, + "epoch": 0.11, + "learning_rate": 0.0002827962333077315, + "loss": 0.0811, "step": 17770 }, { - "epoch": 0.19, - "learning_rate": 0.00027115322214290346, - "loss": 0.0871, + "epoch": 0.11, + "learning_rate": 0.0002827865519533746, + "loss": 0.0821, "step": 17780 }, { - "epoch": 0.19, - "learning_rate": 0.0002711369978583944, + "epoch": 0.11, + "learning_rate": 0.0002827768705990176, "loss": 0.0881, "step": 17790 }, { - "epoch": 0.19, - "learning_rate": 0.00027112077357388536, - "loss": 0.0879, + "epoch": 0.11, + "learning_rate": 0.0002827671892446607, + "loss": 0.0891, "step": 17800 }, { - "epoch": 0.19, - "learning_rate": 0.0002711045492893763, - "loss": 0.0789, + "epoch": 0.11, + "learning_rate": 0.0002827575078903038, + "loss": 0.0851, "step": 17810 }, { - "epoch": 0.19, - "learning_rate": 0.00027108832500486726, - "loss": 0.0805, + "epoch": 0.12, + "learning_rate": 0.00028274782653594686, + "loss": 0.0837, "step": 17820 }, { - "epoch": 0.19, - "learning_rate": 0.0002710721007203582, - "loss": 0.0745, + "epoch": 0.12, + "learning_rate": 0.00028273814518158994, + "loss": 0.0888, "step": 17830 }, { - "epoch": 0.19, - "learning_rate": 0.00027105587643584916, - "loss": 0.0872, + "epoch": 0.12, + "learning_rate": 0.00028272846382723296, + "loss": 0.0865, "step": 17840 }, { - "epoch": 0.19, - "learning_rate": 0.0002710396521513401, - "loss": 0.0826, + "epoch": 0.12, + "learning_rate": 0.00028271878247287604, + "loss": 0.0865, "step": 17850 }, { - "epoch": 0.19, - "learning_rate": 0.00027102342786683106, - "loss": 0.0863, + "epoch": 0.12, + "learning_rate": 0.0002827091011185191, + "loss": 0.0948, "step": 17860 }, { - "epoch": 0.19, - "learning_rate": 0.000271007203582322, - "loss": 0.0822, + "epoch": 0.12, + "learning_rate": 0.00028269941976416215, + "loss": 0.0955, "step": 17870 }, { - "epoch": 0.19, - "learning_rate": 0.00027099097929781296, - "loss": 0.0818, + "epoch": 0.12, + "learning_rate": 0.00028268973840980523, + "loss": 0.0923, "step": 17880 }, { - "epoch": 0.19, - "learning_rate": 0.0002709747550133039, - "loss": 0.0828, + "epoch": 0.12, + "learning_rate": 0.0002826800570554483, + "loss": 0.0914, "step": 17890 }, { - "epoch": 0.19, - "learning_rate": 0.00027095853072879486, - "loss": 0.0899, + "epoch": 0.12, + "learning_rate": 0.0002826703757010914, + "loss": 0.095, "step": 17900 }, { - "epoch": 0.19, - "learning_rate": 0.0002709423064442858, - "loss": 0.0928, + "epoch": 0.12, + "learning_rate": 0.00028266069434673447, + "loss": 0.0963, "step": 17910 }, { - "epoch": 0.19, - "learning_rate": 0.00027092608215977676, - "loss": 0.086, + "epoch": 0.12, + "learning_rate": 0.00028265101299237755, + "loss": 0.0986, "step": 17920 }, { - "epoch": 0.19, - "learning_rate": 0.0002709098578752677, - "loss": 0.0733, + "epoch": 0.12, + "learning_rate": 0.0002826413316380206, + "loss": 0.105, "step": 17930 }, { - "epoch": 0.19, - "learning_rate": 0.0002708936335907586, - "loss": 0.0885, + "epoch": 0.12, + "learning_rate": 0.00028263165028366365, + "loss": 0.0948, "step": 17940 }, { - "epoch": 0.19, - "learning_rate": 0.0002708774093062496, - "loss": 0.0862, + "epoch": 0.12, + "learning_rate": 0.00028262196892930673, + "loss": 0.1032, "step": 17950 }, { - "epoch": 0.19, - "learning_rate": 0.0002708611850217405, - "loss": 0.1001, + "epoch": 0.12, + "learning_rate": 0.0002826122875749498, + "loss": 0.0888, "step": 17960 }, { - "epoch": 0.19, - "learning_rate": 0.0002708449607372315, - "loss": 0.0904, + "epoch": 0.12, + "learning_rate": 0.00028260260622059284, + "loss": 0.1002, "step": 17970 }, { - "epoch": 0.19, - "learning_rate": 0.0002708287364527224, - "loss": 0.0926, + "epoch": 0.12, + "learning_rate": 0.0002825929248662359, + "loss": 0.0967, "step": 17980 }, { - "epoch": 0.19, - "learning_rate": 0.0002708125121682133, - "loss": 0.0842, + "epoch": 0.12, + "learning_rate": 0.000282583243511879, + "loss": 0.0935, "step": 17990 }, { - "epoch": 0.19, - "learning_rate": 0.0002707962878837043, - "loss": 0.0879, + "epoch": 0.12, + "learning_rate": 0.000282573562157522, + "loss": 0.1026, "step": 18000 }, { - "epoch": 0.19, - "eval_cer": 0.92140788527426, - "eval_loss": 0.057557813823223114, - "eval_runtime": 119.6241, - "eval_samples_per_second": 16.719, - "eval_steps_per_second": 4.18, + "epoch": 0.12, + "eval_cer": 0.9202557903061801, + "eval_loss": 0.06353824585676193, + "eval_runtime": 120.4302, + "eval_samples_per_second": 16.607, + "eval_steps_per_second": 4.152, "step": 18000 }, { - "epoch": 0.19, - "learning_rate": 0.0002707800635991952, - "loss": 0.0872, + "epoch": 0.12, + "learning_rate": 0.0002825638808031651, + "loss": 0.092, "step": 18010 }, { - "epoch": 0.19, - "learning_rate": 0.0002707638393146862, - "loss": 0.0824, + "epoch": 0.12, + "learning_rate": 0.0002825541994488082, + "loss": 0.0913, "step": 18020 }, { - "epoch": 0.2, - "learning_rate": 0.0002707476150301771, - "loss": 0.0874, + "epoch": 0.12, + "learning_rate": 0.00028254451809445126, + "loss": 0.097, "step": 18030 }, { - "epoch": 0.2, - "learning_rate": 0.0002707313907456681, - "loss": 0.0929, + "epoch": 0.12, + "learning_rate": 0.00028253483674009434, + "loss": 0.1017, "step": 18040 }, { - "epoch": 0.2, - "learning_rate": 0.000270715166461159, - "loss": 0.0897, + "epoch": 0.12, + "learning_rate": 0.0002825251553857374, + "loss": 0.1009, "step": 18050 }, { - "epoch": 0.2, - "learning_rate": 0.00027069894217665, - "loss": 0.0876, + "epoch": 0.12, + "learning_rate": 0.0002825154740313805, + "loss": 0.0962, "step": 18060 }, { - "epoch": 0.2, - "learning_rate": 0.0002706827178921409, - "loss": 0.0778, + "epoch": 0.12, + "learning_rate": 0.00028250579267702353, + "loss": 0.0942, "step": 18070 }, { - "epoch": 0.2, - "learning_rate": 0.0002706664936076319, - "loss": 0.0837, + "epoch": 0.12, + "learning_rate": 0.0002824961113226666, + "loss": 0.0949, "step": 18080 }, { - "epoch": 0.2, - "learning_rate": 0.0002706502693231228, - "loss": 0.0882, + "epoch": 0.12, + "learning_rate": 0.0002824864299683097, + "loss": 0.1029, "step": 18090 }, { - "epoch": 0.2, - "learning_rate": 0.0002706340450386138, - "loss": 0.0909, + "epoch": 0.12, + "learning_rate": 0.00028247674861395277, + "loss": 0.1035, "step": 18100 }, { - "epoch": 0.2, - "learning_rate": 0.0002706178207541047, - "loss": 0.0843, + "epoch": 0.12, + "learning_rate": 0.0002824670672595958, + "loss": 0.0965, "step": 18110 }, { - "epoch": 0.2, - "learning_rate": 0.00027060159646959565, - "loss": 0.0813, + "epoch": 0.12, + "learning_rate": 0.00028245738590523887, + "loss": 0.0962, "step": 18120 }, { - "epoch": 0.2, - "learning_rate": 0.0002705853721850866, - "loss": 0.0884, + "epoch": 0.12, + "learning_rate": 0.00028244770455088195, + "loss": 0.088, "step": 18130 }, { - "epoch": 0.2, - "learning_rate": 0.00027056914790057755, - "loss": 0.0926, + "epoch": 0.12, + "learning_rate": 0.000282438023196525, + "loss": 0.0988, "step": 18140 }, { - "epoch": 0.2, - "learning_rate": 0.0002705529236160685, - "loss": 0.0878, + "epoch": 0.12, + "learning_rate": 0.00028242834184216806, + "loss": 0.0946, "step": 18150 }, { - "epoch": 0.2, - "learning_rate": 0.00027053669933155944, - "loss": 0.0821, + "epoch": 0.12, + "learning_rate": 0.00028241866048781114, + "loss": 0.0929, "step": 18160 }, { - "epoch": 0.2, - "learning_rate": 0.00027052047504705037, - "loss": 0.0835, + "epoch": 0.12, + "learning_rate": 0.0002824089791334542, + "loss": 0.09, "step": 18170 }, { - "epoch": 0.2, - "learning_rate": 0.00027050425076254134, - "loss": 0.0742, + "epoch": 0.12, + "learning_rate": 0.0002823992977790973, + "loss": 0.0985, "step": 18180 }, { - "epoch": 0.2, - "learning_rate": 0.00027048802647803227, - "loss": 0.0952, + "epoch": 0.12, + "learning_rate": 0.0002823896164247404, + "loss": 0.0932, "step": 18190 }, { - "epoch": 0.2, - "learning_rate": 0.00027047180219352324, - "loss": 0.0782, + "epoch": 0.12, + "learning_rate": 0.00028237993507038346, + "loss": 0.094, "step": 18200 }, { - "epoch": 0.2, - "learning_rate": 0.00027045557790901417, - "loss": 0.0877, + "epoch": 0.12, + "learning_rate": 0.0002823702537160265, + "loss": 0.098, "step": 18210 }, { - "epoch": 0.2, - "learning_rate": 0.00027043935362450514, - "loss": 0.0841, + "epoch": 0.12, + "learning_rate": 0.00028236057236166956, + "loss": 0.1014, "step": 18220 }, { - "epoch": 0.2, - "learning_rate": 0.00027042312933999607, - "loss": 0.093, + "epoch": 0.12, + "learning_rate": 0.00028235089100731264, + "loss": 0.096, "step": 18230 }, { - "epoch": 0.2, - "learning_rate": 0.00027040690505548704, - "loss": 0.0897, + "epoch": 0.12, + "learning_rate": 0.00028234120965295567, + "loss": 0.0929, "step": 18240 }, { - "epoch": 0.2, - "learning_rate": 0.00027039068077097797, - "loss": 0.0925, + "epoch": 0.12, + "learning_rate": 0.00028233152829859875, + "loss": 0.0936, "step": 18250 }, { - "epoch": 0.2, - "learning_rate": 0.00027037445648646894, - "loss": 0.0926, + "epoch": 0.12, + "learning_rate": 0.0002823218469442418, + "loss": 0.0903, "step": 18260 }, { - "epoch": 0.2, - "learning_rate": 0.00027035823220195987, - "loss": 0.0951, + "epoch": 0.12, + "learning_rate": 0.0002823121655898849, + "loss": 0.0991, "step": 18270 }, { - "epoch": 0.2, - "learning_rate": 0.00027034200791745084, - "loss": 0.0924, + "epoch": 0.12, + "learning_rate": 0.00028230248423552793, + "loss": 0.0946, "step": 18280 }, { - "epoch": 0.2, - "learning_rate": 0.00027032578363294176, - "loss": 0.0991, + "epoch": 0.12, + "learning_rate": 0.000282292802881171, + "loss": 0.0826, "step": 18290 }, { - "epoch": 0.2, - "learning_rate": 0.0002703095593484327, - "loss": 0.0799, + "epoch": 0.12, + "learning_rate": 0.0002822831215268141, + "loss": 0.0882, "step": 18300 }, { - "epoch": 0.2, - "learning_rate": 0.00027029333506392366, - "loss": 0.0832, + "epoch": 0.12, + "learning_rate": 0.00028227344017245717, + "loss": 0.0983, "step": 18310 }, { - "epoch": 0.2, - "learning_rate": 0.0002702771107794146, - "loss": 0.0761, + "epoch": 0.12, + "learning_rate": 0.00028226375881810025, + "loss": 0.0921, "step": 18320 }, { - "epoch": 0.2, - "learning_rate": 0.00027026088649490556, - "loss": 0.0828, + "epoch": 0.12, + "learning_rate": 0.00028225407746374333, + "loss": 0.0873, "step": 18330 }, { - "epoch": 0.2, - "learning_rate": 0.0002702446622103965, - "loss": 0.0781, + "epoch": 0.12, + "learning_rate": 0.0002822443961093864, + "loss": 0.0965, "step": 18340 }, { - "epoch": 0.2, - "learning_rate": 0.0002702284379258874, - "loss": 0.0846, + "epoch": 0.12, + "learning_rate": 0.00028223471475502944, + "loss": 0.0926, "step": 18350 }, { - "epoch": 0.2, - "learning_rate": 0.0002702122136413784, - "loss": 0.0757, + "epoch": 0.12, + "learning_rate": 0.0002822250334006725, + "loss": 0.0923, "step": 18360 }, { - "epoch": 0.2, - "learning_rate": 0.0002701959893568693, - "loss": 0.079, + "epoch": 0.12, + "learning_rate": 0.00028221535204631554, + "loss": 0.0907, "step": 18370 }, { - "epoch": 0.2, - "learning_rate": 0.0002701797650723603, - "loss": 0.0814, + "epoch": 0.12, + "learning_rate": 0.0002822056706919586, + "loss": 0.0938, "step": 18380 }, { - "epoch": 0.2, - "learning_rate": 0.0002701635407878512, - "loss": 0.0753, + "epoch": 0.12, + "learning_rate": 0.0002821959893376017, + "loss": 0.0832, "step": 18390 }, { - "epoch": 0.2, - "learning_rate": 0.0002701473165033422, - "loss": 0.088, + "epoch": 0.12, + "learning_rate": 0.0002821863079832448, + "loss": 0.09, "step": 18400 }, { - "epoch": 0.2, - "learning_rate": 0.0002701310922188331, - "loss": 0.0838, + "epoch": 0.12, + "learning_rate": 0.00028217662662888786, + "loss": 0.0877, "step": 18410 }, { - "epoch": 0.2, - "learning_rate": 0.0002701148679343241, - "loss": 0.0897, + "epoch": 0.12, + "learning_rate": 0.0002821669452745309, + "loss": 0.0963, "step": 18420 }, { - "epoch": 0.2, - "learning_rate": 0.000270098643649815, - "loss": 0.0804, + "epoch": 0.12, + "learning_rate": 0.00028215726392017397, + "loss": 0.0967, "step": 18430 }, { - "epoch": 0.2, - "learning_rate": 0.000270082419365306, - "loss": 0.0922, + "epoch": 0.12, + "learning_rate": 0.00028214758256581705, + "loss": 0.0871, "step": 18440 }, { - "epoch": 0.2, - "learning_rate": 0.0002700661950807969, - "loss": 0.0693, + "epoch": 0.12, + "learning_rate": 0.0002821379012114601, + "loss": 0.0901, "step": 18450 }, { - "epoch": 0.2, - "learning_rate": 0.0002700499707962879, - "loss": 0.085, + "epoch": 0.12, + "learning_rate": 0.0002821282198571032, + "loss": 0.0924, "step": 18460 }, { - "epoch": 0.2, - "learning_rate": 0.0002700337465117788, - "loss": 0.0693, + "epoch": 0.12, + "learning_rate": 0.0002821185385027463, + "loss": 0.0951, "step": 18470 }, { - "epoch": 0.2, - "learning_rate": 0.00027001752222726973, - "loss": 0.0822, + "epoch": 0.12, + "learning_rate": 0.0002821088571483893, + "loss": 0.0811, "step": 18480 }, { - "epoch": 0.2, - "learning_rate": 0.0002700012979427607, - "loss": 0.0759, + "epoch": 0.12, + "learning_rate": 0.0002820991757940324, + "loss": 0.0957, "step": 18490 }, { - "epoch": 0.2, - "learning_rate": 0.00026998507365825163, - "loss": 0.0815, + "epoch": 0.12, + "learning_rate": 0.00028208949443967547, + "loss": 0.0866, "step": 18500 }, { - "epoch": 0.2, - "learning_rate": 0.0002699688493737426, - "loss": 0.0828, + "epoch": 0.12, + "learning_rate": 0.0002820798130853185, + "loss": 0.0875, "step": 18510 }, { - "epoch": 0.2, - "learning_rate": 0.00026995262508923353, - "loss": 0.0785, + "epoch": 0.12, + "learning_rate": 0.0002820701317309616, + "loss": 0.0944, "step": 18520 }, { - "epoch": 0.2, - "learning_rate": 0.00026993640080472445, - "loss": 0.1061, + "epoch": 0.12, + "learning_rate": 0.00028206045037660466, + "loss": 0.0905, "step": 18530 }, { - "epoch": 0.2, - "learning_rate": 0.00026992017652021543, - "loss": 0.0905, + "epoch": 0.12, + "learning_rate": 0.00028205076902224774, + "loss": 0.0974, "step": 18540 }, { - "epoch": 0.2, - "learning_rate": 0.00026990395223570635, - "loss": 0.0787, + "epoch": 0.12, + "learning_rate": 0.0002820410876678908, + "loss": 0.0958, "step": 18550 }, { - "epoch": 0.2, - "learning_rate": 0.0002698877279511973, - "loss": 0.0852, + "epoch": 0.12, + "learning_rate": 0.00028203140631353384, + "loss": 0.0816, "step": 18560 }, { - "epoch": 0.2, - "learning_rate": 0.00026987150366668825, - "loss": 0.0829, + "epoch": 0.12, + "learning_rate": 0.0002820217249591769, + "loss": 0.0899, "step": 18570 }, { - "epoch": 0.2, - "learning_rate": 0.0002698552793821792, - "loss": 0.0781, + "epoch": 0.12, + "learning_rate": 0.00028201204360482, + "loss": 0.0881, "step": 18580 }, { - "epoch": 0.2, - "learning_rate": 0.00026983905509767015, - "loss": 0.084, + "epoch": 0.12, + "learning_rate": 0.0002820023622504631, + "loss": 0.0823, "step": 18590 }, { - "epoch": 0.2, - "learning_rate": 0.0002698228308131611, - "loss": 0.0913, + "epoch": 0.12, + "learning_rate": 0.00028199268089610616, + "loss": 0.0909, "step": 18600 }, { - "epoch": 0.2, - "learning_rate": 0.00026980660652865205, - "loss": 0.0799, + "epoch": 0.12, + "learning_rate": 0.0002819829995417492, + "loss": 0.0881, "step": 18610 }, { - "epoch": 0.2, - "learning_rate": 0.000269790382244143, - "loss": 0.0809, + "epoch": 0.12, + "learning_rate": 0.00028197331818739227, + "loss": 0.1171, "step": 18620 }, { - "epoch": 0.2, - "learning_rate": 0.00026977415795963395, - "loss": 0.0804, + "epoch": 0.12, + "learning_rate": 0.00028196363683303535, + "loss": 0.1105, "step": 18630 }, { - "epoch": 0.2, - "learning_rate": 0.0002697579336751249, - "loss": 0.0837, + "epoch": 0.12, + "learning_rate": 0.00028195395547867837, + "loss": 0.098, "step": 18640 }, { - "epoch": 0.2, - "learning_rate": 0.00026974170939061585, - "loss": 0.0825, + "epoch": 0.12, + "learning_rate": 0.00028194427412432145, + "loss": 0.099, "step": 18650 }, { - "epoch": 0.2, - "learning_rate": 0.0002697254851061068, - "loss": 0.0836, + "epoch": 0.12, + "learning_rate": 0.00028193459276996453, + "loss": 0.0884, "step": 18660 }, { - "epoch": 0.2, - "learning_rate": 0.00026970926082159775, - "loss": 0.082, + "epoch": 0.12, + "learning_rate": 0.0002819249114156076, + "loss": 0.0907, "step": 18670 }, { - "epoch": 0.2, - "learning_rate": 0.00026969303653708867, - "loss": 0.0763, + "epoch": 0.12, + "learning_rate": 0.0002819152300612507, + "loss": 0.0944, "step": 18680 }, { - "epoch": 0.2, - "learning_rate": 0.00026967681225257965, - "loss": 0.077, + "epoch": 0.12, + "learning_rate": 0.00028190554870689377, + "loss": 0.0934, "step": 18690 }, { - "epoch": 0.2, - "learning_rate": 0.00026966058796807057, - "loss": 0.0765, + "epoch": 0.12, + "learning_rate": 0.0002818958673525368, + "loss": 0.0949, "step": 18700 }, { - "epoch": 0.2, - "learning_rate": 0.0002696443636835615, - "loss": 0.0845, + "epoch": 0.12, + "learning_rate": 0.0002818861859981799, + "loss": 0.0893, "step": 18710 }, { - "epoch": 0.2, - "learning_rate": 0.00026962813939905247, - "loss": 0.0875, + "epoch": 0.12, + "learning_rate": 0.00028187650464382295, + "loss": 0.0894, "step": 18720 }, { - "epoch": 0.2, - "learning_rate": 0.0002696119151145434, - "loss": 0.0925, + "epoch": 0.12, + "learning_rate": 0.00028186682328946603, + "loss": 0.0959, "step": 18730 }, { - "epoch": 0.2, - "learning_rate": 0.00026959569083003437, - "loss": 0.095, + "epoch": 0.12, + "learning_rate": 0.0002818571419351091, + "loss": 0.1003, "step": 18740 }, { - "epoch": 0.2, - "learning_rate": 0.0002695794665455253, - "loss": 0.0847, + "epoch": 0.12, + "learning_rate": 0.00028184746058075214, + "loss": 0.0946, "step": 18750 }, { - "epoch": 0.2, - "learning_rate": 0.00026956324226101627, - "loss": 0.0844, + "epoch": 0.12, + "learning_rate": 0.0002818377792263952, + "loss": 0.0904, "step": 18760 }, { - "epoch": 0.2, - "learning_rate": 0.0002695470179765072, - "loss": 0.0962, + "epoch": 0.12, + "learning_rate": 0.00028182809787203825, + "loss": 0.0956, "step": 18770 }, { - "epoch": 0.2, - "learning_rate": 0.00026953079369199817, - "loss": 0.084, + "epoch": 0.12, + "learning_rate": 0.0002818184165176813, + "loss": 0.092, "step": 18780 }, { - "epoch": 0.2, - "learning_rate": 0.00026951456940748914, - "loss": 0.0858, + "epoch": 0.12, + "learning_rate": 0.0002818087351633244, + "loss": 0.0924, "step": 18790 }, { - "epoch": 0.2, - "learning_rate": 0.00026949834512298007, - "loss": 0.0733, + "epoch": 0.12, + "learning_rate": 0.0002817990538089675, + "loss": 0.0845, "step": 18800 }, { - "epoch": 0.2, - "learning_rate": 0.000269482120838471, - "loss": 0.0903, + "epoch": 0.12, + "learning_rate": 0.00028178937245461056, + "loss": 0.0935, "step": 18810 }, { - "epoch": 0.2, - "learning_rate": 0.00026946589655396197, - "loss": 0.0817, + "epoch": 0.12, + "learning_rate": 0.00028177969110025364, + "loss": 0.0915, "step": 18820 }, { - "epoch": 0.2, - "learning_rate": 0.0002694496722694529, - "loss": 0.0783, + "epoch": 0.12, + "learning_rate": 0.0002817700097458967, + "loss": 0.0903, "step": 18830 }, { - "epoch": 0.2, - "learning_rate": 0.00026943344798494387, - "loss": 0.0954, + "epoch": 0.12, + "learning_rate": 0.00028176032839153975, + "loss": 0.0943, "step": 18840 }, { - "epoch": 0.2, - "learning_rate": 0.0002694172237004348, - "loss": 0.0798, + "epoch": 0.12, + "learning_rate": 0.00028175064703718283, + "loss": 0.0873, "step": 18850 }, { - "epoch": 0.2, - "learning_rate": 0.0002694009994159257, - "loss": 0.081, + "epoch": 0.12, + "learning_rate": 0.0002817409656828259, + "loss": 0.0861, "step": 18860 }, { - "epoch": 0.2, - "learning_rate": 0.0002693847751314167, - "loss": 0.0808, + "epoch": 0.12, + "learning_rate": 0.000281731284328469, + "loss": 0.0841, "step": 18870 }, { - "epoch": 0.2, - "learning_rate": 0.0002693685508469076, - "loss": 0.0851, + "epoch": 0.12, + "learning_rate": 0.000281721602974112, + "loss": 0.0964, "step": 18880 }, { - "epoch": 0.2, - "learning_rate": 0.0002693523265623986, - "loss": 0.0781, + "epoch": 0.12, + "learning_rate": 0.0002817119216197551, + "loss": 0.0873, "step": 18890 }, { - "epoch": 0.2, - "learning_rate": 0.0002693361022778895, - "loss": 0.0865, + "epoch": 0.12, + "learning_rate": 0.0002817022402653982, + "loss": 0.0849, "step": 18900 }, { - "epoch": 0.2, - "learning_rate": 0.0002693198779933805, - "loss": 0.0879, + "epoch": 0.12, + "learning_rate": 0.0002816925589110412, + "loss": 0.091, "step": 18910 }, { - "epoch": 0.2, - "learning_rate": 0.0002693036537088714, - "loss": 0.0801, + "epoch": 0.12, + "learning_rate": 0.0002816828775566843, + "loss": 0.0938, "step": 18920 }, { - "epoch": 0.2, - "learning_rate": 0.0002692874294243624, - "loss": 0.0756, + "epoch": 0.12, + "learning_rate": 0.00028167319620232736, + "loss": 0.0951, "step": 18930 }, { - "epoch": 0.2, - "learning_rate": 0.0002692712051398533, - "loss": 0.0856, + "epoch": 0.12, + "learning_rate": 0.00028166351484797044, + "loss": 0.096, "step": 18940 }, { - "epoch": 0.2, - "learning_rate": 0.0002692549808553443, - "loss": 0.0854, + "epoch": 0.12, + "learning_rate": 0.0002816538334936135, + "loss": 0.0972, "step": 18950 }, { - "epoch": 0.21, - "learning_rate": 0.0002692387565708352, - "loss": 0.0786, + "epoch": 0.12, + "learning_rate": 0.0002816441521392566, + "loss": 0.0955, "step": 18960 }, { - "epoch": 0.21, - "learning_rate": 0.0002692225322863262, - "loss": 0.0826, + "epoch": 0.12, + "learning_rate": 0.0002816344707848997, + "loss": 0.0916, "step": 18970 }, { - "epoch": 0.21, - "learning_rate": 0.0002692063080018171, - "loss": 0.0815, + "epoch": 0.12, + "learning_rate": 0.0002816247894305427, + "loss": 0.1013, "step": 18980 }, { - "epoch": 0.21, - "learning_rate": 0.00026919008371730803, - "loss": 0.0796, + "epoch": 0.12, + "learning_rate": 0.0002816151080761858, + "loss": 0.0868, "step": 18990 }, { - "epoch": 0.21, - "learning_rate": 0.000269173859432799, - "loss": 0.079, + "epoch": 0.12, + "learning_rate": 0.00028160542672182886, + "loss": 0.1049, "step": 19000 }, { - "epoch": 0.21, - "eval_cer": 0.9213469248561246, - "eval_loss": 0.05497489497065544, - "eval_runtime": 119.921, - "eval_samples_per_second": 16.678, - "eval_steps_per_second": 4.169, + "epoch": 0.12, + "eval_cer": 0.9201301547847701, + "eval_loss": 0.061801835894584656, + "eval_runtime": 120.5064, + "eval_samples_per_second": 16.597, + "eval_steps_per_second": 4.149, "step": 19000 }, { - "epoch": 0.21, - "learning_rate": 0.00026915763514828993, - "loss": 0.0819, + "epoch": 0.12, + "learning_rate": 0.0002815957453674719, + "loss": 0.0817, "step": 19010 }, { - "epoch": 0.21, - "learning_rate": 0.0002691414108637809, - "loss": 0.073, + "epoch": 0.12, + "learning_rate": 0.00028158606401311497, + "loss": 0.087, "step": 19020 }, { - "epoch": 0.21, - "learning_rate": 0.00026912518657927183, - "loss": 0.0776, + "epoch": 0.12, + "learning_rate": 0.00028157638265875805, + "loss": 0.0936, "step": 19030 }, { - "epoch": 0.21, - "learning_rate": 0.00026910896229476275, - "loss": 0.0742, + "epoch": 0.12, + "learning_rate": 0.00028156670130440113, + "loss": 0.0906, "step": 19040 }, { - "epoch": 0.21, - "learning_rate": 0.00026909273801025373, - "loss": 0.0901, + "epoch": 0.12, + "learning_rate": 0.00028155701995004415, + "loss": 0.0897, "step": 19050 }, { - "epoch": 0.21, - "learning_rate": 0.00026907651372574465, - "loss": 0.0749, + "epoch": 0.12, + "learning_rate": 0.00028154733859568723, + "loss": 0.0822, "step": 19060 }, { - "epoch": 0.21, - "learning_rate": 0.00026906028944123563, - "loss": 0.0778, + "epoch": 0.12, + "learning_rate": 0.0002815376572413303, + "loss": 0.0894, "step": 19070 }, { - "epoch": 0.21, - "learning_rate": 0.00026904406515672655, - "loss": 0.0864, + "epoch": 0.12, + "learning_rate": 0.0002815279758869734, + "loss": 0.0967, "step": 19080 }, { - "epoch": 0.21, - "learning_rate": 0.00026902784087221753, - "loss": 0.0807, + "epoch": 0.12, + "learning_rate": 0.0002815182945326165, + "loss": 0.0817, "step": 19090 }, { - "epoch": 0.21, - "learning_rate": 0.00026901161658770845, - "loss": 0.0915, + "epoch": 0.12, + "learning_rate": 0.00028150861317825955, + "loss": 0.0874, "step": 19100 }, { - "epoch": 0.21, - "learning_rate": 0.00026899539230319943, - "loss": 0.0948, + "epoch": 0.12, + "learning_rate": 0.00028149893182390263, + "loss": 0.0824, "step": 19110 }, { - "epoch": 0.21, - "learning_rate": 0.00026897916801869035, - "loss": 0.0784, + "epoch": 0.12, + "learning_rate": 0.00028148925046954566, + "loss": 0.0837, "step": 19120 }, { - "epoch": 0.21, - "learning_rate": 0.00026896294373418133, - "loss": 0.078, + "epoch": 0.12, + "learning_rate": 0.00028147956911518874, + "loss": 0.0946, "step": 19130 }, { - "epoch": 0.21, - "learning_rate": 0.00026894671944967225, - "loss": 0.0783, + "epoch": 0.12, + "learning_rate": 0.0002814698877608318, + "loss": 0.0835, "step": 19140 }, { - "epoch": 0.21, - "learning_rate": 0.00026893049516516323, - "loss": 0.0849, + "epoch": 0.12, + "learning_rate": 0.00028146020640647484, + "loss": 0.0969, "step": 19150 }, { - "epoch": 0.21, - "learning_rate": 0.00026891427088065415, - "loss": 0.0937, + "epoch": 0.12, + "learning_rate": 0.0002814505250521179, + "loss": 0.0824, "step": 19160 }, { - "epoch": 0.21, - "learning_rate": 0.0002688980465961451, - "loss": 0.0789, + "epoch": 0.12, + "learning_rate": 0.000281440843697761, + "loss": 0.087, "step": 19170 }, { - "epoch": 0.21, - "learning_rate": 0.00026888182231163605, - "loss": 0.0893, + "epoch": 0.12, + "learning_rate": 0.0002814311623434041, + "loss": 0.0855, "step": 19180 }, { - "epoch": 0.21, - "learning_rate": 0.00026886559802712697, - "loss": 0.0793, + "epoch": 0.12, + "learning_rate": 0.0002814214809890471, + "loss": 0.0852, "step": 19190 }, { - "epoch": 0.21, - "learning_rate": 0.00026884937374261795, - "loss": 0.0801, + "epoch": 0.12, + "learning_rate": 0.0002814117996346902, + "loss": 0.0853, "step": 19200 }, { - "epoch": 0.21, - "learning_rate": 0.00026883314945810887, - "loss": 0.0781, + "epoch": 0.12, + "learning_rate": 0.00028140211828033327, + "loss": 0.0883, "step": 19210 }, { - "epoch": 0.21, - "learning_rate": 0.0002688169251735998, - "loss": 0.0872, + "epoch": 0.12, + "learning_rate": 0.00028139243692597635, + "loss": 0.0913, "step": 19220 }, { - "epoch": 0.21, - "learning_rate": 0.00026880070088909077, - "loss": 0.0802, + "epoch": 0.12, + "learning_rate": 0.00028138275557161943, + "loss": 0.0953, "step": 19230 }, { - "epoch": 0.21, - "learning_rate": 0.0002687844766045817, - "loss": 0.0795, + "epoch": 0.12, + "learning_rate": 0.0002813730742172625, + "loss": 0.0886, "step": 19240 }, { - "epoch": 0.21, - "learning_rate": 0.00026876825232007267, - "loss": 0.0779, + "epoch": 0.12, + "learning_rate": 0.00028136339286290553, + "loss": 0.0885, "step": 19250 }, { - "epoch": 0.21, - "learning_rate": 0.0002687520280355636, - "loss": 0.0893, + "epoch": 0.12, + "learning_rate": 0.0002813537115085486, + "loss": 0.0913, "step": 19260 }, { - "epoch": 0.21, - "learning_rate": 0.00026873580375105457, - "loss": 0.085, + "epoch": 0.12, + "learning_rate": 0.0002813440301541917, + "loss": 0.0874, "step": 19270 }, { - "epoch": 0.21, - "learning_rate": 0.0002687195794665455, - "loss": 0.0808, + "epoch": 0.12, + "learning_rate": 0.0002813343487998347, + "loss": 0.0911, "step": 19280 }, { - "epoch": 0.21, - "learning_rate": 0.00026870335518203647, - "loss": 0.0876, + "epoch": 0.12, + "learning_rate": 0.0002813246674454778, + "loss": 0.0937, "step": 19290 }, { - "epoch": 0.21, - "learning_rate": 0.0002686871308975274, - "loss": 0.0789, + "epoch": 0.12, + "learning_rate": 0.0002813149860911209, + "loss": 0.0878, "step": 19300 }, { - "epoch": 0.21, - "learning_rate": 0.00026867090661301837, - "loss": 0.0782, + "epoch": 0.12, + "learning_rate": 0.00028130530473676396, + "loss": 0.0914, "step": 19310 }, { - "epoch": 0.21, - "learning_rate": 0.0002686546823285093, - "loss": 0.0782, + "epoch": 0.12, + "learning_rate": 0.00028129562338240704, + "loss": 0.094, "step": 19320 }, { - "epoch": 0.21, - "learning_rate": 0.00026863845804400027, - "loss": 0.0835, + "epoch": 0.12, + "learning_rate": 0.00028128594202805006, + "loss": 0.0918, "step": 19330 }, { - "epoch": 0.21, - "learning_rate": 0.0002686222337594912, - "loss": 0.0828, + "epoch": 0.12, + "learning_rate": 0.00028127626067369314, + "loss": 0.0973, "step": 19340 }, { - "epoch": 0.21, - "learning_rate": 0.00026860600947498217, - "loss": 0.0829, + "epoch": 0.12, + "learning_rate": 0.0002812665793193362, + "loss": 0.0961, "step": 19350 }, { - "epoch": 0.21, - "learning_rate": 0.0002685897851904731, - "loss": 0.0847, + "epoch": 0.12, + "learning_rate": 0.0002812568979649793, + "loss": 0.092, "step": 19360 }, { - "epoch": 0.21, - "learning_rate": 0.000268573560905964, - "loss": 0.0848, + "epoch": 0.13, + "learning_rate": 0.0002812472166106224, + "loss": 0.0907, "step": 19370 }, { - "epoch": 0.21, - "learning_rate": 0.000268557336621455, - "loss": 0.0852, + "epoch": 0.13, + "learning_rate": 0.0002812375352562654, + "loss": 0.0929, "step": 19380 }, { - "epoch": 0.21, - "learning_rate": 0.0002685411123369459, - "loss": 0.0953, + "epoch": 0.13, + "learning_rate": 0.0002812278539019085, + "loss": 0.1038, "step": 19390 }, { - "epoch": 0.21, - "learning_rate": 0.00026852488805243684, - "loss": 0.0961, + "epoch": 0.13, + "learning_rate": 0.00028121817254755157, + "loss": 0.1033, "step": 19400 }, { - "epoch": 0.21, - "learning_rate": 0.0002685086637679278, - "loss": 0.0766, + "epoch": 0.13, + "learning_rate": 0.0002812084911931946, + "loss": 0.0982, "step": 19410 }, { - "epoch": 0.21, - "learning_rate": 0.00026849243948341874, - "loss": 0.0759, + "epoch": 0.13, + "learning_rate": 0.0002811988098388377, + "loss": 0.0934, "step": 19420 }, { - "epoch": 0.21, - "learning_rate": 0.0002684762151989097, - "loss": 0.0746, + "epoch": 0.13, + "learning_rate": 0.00028118912848448075, + "loss": 0.0902, "step": 19430 }, { - "epoch": 0.21, - "learning_rate": 0.00026845999091440064, - "loss": 0.0758, + "epoch": 0.13, + "learning_rate": 0.00028117944713012383, + "loss": 0.0876, "step": 19440 }, { - "epoch": 0.21, - "learning_rate": 0.0002684437666298916, - "loss": 0.0824, + "epoch": 0.13, + "learning_rate": 0.0002811697657757669, + "loss": 0.0883, "step": 19450 }, { - "epoch": 0.21, - "learning_rate": 0.00026842754234538254, - "loss": 0.0776, + "epoch": 0.13, + "learning_rate": 0.00028116008442141, + "loss": 0.0987, "step": 19460 }, { - "epoch": 0.21, - "learning_rate": 0.0002684113180608735, - "loss": 0.0978, + "epoch": 0.13, + "learning_rate": 0.000281150403067053, + "loss": 0.0868, "step": 19470 }, { - "epoch": 0.21, - "learning_rate": 0.00026839509377636443, - "loss": 0.0763, + "epoch": 0.13, + "learning_rate": 0.0002811407217126961, + "loss": 0.0942, "step": 19480 }, { - "epoch": 0.21, - "learning_rate": 0.0002683788694918554, - "loss": 0.082, + "epoch": 0.13, + "learning_rate": 0.0002811310403583392, + "loss": 0.0883, "step": 19490 }, { - "epoch": 0.21, - "learning_rate": 0.00026836264520734633, - "loss": 0.0791, + "epoch": 0.13, + "learning_rate": 0.00028112135900398226, + "loss": 0.0852, "step": 19500 }, { - "epoch": 0.21, - "learning_rate": 0.0002683464209228373, - "loss": 0.0728, + "epoch": 0.13, + "learning_rate": 0.00028111167764962534, + "loss": 0.0836, "step": 19510 }, { - "epoch": 0.21, - "learning_rate": 0.00026833019663832823, - "loss": 0.0961, + "epoch": 0.13, + "learning_rate": 0.00028110199629526836, + "loss": 0.0858, "step": 19520 }, { - "epoch": 0.21, - "learning_rate": 0.0002683139723538192, - "loss": 0.0916, + "epoch": 0.13, + "learning_rate": 0.00028109231494091144, + "loss": 0.0841, "step": 19530 }, { - "epoch": 0.21, - "learning_rate": 0.00026829774806931013, - "loss": 0.0832, + "epoch": 0.13, + "learning_rate": 0.0002810826335865545, + "loss": 0.0911, "step": 19540 }, { - "epoch": 0.21, - "learning_rate": 0.00026828152378480106, - "loss": 0.0876, + "epoch": 0.13, + "learning_rate": 0.00028107295223219755, + "loss": 0.0891, "step": 19550 }, { - "epoch": 0.21, - "learning_rate": 0.00026826529950029203, - "loss": 0.086, + "epoch": 0.13, + "learning_rate": 0.00028106327087784063, + "loss": 0.091, "step": 19560 }, { - "epoch": 0.21, - "learning_rate": 0.00026824907521578296, - "loss": 0.0852, + "epoch": 0.13, + "learning_rate": 0.0002810535895234837, + "loss": 0.0977, "step": 19570 }, { - "epoch": 0.21, - "learning_rate": 0.0002682328509312739, - "loss": 0.0769, + "epoch": 0.13, + "learning_rate": 0.0002810439081691268, + "loss": 0.0923, "step": 19580 }, { - "epoch": 0.21, - "learning_rate": 0.00026821662664676486, - "loss": 0.0827, + "epoch": 0.13, + "learning_rate": 0.00028103422681476987, + "loss": 0.0925, "step": 19590 }, { - "epoch": 0.21, - "learning_rate": 0.0002682004023622558, - "loss": 0.0856, + "epoch": 0.13, + "learning_rate": 0.00028102454546041295, + "loss": 0.089, "step": 19600 }, { - "epoch": 0.21, - "learning_rate": 0.00026818417807774675, - "loss": 0.0735, + "epoch": 0.13, + "learning_rate": 0.00028101486410605597, + "loss": 0.091, "step": 19610 }, { - "epoch": 0.21, - "learning_rate": 0.0002681679537932377, - "loss": 0.0827, + "epoch": 0.13, + "learning_rate": 0.00028100518275169905, + "loss": 0.0954, "step": 19620 }, { - "epoch": 0.21, - "learning_rate": 0.00026815172950872865, - "loss": 0.0788, + "epoch": 0.13, + "learning_rate": 0.00028099550139734213, + "loss": 0.0941, "step": 19630 }, { - "epoch": 0.21, - "learning_rate": 0.0002681355052242196, - "loss": 0.0792, + "epoch": 0.13, + "learning_rate": 0.0002809858200429852, + "loss": 0.0894, "step": 19640 }, { - "epoch": 0.21, - "learning_rate": 0.00026811928093971055, - "loss": 0.08, + "epoch": 0.13, + "learning_rate": 0.00028097613868862824, + "loss": 0.0888, "step": 19650 }, { - "epoch": 0.21, - "learning_rate": 0.0002681030566552015, - "loss": 0.0742, + "epoch": 0.13, + "learning_rate": 0.0002809664573342713, + "loss": 0.0767, "step": 19660 }, { - "epoch": 0.21, - "learning_rate": 0.00026808683237069245, - "loss": 0.0861, + "epoch": 0.13, + "learning_rate": 0.0002809567759799144, + "loss": 0.0934, "step": 19670 }, { - "epoch": 0.21, - "learning_rate": 0.0002680706080861834, - "loss": 0.0855, + "epoch": 0.13, + "learning_rate": 0.0002809470946255574, + "loss": 0.0837, "step": 19680 }, { - "epoch": 0.21, - "learning_rate": 0.00026805438380167435, - "loss": 0.0848, + "epoch": 0.13, + "learning_rate": 0.0002809374132712005, + "loss": 0.0877, "step": 19690 }, { - "epoch": 0.21, - "learning_rate": 0.0002680381595171653, - "loss": 0.0841, + "epoch": 0.13, + "learning_rate": 0.0002809277319168436, + "loss": 0.0977, "step": 19700 }, { - "epoch": 0.21, - "learning_rate": 0.00026802193523265625, - "loss": 0.0769, + "epoch": 0.13, + "learning_rate": 0.00028091805056248666, + "loss": 0.0953, "step": 19710 }, { - "epoch": 0.21, - "learning_rate": 0.0002680057109481472, - "loss": 0.0859, + "epoch": 0.13, + "learning_rate": 0.00028090836920812974, + "loss": 0.0901, "step": 19720 }, { - "epoch": 0.21, - "learning_rate": 0.0002679894866636381, - "loss": 0.0852, + "epoch": 0.13, + "learning_rate": 0.0002808986878537728, + "loss": 0.0872, "step": 19730 }, { - "epoch": 0.21, - "learning_rate": 0.0002679732623791291, - "loss": 0.0763, + "epoch": 0.13, + "learning_rate": 0.0002808890064994159, + "loss": 0.094, "step": 19740 }, { - "epoch": 0.21, - "learning_rate": 0.00026795703809462, - "loss": 0.0837, + "epoch": 0.13, + "learning_rate": 0.0002808793251450589, + "loss": 0.0804, "step": 19750 }, { - "epoch": 0.21, - "learning_rate": 0.0002679408138101109, - "loss": 0.0815, + "epoch": 0.13, + "learning_rate": 0.000280869643790702, + "loss": 0.0929, "step": 19760 }, { - "epoch": 0.21, - "learning_rate": 0.0002679245895256019, - "loss": 0.0865, + "epoch": 0.13, + "learning_rate": 0.0002808599624363451, + "loss": 0.0794, "step": 19770 }, { - "epoch": 0.21, - "learning_rate": 0.0002679083652410928, - "loss": 0.0833, + "epoch": 0.13, + "learning_rate": 0.0002808502810819881, + "loss": 0.0907, "step": 19780 }, { - "epoch": 0.21, - "learning_rate": 0.0002678921409565838, - "loss": 0.092, + "epoch": 0.13, + "learning_rate": 0.0002808405997276312, + "loss": 0.0979, "step": 19790 }, { - "epoch": 0.21, - "learning_rate": 0.0002678759166720747, - "loss": 0.075, + "epoch": 0.13, + "learning_rate": 0.00028083091837327427, + "loss": 0.0928, "step": 19800 }, { - "epoch": 0.21, - "learning_rate": 0.0002678596923875657, - "loss": 0.0904, + "epoch": 0.13, + "learning_rate": 0.00028082123701891735, + "loss": 0.0865, "step": 19810 }, { - "epoch": 0.21, - "learning_rate": 0.0002678434681030566, - "loss": 0.0865, + "epoch": 0.13, + "learning_rate": 0.0002808115556645604, + "loss": 0.1105, "step": 19820 }, { - "epoch": 0.21, - "learning_rate": 0.0002678272438185476, - "loss": 0.0851, + "epoch": 0.13, + "learning_rate": 0.00028080187431020346, + "loss": 0.088, "step": 19830 }, { - "epoch": 0.21, - "learning_rate": 0.0002678110195340385, - "loss": 0.0782, + "epoch": 0.13, + "learning_rate": 0.00028079219295584654, + "loss": 0.0871, "step": 19840 }, { - "epoch": 0.21, - "learning_rate": 0.0002677947952495295, - "loss": 0.0756, + "epoch": 0.13, + "learning_rate": 0.0002807825116014896, + "loss": 0.0994, "step": 19850 }, { - "epoch": 0.21, - "learning_rate": 0.0002677785709650204, - "loss": 0.0764, + "epoch": 0.13, + "learning_rate": 0.0002807728302471327, + "loss": 0.0874, "step": 19860 }, { - "epoch": 0.21, - "learning_rate": 0.0002677623466805114, - "loss": 0.0792, + "epoch": 0.13, + "learning_rate": 0.0002807631488927758, + "loss": 0.0849, "step": 19870 }, { - "epoch": 0.22, - "learning_rate": 0.0002677461223960023, - "loss": 0.0814, + "epoch": 0.13, + "learning_rate": 0.00028075346753841886, + "loss": 0.0859, "step": 19880 }, { - "epoch": 0.22, - "learning_rate": 0.0002677298981114933, - "loss": 0.0775, + "epoch": 0.13, + "learning_rate": 0.0002807437861840619, + "loss": 0.0839, "step": 19890 }, { - "epoch": 0.22, - "learning_rate": 0.0002677136738269842, - "loss": 0.0805, + "epoch": 0.13, + "learning_rate": 0.00028073410482970496, + "loss": 0.0876, "step": 19900 }, { - "epoch": 0.22, - "learning_rate": 0.00026769744954247514, - "loss": 0.0756, + "epoch": 0.13, + "learning_rate": 0.00028072442347534804, + "loss": 0.0905, "step": 19910 }, { - "epoch": 0.22, - "learning_rate": 0.0002676812252579661, - "loss": 0.0827, + "epoch": 0.13, + "learning_rate": 0.00028071474212099107, + "loss": 0.0839, "step": 19920 }, { - "epoch": 0.22, - "learning_rate": 0.00026766500097345704, - "loss": 0.0796, + "epoch": 0.13, + "learning_rate": 0.00028070506076663415, + "loss": 0.0942, "step": 19930 }, { - "epoch": 0.22, - "learning_rate": 0.00026764877668894796, - "loss": 0.0812, + "epoch": 0.13, + "learning_rate": 0.0002806953794122772, + "loss": 0.0983, "step": 19940 }, { - "epoch": 0.22, - "learning_rate": 0.00026763255240443894, - "loss": 0.0852, + "epoch": 0.13, + "learning_rate": 0.0002806856980579203, + "loss": 0.0908, "step": 19950 }, { - "epoch": 0.22, - "learning_rate": 0.00026761632811992986, - "loss": 0.0865, + "epoch": 0.13, + "learning_rate": 0.00028067601670356333, + "loss": 0.0869, "step": 19960 }, { - "epoch": 0.22, - "learning_rate": 0.00026760010383542084, - "loss": 0.0873, + "epoch": 0.13, + "learning_rate": 0.0002806663353492064, + "loss": 0.098, "step": 19970 }, { - "epoch": 0.22, - "learning_rate": 0.00026758387955091176, - "loss": 0.0809, + "epoch": 0.13, + "learning_rate": 0.0002806566539948495, + "loss": 0.0949, "step": 19980 }, { - "epoch": 0.22, - "learning_rate": 0.00026756765526640274, - "loss": 0.0778, + "epoch": 0.13, + "learning_rate": 0.00028064697264049257, + "loss": 0.0903, "step": 19990 }, { - "epoch": 0.22, - "learning_rate": 0.00026755143098189366, - "loss": 0.0808, + "epoch": 0.13, + "learning_rate": 0.00028063729128613565, + "loss": 0.0893, "step": 20000 }, { - "epoch": 0.22, - "eval_cer": 0.9214794475042452, - "eval_loss": 0.05358384922146797, - "eval_runtime": 119.5234, - "eval_samples_per_second": 16.733, - "eval_steps_per_second": 4.183, + "epoch": 0.13, + "eval_cer": 0.9201129815840018, + "eval_loss": 0.0617336705327034, + "eval_runtime": 120.5228, + "eval_samples_per_second": 16.594, + "eval_steps_per_second": 4.149, "step": 20000 }, { - "epoch": 0.22, - "learning_rate": 0.00026753520669738464, - "loss": 0.085, + "epoch": 0.13, + "learning_rate": 0.00028062760993177873, + "loss": 0.0877, "step": 20010 }, { - "epoch": 0.22, - "learning_rate": 0.00026751898241287556, - "loss": 0.0851, + "epoch": 0.13, + "learning_rate": 0.00028061792857742176, + "loss": 0.0923, "step": 20020 }, { - "epoch": 0.22, - "learning_rate": 0.00026750275812836654, - "loss": 0.0826, + "epoch": 0.13, + "learning_rate": 0.00028060824722306484, + "loss": 0.0889, "step": 20030 }, { - "epoch": 0.22, - "learning_rate": 0.00026748653384385746, - "loss": 0.0797, + "epoch": 0.13, + "learning_rate": 0.0002805985658687079, + "loss": 0.0913, "step": 20040 }, { - "epoch": 0.22, - "learning_rate": 0.00026747030955934844, - "loss": 0.0958, + "epoch": 0.13, + "learning_rate": 0.00028058888451435094, + "loss": 0.096, "step": 20050 }, { - "epoch": 0.22, - "learning_rate": 0.00026745408527483936, - "loss": 0.0862, + "epoch": 0.13, + "learning_rate": 0.000280579203159994, + "loss": 0.0952, "step": 20060 }, { - "epoch": 0.22, - "learning_rate": 0.00026743786099033034, - "loss": 0.0823, + "epoch": 0.13, + "learning_rate": 0.0002805695218056371, + "loss": 0.0936, "step": 20070 }, { - "epoch": 0.22, - "learning_rate": 0.00026742163670582126, - "loss": 0.0798, + "epoch": 0.13, + "learning_rate": 0.0002805598404512802, + "loss": 0.0893, "step": 20080 }, { - "epoch": 0.22, - "learning_rate": 0.0002674054124213122, - "loss": 0.0767, + "epoch": 0.13, + "learning_rate": 0.00028055015909692326, + "loss": 0.0956, "step": 20090 }, { - "epoch": 0.22, - "learning_rate": 0.00026738918813680316, - "loss": 0.0762, + "epoch": 0.13, + "learning_rate": 0.0002805404777425663, + "loss": 0.0822, "step": 20100 }, { - "epoch": 0.22, - "learning_rate": 0.0002673729638522941, - "loss": 0.0801, + "epoch": 0.13, + "learning_rate": 0.00028053079638820937, + "loss": 0.0889, "step": 20110 }, { - "epoch": 0.22, - "learning_rate": 0.000267356739567785, - "loss": 0.0813, + "epoch": 0.13, + "learning_rate": 0.00028052111503385245, + "loss": 0.0948, "step": 20120 }, { - "epoch": 0.22, - "learning_rate": 0.000267340515283276, - "loss": 0.0858, + "epoch": 0.13, + "learning_rate": 0.0002805114336794955, + "loss": 0.0932, "step": 20130 }, { - "epoch": 0.22, - "learning_rate": 0.0002673242909987669, - "loss": 0.077, + "epoch": 0.13, + "learning_rate": 0.0002805017523251386, + "loss": 0.0903, "step": 20140 }, { - "epoch": 0.22, - "learning_rate": 0.0002673080667142579, - "loss": 0.0792, + "epoch": 0.13, + "learning_rate": 0.00028049207097078163, + "loss": 0.0974, "step": 20150 }, { - "epoch": 0.22, - "learning_rate": 0.0002672918424297488, - "loss": 0.0857, + "epoch": 0.13, + "learning_rate": 0.0002804823896164247, + "loss": 0.0844, "step": 20160 }, { - "epoch": 0.22, - "learning_rate": 0.0002672756181452398, - "loss": 0.0836, + "epoch": 0.13, + "learning_rate": 0.0002804727082620678, + "loss": 0.0987, "step": 20170 }, { - "epoch": 0.22, - "learning_rate": 0.0002672593938607307, - "loss": 0.0749, + "epoch": 0.13, + "learning_rate": 0.0002804630269077108, + "loss": 0.0943, "step": 20180 }, { - "epoch": 0.22, - "learning_rate": 0.0002672431695762217, - "loss": 0.0817, + "epoch": 0.13, + "learning_rate": 0.0002804533455533539, + "loss": 0.0893, "step": 20190 }, { - "epoch": 0.22, - "learning_rate": 0.0002672269452917126, - "loss": 0.0797, + "epoch": 0.13, + "learning_rate": 0.000280443664198997, + "loss": 0.0872, "step": 20200 }, { - "epoch": 0.22, - "learning_rate": 0.0002672107210072036, - "loss": 0.0723, + "epoch": 0.13, + "learning_rate": 0.00028043398284464005, + "loss": 0.0928, "step": 20210 }, { - "epoch": 0.22, - "learning_rate": 0.0002671944967226945, - "loss": 0.0861, + "epoch": 0.13, + "learning_rate": 0.00028042430149028313, + "loss": 0.0956, "step": 20220 }, { - "epoch": 0.22, - "learning_rate": 0.0002671782724381855, - "loss": 0.0911, + "epoch": 0.13, + "learning_rate": 0.0002804146201359262, + "loss": 0.0847, "step": 20230 }, { - "epoch": 0.22, - "learning_rate": 0.0002671620481536764, - "loss": 0.0908, + "epoch": 0.13, + "learning_rate": 0.00028040493878156924, + "loss": 0.0894, "step": 20240 }, { - "epoch": 0.22, - "learning_rate": 0.0002671458238691674, - "loss": 0.0815, + "epoch": 0.13, + "learning_rate": 0.0002803952574272123, + "loss": 0.0932, "step": 20250 }, { - "epoch": 0.22, - "learning_rate": 0.0002671295995846583, - "loss": 0.0957, + "epoch": 0.13, + "learning_rate": 0.0002803855760728554, + "loss": 0.0895, "step": 20260 }, { - "epoch": 0.22, - "learning_rate": 0.0002671133753001492, - "loss": 0.0844, + "epoch": 0.13, + "learning_rate": 0.0002803758947184985, + "loss": 0.0924, "step": 20270 }, { - "epoch": 0.22, - "learning_rate": 0.0002670971510156402, - "loss": 0.0762, + "epoch": 0.13, + "learning_rate": 0.00028036621336414156, + "loss": 0.0878, "step": 20280 }, { - "epoch": 0.22, - "learning_rate": 0.0002670809267311311, - "loss": 0.0908, + "epoch": 0.13, + "learning_rate": 0.0002803565320097846, + "loss": 0.082, "step": 20290 }, { - "epoch": 0.22, - "learning_rate": 0.00026706470244662205, - "loss": 0.0868, + "epoch": 0.13, + "learning_rate": 0.00028034685065542766, + "loss": 0.0905, "step": 20300 }, { - "epoch": 0.22, - "learning_rate": 0.000267048478162113, - "loss": 0.0824, + "epoch": 0.13, + "learning_rate": 0.00028033716930107074, + "loss": 0.0831, "step": 20310 }, { - "epoch": 0.22, - "learning_rate": 0.00026703225387760394, - "loss": 0.073, + "epoch": 0.13, + "learning_rate": 0.00028032748794671377, + "loss": 0.0863, "step": 20320 }, { - "epoch": 0.22, - "learning_rate": 0.0002670160295930949, - "loss": 0.0888, + "epoch": 0.13, + "learning_rate": 0.00028031780659235685, + "loss": 0.0847, "step": 20330 }, { - "epoch": 0.22, - "learning_rate": 0.00026699980530858584, - "loss": 0.0734, + "epoch": 0.13, + "learning_rate": 0.00028030812523799993, + "loss": 0.0892, "step": 20340 }, { - "epoch": 0.22, - "learning_rate": 0.0002669835810240768, - "loss": 0.0856, + "epoch": 0.13, + "learning_rate": 0.000280298443883643, + "loss": 0.0942, "step": 20350 }, { - "epoch": 0.22, - "learning_rate": 0.00026696735673956774, - "loss": 0.0818, + "epoch": 0.13, + "learning_rate": 0.0002802887625292861, + "loss": 0.0878, "step": 20360 }, { - "epoch": 0.22, - "learning_rate": 0.0002669511324550587, - "loss": 0.0825, + "epoch": 0.13, + "learning_rate": 0.00028027908117492917, + "loss": 0.0905, "step": 20370 }, { - "epoch": 0.22, - "learning_rate": 0.00026693490817054964, - "loss": 0.0854, + "epoch": 0.13, + "learning_rate": 0.0002802693998205722, + "loss": 0.0888, "step": 20380 }, { - "epoch": 0.22, - "learning_rate": 0.0002669186838860406, - "loss": 0.082, + "epoch": 0.13, + "learning_rate": 0.0002802597184662153, + "loss": 0.0854, "step": 20390 }, { - "epoch": 0.22, - "learning_rate": 0.00026690245960153154, - "loss": 0.084, + "epoch": 0.13, + "learning_rate": 0.00028025003711185835, + "loss": 0.0857, "step": 20400 }, { - "epoch": 0.22, - "learning_rate": 0.0002668862353170225, - "loss": 0.081, + "epoch": 0.13, + "learning_rate": 0.00028024035575750143, + "loss": 0.0841, "step": 20410 }, { - "epoch": 0.22, - "learning_rate": 0.00026687001103251344, - "loss": 0.076, + "epoch": 0.13, + "learning_rate": 0.00028023067440314446, + "loss": 0.0917, "step": 20420 }, { - "epoch": 0.22, - "learning_rate": 0.0002668537867480044, - "loss": 0.0803, + "epoch": 0.13, + "learning_rate": 0.00028022099304878754, + "loss": 0.0919, "step": 20430 }, { - "epoch": 0.22, - "learning_rate": 0.00026683756246349534, - "loss": 0.0818, + "epoch": 0.13, + "learning_rate": 0.0002802113116944306, + "loss": 0.095, "step": 20440 }, { - "epoch": 0.22, - "learning_rate": 0.00026682133817898626, - "loss": 0.082, + "epoch": 0.13, + "learning_rate": 0.00028020163034007364, + "loss": 0.0873, "step": 20450 }, { - "epoch": 0.22, - "learning_rate": 0.00026680511389447724, - "loss": 0.0874, + "epoch": 0.13, + "learning_rate": 0.0002801919489857167, + "loss": 0.0891, "step": 20460 }, { - "epoch": 0.22, - "learning_rate": 0.00026678888960996816, - "loss": 0.0714, + "epoch": 0.13, + "learning_rate": 0.0002801822676313598, + "loss": 0.081, "step": 20470 }, { - "epoch": 0.22, - "learning_rate": 0.0002667726653254591, - "loss": 0.0893, + "epoch": 0.13, + "learning_rate": 0.0002801725862770029, + "loss": 0.088, "step": 20480 }, { - "epoch": 0.22, - "learning_rate": 0.00026675644104095006, - "loss": 0.0721, + "epoch": 0.13, + "learning_rate": 0.00028016290492264596, + "loss": 0.0876, "step": 20490 }, { - "epoch": 0.22, - "learning_rate": 0.000266740216756441, - "loss": 0.0772, + "epoch": 0.13, + "learning_rate": 0.00028015322356828904, + "loss": 0.0932, "step": 20500 }, { - "epoch": 0.22, - "learning_rate": 0.00026672399247193196, - "loss": 0.0769, + "epoch": 0.13, + "learning_rate": 0.0002801435422139321, + "loss": 0.1059, "step": 20510 }, { - "epoch": 0.22, - "learning_rate": 0.0002667077681874229, - "loss": 0.0808, + "epoch": 0.13, + "learning_rate": 0.00028013386085957515, + "loss": 0.0906, "step": 20520 }, { - "epoch": 0.22, - "learning_rate": 0.00026669154390291386, - "loss": 0.0774, + "epoch": 0.13, + "learning_rate": 0.00028012417950521823, + "loss": 0.0893, "step": 20530 }, { - "epoch": 0.22, - "learning_rate": 0.0002666753196184048, - "loss": 0.0785, + "epoch": 0.13, + "learning_rate": 0.0002801144981508613, + "loss": 0.0891, "step": 20540 }, { - "epoch": 0.22, - "learning_rate": 0.00026665909533389576, - "loss": 0.0721, + "epoch": 0.13, + "learning_rate": 0.00028010481679650433, + "loss": 0.0956, "step": 20550 }, { - "epoch": 0.22, - "learning_rate": 0.0002666428710493867, - "loss": 0.0748, + "epoch": 0.13, + "learning_rate": 0.0002800951354421474, + "loss": 0.0828, "step": 20560 }, { - "epoch": 0.22, - "learning_rate": 0.00026662664676487766, - "loss": 0.0757, + "epoch": 0.13, + "learning_rate": 0.0002800854540877905, + "loss": 0.0866, "step": 20570 }, { - "epoch": 0.22, - "learning_rate": 0.0002666104224803686, - "loss": 0.072, + "epoch": 0.13, + "learning_rate": 0.0002800757727334336, + "loss": 0.0918, "step": 20580 }, { - "epoch": 0.22, - "learning_rate": 0.00026659419819585956, - "loss": 0.0826, + "epoch": 0.13, + "learning_rate": 0.0002800660913790766, + "loss": 0.0956, "step": 20590 }, { - "epoch": 0.22, - "learning_rate": 0.0002665779739113505, - "loss": 0.0853, + "epoch": 0.13, + "learning_rate": 0.0002800564100247197, + "loss": 0.1036, "step": 20600 }, { - "epoch": 0.22, - "learning_rate": 0.00026656174962684146, - "loss": 0.0728, + "epoch": 0.13, + "learning_rate": 0.00028004672867036276, + "loss": 0.0942, "step": 20610 }, { - "epoch": 0.22, - "learning_rate": 0.0002665455253423324, - "loss": 0.072, + "epoch": 0.13, + "learning_rate": 0.00028003704731600584, + "loss": 0.0904, "step": 20620 }, { - "epoch": 0.22, - "learning_rate": 0.0002665293010578233, - "loss": 0.0726, + "epoch": 0.13, + "learning_rate": 0.0002800273659616489, + "loss": 0.0893, "step": 20630 }, { - "epoch": 0.22, - "learning_rate": 0.0002665130767733143, - "loss": 0.0801, + "epoch": 0.13, + "learning_rate": 0.000280017684607292, + "loss": 0.0894, "step": 20640 }, { - "epoch": 0.22, - "learning_rate": 0.0002664968524888052, - "loss": 0.0839, + "epoch": 0.13, + "learning_rate": 0.0002800080032529351, + "loss": 0.0861, "step": 20650 }, { - "epoch": 0.22, - "learning_rate": 0.00026648062820429613, - "loss": 0.0825, + "epoch": 0.13, + "learning_rate": 0.0002799983218985781, + "loss": 0.0985, "step": 20660 }, { - "epoch": 0.22, - "learning_rate": 0.0002664644039197871, - "loss": 0.0776, + "epoch": 0.13, + "learning_rate": 0.0002799886405442212, + "loss": 0.0885, "step": 20670 }, { - "epoch": 0.22, - "learning_rate": 0.00026644817963527803, - "loss": 0.0739, + "epoch": 0.13, + "learning_rate": 0.00027997895918986426, + "loss": 0.0958, "step": 20680 }, { - "epoch": 0.22, - "learning_rate": 0.000266431955350769, - "loss": 0.0756, + "epoch": 0.13, + "learning_rate": 0.0002799692778355073, + "loss": 0.0909, "step": 20690 }, { - "epoch": 0.22, - "learning_rate": 0.00026641573106625993, - "loss": 0.0788, + "epoch": 0.13, + "learning_rate": 0.00027995959648115037, + "loss": 0.0896, "step": 20700 }, { - "epoch": 0.22, - "learning_rate": 0.0002663995067817509, - "loss": 0.087, + "epoch": 0.13, + "learning_rate": 0.00027994991512679345, + "loss": 0.0867, "step": 20710 }, { - "epoch": 0.22, - "learning_rate": 0.0002663832824972418, - "loss": 0.0834, + "epoch": 0.13, + "learning_rate": 0.00027994023377243653, + "loss": 0.0924, "step": 20720 }, { - "epoch": 0.22, - "learning_rate": 0.0002663670582127328, - "loss": 0.0855, + "epoch": 0.13, + "learning_rate": 0.00027993055241807955, + "loss": 0.0919, "step": 20730 }, { - "epoch": 0.22, - "learning_rate": 0.0002663508339282237, - "loss": 0.0904, + "epoch": 0.13, + "learning_rate": 0.00027992087106372263, + "loss": 0.0937, "step": 20740 }, { - "epoch": 0.22, - "learning_rate": 0.0002663346096437147, - "loss": 0.076, + "epoch": 0.13, + "learning_rate": 0.0002799111897093657, + "loss": 0.0841, "step": 20750 }, { - "epoch": 0.22, - "learning_rate": 0.0002663183853592056, - "loss": 0.082, + "epoch": 0.13, + "learning_rate": 0.0002799015083550088, + "loss": 0.0913, "step": 20760 }, { - "epoch": 0.22, - "learning_rate": 0.0002663021610746966, - "loss": 0.0729, + "epoch": 0.13, + "learning_rate": 0.00027989182700065187, + "loss": 0.0917, "step": 20770 }, { - "epoch": 0.22, - "learning_rate": 0.0002662859367901875, - "loss": 0.0777, + "epoch": 0.13, + "learning_rate": 0.00027988214564629495, + "loss": 0.0824, "step": 20780 }, { - "epoch": 0.22, - "learning_rate": 0.0002662697125056785, - "loss": 0.0724, + "epoch": 0.13, + "learning_rate": 0.000279872464291938, + "loss": 0.0915, "step": 20790 }, { - "epoch": 0.22, - "learning_rate": 0.0002662534882211694, - "loss": 0.0826, + "epoch": 0.13, + "learning_rate": 0.00027986278293758106, + "loss": 0.0903, "step": 20800 }, { - "epoch": 0.23, - "learning_rate": 0.00026623726393666035, - "loss": 0.0726, + "epoch": 0.13, + "learning_rate": 0.00027985310158322414, + "loss": 0.0961, "step": 20810 }, { - "epoch": 0.23, - "learning_rate": 0.0002662210396521513, - "loss": 0.0861, + "epoch": 0.13, + "learning_rate": 0.00027984342022886716, + "loss": 0.0852, "step": 20820 }, { - "epoch": 0.23, - "learning_rate": 0.00026620481536764225, - "loss": 0.073, + "epoch": 0.13, + "learning_rate": 0.00027983373887451024, + "loss": 0.0901, "step": 20830 }, { - "epoch": 0.23, - "learning_rate": 0.00026618859108313317, - "loss": 0.0703, + "epoch": 0.13, + "learning_rate": 0.0002798240575201533, + "loss": 0.0975, "step": 20840 }, { - "epoch": 0.23, - "learning_rate": 0.00026617236679862415, - "loss": 0.0781, + "epoch": 0.13, + "learning_rate": 0.0002798143761657964, + "loss": 0.1021, "step": 20850 }, { - "epoch": 0.23, - "learning_rate": 0.00026615614251411507, - "loss": 0.0681, + "epoch": 0.13, + "learning_rate": 0.0002798046948114395, + "loss": 0.0892, "step": 20860 }, { - "epoch": 0.23, - "learning_rate": 0.00026613991822960605, - "loss": 0.0856, + "epoch": 0.13, + "learning_rate": 0.0002797950134570825, + "loss": 0.0838, "step": 20870 }, { - "epoch": 0.23, - "learning_rate": 0.00026612369394509697, - "loss": 0.0858, + "epoch": 0.13, + "learning_rate": 0.0002797853321027256, + "loss": 0.0859, "step": 20880 }, { - "epoch": 0.23, - "learning_rate": 0.00026610746966058795, - "loss": 0.0839, + "epoch": 0.13, + "learning_rate": 0.00027977565074836867, + "loss": 0.0897, "step": 20890 }, { - "epoch": 0.23, - "learning_rate": 0.00026609124537607887, - "loss": 0.0917, + "epoch": 0.13, + "learning_rate": 0.00027976596939401175, + "loss": 0.0892, "step": 20900 }, { - "epoch": 0.23, - "learning_rate": 0.00026607502109156985, - "loss": 0.0867, + "epoch": 0.13, + "learning_rate": 0.00027975628803965483, + "loss": 0.0871, "step": 20910 }, { - "epoch": 0.23, - "learning_rate": 0.00026605879680706077, - "loss": 0.0681, + "epoch": 0.14, + "learning_rate": 0.0002797466066852979, + "loss": 0.085, "step": 20920 }, { - "epoch": 0.23, - "learning_rate": 0.00026604257252255175, - "loss": 0.0779, + "epoch": 0.14, + "learning_rate": 0.00027973692533094093, + "loss": 0.0877, "step": 20930 }, { - "epoch": 0.23, - "learning_rate": 0.00026602634823804267, - "loss": 0.0734, + "epoch": 0.14, + "learning_rate": 0.000279727243976584, + "loss": 0.0885, "step": 20940 }, { - "epoch": 0.23, - "learning_rate": 0.00026601012395353364, - "loss": 0.0874, + "epoch": 0.14, + "learning_rate": 0.00027971756262222704, + "loss": 0.0845, "step": 20950 }, { - "epoch": 0.23, - "learning_rate": 0.00026599389966902457, - "loss": 0.069, + "epoch": 0.14, + "learning_rate": 0.0002797078812678701, + "loss": 0.0914, "step": 20960 }, { - "epoch": 0.23, - "learning_rate": 0.00026597767538451554, - "loss": 0.0783, + "epoch": 0.14, + "learning_rate": 0.0002796981999135132, + "loss": 0.0927, "step": 20970 }, { - "epoch": 0.23, - "learning_rate": 0.00026596145110000647, - "loss": 0.0889, + "epoch": 0.14, + "learning_rate": 0.0002796885185591563, + "loss": 0.0908, "step": 20980 }, { - "epoch": 0.23, - "learning_rate": 0.0002659452268154974, - "loss": 0.0734, - "step": 20990 + "epoch": 0.14, + "learning_rate": 0.00027967883720479936, + "loss": 0.0919, + "step": 20990 }, { - "epoch": 0.23, - "learning_rate": 0.00026592900253098837, - "loss": 0.0684, + "epoch": 0.14, + "learning_rate": 0.00027966915585044244, + "loss": 0.0834, "step": 21000 }, { - "epoch": 0.23, - "eval_cer": 0.9213963999780896, - "eval_loss": 0.053616225719451904, - "eval_runtime": 119.4751, - "eval_samples_per_second": 16.74, - "eval_steps_per_second": 4.185, + "epoch": 0.14, + "eval_cer": 0.9202223477573156, + "eval_loss": 0.05823448300361633, + "eval_runtime": 120.3243, + "eval_samples_per_second": 16.622, + "eval_steps_per_second": 4.155, "step": 21000 }, { - "epoch": 0.23, - "learning_rate": 0.0002659127782464793, - "loss": 0.0817, + "epoch": 0.14, + "learning_rate": 0.00027965947449608546, + "loss": 0.0809, "step": 21010 }, { - "epoch": 0.23, - "learning_rate": 0.0002658965539619702, - "loss": 0.0782, + "epoch": 0.14, + "learning_rate": 0.00027964979314172854, + "loss": 0.0962, "step": 21020 }, { - "epoch": 0.23, - "learning_rate": 0.0002658803296774612, - "loss": 0.0735, + "epoch": 0.14, + "learning_rate": 0.0002796401117873716, + "loss": 0.0888, "step": 21030 }, { - "epoch": 0.23, - "learning_rate": 0.0002658641053929521, - "loss": 0.0729, + "epoch": 0.14, + "learning_rate": 0.0002796304304330147, + "loss": 0.1118, "step": 21040 }, { - "epoch": 0.23, - "learning_rate": 0.0002658478811084431, - "loss": 0.0763, + "epoch": 0.14, + "learning_rate": 0.0002796207490786578, + "loss": 0.0849, "step": 21050 }, { - "epoch": 0.23, - "learning_rate": 0.000265831656823934, - "loss": 0.0828, + "epoch": 0.14, + "learning_rate": 0.0002796110677243008, + "loss": 0.0872, "step": 21060 }, { - "epoch": 0.23, - "learning_rate": 0.000265815432539425, - "loss": 0.0758, + "epoch": 0.14, + "learning_rate": 0.0002796013863699439, + "loss": 0.0928, "step": 21070 }, { - "epoch": 0.23, - "learning_rate": 0.0002657992082549159, - "loss": 0.0788, + "epoch": 0.14, + "learning_rate": 0.00027959170501558697, + "loss": 0.0871, "step": 21080 }, { - "epoch": 0.23, - "learning_rate": 0.0002657829839704069, - "loss": 0.0772, + "epoch": 0.14, + "learning_rate": 0.00027958202366123, + "loss": 0.0832, "step": 21090 }, { - "epoch": 0.23, - "learning_rate": 0.0002657667596858978, - "loss": 0.0781, + "epoch": 0.14, + "learning_rate": 0.00027957234230687307, + "loss": 0.0811, "step": 21100 }, { - "epoch": 0.23, - "learning_rate": 0.0002657505354013888, - "loss": 0.0717, + "epoch": 0.14, + "learning_rate": 0.00027956266095251615, + "loss": 0.0977, "step": 21110 }, { - "epoch": 0.23, - "learning_rate": 0.00026573431111687976, - "loss": 0.0867, + "epoch": 0.14, + "learning_rate": 0.00027955297959815923, + "loss": 0.0911, "step": 21120 }, { - "epoch": 0.23, - "learning_rate": 0.0002657180868323707, - "loss": 0.086, + "epoch": 0.14, + "learning_rate": 0.0002795432982438023, + "loss": 0.0842, "step": 21130 }, { - "epoch": 0.23, - "learning_rate": 0.0002657018625478616, - "loss": 0.0754, + "epoch": 0.14, + "learning_rate": 0.0002795336168894454, + "loss": 0.0876, "step": 21140 }, { - "epoch": 0.23, - "learning_rate": 0.0002656856382633526, - "loss": 0.0747, + "epoch": 0.14, + "learning_rate": 0.0002795239355350884, + "loss": 0.0853, "step": 21150 }, { - "epoch": 0.23, - "learning_rate": 0.0002656694139788435, - "loss": 0.0853, + "epoch": 0.14, + "learning_rate": 0.0002795142541807315, + "loss": 0.0926, "step": 21160 }, { - "epoch": 0.23, - "learning_rate": 0.00026565318969433443, - "loss": 0.0834, + "epoch": 0.14, + "learning_rate": 0.0002795045728263746, + "loss": 0.0926, "step": 21170 }, { - "epoch": 0.23, - "learning_rate": 0.0002656369654098254, - "loss": 0.0713, + "epoch": 0.14, + "learning_rate": 0.00027949489147201766, + "loss": 0.0858, "step": 21180 }, { - "epoch": 0.23, - "learning_rate": 0.00026562074112531633, - "loss": 0.0846, + "epoch": 0.14, + "learning_rate": 0.0002794852101176607, + "loss": 0.0838, "step": 21190 }, { - "epoch": 0.23, - "learning_rate": 0.0002656045168408073, - "loss": 0.0779, + "epoch": 0.14, + "learning_rate": 0.00027947552876330376, + "loss": 0.0829, "step": 21200 }, { - "epoch": 0.23, - "learning_rate": 0.00026558829255629823, - "loss": 0.0849, + "epoch": 0.14, + "learning_rate": 0.00027946584740894684, + "loss": 0.0883, "step": 21210 }, { - "epoch": 0.23, - "learning_rate": 0.0002655720682717892, - "loss": 0.0879, + "epoch": 0.14, + "learning_rate": 0.00027945616605458987, + "loss": 0.0827, "step": 21220 }, { - "epoch": 0.23, - "learning_rate": 0.00026555584398728013, - "loss": 0.0791, + "epoch": 0.14, + "learning_rate": 0.00027944648470023295, + "loss": 0.0829, "step": 21230 }, { - "epoch": 0.23, - "learning_rate": 0.0002655396197027711, - "loss": 0.0756, + "epoch": 0.14, + "learning_rate": 0.000279436803345876, + "loss": 0.0826, "step": 21240 }, { - "epoch": 0.23, - "learning_rate": 0.00026552339541826203, - "loss": 0.0824, + "epoch": 0.14, + "learning_rate": 0.0002794271219915191, + "loss": 0.0762, "step": 21250 }, { - "epoch": 0.23, - "learning_rate": 0.000265507171133753, - "loss": 0.0818, + "epoch": 0.14, + "learning_rate": 0.0002794174406371622, + "loss": 0.0883, "step": 21260 }, { - "epoch": 0.23, - "learning_rate": 0.00026549094684924393, - "loss": 0.0836, + "epoch": 0.14, + "learning_rate": 0.00027940775928280527, + "loss": 0.095, "step": 21270 }, { - "epoch": 0.23, - "learning_rate": 0.0002654747225647349, - "loss": 0.0869, + "epoch": 0.14, + "learning_rate": 0.00027939807792844835, + "loss": 0.0813, "step": 21280 }, { - "epoch": 0.23, - "learning_rate": 0.00026545849828022583, - "loss": 0.0799, + "epoch": 0.14, + "learning_rate": 0.00027938839657409137, + "loss": 0.0904, "step": 21290 }, { - "epoch": 0.23, - "learning_rate": 0.0002654422739957168, - "loss": 0.0779, + "epoch": 0.14, + "learning_rate": 0.00027937871521973445, + "loss": 0.0799, "step": 21300 }, { - "epoch": 0.23, - "learning_rate": 0.00026542604971120773, - "loss": 0.0734, + "epoch": 0.14, + "learning_rate": 0.00027936903386537753, + "loss": 0.0824, "step": 21310 }, { - "epoch": 0.23, - "learning_rate": 0.00026540982542669865, - "loss": 0.0751, + "epoch": 0.14, + "learning_rate": 0.0002793593525110206, + "loss": 0.0868, "step": 21320 }, { - "epoch": 0.23, - "learning_rate": 0.00026539360114218963, - "loss": 0.0794, + "epoch": 0.14, + "learning_rate": 0.00027934967115666364, + "loss": 0.0898, "step": 21330 }, { - "epoch": 0.23, - "learning_rate": 0.00026537737685768055, - "loss": 0.0916, + "epoch": 0.14, + "learning_rate": 0.0002793399898023067, + "loss": 0.0923, "step": 21340 }, { - "epoch": 0.23, - "learning_rate": 0.00026536115257317147, - "loss": 0.0758, + "epoch": 0.14, + "learning_rate": 0.0002793303084479498, + "loss": 0.0995, "step": 21350 }, { - "epoch": 0.23, - "learning_rate": 0.00026534492828866245, - "loss": 0.0725, + "epoch": 0.14, + "learning_rate": 0.0002793206270935928, + "loss": 0.0846, "step": 21360 }, { - "epoch": 0.23, - "learning_rate": 0.00026532870400415337, - "loss": 0.0722, + "epoch": 0.14, + "learning_rate": 0.0002793109457392359, + "loss": 0.0831, "step": 21370 }, { - "epoch": 0.23, - "learning_rate": 0.00026531247971964435, - "loss": 0.0836, + "epoch": 0.14, + "learning_rate": 0.000279301264384879, + "loss": 0.0853, "step": 21380 }, { - "epoch": 0.23, - "learning_rate": 0.00026529625543513527, - "loss": 0.0838, + "epoch": 0.14, + "learning_rate": 0.00027929158303052206, + "loss": 0.0807, "step": 21390 }, { - "epoch": 0.23, - "learning_rate": 0.00026528003115062625, - "loss": 0.0784, + "epoch": 0.14, + "learning_rate": 0.00027928190167616514, + "loss": 0.0855, "step": 21400 }, { - "epoch": 0.23, - "learning_rate": 0.00026526380686611717, - "loss": 0.0732, + "epoch": 0.14, + "learning_rate": 0.0002792722203218082, + "loss": 0.0817, "step": 21410 }, { - "epoch": 0.23, - "learning_rate": 0.00026524758258160815, - "loss": 0.0694, + "epoch": 0.14, + "learning_rate": 0.0002792625389674513, + "loss": 0.0828, "step": 21420 }, { - "epoch": 0.23, - "learning_rate": 0.00026523135829709907, - "loss": 0.0736, + "epoch": 0.14, + "learning_rate": 0.0002792528576130943, + "loss": 0.079, "step": 21430 }, { - "epoch": 0.23, - "learning_rate": 0.00026521513401259005, - "loss": 0.0784, + "epoch": 0.14, + "learning_rate": 0.0002792431762587374, + "loss": 0.0984, "step": 21440 }, { - "epoch": 0.23, - "learning_rate": 0.00026519890972808097, - "loss": 0.0747, + "epoch": 0.14, + "learning_rate": 0.0002792334949043805, + "loss": 0.0875, "step": 21450 }, { - "epoch": 0.23, - "learning_rate": 0.00026518268544357195, - "loss": 0.0728, + "epoch": 0.14, + "learning_rate": 0.0002792238135500235, + "loss": 0.0795, "step": 21460 }, { - "epoch": 0.23, - "learning_rate": 0.00026516646115906287, - "loss": 0.0795, + "epoch": 0.14, + "learning_rate": 0.0002792141321956666, + "loss": 0.088, "step": 21470 }, { - "epoch": 0.23, - "learning_rate": 0.00026515023687455385, - "loss": 0.0772, + "epoch": 0.14, + "learning_rate": 0.00027920445084130967, + "loss": 0.0871, "step": 21480 }, { - "epoch": 0.23, - "learning_rate": 0.00026513401259004477, - "loss": 0.0714, + "epoch": 0.14, + "learning_rate": 0.00027919476948695275, + "loss": 0.0846, "step": 21490 }, { - "epoch": 0.23, - "learning_rate": 0.0002651177883055357, - "loss": 0.0764, + "epoch": 0.14, + "learning_rate": 0.0002791850881325958, + "loss": 0.0867, "step": 21500 }, { - "epoch": 0.23, - "learning_rate": 0.00026510156402102667, - "loss": 0.0844, + "epoch": 0.14, + "learning_rate": 0.00027917540677823886, + "loss": 0.0869, "step": 21510 }, { - "epoch": 0.23, - "learning_rate": 0.0002650853397365176, - "loss": 0.0767, + "epoch": 0.14, + "learning_rate": 0.00027916572542388194, + "loss": 0.082, "step": 21520 }, { - "epoch": 0.23, - "learning_rate": 0.0002650691154520085, - "loss": 0.0803, + "epoch": 0.14, + "learning_rate": 0.000279156044069525, + "loss": 0.0821, "step": 21530 }, { - "epoch": 0.23, - "learning_rate": 0.0002650528911674995, - "loss": 0.0702, + "epoch": 0.14, + "learning_rate": 0.0002791463627151681, + "loss": 0.0959, "step": 21540 }, { - "epoch": 0.23, - "learning_rate": 0.0002650366668829904, - "loss": 0.0709, + "epoch": 0.14, + "learning_rate": 0.0002791366813608112, + "loss": 0.0878, "step": 21550 }, { - "epoch": 0.23, - "learning_rate": 0.0002650204425984814, - "loss": 0.0767, + "epoch": 0.14, + "learning_rate": 0.0002791270000064542, + "loss": 0.0863, "step": 21560 }, { - "epoch": 0.23, - "learning_rate": 0.0002650042183139723, - "loss": 0.0797, + "epoch": 0.14, + "learning_rate": 0.0002791173186520973, + "loss": 0.0894, "step": 21570 }, { - "epoch": 0.23, - "learning_rate": 0.0002649879940294633, - "loss": 0.078, + "epoch": 0.14, + "learning_rate": 0.00027910763729774036, + "loss": 0.0915, "step": 21580 }, { - "epoch": 0.23, - "learning_rate": 0.0002649717697449542, - "loss": 0.0817, + "epoch": 0.14, + "learning_rate": 0.0002790979559433834, + "loss": 0.0836, "step": 21590 }, { - "epoch": 0.23, - "learning_rate": 0.0002649555454604452, - "loss": 0.0822, + "epoch": 0.14, + "learning_rate": 0.00027908827458902647, + "loss": 0.0846, "step": 21600 }, { - "epoch": 0.23, - "learning_rate": 0.0002649393211759361, - "loss": 0.0852, + "epoch": 0.14, + "learning_rate": 0.00027907859323466955, + "loss": 0.0864, "step": 21610 }, { - "epoch": 0.23, - "learning_rate": 0.0002649230968914271, - "loss": 0.0844, + "epoch": 0.14, + "learning_rate": 0.0002790689118803126, + "loss": 0.0886, "step": 21620 }, { - "epoch": 0.23, - "learning_rate": 0.000264906872606918, - "loss": 0.0737, + "epoch": 0.14, + "learning_rate": 0.0002790592305259557, + "loss": 0.0809, "step": 21630 }, { - "epoch": 0.23, - "learning_rate": 0.000264890648322409, - "loss": 0.0777, + "epoch": 0.14, + "learning_rate": 0.00027904954917159873, + "loss": 0.0842, "step": 21640 }, { - "epoch": 0.23, - "learning_rate": 0.0002648744240378999, - "loss": 0.0825, + "epoch": 0.14, + "learning_rate": 0.0002790398678172418, + "loss": 0.0854, "step": 21650 }, { - "epoch": 0.23, - "learning_rate": 0.0002648581997533909, - "loss": 0.0823, + "epoch": 0.14, + "learning_rate": 0.0002790301864628849, + "loss": 0.0841, "step": 21660 }, { - "epoch": 0.23, - "learning_rate": 0.0002648419754688818, - "loss": 0.0784, + "epoch": 0.14, + "learning_rate": 0.00027902050510852797, + "loss": 0.0806, "step": 21670 }, { - "epoch": 0.23, - "learning_rate": 0.00026482575118437273, - "loss": 0.0783, + "epoch": 0.14, + "learning_rate": 0.00027901082375417105, + "loss": 0.094, "step": 21680 }, { - "epoch": 0.23, - "learning_rate": 0.0002648095268998637, - "loss": 0.0731, + "epoch": 0.14, + "learning_rate": 0.00027900114239981413, + "loss": 0.0861, "step": 21690 }, { - "epoch": 0.23, - "learning_rate": 0.00026479330261535463, - "loss": 0.0776, + "epoch": 0.14, + "learning_rate": 0.00027899146104545716, + "loss": 0.0838, "step": 21700 }, { - "epoch": 0.23, - "learning_rate": 0.00026477707833084556, - "loss": 0.085, + "epoch": 0.14, + "learning_rate": 0.00027898177969110023, + "loss": 0.091, "step": 21710 }, { - "epoch": 0.23, - "learning_rate": 0.00026476085404633653, - "loss": 0.0726, + "epoch": 0.14, + "learning_rate": 0.0002789720983367433, + "loss": 0.0874, "step": 21720 }, { - "epoch": 0.24, - "learning_rate": 0.00026474462976182746, - "loss": 0.0802, + "epoch": 0.14, + "learning_rate": 0.00027896241698238634, + "loss": 0.0942, "step": 21730 }, { - "epoch": 0.24, - "learning_rate": 0.00026472840547731843, - "loss": 0.0807, + "epoch": 0.14, + "learning_rate": 0.0002789527356280294, + "loss": 0.0922, "step": 21740 }, { - "epoch": 0.24, - "learning_rate": 0.00026471218119280936, - "loss": 0.0786, + "epoch": 0.14, + "learning_rate": 0.0002789430542736725, + "loss": 0.0884, "step": 21750 }, { - "epoch": 0.24, - "learning_rate": 0.00026469595690830033, - "loss": 0.0822, + "epoch": 0.14, + "learning_rate": 0.0002789333729193156, + "loss": 0.0837, "step": 21760 }, { - "epoch": 0.24, - "learning_rate": 0.00026467973262379125, - "loss": 0.0906, + "epoch": 0.14, + "learning_rate": 0.00027892369156495866, + "loss": 0.0817, "step": 21770 }, { - "epoch": 0.24, - "learning_rate": 0.00026466350833928223, - "loss": 0.0782, + "epoch": 0.14, + "learning_rate": 0.0002789140102106017, + "loss": 0.0761, "step": 21780 }, { - "epoch": 0.24, - "learning_rate": 0.00026464728405477315, - "loss": 0.0952, + "epoch": 0.14, + "learning_rate": 0.00027890432885624476, + "loss": 0.0959, "step": 21790 }, { - "epoch": 0.24, - "learning_rate": 0.00026463105977026413, - "loss": 0.0848, + "epoch": 0.14, + "learning_rate": 0.00027889464750188784, + "loss": 0.0828, "step": 21800 }, { - "epoch": 0.24, - "learning_rate": 0.00026461483548575505, - "loss": 0.0791, + "epoch": 0.14, + "learning_rate": 0.0002788849661475309, + "loss": 0.0794, "step": 21810 }, { - "epoch": 0.24, - "learning_rate": 0.00026459861120124603, - "loss": 0.0764, + "epoch": 0.14, + "learning_rate": 0.000278875284793174, + "loss": 0.0823, "step": 21820 }, { - "epoch": 0.24, - "learning_rate": 0.00026458238691673695, - "loss": 0.0763, + "epoch": 0.14, + "learning_rate": 0.00027886560343881703, + "loss": 0.0945, "step": 21830 }, { - "epoch": 0.24, - "learning_rate": 0.00026456616263222793, - "loss": 0.0694, + "epoch": 0.14, + "learning_rate": 0.0002788559220844601, + "loss": 0.0778, "step": 21840 }, { - "epoch": 0.24, - "learning_rate": 0.00026454993834771885, - "loss": 0.0808, + "epoch": 0.14, + "learning_rate": 0.0002788462407301032, + "loss": 0.0832, "step": 21850 }, { - "epoch": 0.24, - "learning_rate": 0.0002645337140632098, - "loss": 0.0724, + "epoch": 0.14, + "learning_rate": 0.0002788365593757462, + "loss": 0.086, "step": 21860 }, { - "epoch": 0.24, - "learning_rate": 0.00026451748977870075, - "loss": 0.0878, + "epoch": 0.14, + "learning_rate": 0.0002788268780213893, + "loss": 0.0821, "step": 21870 }, { - "epoch": 0.24, - "learning_rate": 0.0002645012654941917, - "loss": 0.0743, + "epoch": 0.14, + "learning_rate": 0.0002788171966670324, + "loss": 0.0882, "step": 21880 }, { - "epoch": 0.24, - "learning_rate": 0.0002644850412096826, - "loss": 0.0784, + "epoch": 0.14, + "learning_rate": 0.00027880751531267545, + "loss": 0.0738, "step": 21890 }, { - "epoch": 0.24, - "learning_rate": 0.0002644688169251736, - "loss": 0.0821, + "epoch": 0.14, + "learning_rate": 0.00027879783395831853, + "loss": 0.083, "step": 21900 }, { - "epoch": 0.24, - "learning_rate": 0.0002644525926406645, + "epoch": 0.14, + "learning_rate": 0.0002787881526039616, "loss": 0.086, "step": 21910 }, { - "epoch": 0.24, - "learning_rate": 0.0002644363683561555, - "loss": 0.0805, + "epoch": 0.14, + "learning_rate": 0.00027877847124960464, + "loss": 0.0844, "step": 21920 }, { - "epoch": 0.24, - "learning_rate": 0.0002644201440716464, - "loss": 0.0754, + "epoch": 0.14, + "learning_rate": 0.0002787687898952477, + "loss": 0.0889, "step": 21930 }, { - "epoch": 0.24, - "learning_rate": 0.0002644039197871374, - "loss": 0.0682, + "epoch": 0.14, + "learning_rate": 0.0002787591085408908, + "loss": 0.0853, "step": 21940 }, { - "epoch": 0.24, - "learning_rate": 0.0002643876955026283, - "loss": 0.0766, + "epoch": 0.14, + "learning_rate": 0.0002787494271865339, + "loss": 0.0814, "step": 21950 }, { - "epoch": 0.24, - "learning_rate": 0.0002643714712181193, - "loss": 0.0782, + "epoch": 0.14, + "learning_rate": 0.0002787397458321769, + "loss": 0.0881, "step": 21960 }, { - "epoch": 0.24, - "learning_rate": 0.0002643552469336102, - "loss": 0.079, + "epoch": 0.14, + "learning_rate": 0.00027873006447782, + "loss": 0.0802, "step": 21970 }, { - "epoch": 0.24, - "learning_rate": 0.00026433902264910117, - "loss": 0.0777, + "epoch": 0.14, + "learning_rate": 0.00027872038312346306, + "loss": 0.0876, "step": 21980 }, { - "epoch": 0.24, - "learning_rate": 0.0002643227983645921, - "loss": 0.0823, + "epoch": 0.14, + "learning_rate": 0.0002787107017691061, + "loss": 0.1003, "step": 21990 }, { - "epoch": 0.24, - "learning_rate": 0.00026430657408008307, - "loss": 0.0789, + "epoch": 0.14, + "learning_rate": 0.00027870102041474917, + "loss": 0.0815, "step": 22000 }, { - "epoch": 0.24, - "eval_cer": 0.9213937495251272, - "eval_loss": 0.05299902334809303, - "eval_runtime": 119.4931, - "eval_samples_per_second": 16.737, - "eval_steps_per_second": 4.184, + "epoch": 0.14, + "eval_cer": 0.9202078861145633, + "eval_loss": 0.05837943032383919, + "eval_runtime": 120.4265, + "eval_samples_per_second": 16.608, + "eval_steps_per_second": 4.152, "step": 22000 }, { - "epoch": 0.24, - "learning_rate": 0.000264290349795574, - "loss": 0.0876, + "epoch": 0.14, + "learning_rate": 0.00027869133906039225, + "loss": 0.0908, "step": 22010 }, { - "epoch": 0.24, - "learning_rate": 0.00026427412551106497, - "loss": 0.0739, + "epoch": 0.14, + "learning_rate": 0.00027868165770603533, + "loss": 0.0827, "step": 22020 }, { - "epoch": 0.24, - "learning_rate": 0.0002642579012265559, - "loss": 0.0767, + "epoch": 0.14, + "learning_rate": 0.0002786719763516784, + "loss": 0.0863, "step": 22030 }, { - "epoch": 0.24, - "learning_rate": 0.0002642416769420468, - "loss": 0.075, + "epoch": 0.14, + "learning_rate": 0.0002786622949973215, + "loss": 0.0861, "step": 22040 }, { - "epoch": 0.24, - "learning_rate": 0.0002642254526575378, - "loss": 0.0737, + "epoch": 0.14, + "learning_rate": 0.00027865261364296457, + "loss": 0.0893, "step": 22050 }, { - "epoch": 0.24, - "learning_rate": 0.0002642092283730287, - "loss": 0.0668, + "epoch": 0.14, + "learning_rate": 0.0002786429322886076, + "loss": 0.0987, "step": 22060 }, { - "epoch": 0.24, - "learning_rate": 0.00026419300408851964, - "loss": 0.0823, + "epoch": 0.14, + "learning_rate": 0.0002786332509342507, + "loss": 0.0806, "step": 22070 }, { - "epoch": 0.24, - "learning_rate": 0.0002641767798040106, - "loss": 0.0818, + "epoch": 0.14, + "learning_rate": 0.00027862356957989375, + "loss": 0.0958, "step": 22080 }, { - "epoch": 0.24, - "learning_rate": 0.00026416055551950154, - "loss": 0.0752, + "epoch": 0.14, + "learning_rate": 0.00027861388822553683, + "loss": 0.0992, "step": 22090 }, { - "epoch": 0.24, - "learning_rate": 0.0002641443312349925, - "loss": 0.0883, + "epoch": 0.14, + "learning_rate": 0.00027860420687117986, + "loss": 0.0949, "step": 22100 }, { - "epoch": 0.24, - "learning_rate": 0.00026412810695048344, - "loss": 0.0765, + "epoch": 0.14, + "learning_rate": 0.00027859452551682294, + "loss": 0.0819, "step": 22110 }, { - "epoch": 0.24, - "learning_rate": 0.0002641118826659744, - "loss": 0.0901, + "epoch": 0.14, + "learning_rate": 0.000278584844162466, + "loss": 0.0935, "step": 22120 }, { - "epoch": 0.24, - "learning_rate": 0.00026409565838146534, - "loss": 0.0739, + "epoch": 0.14, + "learning_rate": 0.00027857516280810904, + "loss": 0.0851, "step": 22130 }, { - "epoch": 0.24, - "learning_rate": 0.0002640794340969563, - "loss": 0.0742, + "epoch": 0.14, + "learning_rate": 0.0002785654814537521, + "loss": 0.0844, "step": 22140 }, { - "epoch": 0.24, - "learning_rate": 0.00026406320981244724, - "loss": 0.0705, + "epoch": 0.14, + "learning_rate": 0.0002785558000993952, + "loss": 0.0854, "step": 22150 }, { - "epoch": 0.24, - "learning_rate": 0.0002640469855279382, - "loss": 0.0716, + "epoch": 0.14, + "learning_rate": 0.0002785461187450383, + "loss": 0.079, "step": 22160 }, { - "epoch": 0.24, - "learning_rate": 0.00026403076124342914, - "loss": 0.0777, + "epoch": 0.14, + "learning_rate": 0.00027853643739068136, + "loss": 0.0878, "step": 22170 }, { - "epoch": 0.24, - "learning_rate": 0.0002640145369589201, - "loss": 0.0707, + "epoch": 0.14, + "learning_rate": 0.00027852675603632444, + "loss": 0.0863, "step": 22180 }, { - "epoch": 0.24, - "learning_rate": 0.00026399831267441104, - "loss": 0.076, + "epoch": 0.14, + "learning_rate": 0.0002785170746819675, + "loss": 0.0834, "step": 22190 }, { - "epoch": 0.24, - "learning_rate": 0.000263982088389902, - "loss": 0.0703, + "epoch": 0.14, + "learning_rate": 0.00027850739332761055, + "loss": 0.0865, "step": 22200 }, { - "epoch": 0.24, - "learning_rate": 0.00026396586410539294, - "loss": 0.0745, + "epoch": 0.14, + "learning_rate": 0.00027849771197325363, + "loss": 0.0854, "step": 22210 }, { - "epoch": 0.24, - "learning_rate": 0.00026394963982088386, - "loss": 0.0756, + "epoch": 0.14, + "learning_rate": 0.0002784880306188967, + "loss": 0.0752, "step": 22220 }, { - "epoch": 0.24, - "learning_rate": 0.00026393341553637484, - "loss": 0.0806, + "epoch": 0.14, + "learning_rate": 0.00027847834926453973, + "loss": 0.0943, "step": 22230 }, { - "epoch": 0.24, - "learning_rate": 0.00026391719125186576, - "loss": 0.0739, + "epoch": 0.14, + "learning_rate": 0.0002784686679101828, + "loss": 0.0914, "step": 22240 }, { - "epoch": 0.24, - "learning_rate": 0.00026390096696735674, - "loss": 0.0805, + "epoch": 0.14, + "learning_rate": 0.0002784589865558259, + "loss": 0.0916, "step": 22250 }, { - "epoch": 0.24, - "learning_rate": 0.00026388474268284766, - "loss": 0.0761, + "epoch": 0.14, + "learning_rate": 0.00027844930520146897, + "loss": 0.0776, "step": 22260 }, { - "epoch": 0.24, - "learning_rate": 0.0002638685183983386, - "loss": 0.0867, + "epoch": 0.14, + "learning_rate": 0.000278439623847112, + "loss": 0.0932, "step": 22270 }, { - "epoch": 0.24, - "learning_rate": 0.00026385229411382956, - "loss": 0.0748, + "epoch": 0.14, + "learning_rate": 0.0002784299424927551, + "loss": 0.0895, "step": 22280 }, { - "epoch": 0.24, - "learning_rate": 0.0002638360698293205, - "loss": 0.071, + "epoch": 0.14, + "learning_rate": 0.00027842026113839816, + "loss": 0.0972, "step": 22290 }, { - "epoch": 0.24, - "learning_rate": 0.00026381984554481146, - "loss": 0.0756, + "epoch": 0.14, + "learning_rate": 0.00027841057978404124, + "loss": 0.0865, "step": 22300 }, { - "epoch": 0.24, - "learning_rate": 0.0002638036212603024, - "loss": 0.0749, + "epoch": 0.14, + "learning_rate": 0.0002784008984296843, + "loss": 0.0883, "step": 22310 }, { - "epoch": 0.24, - "learning_rate": 0.00026378739697579336, - "loss": 0.0711, + "epoch": 0.14, + "learning_rate": 0.0002783912170753274, + "loss": 0.0872, "step": 22320 }, { - "epoch": 0.24, - "learning_rate": 0.0002637711726912843, - "loss": 0.075, + "epoch": 0.14, + "learning_rate": 0.0002783815357209704, + "loss": 0.1006, "step": 22330 }, { - "epoch": 0.24, - "learning_rate": 0.00026375494840677526, - "loss": 0.0738, + "epoch": 0.14, + "learning_rate": 0.0002783718543666135, + "loss": 0.0807, "step": 22340 }, { - "epoch": 0.24, - "learning_rate": 0.0002637387241222662, - "loss": 0.072, + "epoch": 0.14, + "learning_rate": 0.0002783621730122566, + "loss": 0.0862, "step": 22350 }, { - "epoch": 0.24, - "learning_rate": 0.00026372249983775716, - "loss": 0.0764, + "epoch": 0.14, + "learning_rate": 0.0002783524916578996, + "loss": 0.091, "step": 22360 }, { - "epoch": 0.24, - "learning_rate": 0.0002637062755532481, - "loss": 0.0662, + "epoch": 0.14, + "learning_rate": 0.0002783428103035427, + "loss": 0.0831, "step": 22370 }, { - "epoch": 0.24, - "learning_rate": 0.00026369005126873906, - "loss": 0.0786, + "epoch": 0.14, + "learning_rate": 0.00027833312894918577, + "loss": 0.0741, "step": 22380 }, { - "epoch": 0.24, - "learning_rate": 0.00026367382698423, - "loss": 0.0721, + "epoch": 0.14, + "learning_rate": 0.00027832344759482885, + "loss": 0.0913, "step": 22390 }, { - "epoch": 0.24, - "learning_rate": 0.0002636576026997209, - "loss": 0.084, + "epoch": 0.14, + "learning_rate": 0.00027831376624047193, + "loss": 0.0852, "step": 22400 }, { - "epoch": 0.24, - "learning_rate": 0.0002636413784152119, - "loss": 0.0744, + "epoch": 0.14, + "learning_rate": 0.00027830408488611495, + "loss": 0.0787, "step": 22410 }, { - "epoch": 0.24, - "learning_rate": 0.0002636251541307028, - "loss": 0.0695, + "epoch": 0.14, + "learning_rate": 0.00027829440353175803, + "loss": 0.0924, "step": 22420 }, { - "epoch": 0.24, - "learning_rate": 0.0002636089298461938, - "loss": 0.0798, + "epoch": 0.14, + "learning_rate": 0.0002782847221774011, + "loss": 0.0769, "step": 22430 }, { - "epoch": 0.24, - "learning_rate": 0.0002635927055616847, - "loss": 0.0717, + "epoch": 0.14, + "learning_rate": 0.0002782750408230442, + "loss": 0.0869, "step": 22440 }, { - "epoch": 0.24, - "learning_rate": 0.0002635764812771756, - "loss": 0.0798, + "epoch": 0.14, + "learning_rate": 0.00027826535946868727, + "loss": 0.0888, "step": 22450 }, { - "epoch": 0.24, - "learning_rate": 0.0002635602569926666, - "loss": 0.0737, + "epoch": 0.14, + "learning_rate": 0.00027825567811433035, + "loss": 0.0938, "step": 22460 }, { - "epoch": 0.24, - "learning_rate": 0.0002635440327081575, - "loss": 0.075, + "epoch": 0.15, + "learning_rate": 0.0002782459967599734, + "loss": 0.0889, "step": 22470 }, { - "epoch": 0.24, - "learning_rate": 0.0002635278084236485, - "loss": 0.0771, + "epoch": 0.15, + "learning_rate": 0.00027823631540561646, + "loss": 0.0837, "step": 22480 }, { - "epoch": 0.24, - "learning_rate": 0.0002635115841391394, - "loss": 0.0767, + "epoch": 0.15, + "learning_rate": 0.00027822663405125954, + "loss": 0.0864, "step": 22490 }, { - "epoch": 0.24, - "learning_rate": 0.0002634953598546304, - "loss": 0.0752, + "epoch": 0.15, + "learning_rate": 0.00027821695269690256, + "loss": 0.0951, "step": 22500 }, { - "epoch": 0.24, - "learning_rate": 0.0002634791355701213, - "loss": 0.0791, + "epoch": 0.15, + "learning_rate": 0.00027820727134254564, + "loss": 0.0865, "step": 22510 }, { - "epoch": 0.24, - "learning_rate": 0.0002634629112856123, - "loss": 0.0794, + "epoch": 0.15, + "learning_rate": 0.0002781975899881887, + "loss": 0.0865, "step": 22520 }, { - "epoch": 0.24, - "learning_rate": 0.0002634466870011032, - "loss": 0.0664, + "epoch": 0.15, + "learning_rate": 0.0002781879086338318, + "loss": 0.085, "step": 22530 }, { - "epoch": 0.24, - "learning_rate": 0.0002634304627165942, - "loss": 0.0804, + "epoch": 0.15, + "learning_rate": 0.0002781782272794749, + "loss": 0.0851, "step": 22540 }, { - "epoch": 0.24, - "learning_rate": 0.0002634142384320851, - "loss": 0.0865, + "epoch": 0.15, + "learning_rate": 0.0002781685459251179, + "loss": 0.0882, "step": 22550 }, { - "epoch": 0.24, - "learning_rate": 0.0002633980141475761, - "loss": 0.0827, + "epoch": 0.15, + "learning_rate": 0.000278158864570761, + "loss": 0.0921, "step": 22560 }, { - "epoch": 0.24, - "learning_rate": 0.000263381789863067, - "loss": 0.0723, + "epoch": 0.15, + "learning_rate": 0.00027814918321640407, + "loss": 0.0955, "step": 22570 }, { - "epoch": 0.24, - "learning_rate": 0.00026336556557855794, - "loss": 0.0821, + "epoch": 0.15, + "learning_rate": 0.00027813950186204715, + "loss": 0.0897, "step": 22580 }, { - "epoch": 0.24, - "learning_rate": 0.0002633493412940489, - "loss": 0.0897, + "epoch": 0.15, + "learning_rate": 0.0002781298205076902, + "loss": 0.0882, "step": 22590 }, { - "epoch": 0.24, - "learning_rate": 0.00026333311700953984, - "loss": 0.0923, + "epoch": 0.15, + "learning_rate": 0.00027812013915333325, + "loss": 0.0851, "step": 22600 }, { - "epoch": 0.24, - "learning_rate": 0.0002633168927250308, - "loss": 0.0765, + "epoch": 0.15, + "learning_rate": 0.00027811045779897633, + "loss": 0.0875, "step": 22610 }, { - "epoch": 0.24, - "learning_rate": 0.00026330066844052174, - "loss": 0.075, + "epoch": 0.15, + "learning_rate": 0.0002781007764446194, + "loss": 0.0901, "step": 22620 }, { - "epoch": 0.24, - "learning_rate": 0.00026328444415601266, - "loss": 0.0732, + "epoch": 0.15, + "learning_rate": 0.00027809109509026244, + "loss": 0.0803, "step": 22630 }, { - "epoch": 0.24, - "learning_rate": 0.00026326821987150364, - "loss": 0.0767, + "epoch": 0.15, + "learning_rate": 0.0002780814137359055, + "loss": 0.0953, "step": 22640 }, { - "epoch": 0.24, - "learning_rate": 0.00026325199558699456, - "loss": 0.0776, + "epoch": 0.15, + "learning_rate": 0.0002780717323815486, + "loss": 0.0928, "step": 22650 }, { - "epoch": 0.25, - "learning_rate": 0.00026323577130248554, - "loss": 0.0806, + "epoch": 0.15, + "learning_rate": 0.0002780620510271917, + "loss": 0.0852, "step": 22660 }, { - "epoch": 0.25, - "learning_rate": 0.00026321954701797646, - "loss": 0.0769, + "epoch": 0.15, + "learning_rate": 0.00027805236967283476, + "loss": 0.0895, "step": 22670 }, { - "epoch": 0.25, - "learning_rate": 0.00026320332273346744, - "loss": 0.075, + "epoch": 0.15, + "learning_rate": 0.00027804268831847784, + "loss": 0.0824, "step": 22680 }, { - "epoch": 0.25, - "learning_rate": 0.00026318709844895836, - "loss": 0.0814, + "epoch": 0.15, + "learning_rate": 0.00027803300696412086, + "loss": 0.0882, "step": 22690 }, { - "epoch": 0.25, - "learning_rate": 0.00026317087416444934, - "loss": 0.0702, + "epoch": 0.15, + "learning_rate": 0.00027802332560976394, + "loss": 0.0834, "step": 22700 }, { - "epoch": 0.25, - "learning_rate": 0.00026315464987994026, - "loss": 0.0754, + "epoch": 0.15, + "learning_rate": 0.000278013644255407, + "loss": 0.0839, "step": 22710 }, { - "epoch": 0.25, - "learning_rate": 0.00026313842559543124, - "loss": 0.0815, + "epoch": 0.15, + "learning_rate": 0.0002780039629010501, + "loss": 0.0845, "step": 22720 }, { - "epoch": 0.25, - "learning_rate": 0.00026312220131092216, - "loss": 0.0777, + "epoch": 0.15, + "learning_rate": 0.0002779942815466932, + "loss": 0.0868, "step": 22730 }, { - "epoch": 0.25, - "learning_rate": 0.00026310597702641314, - "loss": 0.0759, + "epoch": 0.15, + "learning_rate": 0.0002779846001923362, + "loss": 0.0835, "step": 22740 }, { - "epoch": 0.25, - "learning_rate": 0.00026308975274190406, - "loss": 0.0693, + "epoch": 0.15, + "learning_rate": 0.0002779749188379793, + "loss": 0.0873, "step": 22750 }, { - "epoch": 0.25, - "learning_rate": 0.000263073528457395, - "loss": 0.0807, + "epoch": 0.15, + "learning_rate": 0.0002779652374836223, + "loss": 0.0964, "step": 22760 }, { - "epoch": 0.25, - "learning_rate": 0.00026305730417288596, - "loss": 0.077, + "epoch": 0.15, + "learning_rate": 0.0002779555561292654, + "loss": 0.0862, "step": 22770 }, { - "epoch": 0.25, - "learning_rate": 0.0002630410798883769, - "loss": 0.0756, + "epoch": 0.15, + "learning_rate": 0.00027794587477490847, + "loss": 0.0854, "step": 22780 }, { - "epoch": 0.25, - "learning_rate": 0.00026302485560386786, - "loss": 0.0706, + "epoch": 0.15, + "learning_rate": 0.00027793619342055155, + "loss": 0.0942, "step": 22790 }, { - "epoch": 0.25, - "learning_rate": 0.0002630086313193588, - "loss": 0.0751, + "epoch": 0.15, + "learning_rate": 0.00027792651206619463, + "loss": 0.0959, "step": 22800 }, { - "epoch": 0.25, - "learning_rate": 0.0002629924070348497, - "loss": 0.0791, + "epoch": 0.15, + "learning_rate": 0.0002779168307118377, + "loss": 0.0846, "step": 22810 }, { - "epoch": 0.25, - "learning_rate": 0.0002629761827503407, - "loss": 0.0737, + "epoch": 0.15, + "learning_rate": 0.0002779071493574808, + "loss": 0.083, "step": 22820 }, { - "epoch": 0.25, - "learning_rate": 0.0002629599584658316, - "loss": 0.0777, + "epoch": 0.15, + "learning_rate": 0.0002778974680031238, + "loss": 0.091, "step": 22830 }, { - "epoch": 0.25, - "learning_rate": 0.0002629437341813226, - "loss": 0.0804, + "epoch": 0.15, + "learning_rate": 0.0002778877866487669, + "loss": 0.0762, "step": 22840 }, { - "epoch": 0.25, - "learning_rate": 0.0002629275098968135, - "loss": 0.0739, + "epoch": 0.15, + "learning_rate": 0.00027787810529441, + "loss": 0.0788, "step": 22850 }, { - "epoch": 0.25, - "learning_rate": 0.0002629112856123045, - "loss": 0.0774, + "epoch": 0.15, + "learning_rate": 0.00027786842394005306, + "loss": 0.0962, "step": 22860 }, { - "epoch": 0.25, - "learning_rate": 0.0002628950613277954, - "loss": 0.0748, + "epoch": 0.15, + "learning_rate": 0.0002778587425856961, + "loss": 0.0805, "step": 22870 }, { - "epoch": 0.25, - "learning_rate": 0.0002628788370432864, - "loss": 0.071, + "epoch": 0.15, + "learning_rate": 0.00027784906123133916, + "loss": 0.0905, "step": 22880 }, { - "epoch": 0.25, - "learning_rate": 0.0002628626127587773, - "loss": 0.0694, + "epoch": 0.15, + "learning_rate": 0.00027783937987698224, + "loss": 0.0842, "step": 22890 }, { - "epoch": 0.25, - "learning_rate": 0.0002628463884742683, - "loss": 0.0779, + "epoch": 0.15, + "learning_rate": 0.00027782969852262527, + "loss": 0.0782, "step": 22900 }, { - "epoch": 0.25, - "learning_rate": 0.0002628301641897592, - "loss": 0.0904, + "epoch": 0.15, + "learning_rate": 0.00027782001716826835, + "loss": 0.0891, "step": 22910 }, { - "epoch": 0.25, - "learning_rate": 0.0002628139399052502, - "loss": 0.0732, + "epoch": 0.15, + "learning_rate": 0.0002778103358139114, + "loss": 0.0791, "step": 22920 }, { - "epoch": 0.25, - "learning_rate": 0.0002627977156207411, - "loss": 0.0808, + "epoch": 0.15, + "learning_rate": 0.0002778006544595545, + "loss": 0.0859, "step": 22930 }, { - "epoch": 0.25, - "learning_rate": 0.0002627814913362321, - "loss": 0.0681, + "epoch": 0.15, + "learning_rate": 0.0002777909731051976, + "loss": 0.0843, "step": 22940 }, { - "epoch": 0.25, - "learning_rate": 0.000262765267051723, - "loss": 0.0794, + "epoch": 0.15, + "learning_rate": 0.00027778129175084067, + "loss": 0.0767, "step": 22950 }, { - "epoch": 0.25, - "learning_rate": 0.0002627490427672139, - "loss": 0.0777, + "epoch": 0.15, + "learning_rate": 0.00027777161039648375, + "loss": 0.0834, "step": 22960 }, { - "epoch": 0.25, - "learning_rate": 0.0002627328184827049, - "loss": 0.0738, + "epoch": 0.15, + "learning_rate": 0.00027776192904212677, + "loss": 0.0858, "step": 22970 }, { - "epoch": 0.25, - "learning_rate": 0.0002627165941981958, - "loss": 0.0755, + "epoch": 0.15, + "learning_rate": 0.00027775224768776985, + "loss": 0.0829, "step": 22980 }, { - "epoch": 0.25, - "learning_rate": 0.00026270036991368675, - "loss": 0.085, + "epoch": 0.15, + "learning_rate": 0.00027774256633341293, + "loss": 0.096, "step": 22990 }, { - "epoch": 0.25, - "learning_rate": 0.0002626841456291777, - "loss": 0.088, + "epoch": 0.15, + "learning_rate": 0.00027773288497905596, + "loss": 0.0801, "step": 23000 }, { - "epoch": 0.25, - "eval_cer": 0.9214856318944907, - "eval_loss": 0.052428290247917175, - "eval_runtime": 119.4918, - "eval_samples_per_second": 16.738, - "eval_steps_per_second": 4.184, + "epoch": 0.15, + "eval_cer": 0.9202295785786917, + "eval_loss": 0.06064927205443382, + "eval_runtime": 120.4894, + "eval_samples_per_second": 16.599, + "eval_steps_per_second": 4.15, "step": 23000 }, { - "epoch": 0.25, - "learning_rate": 0.00026266792134466865, - "loss": 0.0769, + "epoch": 0.15, + "learning_rate": 0.00027772320362469904, + "loss": 0.0825, "step": 23010 }, { - "epoch": 0.25, - "learning_rate": 0.0002626516970601596, - "loss": 0.0814, + "epoch": 0.15, + "learning_rate": 0.0002777135222703421, + "loss": 0.0786, "step": 23020 }, { - "epoch": 0.25, - "learning_rate": 0.00026263547277565055, - "loss": 0.0733, + "epoch": 0.15, + "learning_rate": 0.0002777038409159852, + "loss": 0.0859, "step": 23030 }, { - "epoch": 0.25, - "learning_rate": 0.0002626192484911415, - "loss": 0.0729, + "epoch": 0.15, + "learning_rate": 0.0002776941595616282, + "loss": 0.0909, "step": 23040 }, { - "epoch": 0.25, - "learning_rate": 0.00026260302420663245, - "loss": 0.076, + "epoch": 0.15, + "learning_rate": 0.0002776844782072713, + "loss": 0.0806, "step": 23050 }, { - "epoch": 0.25, - "learning_rate": 0.0002625867999221234, - "loss": 0.0886, + "epoch": 0.15, + "learning_rate": 0.0002776747968529144, + "loss": 0.0754, "step": 23060 }, { - "epoch": 0.25, - "learning_rate": 0.00026257057563761435, - "loss": 0.0811, + "epoch": 0.15, + "learning_rate": 0.00027766511549855746, + "loss": 0.0807, "step": 23070 }, { - "epoch": 0.25, - "learning_rate": 0.0002625543513531053, - "loss": 0.0702, + "epoch": 0.15, + "learning_rate": 0.00027765543414420054, + "loss": 0.0853, "step": 23080 }, { - "epoch": 0.25, - "learning_rate": 0.00026253812706859625, - "loss": 0.0745, + "epoch": 0.15, + "learning_rate": 0.0002776457527898436, + "loss": 0.0819, "step": 23090 }, { - "epoch": 0.25, - "learning_rate": 0.0002625219027840872, - "loss": 0.0833, + "epoch": 0.15, + "learning_rate": 0.0002776360714354867, + "loss": 0.0742, "step": 23100 }, { - "epoch": 0.25, - "learning_rate": 0.00026250567849957814, - "loss": 0.0722, + "epoch": 0.15, + "learning_rate": 0.0002776263900811297, + "loss": 0.0853, "step": 23110 }, { - "epoch": 0.25, - "learning_rate": 0.0002624894542150691, - "loss": 0.0739, + "epoch": 0.15, + "learning_rate": 0.0002776167087267728, + "loss": 0.0893, "step": 23120 }, { - "epoch": 0.25, - "learning_rate": 0.00026247322993056004, - "loss": 0.0757, + "epoch": 0.15, + "learning_rate": 0.0002776070273724159, + "loss": 0.0786, "step": 23130 }, { - "epoch": 0.25, - "learning_rate": 0.00026245700564605097, - "loss": 0.0695, + "epoch": 0.15, + "learning_rate": 0.0002775973460180589, + "loss": 0.0899, "step": 23140 }, { - "epoch": 0.25, - "learning_rate": 0.00026244078136154194, - "loss": 0.0825, + "epoch": 0.15, + "learning_rate": 0.000277587664663702, + "loss": 0.0777, "step": 23150 }, { - "epoch": 0.25, - "learning_rate": 0.00026242455707703287, - "loss": 0.066, + "epoch": 0.15, + "learning_rate": 0.00027757798330934507, + "loss": 0.0835, "step": 23160 }, { - "epoch": 0.25, - "learning_rate": 0.0002624083327925238, - "loss": 0.0892, + "epoch": 0.15, + "learning_rate": 0.00027756830195498815, + "loss": 0.0871, "step": 23170 }, { - "epoch": 0.25, - "learning_rate": 0.00026239210850801477, - "loss": 0.0815, + "epoch": 0.15, + "learning_rate": 0.0002775586206006312, + "loss": 0.084, "step": 23180 }, { - "epoch": 0.25, - "learning_rate": 0.0002623758842235057, - "loss": 0.0775, + "epoch": 0.15, + "learning_rate": 0.00027754893924627426, + "loss": 0.0844, "step": 23190 }, { - "epoch": 0.25, - "learning_rate": 0.00026235965993899667, - "loss": 0.0795, + "epoch": 0.15, + "learning_rate": 0.00027753925789191733, + "loss": 0.0889, "step": 23200 }, { - "epoch": 0.25, - "learning_rate": 0.0002623434356544876, - "loss": 0.0745, + "epoch": 0.15, + "learning_rate": 0.0002775295765375604, + "loss": 0.0907, "step": 23210 }, { - "epoch": 0.25, - "learning_rate": 0.00026232721136997856, - "loss": 0.0748, + "epoch": 0.15, + "learning_rate": 0.0002775198951832035, + "loss": 0.0862, "step": 23220 }, { - "epoch": 0.25, - "learning_rate": 0.0002623109870854695, - "loss": 0.0688, + "epoch": 0.15, + "learning_rate": 0.0002775102138288466, + "loss": 0.0866, "step": 23230 }, { - "epoch": 0.25, - "learning_rate": 0.00026229476280096046, - "loss": 0.0798, + "epoch": 0.15, + "learning_rate": 0.0002775005324744896, + "loss": 0.0837, "step": 23240 }, { - "epoch": 0.25, - "learning_rate": 0.0002622785385164514, - "loss": 0.0801, + "epoch": 0.15, + "learning_rate": 0.0002774908511201327, + "loss": 0.0837, "step": 23250 }, { - "epoch": 0.25, - "learning_rate": 0.00026226231423194236, - "loss": 0.0833, + "epoch": 0.15, + "learning_rate": 0.00027748116976577576, + "loss": 0.0831, "step": 23260 }, { - "epoch": 0.25, - "learning_rate": 0.0002622460899474333, - "loss": 0.0803, + "epoch": 0.15, + "learning_rate": 0.0002774714884114188, + "loss": 0.0838, "step": 23270 }, { - "epoch": 0.25, - "learning_rate": 0.00026222986566292426, - "loss": 0.0798, + "epoch": 0.15, + "learning_rate": 0.00027746180705706186, + "loss": 0.084, "step": 23280 }, { - "epoch": 0.25, - "learning_rate": 0.0002622136413784152, - "loss": 0.071, + "epoch": 0.15, + "learning_rate": 0.00027745212570270494, + "loss": 0.0949, "step": 23290 }, { - "epoch": 0.25, - "learning_rate": 0.00026219741709390616, - "loss": 0.0816, + "epoch": 0.15, + "learning_rate": 0.000277442444348348, + "loss": 0.0867, "step": 23300 }, { - "epoch": 0.25, - "learning_rate": 0.0002621811928093971, - "loss": 0.0781, + "epoch": 0.15, + "learning_rate": 0.0002774327629939911, + "loss": 0.0979, "step": 23310 }, { - "epoch": 0.25, - "learning_rate": 0.000262164968524888, - "loss": 0.0805, + "epoch": 0.15, + "learning_rate": 0.00027742308163963413, + "loss": 0.0777, "step": 23320 }, { - "epoch": 0.25, - "learning_rate": 0.000262148744240379, - "loss": 0.077, + "epoch": 0.15, + "learning_rate": 0.0002774134002852772, + "loss": 0.0789, "step": 23330 }, { - "epoch": 0.25, - "learning_rate": 0.0002621325199558699, - "loss": 0.074, + "epoch": 0.15, + "learning_rate": 0.0002774037189309203, + "loss": 0.0872, "step": 23340 }, { - "epoch": 0.25, - "learning_rate": 0.00026211629567136083, - "loss": 0.0779, + "epoch": 0.15, + "learning_rate": 0.00027739403757656337, + "loss": 0.0829, "step": 23350 }, { - "epoch": 0.25, - "learning_rate": 0.0002621000713868518, - "loss": 0.0756, + "epoch": 0.15, + "learning_rate": 0.00027738435622220645, + "loss": 0.0835, "step": 23360 }, { - "epoch": 0.25, - "learning_rate": 0.00026208384710234273, - "loss": 0.0748, + "epoch": 0.15, + "learning_rate": 0.0002773746748678495, + "loss": 0.087, "step": 23370 }, { - "epoch": 0.25, - "learning_rate": 0.0002620676228178337, - "loss": 0.0759, + "epoch": 0.15, + "learning_rate": 0.00027736499351349255, + "loss": 0.1009, "step": 23380 }, { - "epoch": 0.25, - "learning_rate": 0.00026205139853332463, - "loss": 0.0777, + "epoch": 0.15, + "learning_rate": 0.00027735531215913563, + "loss": 0.09, "step": 23390 }, { - "epoch": 0.25, - "learning_rate": 0.0002620351742488156, - "loss": 0.0694, + "epoch": 0.15, + "learning_rate": 0.00027734563080477866, + "loss": 0.0763, "step": 23400 }, { - "epoch": 0.25, - "learning_rate": 0.00026201894996430653, - "loss": 0.0839, + "epoch": 0.15, + "learning_rate": 0.00027733594945042174, + "loss": 0.0835, "step": 23410 }, { - "epoch": 0.25, - "learning_rate": 0.0002620027256797975, - "loss": 0.0758, + "epoch": 0.15, + "learning_rate": 0.0002773262680960648, + "loss": 0.0953, "step": 23420 }, { - "epoch": 0.25, - "learning_rate": 0.00026198650139528843, - "loss": 0.0763, + "epoch": 0.15, + "learning_rate": 0.0002773165867417079, + "loss": 0.0795, "step": 23430 }, { - "epoch": 0.25, - "learning_rate": 0.0002619702771107794, - "loss": 0.0712, + "epoch": 0.15, + "learning_rate": 0.000277306905387351, + "loss": 0.0847, "step": 23440 }, { - "epoch": 0.25, - "learning_rate": 0.00026195405282627033, - "loss": 0.0726, + "epoch": 0.15, + "learning_rate": 0.00027729722403299406, + "loss": 0.084, "step": 23450 }, { - "epoch": 0.25, - "learning_rate": 0.0002619378285417613, - "loss": 0.079, + "epoch": 0.15, + "learning_rate": 0.0002772875426786371, + "loss": 0.0885, "step": 23460 }, { - "epoch": 0.25, - "learning_rate": 0.00026192160425725223, - "loss": 0.0702, + "epoch": 0.15, + "learning_rate": 0.00027727786132428016, + "loss": 0.0782, "step": 23470 }, { - "epoch": 0.25, - "learning_rate": 0.0002619053799727432, - "loss": 0.0703, + "epoch": 0.15, + "learning_rate": 0.00027726817996992324, + "loss": 0.0843, "step": 23480 }, { - "epoch": 0.25, - "learning_rate": 0.00026188915568823413, - "loss": 0.0753, + "epoch": 0.15, + "learning_rate": 0.0002772584986155663, + "loss": 0.1056, "step": 23490 }, { - "epoch": 0.25, - "learning_rate": 0.00026187293140372505, - "loss": 0.0801, + "epoch": 0.15, + "learning_rate": 0.0002772488172612094, + "loss": 0.0892, "step": 23500 }, { - "epoch": 0.25, - "learning_rate": 0.000261856707119216, - "loss": 0.0741, + "epoch": 0.15, + "learning_rate": 0.00027723913590685243, + "loss": 0.0827, "step": 23510 }, { - "epoch": 0.25, - "learning_rate": 0.00026184048283470695, - "loss": 0.0661, + "epoch": 0.15, + "learning_rate": 0.0002772294545524955, + "loss": 0.0775, "step": 23520 }, { - "epoch": 0.25, - "learning_rate": 0.0002618242585501979, - "loss": 0.0762, + "epoch": 0.15, + "learning_rate": 0.0002772197731981386, + "loss": 0.0886, "step": 23530 }, { - "epoch": 0.25, - "learning_rate": 0.00026180803426568885, - "loss": 0.0697, + "epoch": 0.15, + "learning_rate": 0.0002772100918437816, + "loss": 0.0802, "step": 23540 }, { - "epoch": 0.25, - "learning_rate": 0.0002617918099811798, - "loss": 0.0786, + "epoch": 0.15, + "learning_rate": 0.0002772004104894247, + "loss": 0.0841, "step": 23550 }, { - "epoch": 0.25, - "learning_rate": 0.00026177558569667075, - "loss": 0.0856, + "epoch": 0.15, + "learning_rate": 0.0002771907291350678, + "loss": 0.0892, "step": 23560 }, { - "epoch": 0.25, - "learning_rate": 0.0002617593614121617, - "loss": 0.0704, + "epoch": 0.15, + "learning_rate": 0.00027718104778071085, + "loss": 0.0921, "step": 23570 }, { - "epoch": 0.26, - "learning_rate": 0.00026174313712765265, - "loss": 0.0729, + "epoch": 0.15, + "learning_rate": 0.00027717136642635393, + "loss": 0.0875, "step": 23580 }, { - "epoch": 0.26, - "learning_rate": 0.0002617269128431436, - "loss": 0.0742, + "epoch": 0.15, + "learning_rate": 0.000277161685071997, + "loss": 0.0791, "step": 23590 }, { - "epoch": 0.26, - "learning_rate": 0.00026171068855863455, - "loss": 0.0823, + "epoch": 0.15, + "learning_rate": 0.00027715200371764004, + "loss": 0.0801, "step": 23600 }, { - "epoch": 0.26, - "learning_rate": 0.0002616944642741255, - "loss": 0.0777, + "epoch": 0.15, + "learning_rate": 0.0002771423223632831, + "loss": 0.0805, "step": 23610 }, { - "epoch": 0.26, - "learning_rate": 0.00026167823998961645, - "loss": 0.076, + "epoch": 0.15, + "learning_rate": 0.0002771326410089262, + "loss": 0.0831, "step": 23620 }, { - "epoch": 0.26, - "learning_rate": 0.0002616620157051074, - "loss": 0.0742, + "epoch": 0.15, + "learning_rate": 0.0002771229596545693, + "loss": 0.0806, "step": 23630 }, { - "epoch": 0.26, - "learning_rate": 0.00026164579142059835, - "loss": 0.0753, + "epoch": 0.15, + "learning_rate": 0.0002771132783002123, + "loss": 0.0813, "step": 23640 }, { - "epoch": 0.26, - "learning_rate": 0.00026162956713608927, - "loss": 0.0718, + "epoch": 0.15, + "learning_rate": 0.0002771035969458554, + "loss": 0.08, "step": 23650 }, { - "epoch": 0.26, - "learning_rate": 0.00026161334285158025, - "loss": 0.0857, + "epoch": 0.15, + "learning_rate": 0.00027709391559149846, + "loss": 0.0829, "step": 23660 }, { - "epoch": 0.26, - "learning_rate": 0.00026159711856707117, - "loss": 0.0772, + "epoch": 0.15, + "learning_rate": 0.0002770842342371415, + "loss": 0.0822, "step": 23670 }, { - "epoch": 0.26, - "learning_rate": 0.0002615808942825621, - "loss": 0.0742, + "epoch": 0.15, + "learning_rate": 0.00027707455288278457, + "loss": 0.0754, "step": 23680 }, { - "epoch": 0.26, - "learning_rate": 0.00026156466999805307, - "loss": 0.0717, + "epoch": 0.15, + "learning_rate": 0.00027706487152842765, + "loss": 0.0773, "step": 23690 }, { - "epoch": 0.26, - "learning_rate": 0.000261548445713544, - "loss": 0.0699, + "epoch": 0.15, + "learning_rate": 0.00027705519017407073, + "loss": 0.0754, "step": 23700 }, { - "epoch": 0.26, - "learning_rate": 0.00026153222142903497, - "loss": 0.0719, + "epoch": 0.15, + "learning_rate": 0.0002770455088197138, + "loss": 0.0874, "step": 23710 }, { - "epoch": 0.26, - "learning_rate": 0.0002615159971445259, - "loss": 0.0728, + "epoch": 0.15, + "learning_rate": 0.0002770358274653569, + "loss": 0.0813, "step": 23720 }, { - "epoch": 0.26, - "learning_rate": 0.00026149977286001687, - "loss": 0.0715, + "epoch": 0.15, + "learning_rate": 0.00027702614611099997, + "loss": 0.0836, "step": 23730 }, { - "epoch": 0.26, - "learning_rate": 0.0002614835485755078, - "loss": 0.0661, + "epoch": 0.15, + "learning_rate": 0.000277016464756643, + "loss": 0.085, "step": 23740 }, { - "epoch": 0.26, - "learning_rate": 0.00026146732429099877, - "loss": 0.077, + "epoch": 0.15, + "learning_rate": 0.00027700678340228607, + "loss": 0.0947, "step": 23750 }, { - "epoch": 0.26, - "learning_rate": 0.0002614511000064897, - "loss": 0.0775, + "epoch": 0.15, + "learning_rate": 0.00027699710204792915, + "loss": 0.0881, "step": 23760 }, { - "epoch": 0.26, - "learning_rate": 0.00026143487572198067, - "loss": 0.0747, + "epoch": 0.15, + "learning_rate": 0.0002769874206935722, + "loss": 0.0918, "step": 23770 }, { - "epoch": 0.26, - "learning_rate": 0.0002614186514374716, - "loss": 0.0774, + "epoch": 0.15, + "learning_rate": 0.00027697773933921526, + "loss": 0.0887, "step": 23780 }, { - "epoch": 0.26, - "learning_rate": 0.00026140242715296257, - "loss": 0.0764, + "epoch": 0.15, + "learning_rate": 0.00027696805798485834, + "loss": 0.0871, "step": 23790 }, { - "epoch": 0.26, - "learning_rate": 0.0002613862028684535, - "loss": 0.08, + "epoch": 0.15, + "learning_rate": 0.0002769583766305014, + "loss": 0.0891, "step": 23800 }, { - "epoch": 0.26, - "learning_rate": 0.00026136997858394447, - "loss": 0.0708, + "epoch": 0.15, + "learning_rate": 0.00027694869527614444, + "loss": 0.0802, "step": 23810 }, { - "epoch": 0.26, - "learning_rate": 0.0002613537542994354, - "loss": 0.0702, + "epoch": 0.15, + "learning_rate": 0.0002769390139217875, + "loss": 0.0794, "step": 23820 }, { - "epoch": 0.26, - "learning_rate": 0.0002613375300149263, - "loss": 0.0739, + "epoch": 0.15, + "learning_rate": 0.0002769293325674306, + "loss": 0.099, "step": 23830 }, { - "epoch": 0.26, - "learning_rate": 0.0002613213057304173, - "loss": 0.0774, + "epoch": 0.15, + "learning_rate": 0.0002769196512130737, + "loss": 0.0877, "step": 23840 }, { - "epoch": 0.26, - "learning_rate": 0.0002613050814459082, - "loss": 0.0756, + "epoch": 0.15, + "learning_rate": 0.00027690996985871676, + "loss": 0.076, "step": 23850 }, { - "epoch": 0.26, - "learning_rate": 0.00026128885716139913, - "loss": 0.0876, + "epoch": 0.15, + "learning_rate": 0.00027690028850435984, + "loss": 0.0859, "step": 23860 }, { - "epoch": 0.26, - "learning_rate": 0.0002612726328768901, - "loss": 0.0738, + "epoch": 0.15, + "learning_rate": 0.0002768906071500029, + "loss": 0.0943, "step": 23870 }, { - "epoch": 0.26, - "learning_rate": 0.00026125640859238103, - "loss": 0.0818, + "epoch": 0.15, + "learning_rate": 0.00027688092579564595, + "loss": 0.0795, "step": 23880 }, { - "epoch": 0.26, - "learning_rate": 0.000261240184307872, - "loss": 0.081, + "epoch": 0.15, + "learning_rate": 0.00027687124444128903, + "loss": 0.0917, "step": 23890 }, { - "epoch": 0.26, - "learning_rate": 0.00026122396002336293, - "loss": 0.0694, + "epoch": 0.15, + "learning_rate": 0.0002768615630869321, + "loss": 0.0919, "step": 23900 }, { - "epoch": 0.26, - "learning_rate": 0.0002612077357388539, - "loss": 0.0726, + "epoch": 0.15, + "learning_rate": 0.00027685188173257513, + "loss": 0.0935, "step": 23910 }, { - "epoch": 0.26, - "learning_rate": 0.00026119151145434483, - "loss": 0.0749, + "epoch": 0.15, + "learning_rate": 0.0002768422003782182, + "loss": 0.0776, "step": 23920 }, { - "epoch": 0.26, - "learning_rate": 0.0002611752871698358, - "loss": 0.0749, + "epoch": 0.15, + "learning_rate": 0.0002768325190238613, + "loss": 0.0901, "step": 23930 }, { - "epoch": 0.26, - "learning_rate": 0.00026115906288532673, - "loss": 0.0768, + "epoch": 0.15, + "learning_rate": 0.00027682283766950437, + "loss": 0.0854, "step": 23940 }, { - "epoch": 0.26, - "learning_rate": 0.0002611428386008177, - "loss": 0.0685, + "epoch": 0.15, + "learning_rate": 0.0002768131563151474, + "loss": 0.0786, "step": 23950 }, { - "epoch": 0.26, - "learning_rate": 0.00026112661431630863, - "loss": 0.0728, + "epoch": 0.15, + "learning_rate": 0.0002768034749607905, + "loss": 0.0867, "step": 23960 }, { - "epoch": 0.26, - "learning_rate": 0.0002611103900317996, - "loss": 0.0705, + "epoch": 0.15, + "learning_rate": 0.00027679379360643356, + "loss": 0.0776, "step": 23970 }, { - "epoch": 0.26, - "learning_rate": 0.00026109416574729053, - "loss": 0.0793, + "epoch": 0.15, + "learning_rate": 0.00027678411225207664, + "loss": 0.0895, "step": 23980 }, { - "epoch": 0.26, - "learning_rate": 0.0002610779414627815, - "loss": 0.0663, + "epoch": 0.15, + "learning_rate": 0.0002767744308977197, + "loss": 0.0833, "step": 23990 }, { - "epoch": 0.26, - "learning_rate": 0.00026106171717827243, - "loss": 0.076, + "epoch": 0.15, + "learning_rate": 0.0002767647495433628, + "loss": 0.0764, "step": 24000 }, { - "epoch": 0.26, - "eval_cer": 0.9213513422777286, - "eval_loss": 0.05190052092075348, - "eval_runtime": 119.4469, - "eval_samples_per_second": 16.744, - "eval_steps_per_second": 4.186, + "epoch": 0.15, + "eval_cer": 0.920127443226754, + "eval_loss": 0.05912618711590767, + "eval_runtime": 120.5476, + "eval_samples_per_second": 16.591, + "eval_steps_per_second": 4.148, "step": 24000 }, { - "epoch": 0.26, - "learning_rate": 0.00026104549289376335, - "loss": 0.0717, + "epoch": 0.15, + "learning_rate": 0.0002767550681890058, + "loss": 0.089, "step": 24010 }, { - "epoch": 0.26, - "learning_rate": 0.00026102926860925433, - "loss": 0.0735, + "epoch": 0.16, + "learning_rate": 0.0002767453868346489, + "loss": 0.0763, "step": 24020 }, { - "epoch": 0.26, - "learning_rate": 0.00026101304432474525, - "loss": 0.0713, + "epoch": 0.16, + "learning_rate": 0.000276735705480292, + "loss": 0.1077, "step": 24030 }, { - "epoch": 0.26, - "learning_rate": 0.0002609968200402362, - "loss": 0.0768, + "epoch": 0.16, + "learning_rate": 0.000276726024125935, + "loss": 0.084, "step": 24040 }, { - "epoch": 0.26, - "learning_rate": 0.00026098059575572715, - "loss": 0.0675, + "epoch": 0.16, + "learning_rate": 0.0002767163427715781, + "loss": 0.0774, "step": 24050 }, { - "epoch": 0.26, - "learning_rate": 0.0002609643714712181, - "loss": 0.0671, + "epoch": 0.16, + "learning_rate": 0.00027670666141722117, + "loss": 0.0827, "step": 24060 }, { - "epoch": 0.26, - "learning_rate": 0.00026094814718670905, - "loss": 0.0721, + "epoch": 0.16, + "learning_rate": 0.00027669698006286425, + "loss": 0.0831, "step": 24070 }, { - "epoch": 0.26, - "learning_rate": 0.0002609319229022, - "loss": 0.0797, + "epoch": 0.16, + "learning_rate": 0.0002766872987085073, + "loss": 0.0865, "step": 24080 }, { - "epoch": 0.26, - "learning_rate": 0.00026091569861769095, - "loss": 0.0728, + "epoch": 0.16, + "learning_rate": 0.00027667761735415035, + "loss": 0.0803, "step": 24090 }, { - "epoch": 0.26, - "learning_rate": 0.0002608994743331819, - "loss": 0.0745, + "epoch": 0.16, + "learning_rate": 0.00027666793599979343, + "loss": 0.0828, "step": 24100 }, { - "epoch": 0.26, - "learning_rate": 0.00026088325004867285, - "loss": 0.0733, + "epoch": 0.16, + "learning_rate": 0.0002766582546454365, + "loss": 0.0902, "step": 24110 }, { - "epoch": 0.26, - "learning_rate": 0.0002608670257641638, - "loss": 0.0789, + "epoch": 0.16, + "learning_rate": 0.0002766485732910796, + "loss": 0.0817, "step": 24120 }, { - "epoch": 0.26, - "learning_rate": 0.00026085080147965475, - "loss": 0.0685, + "epoch": 0.16, + "learning_rate": 0.00027663889193672267, + "loss": 0.0863, "step": 24130 }, { - "epoch": 0.26, - "learning_rate": 0.00026083457719514567, - "loss": 0.0769, + "epoch": 0.16, + "learning_rate": 0.0002766292105823657, + "loss": 0.0878, "step": 24140 }, { - "epoch": 0.26, - "learning_rate": 0.00026081835291063665, - "loss": 0.0689, + "epoch": 0.16, + "learning_rate": 0.0002766195292280088, + "loss": 0.0832, "step": 24150 }, { - "epoch": 0.26, - "learning_rate": 0.00026080212862612757, - "loss": 0.0637, + "epoch": 0.16, + "learning_rate": 0.00027660984787365186, + "loss": 0.0952, "step": 24160 }, { - "epoch": 0.26, - "learning_rate": 0.00026078590434161855, - "loss": 0.084, + "epoch": 0.16, + "learning_rate": 0.0002766001665192949, + "loss": 0.1014, "step": 24170 }, { - "epoch": 0.26, - "learning_rate": 0.00026076968005710947, - "loss": 0.0877, + "epoch": 0.16, + "learning_rate": 0.00027659048516493796, + "loss": 0.0823, "step": 24180 }, { - "epoch": 0.26, - "learning_rate": 0.0002607534557726004, - "loss": 0.0711, + "epoch": 0.16, + "learning_rate": 0.00027658080381058104, + "loss": 0.0901, "step": 24190 }, { - "epoch": 0.26, - "learning_rate": 0.00026073723148809137, - "loss": 0.0736, + "epoch": 0.16, + "learning_rate": 0.0002765711224562241, + "loss": 0.0863, "step": 24200 }, { - "epoch": 0.26, - "learning_rate": 0.0002607210072035823, - "loss": 0.0752, + "epoch": 0.16, + "learning_rate": 0.0002765614411018672, + "loss": 0.0839, "step": 24210 }, { - "epoch": 0.26, - "learning_rate": 0.0002607047829190732, - "loss": 0.0722, + "epoch": 0.16, + "learning_rate": 0.0002765517597475102, + "loss": 0.0868, "step": 24220 }, { - "epoch": 0.26, - "learning_rate": 0.0002606885586345642, - "loss": 0.0739, + "epoch": 0.16, + "learning_rate": 0.0002765420783931533, + "loss": 0.0877, "step": 24230 }, { - "epoch": 0.26, - "learning_rate": 0.0002606723343500551, - "loss": 0.0752, + "epoch": 0.16, + "learning_rate": 0.0002765323970387964, + "loss": 0.0801, "step": 24240 }, { - "epoch": 0.26, - "learning_rate": 0.0002606561100655461, - "loss": 0.0757, + "epoch": 0.16, + "learning_rate": 0.00027652271568443947, + "loss": 0.0874, "step": 24250 }, { - "epoch": 0.26, - "learning_rate": 0.000260639885781037, - "loss": 0.0703, + "epoch": 0.16, + "learning_rate": 0.00027651303433008255, + "loss": 0.0953, "step": 24260 }, { - "epoch": 0.26, - "learning_rate": 0.000260623661496528, - "loss": 0.0726, + "epoch": 0.16, + "learning_rate": 0.0002765033529757256, + "loss": 0.0825, "step": 24270 }, { - "epoch": 0.26, - "learning_rate": 0.0002606074372120189, - "loss": 0.0742, + "epoch": 0.16, + "learning_rate": 0.00027649367162136865, + "loss": 0.0843, "step": 24280 }, { - "epoch": 0.26, - "learning_rate": 0.0002605912129275099, - "loss": 0.078, + "epoch": 0.16, + "learning_rate": 0.00027648399026701173, + "loss": 0.085, "step": 24290 }, { - "epoch": 0.26, - "learning_rate": 0.0002605749886430008, - "loss": 0.0679, + "epoch": 0.16, + "learning_rate": 0.0002764743089126548, + "loss": 0.0968, "step": 24300 }, { - "epoch": 0.26, - "learning_rate": 0.0002605587643584918, - "loss": 0.0709, + "epoch": 0.16, + "learning_rate": 0.00027646462755829784, + "loss": 0.0835, "step": 24310 }, { - "epoch": 0.26, - "learning_rate": 0.0002605425400739827, - "loss": 0.0703, + "epoch": 0.16, + "learning_rate": 0.0002764549462039409, + "loss": 0.0902, "step": 24320 }, { - "epoch": 0.26, - "learning_rate": 0.0002605263157894737, - "loss": 0.0748, + "epoch": 0.16, + "learning_rate": 0.000276445264849584, + "loss": 0.0896, "step": 24330 }, { - "epoch": 0.26, - "learning_rate": 0.0002605100915049646, - "loss": 0.0829, + "epoch": 0.16, + "learning_rate": 0.0002764355834952271, + "loss": 0.0869, "step": 24340 }, { - "epoch": 0.26, - "learning_rate": 0.0002604938672204556, - "loss": 0.0766, + "epoch": 0.16, + "learning_rate": 0.00027642590214087016, + "loss": 0.0846, "step": 24350 }, { - "epoch": 0.26, - "learning_rate": 0.0002604776429359465, - "loss": 0.0716, + "epoch": 0.16, + "learning_rate": 0.0002764162207865132, + "loss": 0.0834, "step": 24360 }, { - "epoch": 0.26, - "learning_rate": 0.00026046141865143744, - "loss": 0.072, + "epoch": 0.16, + "learning_rate": 0.00027640653943215626, + "loss": 0.0743, "step": 24370 }, { - "epoch": 0.26, - "learning_rate": 0.0002604451943669284, - "loss": 0.076, + "epoch": 0.16, + "learning_rate": 0.00027639685807779934, + "loss": 0.0856, "step": 24380 }, { - "epoch": 0.26, - "learning_rate": 0.00026042897008241934, - "loss": 0.0754, + "epoch": 0.16, + "learning_rate": 0.0002763871767234424, + "loss": 0.0804, "step": 24390 }, { - "epoch": 0.26, - "learning_rate": 0.00026041274579791026, - "loss": 0.0704, + "epoch": 0.16, + "learning_rate": 0.0002763774953690855, + "loss": 0.0856, "step": 24400 }, { - "epoch": 0.26, - "learning_rate": 0.00026039652151340124, - "loss": 0.0757, + "epoch": 0.16, + "learning_rate": 0.0002763678140147285, + "loss": 0.0962, "step": 24410 }, { - "epoch": 0.26, - "learning_rate": 0.00026038029722889216, - "loss": 0.0761, + "epoch": 0.16, + "learning_rate": 0.0002763581326603716, + "loss": 0.0898, "step": 24420 }, { - "epoch": 0.26, - "learning_rate": 0.00026036407294438313, - "loss": 0.072, + "epoch": 0.16, + "learning_rate": 0.0002763484513060147, + "loss": 0.0944, "step": 24430 }, { - "epoch": 0.26, - "learning_rate": 0.00026034784865987406, - "loss": 0.0671, + "epoch": 0.16, + "learning_rate": 0.0002763387699516577, + "loss": 0.0858, "step": 24440 }, { - "epoch": 0.26, - "learning_rate": 0.00026033162437536503, - "loss": 0.0755, + "epoch": 0.16, + "learning_rate": 0.0002763290885973008, + "loss": 0.0812, "step": 24450 }, { - "epoch": 0.26, - "learning_rate": 0.00026031540009085596, - "loss": 0.0697, + "epoch": 0.16, + "learning_rate": 0.00027631940724294387, + "loss": 0.084, "step": 24460 }, { - "epoch": 0.26, - "learning_rate": 0.00026029917580634693, - "loss": 0.0672, + "epoch": 0.16, + "learning_rate": 0.00027630972588858695, + "loss": 0.0755, "step": 24470 }, { - "epoch": 0.26, - "learning_rate": 0.00026028295152183786, - "loss": 0.0823, + "epoch": 0.16, + "learning_rate": 0.00027630004453423003, + "loss": 0.085, "step": 24480 }, { - "epoch": 0.26, - "learning_rate": 0.00026026672723732883, - "loss": 0.0871, + "epoch": 0.16, + "learning_rate": 0.0002762903631798731, + "loss": 0.0766, "step": 24490 }, { - "epoch": 0.26, - "learning_rate": 0.00026025050295281976, - "loss": 0.0716, + "epoch": 0.16, + "learning_rate": 0.00027628068182551614, + "loss": 0.0846, "step": 24500 }, { - "epoch": 0.27, - "learning_rate": 0.00026023427866831073, - "loss": 0.0729, + "epoch": 0.16, + "learning_rate": 0.0002762710004711592, + "loss": 0.0878, "step": 24510 }, { - "epoch": 0.27, - "learning_rate": 0.00026021805438380166, - "loss": 0.0711, + "epoch": 0.16, + "learning_rate": 0.0002762613191168023, + "loss": 0.0907, "step": 24520 }, { - "epoch": 0.27, - "learning_rate": 0.00026020183009929263, - "loss": 0.0681, + "epoch": 0.16, + "learning_rate": 0.0002762516377624454, + "loss": 0.0784, "step": 24530 }, { - "epoch": 0.27, - "learning_rate": 0.00026018560581478356, - "loss": 0.0692, + "epoch": 0.16, + "learning_rate": 0.0002762419564080884, + "loss": 0.0869, "step": 24540 }, { - "epoch": 0.27, - "learning_rate": 0.0002601693815302745, - "loss": 0.0698, + "epoch": 0.16, + "learning_rate": 0.0002762322750537315, + "loss": 0.0841, "step": 24550 }, { - "epoch": 0.27, - "learning_rate": 0.00026015315724576545, - "loss": 0.0668, + "epoch": 0.16, + "learning_rate": 0.00027622259369937456, + "loss": 0.0877, "step": 24560 }, { - "epoch": 0.27, - "learning_rate": 0.0002601369329612564, - "loss": 0.0745, + "epoch": 0.16, + "learning_rate": 0.0002762129123450176, + "loss": 0.0771, "step": 24570 }, { - "epoch": 0.27, - "learning_rate": 0.0002601207086767473, - "loss": 0.0719, + "epoch": 0.16, + "learning_rate": 0.00027620323099066067, + "loss": 0.0892, "step": 24580 }, { - "epoch": 0.27, - "learning_rate": 0.0002601044843922383, - "loss": 0.077, + "epoch": 0.16, + "learning_rate": 0.00027619354963630375, + "loss": 0.0895, "step": 24590 }, { - "epoch": 0.27, - "learning_rate": 0.0002600882601077292, - "loss": 0.0704, + "epoch": 0.16, + "learning_rate": 0.0002761838682819468, + "loss": 0.089, "step": 24600 }, { - "epoch": 0.27, - "learning_rate": 0.0002600720358232202, - "loss": 0.0635, + "epoch": 0.16, + "learning_rate": 0.0002761741869275899, + "loss": 0.0774, "step": 24610 }, { - "epoch": 0.27, - "learning_rate": 0.0002600558115387111, - "loss": 0.071, + "epoch": 0.16, + "learning_rate": 0.000276164505573233, + "loss": 0.0892, "step": 24620 }, { - "epoch": 0.27, - "learning_rate": 0.0002600395872542021, - "loss": 0.0658, + "epoch": 0.16, + "learning_rate": 0.00027615482421887606, + "loss": 0.0756, "step": 24630 }, { - "epoch": 0.27, - "learning_rate": 0.000260023362969693, - "loss": 0.0666, + "epoch": 0.16, + "learning_rate": 0.0002761451428645191, + "loss": 0.0872, "step": 24640 }, { - "epoch": 0.27, - "learning_rate": 0.000260007138685184, - "loss": 0.0805, + "epoch": 0.16, + "learning_rate": 0.00027613546151016217, + "loss": 0.1005, "step": 24650 }, { - "epoch": 0.27, - "learning_rate": 0.0002599909144006749, - "loss": 0.0914, + "epoch": 0.16, + "learning_rate": 0.00027612578015580525, + "loss": 0.0867, "step": 24660 }, { - "epoch": 0.27, - "learning_rate": 0.0002599746901161659, - "loss": 0.0752, + "epoch": 0.16, + "learning_rate": 0.00027611609880144833, + "loss": 0.0829, "step": 24670 }, { - "epoch": 0.27, - "learning_rate": 0.0002599584658316568, - "loss": 0.0749, + "epoch": 0.16, + "learning_rate": 0.00027610641744709136, + "loss": 0.0862, "step": 24680 }, { - "epoch": 0.27, - "learning_rate": 0.0002599422415471478, - "loss": 0.0754, + "epoch": 0.16, + "learning_rate": 0.00027609673609273443, + "loss": 0.0864, "step": 24690 }, { - "epoch": 0.27, - "learning_rate": 0.0002599260172626387, - "loss": 0.0688, + "epoch": 0.16, + "learning_rate": 0.0002760870547383775, + "loss": 0.0763, "step": 24700 }, { - "epoch": 0.27, - "learning_rate": 0.0002599097929781297, - "loss": 0.0741, + "epoch": 0.16, + "learning_rate": 0.00027607737338402054, + "loss": 0.0859, "step": 24710 }, { - "epoch": 0.27, - "learning_rate": 0.0002598935686936206, - "loss": 0.0787, + "epoch": 0.16, + "learning_rate": 0.0002760676920296636, + "loss": 0.0757, "step": 24720 }, { - "epoch": 0.27, - "learning_rate": 0.0002598773444091115, - "loss": 0.0658, + "epoch": 0.16, + "learning_rate": 0.0002760580106753067, + "loss": 0.088, "step": 24730 }, { - "epoch": 0.27, - "learning_rate": 0.0002598611201246025, - "loss": 0.0737, + "epoch": 0.16, + "learning_rate": 0.0002760483293209498, + "loss": 0.0835, "step": 24740 }, { - "epoch": 0.27, - "learning_rate": 0.0002598448958400934, - "loss": 0.0743, + "epoch": 0.16, + "learning_rate": 0.00027603864796659286, + "loss": 0.0874, "step": 24750 }, { - "epoch": 0.27, - "learning_rate": 0.00025982867155558434, - "loss": 0.0681, + "epoch": 0.16, + "learning_rate": 0.00027602896661223594, + "loss": 0.0854, "step": 24760 }, { - "epoch": 0.27, - "learning_rate": 0.0002598124472710753, - "loss": 0.0834, + "epoch": 0.16, + "learning_rate": 0.000276019285257879, + "loss": 0.074, "step": 24770 }, { - "epoch": 0.27, - "learning_rate": 0.00025979622298656624, - "loss": 0.0739, + "epoch": 0.16, + "learning_rate": 0.00027600960390352204, + "loss": 0.0841, "step": 24780 }, { - "epoch": 0.27, - "learning_rate": 0.0002597799987020572, - "loss": 0.0717, + "epoch": 0.16, + "learning_rate": 0.0002759999225491651, + "loss": 0.0771, "step": 24790 }, { - "epoch": 0.27, - "learning_rate": 0.00025976377441754814, - "loss": 0.0667, + "epoch": 0.16, + "learning_rate": 0.0002759902411948082, + "loss": 0.0853, "step": 24800 }, { - "epoch": 0.27, - "learning_rate": 0.0002597475501330391, - "loss": 0.074, + "epoch": 0.16, + "learning_rate": 0.00027598055984045123, + "loss": 0.0791, "step": 24810 }, { - "epoch": 0.27, - "learning_rate": 0.00025973132584853004, - "loss": 0.0837, + "epoch": 0.16, + "learning_rate": 0.0002759708784860943, + "loss": 0.0776, "step": 24820 }, { - "epoch": 0.27, - "learning_rate": 0.000259715101564021, - "loss": 0.0689, + "epoch": 0.16, + "learning_rate": 0.0002759611971317374, + "loss": 0.0794, "step": 24830 }, { - "epoch": 0.27, - "learning_rate": 0.00025969887727951194, - "loss": 0.0741, + "epoch": 0.16, + "learning_rate": 0.00027595151577738047, + "loss": 0.0813, "step": 24840 }, { - "epoch": 0.27, - "learning_rate": 0.0002596826529950029, - "loss": 0.0714, + "epoch": 0.16, + "learning_rate": 0.0002759418344230235, + "loss": 0.0743, "step": 24850 }, { - "epoch": 0.27, - "learning_rate": 0.00025966642871049384, - "loss": 0.0705, + "epoch": 0.16, + "learning_rate": 0.0002759321530686666, + "loss": 0.0851, "step": 24860 }, { - "epoch": 0.27, - "learning_rate": 0.0002596502044259848, - "loss": 0.0885, + "epoch": 0.16, + "learning_rate": 0.00027592247171430965, + "loss": 0.0773, "step": 24870 }, { - "epoch": 0.27, - "learning_rate": 0.00025963398014147574, - "loss": 0.0771, + "epoch": 0.16, + "learning_rate": 0.00027591279035995273, + "loss": 0.0703, "step": 24880 }, { - "epoch": 0.27, - "learning_rate": 0.0002596177558569667, - "loss": 0.0752, + "epoch": 0.16, + "learning_rate": 0.0002759031090055958, + "loss": 0.0789, "step": 24890 }, { - "epoch": 0.27, - "learning_rate": 0.00025960153157245764, - "loss": 0.076, + "epoch": 0.16, + "learning_rate": 0.0002758934276512389, + "loss": 0.0783, "step": 24900 }, { - "epoch": 0.27, - "learning_rate": 0.00025958530728794856, - "loss": 0.0835, + "epoch": 0.16, + "learning_rate": 0.000275883746296882, + "loss": 0.0737, "step": 24910 }, { - "epoch": 0.27, - "learning_rate": 0.00025956908300343954, - "loss": 0.073, + "epoch": 0.16, + "learning_rate": 0.000275874064942525, + "loss": 0.0856, "step": 24920 }, { - "epoch": 0.27, - "learning_rate": 0.00025955285871893046, - "loss": 0.0668, + "epoch": 0.16, + "learning_rate": 0.0002758643835881681, + "loss": 0.0797, "step": 24930 }, { - "epoch": 0.27, - "learning_rate": 0.0002595366344344214, - "loss": 0.0735, + "epoch": 0.16, + "learning_rate": 0.0002758547022338111, + "loss": 0.0841, "step": 24940 }, { - "epoch": 0.27, - "learning_rate": 0.00025952041014991236, - "loss": 0.0704, + "epoch": 0.16, + "learning_rate": 0.0002758450208794542, + "loss": 0.0802, "step": 24950 }, { - "epoch": 0.27, - "learning_rate": 0.0002595041858654033, - "loss": 0.0726, + "epoch": 0.16, + "learning_rate": 0.00027583533952509726, + "loss": 0.0742, "step": 24960 }, { - "epoch": 0.27, - "learning_rate": 0.00025948796158089426, - "loss": 0.0757, + "epoch": 0.16, + "learning_rate": 0.00027582565817074034, + "loss": 0.0802, "step": 24970 }, { - "epoch": 0.27, - "learning_rate": 0.0002594717372963852, - "loss": 0.0804, + "epoch": 0.16, + "learning_rate": 0.0002758159768163834, + "loss": 0.0788, "step": 24980 }, { - "epoch": 0.27, - "learning_rate": 0.00025945551301187616, - "loss": 0.0635, + "epoch": 0.16, + "learning_rate": 0.00027580629546202645, + "loss": 0.0785, "step": 24990 }, { - "epoch": 0.27, - "learning_rate": 0.0002594392887273671, - "loss": 0.0714, + "epoch": 0.16, + "learning_rate": 0.00027579661410766953, + "loss": 0.0779, "step": 25000 }, { - "epoch": 0.27, - "eval_cer": 0.9212815470163851, - "eval_loss": 0.05058603733778, - "eval_runtime": 119.4621, - "eval_samples_per_second": 16.742, - "eval_steps_per_second": 4.185, + "epoch": 0.16, + "eval_cer": 0.9200786351824652, + "eval_loss": 0.055601075291633606, + "eval_runtime": 120.6339, + "eval_samples_per_second": 16.579, + "eval_steps_per_second": 4.145, "step": 25000 }, { - "epoch": 0.27, - "learning_rate": 0.00025942306444285806, - "loss": 0.0663, + "epoch": 0.16, + "learning_rate": 0.0002757869327533126, + "loss": 0.0794, "step": 25010 }, { - "epoch": 0.27, - "learning_rate": 0.000259406840158349, - "loss": 0.0744, + "epoch": 0.16, + "learning_rate": 0.0002757772513989557, + "loss": 0.0827, "step": 25020 }, { - "epoch": 0.27, - "learning_rate": 0.00025939061587383996, - "loss": 0.073, + "epoch": 0.16, + "learning_rate": 0.00027576757004459877, + "loss": 0.082, "step": 25030 }, { - "epoch": 0.27, - "learning_rate": 0.0002593743915893309, - "loss": 0.0765, + "epoch": 0.16, + "learning_rate": 0.00027575788869024185, + "loss": 0.0755, "step": 25040 }, { - "epoch": 0.27, - "learning_rate": 0.00025935816730482186, - "loss": 0.0702, + "epoch": 0.16, + "learning_rate": 0.0002757482073358849, + "loss": 0.0875, "step": 25050 }, { - "epoch": 0.27, - "learning_rate": 0.0002593419430203128, - "loss": 0.076, + "epoch": 0.16, + "learning_rate": 0.00027573852598152795, + "loss": 0.0743, "step": 25060 }, { - "epoch": 0.27, - "learning_rate": 0.00025932571873580376, - "loss": 0.0804, + "epoch": 0.16, + "learning_rate": 0.00027572884462717103, + "loss": 0.084, "step": 25070 }, { - "epoch": 0.27, - "learning_rate": 0.0002593094944512947, - "loss": 0.0705, + "epoch": 0.16, + "learning_rate": 0.00027571916327281406, + "loss": 0.079, "step": 25080 }, { - "epoch": 0.27, - "learning_rate": 0.0002592932701667856, - "loss": 0.0661, + "epoch": 0.16, + "learning_rate": 0.00027570948191845714, + "loss": 0.0709, "step": 25090 }, { - "epoch": 0.27, - "learning_rate": 0.0002592770458822766, - "loss": 0.0816, + "epoch": 0.16, + "learning_rate": 0.0002756998005641002, + "loss": 0.0891, "step": 25100 }, { - "epoch": 0.27, - "learning_rate": 0.0002592608215977675, - "loss": 0.0686, + "epoch": 0.16, + "learning_rate": 0.0002756901192097433, + "loss": 0.0788, "step": 25110 }, { - "epoch": 0.27, - "learning_rate": 0.0002592445973132584, - "loss": 0.0747, + "epoch": 0.16, + "learning_rate": 0.0002756804378553864, + "loss": 0.0821, "step": 25120 }, { - "epoch": 0.27, - "learning_rate": 0.0002592283730287494, - "loss": 0.0675, + "epoch": 0.16, + "learning_rate": 0.0002756707565010294, + "loss": 0.0805, "step": 25130 }, { - "epoch": 0.27, - "learning_rate": 0.0002592121487442403, - "loss": 0.0729, + "epoch": 0.16, + "learning_rate": 0.0002756610751466725, + "loss": 0.0893, "step": 25140 }, { - "epoch": 0.27, - "learning_rate": 0.0002591959244597313, - "loss": 0.0743, + "epoch": 0.16, + "learning_rate": 0.00027565139379231556, + "loss": 0.0821, "step": 25150 }, { - "epoch": 0.27, - "learning_rate": 0.0002591797001752222, - "loss": 0.0726, + "epoch": 0.16, + "learning_rate": 0.00027564171243795864, + "loss": 0.084, "step": 25160 }, { - "epoch": 0.27, - "learning_rate": 0.0002591634758907132, - "loss": 0.0767, + "epoch": 0.16, + "learning_rate": 0.0002756320310836017, + "loss": 0.0861, "step": 25170 }, { - "epoch": 0.27, - "learning_rate": 0.0002591472516062041, - "loss": 0.0734, + "epoch": 0.16, + "learning_rate": 0.00027562234972924475, + "loss": 0.0722, "step": 25180 }, { - "epoch": 0.27, - "learning_rate": 0.0002591310273216951, - "loss": 0.0731, + "epoch": 0.16, + "learning_rate": 0.00027561266837488783, + "loss": 0.0849, "step": 25190 }, { - "epoch": 0.27, - "learning_rate": 0.000259114803037186, - "loss": 0.0645, + "epoch": 0.16, + "learning_rate": 0.0002756029870205309, + "loss": 0.0809, "step": 25200 }, { - "epoch": 0.27, - "learning_rate": 0.000259098578752677, - "loss": 0.069, + "epoch": 0.16, + "learning_rate": 0.00027559330566617393, + "loss": 0.0845, "step": 25210 }, { - "epoch": 0.27, - "learning_rate": 0.0002590823544681679, - "loss": 0.0792, + "epoch": 0.16, + "learning_rate": 0.000275583624311817, + "loss": 0.0745, "step": 25220 }, { - "epoch": 0.27, - "learning_rate": 0.0002590661301836589, - "loss": 0.0754, + "epoch": 0.16, + "learning_rate": 0.0002755739429574601, + "loss": 0.0786, "step": 25230 }, { - "epoch": 0.27, - "learning_rate": 0.0002590499058991498, - "loss": 0.0651, + "epoch": 0.16, + "learning_rate": 0.00027556426160310317, + "loss": 0.09, "step": 25240 }, { - "epoch": 0.27, - "learning_rate": 0.0002590336816146408, - "loss": 0.0732, + "epoch": 0.16, + "learning_rate": 0.00027555458024874625, + "loss": 0.0857, "step": 25250 }, { - "epoch": 0.27, - "learning_rate": 0.0002590174573301317, - "loss": 0.0763, + "epoch": 0.16, + "learning_rate": 0.00027554489889438933, + "loss": 0.0831, "step": 25260 }, { - "epoch": 0.27, - "learning_rate": 0.00025900123304562264, - "loss": 0.0748, + "epoch": 0.16, + "learning_rate": 0.00027553521754003236, + "loss": 0.0783, "step": 25270 }, { - "epoch": 0.27, - "learning_rate": 0.0002589850087611136, - "loss": 0.0685, + "epoch": 0.16, + "learning_rate": 0.00027552553618567544, + "loss": 0.0744, "step": 25280 }, { - "epoch": 0.27, - "learning_rate": 0.00025896878447660454, - "loss": 0.0753, + "epoch": 0.16, + "learning_rate": 0.0002755158548313185, + "loss": 0.0801, "step": 25290 }, { - "epoch": 0.27, - "learning_rate": 0.00025895256019209547, - "loss": 0.0754, + "epoch": 0.16, + "learning_rate": 0.0002755061734769616, + "loss": 0.0843, "step": 25300 }, { - "epoch": 0.27, - "learning_rate": 0.00025893633590758644, - "loss": 0.0777, + "epoch": 0.16, + "learning_rate": 0.0002754964921226047, + "loss": 0.0846, "step": 25310 }, { - "epoch": 0.27, - "learning_rate": 0.00025892011162307737, - "loss": 0.0728, + "epoch": 0.16, + "learning_rate": 0.0002754868107682477, + "loss": 0.0823, "step": 25320 }, { - "epoch": 0.27, - "learning_rate": 0.00025890388733856834, - "loss": 0.078, + "epoch": 0.16, + "learning_rate": 0.0002754771294138908, + "loss": 0.0865, "step": 25330 }, { - "epoch": 0.27, - "learning_rate": 0.00025888766305405927, - "loss": 0.0802, + "epoch": 0.16, + "learning_rate": 0.0002754674480595338, + "loss": 0.0809, "step": 25340 }, { - "epoch": 0.27, - "learning_rate": 0.00025887143876955024, - "loss": 0.0837, + "epoch": 0.16, + "learning_rate": 0.0002754577667051769, + "loss": 0.0823, "step": 25350 }, { - "epoch": 0.27, - "learning_rate": 0.00025885521448504117, - "loss": 0.0735, + "epoch": 0.16, + "learning_rate": 0.00027544808535081997, + "loss": 0.074, "step": 25360 }, { - "epoch": 0.27, - "learning_rate": 0.00025883899020053214, - "loss": 0.0696, + "epoch": 0.16, + "learning_rate": 0.00027543840399646305, + "loss": 0.0783, "step": 25370 }, { - "epoch": 0.27, - "learning_rate": 0.00025882276591602306, - "loss": 0.0832, + "epoch": 0.16, + "learning_rate": 0.00027542872264210613, + "loss": 0.0785, "step": 25380 }, { - "epoch": 0.27, - "learning_rate": 0.00025880654163151404, - "loss": 0.0684, + "epoch": 0.16, + "learning_rate": 0.0002754190412877492, + "loss": 0.0791, "step": 25390 }, { - "epoch": 0.27, - "learning_rate": 0.00025879031734700496, - "loss": 0.073, + "epoch": 0.16, + "learning_rate": 0.0002754093599333923, + "loss": 0.09, "step": 25400 }, { - "epoch": 0.27, - "learning_rate": 0.00025877409306249594, - "loss": 0.0666, + "epoch": 0.16, + "learning_rate": 0.0002753996785790353, + "loss": 0.0897, "step": 25410 }, { - "epoch": 0.27, - "learning_rate": 0.00025875786877798686, - "loss": 0.0673, + "epoch": 0.16, + "learning_rate": 0.0002753899972246784, + "loss": 0.0906, "step": 25420 }, { - "epoch": 0.28, - "learning_rate": 0.00025874164449347784, - "loss": 0.0676, + "epoch": 0.16, + "learning_rate": 0.00027538031587032147, + "loss": 0.0755, "step": 25430 }, { - "epoch": 0.28, - "learning_rate": 0.00025872542020896876, - "loss": 0.0697, + "epoch": 0.16, + "learning_rate": 0.00027537063451596455, + "loss": 0.0797, "step": 25440 }, { - "epoch": 0.28, - "learning_rate": 0.0002587091959244597, - "loss": 0.0661, + "epoch": 0.16, + "learning_rate": 0.0002753609531616076, + "loss": 0.0794, "step": 25450 }, { - "epoch": 0.28, - "learning_rate": 0.00025869297163995066, - "loss": 0.0643, + "epoch": 0.16, + "learning_rate": 0.00027535127180725066, + "loss": 0.0806, "step": 25460 }, { - "epoch": 0.28, - "learning_rate": 0.0002586767473554416, - "loss": 0.0813, + "epoch": 0.16, + "learning_rate": 0.00027534159045289374, + "loss": 0.0858, "step": 25470 }, { - "epoch": 0.28, - "learning_rate": 0.0002586605230709325, - "loss": 0.0796, + "epoch": 0.16, + "learning_rate": 0.00027533190909853676, + "loss": 0.0756, "step": 25480 }, { - "epoch": 0.28, - "learning_rate": 0.0002586442987864235, - "loss": 0.071, + "epoch": 0.16, + "learning_rate": 0.00027532222774417984, + "loss": 0.0768, "step": 25490 }, { - "epoch": 0.28, - "learning_rate": 0.0002586280745019144, - "loss": 0.0799, + "epoch": 0.16, + "learning_rate": 0.0002753125463898229, + "loss": 0.0827, "step": 25500 }, { - "epoch": 0.28, - "learning_rate": 0.0002586118502174054, - "loss": 0.0672, + "epoch": 0.16, + "learning_rate": 0.000275302865035466, + "loss": 0.086, "step": 25510 }, { - "epoch": 0.28, - "learning_rate": 0.0002585956259328963, - "loss": 0.0745, + "epoch": 0.16, + "learning_rate": 0.0002752931836811091, + "loss": 0.077, "step": 25520 }, { - "epoch": 0.28, - "learning_rate": 0.0002585794016483873, - "loss": 0.0698, + "epoch": 0.16, + "learning_rate": 0.00027528350232675216, + "loss": 0.081, "step": 25530 }, { - "epoch": 0.28, - "learning_rate": 0.0002585631773638782, - "loss": 0.0715, + "epoch": 0.16, + "learning_rate": 0.00027527382097239524, + "loss": 0.0796, "step": 25540 }, { - "epoch": 0.28, - "learning_rate": 0.0002585469530793692, - "loss": 0.0728, + "epoch": 0.16, + "learning_rate": 0.00027526413961803827, + "loss": 0.0907, "step": 25550 }, { - "epoch": 0.28, - "learning_rate": 0.0002585307287948601, - "loss": 0.0765, + "epoch": 0.16, + "learning_rate": 0.00027525445826368135, + "loss": 0.0859, "step": 25560 }, { - "epoch": 0.28, - "learning_rate": 0.0002585145045103511, - "loss": 0.0646, + "epoch": 0.17, + "learning_rate": 0.0002752447769093244, + "loss": 0.0851, "step": 25570 }, { - "epoch": 0.28, - "learning_rate": 0.000258498280225842, - "loss": 0.0764, + "epoch": 0.17, + "learning_rate": 0.00027523509555496745, + "loss": 0.0849, "step": 25580 }, { - "epoch": 0.28, - "learning_rate": 0.000258482055941333, - "loss": 0.0687, + "epoch": 0.17, + "learning_rate": 0.00027522541420061053, + "loss": 0.0801, "step": 25590 }, { - "epoch": 0.28, - "learning_rate": 0.0002584658316568239, - "loss": 0.0658, + "epoch": 0.17, + "learning_rate": 0.0002752157328462536, + "loss": 0.0787, "step": 25600 }, { - "epoch": 0.28, - "learning_rate": 0.0002584496073723149, - "loss": 0.0703, + "epoch": 0.17, + "learning_rate": 0.0002752060514918967, + "loss": 0.0805, "step": 25610 }, { - "epoch": 0.28, - "learning_rate": 0.0002584333830878058, - "loss": 0.0726, + "epoch": 0.17, + "learning_rate": 0.0002751963701375397, + "loss": 0.0807, "step": 25620 }, { - "epoch": 0.28, - "learning_rate": 0.00025841715880329673, - "loss": 0.0731, + "epoch": 0.17, + "learning_rate": 0.0002751866887831828, + "loss": 0.0777, "step": 25630 }, { - "epoch": 0.28, - "learning_rate": 0.0002584009345187877, - "loss": 0.0674, + "epoch": 0.17, + "learning_rate": 0.0002751770074288259, + "loss": 0.0858, "step": 25640 }, { - "epoch": 0.28, - "learning_rate": 0.00025838471023427863, - "loss": 0.0682, + "epoch": 0.17, + "learning_rate": 0.00027516732607446896, + "loss": 0.0756, "step": 25650 }, { - "epoch": 0.28, - "learning_rate": 0.00025836848594976955, - "loss": 0.0781, + "epoch": 0.17, + "learning_rate": 0.00027515764472011204, + "loss": 0.081, "step": 25660 }, { - "epoch": 0.28, - "learning_rate": 0.0002583522616652605, - "loss": 0.0694, + "epoch": 0.17, + "learning_rate": 0.0002751479633657551, + "loss": 0.0802, "step": 25670 }, { - "epoch": 0.28, - "learning_rate": 0.00025833603738075145, - "loss": 0.0683, + "epoch": 0.17, + "learning_rate": 0.0002751382820113982, + "loss": 0.0764, "step": 25680 }, { - "epoch": 0.28, - "learning_rate": 0.0002583198130962424, - "loss": 0.075, + "epoch": 0.17, + "learning_rate": 0.0002751286006570412, + "loss": 0.0846, "step": 25690 }, { - "epoch": 0.28, - "learning_rate": 0.00025830358881173335, - "loss": 0.0728, + "epoch": 0.17, + "learning_rate": 0.0002751189193026843, + "loss": 0.0765, "step": 25700 }, { - "epoch": 0.28, - "learning_rate": 0.0002582873645272243, - "loss": 0.0696, + "epoch": 0.17, + "learning_rate": 0.0002751092379483274, + "loss": 0.0857, "step": 25710 }, { - "epoch": 0.28, - "learning_rate": 0.00025827114024271525, - "loss": 0.0733, + "epoch": 0.17, + "learning_rate": 0.0002750995565939704, + "loss": 0.0816, "step": 25720 }, { - "epoch": 0.28, - "learning_rate": 0.0002582549159582062, - "loss": 0.073, + "epoch": 0.17, + "learning_rate": 0.0002750898752396135, + "loss": 0.0754, "step": 25730 }, { - "epoch": 0.28, - "learning_rate": 0.00025823869167369715, - "loss": 0.0812, + "epoch": 0.17, + "learning_rate": 0.00027508019388525657, + "loss": 0.0789, "step": 25740 }, { - "epoch": 0.28, - "learning_rate": 0.0002582224673891881, - "loss": 0.0737, + "epoch": 0.17, + "learning_rate": 0.00027507051253089965, + "loss": 0.081, "step": 25750 }, { - "epoch": 0.28, - "learning_rate": 0.00025820624310467905, - "loss": 0.0689, + "epoch": 0.17, + "learning_rate": 0.00027506083117654267, + "loss": 0.0821, "step": 25760 }, { - "epoch": 0.28, - "learning_rate": 0.00025819001882017, - "loss": 0.0719, + "epoch": 0.17, + "learning_rate": 0.00027505114982218575, + "loss": 0.074, "step": 25770 }, { - "epoch": 0.28, - "learning_rate": 0.00025817379453566095, - "loss": 0.0758, + "epoch": 0.17, + "learning_rate": 0.00027504146846782883, + "loss": 0.078, "step": 25780 }, { - "epoch": 0.28, - "learning_rate": 0.0002581575702511519, - "loss": 0.0686, + "epoch": 0.17, + "learning_rate": 0.0002750317871134719, + "loss": 0.0847, "step": 25790 }, { - "epoch": 0.28, - "learning_rate": 0.00025814134596664285, - "loss": 0.077, + "epoch": 0.17, + "learning_rate": 0.000275022105759115, + "loss": 0.0789, "step": 25800 }, { - "epoch": 0.28, - "learning_rate": 0.00025812512168213377, - "loss": 0.0625, + "epoch": 0.17, + "learning_rate": 0.00027501242440475807, + "loss": 0.0776, "step": 25810 }, { - "epoch": 0.28, - "learning_rate": 0.00025810889739762475, - "loss": 0.0683, + "epoch": 0.17, + "learning_rate": 0.0002750027430504011, + "loss": 0.0773, "step": 25820 }, { - "epoch": 0.28, - "learning_rate": 0.00025809267311311567, - "loss": 0.0747, + "epoch": 0.17, + "learning_rate": 0.0002749930616960442, + "loss": 0.0928, "step": 25830 }, { - "epoch": 0.28, - "learning_rate": 0.00025807644882860665, - "loss": 0.0607, + "epoch": 0.17, + "learning_rate": 0.00027498338034168726, + "loss": 0.0805, "step": 25840 }, { - "epoch": 0.28, - "learning_rate": 0.00025806022454409757, - "loss": 0.068, + "epoch": 0.17, + "learning_rate": 0.0002749736989873303, + "loss": 0.0892, "step": 25850 }, { - "epoch": 0.28, - "learning_rate": 0.00025804400025958855, - "loss": 0.0688, + "epoch": 0.17, + "learning_rate": 0.00027496401763297336, + "loss": 0.0801, "step": 25860 }, { - "epoch": 0.28, - "learning_rate": 0.00025802777597507947, - "loss": 0.0677, + "epoch": 0.17, + "learning_rate": 0.00027495433627861644, + "loss": 0.0929, "step": 25870 }, { - "epoch": 0.28, - "learning_rate": 0.00025801155169057045, - "loss": 0.075, + "epoch": 0.17, + "learning_rate": 0.0002749446549242595, + "loss": 0.085, "step": 25880 }, { - "epoch": 0.28, - "learning_rate": 0.00025799532740606137, - "loss": 0.0745, + "epoch": 0.17, + "learning_rate": 0.0002749349735699026, + "loss": 0.0845, "step": 25890 }, { - "epoch": 0.28, - "learning_rate": 0.00025797910312155234, - "loss": 0.0688, + "epoch": 0.17, + "learning_rate": 0.0002749252922155456, + "loss": 0.0766, "step": 25900 }, { - "epoch": 0.28, - "learning_rate": 0.00025796287883704327, - "loss": 0.0807, + "epoch": 0.17, + "learning_rate": 0.0002749156108611887, + "loss": 0.0809, "step": 25910 }, { - "epoch": 0.28, - "learning_rate": 0.00025794665455253424, - "loss": 0.0778, + "epoch": 0.17, + "learning_rate": 0.0002749059295068318, + "loss": 0.0844, "step": 25920 }, { - "epoch": 0.28, - "learning_rate": 0.00025793043026802517, - "loss": 0.0787, + "epoch": 0.17, + "learning_rate": 0.00027489624815247487, + "loss": 0.085, "step": 25930 }, { - "epoch": 0.28, - "learning_rate": 0.00025791420598351614, - "loss": 0.0666, + "epoch": 0.17, + "learning_rate": 0.00027488656679811795, + "loss": 0.0703, "step": 25940 }, { - "epoch": 0.28, - "learning_rate": 0.00025789798169900707, - "loss": 0.0633, + "epoch": 0.17, + "learning_rate": 0.00027487688544376097, + "loss": 0.0917, "step": 25950 }, { - "epoch": 0.28, - "learning_rate": 0.000257881757414498, - "loss": 0.0777, + "epoch": 0.17, + "learning_rate": 0.00027486720408940405, + "loss": 0.0807, "step": 25960 }, { - "epoch": 0.28, - "learning_rate": 0.00025786553312998897, - "loss": 0.0673, + "epoch": 0.17, + "learning_rate": 0.00027485752273504713, + "loss": 0.0723, "step": 25970 }, { - "epoch": 0.28, - "learning_rate": 0.0002578493088454799, - "loss": 0.0698, + "epoch": 0.17, + "learning_rate": 0.00027484784138069016, + "loss": 0.0756, "step": 25980 }, { - "epoch": 0.28, - "learning_rate": 0.0002578330845609708, - "loss": 0.0685, + "epoch": 0.17, + "learning_rate": 0.00027483816002633324, + "loss": 0.079, "step": 25990 }, { - "epoch": 0.28, - "learning_rate": 0.0002578168602764618, - "loss": 0.0664, + "epoch": 0.17, + "learning_rate": 0.0002748284786719763, + "loss": 0.0839, "step": 26000 }, { - "epoch": 0.28, - "eval_cer": 0.921349575309087, - "eval_loss": 0.049505751579999924, - "eval_runtime": 119.4812, - "eval_samples_per_second": 16.739, - "eval_steps_per_second": 4.185, + "epoch": 0.17, + "eval_cer": 0.920187097503107, + "eval_loss": 0.05482678487896919, + "eval_runtime": 120.4443, + "eval_samples_per_second": 16.605, + "eval_steps_per_second": 4.151, "step": 26000 }, { - "epoch": 0.28, - "learning_rate": 0.0002578006359919527, - "loss": 0.0735, + "epoch": 0.17, + "learning_rate": 0.0002748187973176194, + "loss": 0.0831, "step": 26010 }, { - "epoch": 0.28, - "learning_rate": 0.0002577844117074437, - "loss": 0.0849, + "epoch": 0.17, + "learning_rate": 0.0002748091159632625, + "loss": 0.0743, "step": 26020 }, { - "epoch": 0.28, - "learning_rate": 0.0002577681874229346, - "loss": 0.0825, + "epoch": 0.17, + "learning_rate": 0.00027479943460890555, + "loss": 0.0838, "step": 26030 }, { - "epoch": 0.28, - "learning_rate": 0.0002577519631384256, - "loss": 0.0799, + "epoch": 0.17, + "learning_rate": 0.0002747897532545486, + "loss": 0.0825, "step": 26040 }, { - "epoch": 0.28, - "learning_rate": 0.0002577357388539165, - "loss": 0.0759, + "epoch": 0.17, + "learning_rate": 0.00027478007190019166, + "loss": 0.0739, "step": 26050 }, { - "epoch": 0.28, - "learning_rate": 0.0002577195145694075, - "loss": 0.0773, + "epoch": 0.17, + "learning_rate": 0.00027477039054583474, + "loss": 0.0756, "step": 26060 }, { - "epoch": 0.28, - "learning_rate": 0.0002577032902848984, - "loss": 0.0693, + "epoch": 0.17, + "learning_rate": 0.0002747607091914778, + "loss": 0.0819, "step": 26070 }, { - "epoch": 0.28, - "learning_rate": 0.0002576870660003894, - "loss": 0.0721, + "epoch": 0.17, + "learning_rate": 0.0002747510278371209, + "loss": 0.0735, "step": 26080 }, { - "epoch": 0.28, - "learning_rate": 0.0002576708417158803, - "loss": 0.0724, + "epoch": 0.17, + "learning_rate": 0.0002747413464827639, + "loss": 0.0777, "step": 26090 }, { - "epoch": 0.28, - "learning_rate": 0.0002576546174313713, - "loss": 0.0665, + "epoch": 0.17, + "learning_rate": 0.000274731665128407, + "loss": 0.0859, "step": 26100 }, { - "epoch": 0.28, - "learning_rate": 0.0002576383931468622, - "loss": 0.0711, + "epoch": 0.17, + "learning_rate": 0.0002747219837740501, + "loss": 0.072, "step": 26110 }, { - "epoch": 0.28, - "learning_rate": 0.0002576221688623532, - "loss": 0.0672, + "epoch": 0.17, + "learning_rate": 0.0002747123024196931, + "loss": 0.0829, "step": 26120 }, { - "epoch": 0.28, - "learning_rate": 0.0002576059445778441, - "loss": 0.0772, + "epoch": 0.17, + "learning_rate": 0.0002747026210653362, + "loss": 0.0791, "step": 26130 }, { - "epoch": 0.28, - "learning_rate": 0.00025758972029333503, - "loss": 0.0747, + "epoch": 0.17, + "learning_rate": 0.00027469293971097927, + "loss": 0.0851, "step": 26140 }, { - "epoch": 0.28, - "learning_rate": 0.000257573496008826, - "loss": 0.0724, + "epoch": 0.17, + "learning_rate": 0.00027468325835662235, + "loss": 0.0768, "step": 26150 }, { - "epoch": 0.28, - "learning_rate": 0.00025755727172431693, - "loss": 0.0744, + "epoch": 0.17, + "learning_rate": 0.00027467357700226543, + "loss": 0.0778, "step": 26160 }, { - "epoch": 0.28, - "learning_rate": 0.00025754104743980785, - "loss": 0.0716, + "epoch": 0.17, + "learning_rate": 0.0002746638956479085, + "loss": 0.0812, "step": 26170 }, { - "epoch": 0.28, - "learning_rate": 0.00025752482315529883, - "loss": 0.0738, + "epoch": 0.17, + "learning_rate": 0.00027465421429355153, + "loss": 0.0753, "step": 26180 }, { - "epoch": 0.28, - "learning_rate": 0.00025750859887078975, - "loss": 0.0744, + "epoch": 0.17, + "learning_rate": 0.0002746445329391946, + "loss": 0.0906, "step": 26190 }, { - "epoch": 0.28, - "learning_rate": 0.00025749237458628073, - "loss": 0.0722, + "epoch": 0.17, + "learning_rate": 0.0002746348515848377, + "loss": 0.0908, "step": 26200 }, { - "epoch": 0.28, - "learning_rate": 0.00025747615030177165, - "loss": 0.0728, + "epoch": 0.17, + "learning_rate": 0.0002746251702304808, + "loss": 0.0823, "step": 26210 }, { - "epoch": 0.28, - "learning_rate": 0.00025745992601726263, - "loss": 0.0752, + "epoch": 0.17, + "learning_rate": 0.0002746154888761238, + "loss": 0.0855, "step": 26220 }, { - "epoch": 0.28, - "learning_rate": 0.00025744370173275355, - "loss": 0.0762, + "epoch": 0.17, + "learning_rate": 0.0002746058075217669, + "loss": 0.0875, "step": 26230 }, { - "epoch": 0.28, - "learning_rate": 0.00025742747744824453, - "loss": 0.08, + "epoch": 0.17, + "learning_rate": 0.00027459612616740996, + "loss": 0.0872, "step": 26240 }, { - "epoch": 0.28, - "learning_rate": 0.00025741125316373545, - "loss": 0.0802, + "epoch": 0.17, + "learning_rate": 0.000274586444813053, + "loss": 0.0768, "step": 26250 }, { - "epoch": 0.28, - "learning_rate": 0.00025739502887922643, - "loss": 0.0706, + "epoch": 0.17, + "learning_rate": 0.00027457676345869606, + "loss": 0.0801, "step": 26260 }, { - "epoch": 0.28, - "learning_rate": 0.00025737880459471735, - "loss": 0.0679, + "epoch": 0.17, + "learning_rate": 0.00027456708210433914, + "loss": 0.0858, "step": 26270 }, { - "epoch": 0.28, - "learning_rate": 0.00025736258031020833, - "loss": 0.0767, + "epoch": 0.17, + "learning_rate": 0.0002745574007499822, + "loss": 0.081, "step": 26280 }, { - "epoch": 0.28, - "learning_rate": 0.00025734635602569925, - "loss": 0.0718, + "epoch": 0.17, + "learning_rate": 0.0002745477193956253, + "loss": 0.086, "step": 26290 }, { - "epoch": 0.28, - "learning_rate": 0.0002573301317411902, - "loss": 0.0778, + "epoch": 0.17, + "learning_rate": 0.0002745380380412684, + "loss": 0.0765, "step": 26300 }, { - "epoch": 0.28, - "learning_rate": 0.00025731390745668115, - "loss": 0.0794, + "epoch": 0.17, + "learning_rate": 0.00027452835668691146, + "loss": 0.0692, "step": 26310 }, { - "epoch": 0.28, - "learning_rate": 0.00025729768317217207, - "loss": 0.0838, + "epoch": 0.17, + "learning_rate": 0.0002745186753325545, + "loss": 0.0889, "step": 26320 }, { - "epoch": 0.28, - "learning_rate": 0.00025728145888766305, - "loss": 0.077, + "epoch": 0.17, + "learning_rate": 0.00027450899397819757, + "loss": 0.0822, "step": 26330 }, { - "epoch": 0.28, - "learning_rate": 0.00025726523460315397, - "loss": 0.0735, + "epoch": 0.17, + "learning_rate": 0.00027449931262384065, + "loss": 0.0715, "step": 26340 }, { - "epoch": 0.29, - "learning_rate": 0.0002572490103186449, - "loss": 0.0676, + "epoch": 0.17, + "learning_rate": 0.0002744896312694837, + "loss": 0.0917, "step": 26350 }, { - "epoch": 0.29, - "learning_rate": 0.00025723278603413587, - "loss": 0.0812, + "epoch": 0.17, + "learning_rate": 0.00027447994991512675, + "loss": 0.076, "step": 26360 }, { - "epoch": 0.29, - "learning_rate": 0.0002572165617496268, - "loss": 0.0775, + "epoch": 0.17, + "learning_rate": 0.00027447026856076983, + "loss": 0.0844, "step": 26370 }, { - "epoch": 0.29, - "learning_rate": 0.00025720033746511777, - "loss": 0.0795, + "epoch": 0.17, + "learning_rate": 0.0002744605872064129, + "loss": 0.0737, "step": 26380 }, { - "epoch": 0.29, - "learning_rate": 0.0002571841131806087, - "loss": 0.0697, + "epoch": 0.17, + "learning_rate": 0.00027445090585205594, + "loss": 0.086, "step": 26390 }, { - "epoch": 0.29, - "learning_rate": 0.00025716788889609967, - "loss": 0.0703, + "epoch": 0.17, + "learning_rate": 0.000274441224497699, + "loss": 0.0738, "step": 26400 }, { - "epoch": 0.29, - "learning_rate": 0.0002571516646115906, - "loss": 0.0774, + "epoch": 0.17, + "learning_rate": 0.0002744315431433421, + "loss": 0.0801, "step": 26410 }, { - "epoch": 0.29, - "learning_rate": 0.00025713544032708157, + "epoch": 0.17, + "learning_rate": 0.0002744218617889852, "loss": 0.0762, "step": 26420 }, { - "epoch": 0.29, - "learning_rate": 0.0002571192160425725, - "loss": 0.072, + "epoch": 0.17, + "learning_rate": 0.00027441218043462826, + "loss": 0.0787, "step": 26430 }, { - "epoch": 0.29, - "learning_rate": 0.00025710299175806347, - "loss": 0.0777, + "epoch": 0.17, + "learning_rate": 0.00027440249908027134, + "loss": 0.0816, "step": 26440 }, { - "epoch": 0.29, - "learning_rate": 0.0002570867674735544, - "loss": 0.0737, + "epoch": 0.17, + "learning_rate": 0.0002743928177259144, + "loss": 0.0835, "step": 26450 }, { - "epoch": 0.29, - "learning_rate": 0.00025707054318904537, - "loss": 0.0728, + "epoch": 0.17, + "learning_rate": 0.00027438313637155744, + "loss": 0.0803, "step": 26460 }, { - "epoch": 0.29, - "learning_rate": 0.0002570543189045363, - "loss": 0.074, + "epoch": 0.17, + "learning_rate": 0.0002743734550172005, + "loss": 0.0749, "step": 26470 }, { - "epoch": 0.29, - "learning_rate": 0.00025703809462002727, - "loss": 0.0714, + "epoch": 0.17, + "learning_rate": 0.0002743637736628436, + "loss": 0.0834, "step": 26480 }, { - "epoch": 0.29, - "learning_rate": 0.0002570218703355182, - "loss": 0.0746, + "epoch": 0.17, + "learning_rate": 0.00027435409230848663, + "loss": 0.08, "step": 26490 }, { - "epoch": 0.29, - "learning_rate": 0.0002570056460510091, - "loss": 0.0639, + "epoch": 0.17, + "learning_rate": 0.0002743444109541297, + "loss": 0.0812, "step": 26500 }, { - "epoch": 0.29, - "learning_rate": 0.0002569894217665001, - "loss": 0.0803, + "epoch": 0.17, + "learning_rate": 0.0002743347295997728, + "loss": 0.0787, "step": 26510 }, { - "epoch": 0.29, - "learning_rate": 0.000256973197481991, - "loss": 0.0712, + "epoch": 0.17, + "learning_rate": 0.00027432504824541587, + "loss": 0.0733, "step": 26520 }, { - "epoch": 0.29, - "learning_rate": 0.000256956973197482, - "loss": 0.0726, + "epoch": 0.17, + "learning_rate": 0.0002743153668910589, + "loss": 0.0841, "step": 26530 }, { - "epoch": 0.29, - "learning_rate": 0.0002569407489129729, - "loss": 0.0785, + "epoch": 0.17, + "learning_rate": 0.000274305685536702, + "loss": 0.0779, "step": 26540 }, { - "epoch": 0.29, - "learning_rate": 0.00025692452462846384, - "loss": 0.0783, + "epoch": 0.17, + "learning_rate": 0.00027429600418234505, + "loss": 0.0809, "step": 26550 }, { - "epoch": 0.29, - "learning_rate": 0.0002569083003439548, - "loss": 0.0787, + "epoch": 0.17, + "learning_rate": 0.00027428632282798813, + "loss": 0.0848, "step": 26560 }, { - "epoch": 0.29, - "learning_rate": 0.00025689207605944574, - "loss": 0.0697, + "epoch": 0.17, + "learning_rate": 0.0002742766414736312, + "loss": 0.0786, "step": 26570 }, { - "epoch": 0.29, - "learning_rate": 0.0002568758517749367, - "loss": 0.075, + "epoch": 0.17, + "learning_rate": 0.0002742669601192743, + "loss": 0.0825, "step": 26580 }, { - "epoch": 0.29, - "learning_rate": 0.00025685962749042763, - "loss": 0.0761, + "epoch": 0.17, + "learning_rate": 0.0002742572787649173, + "loss": 0.08, "step": 26590 }, { - "epoch": 0.29, - "learning_rate": 0.0002568434032059186, - "loss": 0.0692, + "epoch": 0.17, + "learning_rate": 0.0002742475974105604, + "loss": 0.0862, "step": 26600 }, { - "epoch": 0.29, - "learning_rate": 0.00025682717892140953, - "loss": 0.0694, + "epoch": 0.17, + "learning_rate": 0.0002742379160562035, + "loss": 0.0827, "step": 26610 }, { - "epoch": 0.29, - "learning_rate": 0.0002568109546369005, - "loss": 0.0734, + "epoch": 0.17, + "learning_rate": 0.0002742282347018465, + "loss": 0.0763, "step": 26620 }, { - "epoch": 0.29, - "learning_rate": 0.00025679473035239143, - "loss": 0.0673, + "epoch": 0.17, + "learning_rate": 0.0002742185533474896, + "loss": 0.0829, "step": 26630 }, { - "epoch": 0.29, - "learning_rate": 0.0002567785060678824, - "loss": 0.0728, + "epoch": 0.17, + "learning_rate": 0.00027420887199313266, + "loss": 0.0751, "step": 26640 }, { - "epoch": 0.29, - "learning_rate": 0.00025676228178337333, - "loss": 0.0655, + "epoch": 0.17, + "learning_rate": 0.00027419919063877574, + "loss": 0.0729, "step": 26650 }, { - "epoch": 0.29, - "learning_rate": 0.0002567460574988643, - "loss": 0.0735, + "epoch": 0.17, + "learning_rate": 0.0002741895092844188, + "loss": 0.0825, "step": 26660 }, { - "epoch": 0.29, - "learning_rate": 0.00025672983321435523, - "loss": 0.0734, + "epoch": 0.17, + "learning_rate": 0.00027417982793006185, + "loss": 0.0695, "step": 26670 }, { - "epoch": 0.29, - "learning_rate": 0.00025671360892984616, - "loss": 0.0756, + "epoch": 0.17, + "learning_rate": 0.00027417014657570493, + "loss": 0.0834, "step": 26680 }, { - "epoch": 0.29, - "learning_rate": 0.00025669738464533713, - "loss": 0.0657, + "epoch": 0.17, + "learning_rate": 0.000274160465221348, + "loss": 0.0731, "step": 26690 }, { - "epoch": 0.29, - "learning_rate": 0.00025668116036082806, - "loss": 0.0799, + "epoch": 0.17, + "learning_rate": 0.0002741507838669911, + "loss": 0.0814, "step": 26700 }, { - "epoch": 0.29, - "learning_rate": 0.00025666493607631903, - "loss": 0.078, + "epoch": 0.17, + "learning_rate": 0.00027414110251263417, + "loss": 0.0836, "step": 26710 }, { - "epoch": 0.29, - "learning_rate": 0.00025664871179180995, - "loss": 0.0658, + "epoch": 0.17, + "learning_rate": 0.0002741314211582772, + "loss": 0.0917, "step": 26720 }, { - "epoch": 0.29, - "learning_rate": 0.0002566324875073009, - "loss": 0.0573, + "epoch": 0.17, + "learning_rate": 0.0002741217398039203, + "loss": 0.0819, "step": 26730 }, { - "epoch": 0.29, - "learning_rate": 0.00025661626322279185, - "loss": 0.083, + "epoch": 0.17, + "learning_rate": 0.00027411205844956335, + "loss": 0.0858, "step": 26740 }, { - "epoch": 0.29, - "learning_rate": 0.0002566000389382828, - "loss": 0.0658, + "epoch": 0.17, + "learning_rate": 0.0002741023770952064, + "loss": 0.0969, "step": 26750 }, { - "epoch": 0.29, - "learning_rate": 0.00025658381465377375, - "loss": 0.0717, + "epoch": 0.17, + "learning_rate": 0.00027409269574084946, + "loss": 0.0806, "step": 26760 }, { - "epoch": 0.29, - "learning_rate": 0.0002565675903692647, - "loss": 0.0637, + "epoch": 0.17, + "learning_rate": 0.00027408301438649254, + "loss": 0.0853, "step": 26770 }, { - "epoch": 0.29, - "learning_rate": 0.00025655136608475565, - "loss": 0.0683, + "epoch": 0.17, + "learning_rate": 0.0002740733330321356, + "loss": 0.0944, "step": 26780 }, { - "epoch": 0.29, - "learning_rate": 0.0002565351418002466, - "loss": 0.0665, + "epoch": 0.17, + "learning_rate": 0.0002740636516777787, + "loss": 0.0825, "step": 26790 }, { - "epoch": 0.29, - "learning_rate": 0.00025651891751573755, - "loss": 0.0654, + "epoch": 0.17, + "learning_rate": 0.0002740539703234218, + "loss": 0.0841, "step": 26800 }, { - "epoch": 0.29, - "learning_rate": 0.0002565026932312285, - "loss": 0.0683, + "epoch": 0.17, + "learning_rate": 0.0002740442889690648, + "loss": 0.0775, "step": 26810 }, { - "epoch": 0.29, - "learning_rate": 0.00025648646894671945, - "loss": 0.0689, + "epoch": 0.17, + "learning_rate": 0.0002740346076147079, + "loss": 0.0874, "step": 26820 }, { - "epoch": 0.29, - "learning_rate": 0.0002564702446622104, - "loss": 0.0632, + "epoch": 0.17, + "learning_rate": 0.00027402492626035096, + "loss": 0.0888, "step": 26830 }, { - "epoch": 0.29, - "learning_rate": 0.00025645402037770135, - "loss": 0.0721, + "epoch": 0.17, + "learning_rate": 0.00027401524490599404, + "loss": 0.0874, "step": 26840 }, { - "epoch": 0.29, - "learning_rate": 0.0002564377960931923, - "loss": 0.0687, + "epoch": 0.17, + "learning_rate": 0.0002740055635516371, + "loss": 0.0806, "step": 26850 }, { - "epoch": 0.29, - "learning_rate": 0.0002564215718086832, - "loss": 0.0672, + "epoch": 0.17, + "learning_rate": 0.00027399588219728015, + "loss": 0.0848, "step": 26860 }, { - "epoch": 0.29, - "learning_rate": 0.0002564053475241742, - "loss": 0.0639, + "epoch": 0.17, + "learning_rate": 0.00027398620084292323, + "loss": 0.0849, "step": 26870 }, { - "epoch": 0.29, - "learning_rate": 0.0002563891232396651, - "loss": 0.0707, + "epoch": 0.17, + "learning_rate": 0.0002739765194885663, + "loss": 0.0748, "step": 26880 }, { - "epoch": 0.29, - "learning_rate": 0.0002563728989551561, - "loss": 0.0637, + "epoch": 0.17, + "learning_rate": 0.00027396683813420933, + "loss": 0.0871, "step": 26890 }, { - "epoch": 0.29, - "learning_rate": 0.000256356674670647, - "loss": 0.0691, + "epoch": 0.17, + "learning_rate": 0.0002739571567798524, + "loss": 0.0712, "step": 26900 }, { - "epoch": 0.29, - "learning_rate": 0.0002563404503861379, - "loss": 0.0753, + "epoch": 0.17, + "learning_rate": 0.0002739474754254955, + "loss": 0.0749, "step": 26910 }, { - "epoch": 0.29, - "learning_rate": 0.0002563242261016289, - "loss": 0.0807, + "epoch": 0.17, + "learning_rate": 0.00027393779407113857, + "loss": 0.0809, "step": 26920 }, { - "epoch": 0.29, - "learning_rate": 0.0002563080018171198, - "loss": 0.088, + "epoch": 0.17, + "learning_rate": 0.00027392811271678165, + "loss": 0.093, "step": 26930 }, { - "epoch": 0.29, - "learning_rate": 0.0002562917775326108, - "loss": 0.0712, + "epoch": 0.17, + "learning_rate": 0.00027391843136242473, + "loss": 0.0829, "step": 26940 }, { - "epoch": 0.29, - "learning_rate": 0.0002562755532481017, - "loss": 0.074, + "epoch": 0.17, + "learning_rate": 0.00027390875000806776, + "loss": 0.0739, "step": 26950 }, { - "epoch": 0.29, - "learning_rate": 0.0002562593289635927, - "loss": 0.0624, + "epoch": 0.17, + "learning_rate": 0.00027389906865371084, + "loss": 0.0842, "step": 26960 }, { - "epoch": 0.29, - "learning_rate": 0.0002562431046790836, - "loss": 0.0707, + "epoch": 0.17, + "learning_rate": 0.0002738893872993539, + "loss": 0.0819, "step": 26970 }, { - "epoch": 0.29, - "learning_rate": 0.0002562268803945746, - "loss": 0.0697, + "epoch": 0.17, + "learning_rate": 0.000273879705944997, + "loss": 0.0789, "step": 26980 }, { - "epoch": 0.29, - "learning_rate": 0.0002562106561100655, - "loss": 0.0789, + "epoch": 0.17, + "learning_rate": 0.00027387002459064, + "loss": 0.0716, "step": 26990 }, { - "epoch": 0.29, - "learning_rate": 0.0002561944318255565, - "loss": 0.0791, + "epoch": 0.17, + "learning_rate": 0.0002738603432362831, + "loss": 0.0811, "step": 27000 }, { - "epoch": 0.29, - "eval_cer": 0.9214635447864706, - "eval_loss": 0.04918750375509262, - "eval_runtime": 119.567, - "eval_samples_per_second": 16.727, - "eval_steps_per_second": 4.182, + "epoch": 0.17, + "eval_cer": 0.9201509433962264, + "eval_loss": 0.053227175027132034, + "eval_runtime": 120.4018, + "eval_samples_per_second": 16.611, + "eval_steps_per_second": 4.153, "step": 27000 }, { - "epoch": 0.29, - "learning_rate": 0.0002561782075410474, - "loss": 0.0691, + "epoch": 0.17, + "learning_rate": 0.0002738506618819262, + "loss": 0.0779, "step": 27010 }, { - "epoch": 0.29, - "learning_rate": 0.0002561619832565384, - "loss": 0.0724, + "epoch": 0.17, + "learning_rate": 0.0002738409805275692, + "loss": 0.0745, "step": 27020 }, { - "epoch": 0.29, - "learning_rate": 0.0002561457589720293, - "loss": 0.0648, + "epoch": 0.17, + "learning_rate": 0.0002738312991732123, + "loss": 0.0749, "step": 27030 }, { - "epoch": 0.29, - "learning_rate": 0.00025612953468752024, - "loss": 0.078, + "epoch": 0.17, + "learning_rate": 0.00027382161781885537, + "loss": 0.0808, "step": 27040 }, { - "epoch": 0.29, - "learning_rate": 0.0002561133104030112, - "loss": 0.0735, + "epoch": 0.17, + "learning_rate": 0.00027381193646449845, + "loss": 0.0819, "step": 27050 }, { - "epoch": 0.29, - "learning_rate": 0.00025609708611850214, - "loss": 0.0669, + "epoch": 0.17, + "learning_rate": 0.0002738022551101415, + "loss": 0.0769, "step": 27060 }, { - "epoch": 0.29, - "learning_rate": 0.0002560808618339931, - "loss": 0.0694, + "epoch": 0.17, + "learning_rate": 0.0002737925737557846, + "loss": 0.0761, "step": 27070 }, { - "epoch": 0.29, - "learning_rate": 0.00025606463754948404, - "loss": 0.0659, + "epoch": 0.17, + "learning_rate": 0.0002737828924014277, + "loss": 0.0797, "step": 27080 }, { - "epoch": 0.29, - "learning_rate": 0.00025604841326497496, - "loss": 0.0714, + "epoch": 0.17, + "learning_rate": 0.0002737732110470707, + "loss": 0.0828, "step": 27090 }, { - "epoch": 0.29, - "learning_rate": 0.00025603218898046594, - "loss": 0.0835, + "epoch": 0.17, + "learning_rate": 0.0002737635296927138, + "loss": 0.0703, "step": 27100 }, { - "epoch": 0.29, - "learning_rate": 0.00025601596469595686, - "loss": 0.0659, + "epoch": 0.17, + "learning_rate": 0.00027375384833835687, + "loss": 0.0821, "step": 27110 }, { - "epoch": 0.29, - "learning_rate": 0.00025599974041144784, - "loss": 0.0687, + "epoch": 0.18, + "learning_rate": 0.00027374416698399995, + "loss": 0.0785, "step": 27120 }, { - "epoch": 0.29, - "learning_rate": 0.00025598351612693876, - "loss": 0.072, + "epoch": 0.18, + "learning_rate": 0.000273734485629643, + "loss": 0.0789, "step": 27130 }, { - "epoch": 0.29, - "learning_rate": 0.00025596729184242974, - "loss": 0.0687, + "epoch": 0.18, + "learning_rate": 0.00027372480427528606, + "loss": 0.0783, "step": 27140 }, { - "epoch": 0.29, - "learning_rate": 0.00025595106755792066, - "loss": 0.0719, + "epoch": 0.18, + "learning_rate": 0.00027371512292092914, + "loss": 0.0768, "step": 27150 }, { - "epoch": 0.29, - "learning_rate": 0.00025593484327341164, - "loss": 0.0801, + "epoch": 0.18, + "learning_rate": 0.00027370544156657216, + "loss": 0.0781, "step": 27160 }, { - "epoch": 0.29, - "learning_rate": 0.00025591861898890256, - "loss": 0.0721, + "epoch": 0.18, + "learning_rate": 0.00027369576021221524, + "loss": 0.078, "step": 27170 }, { - "epoch": 0.29, - "learning_rate": 0.00025590239470439354, - "loss": 0.0666, + "epoch": 0.18, + "learning_rate": 0.0002736860788578583, + "loss": 0.0853, "step": 27180 }, { - "epoch": 0.29, - "learning_rate": 0.00025588617041988446, - "loss": 0.0699, + "epoch": 0.18, + "learning_rate": 0.0002736763975035014, + "loss": 0.0755, "step": 27190 }, { - "epoch": 0.29, - "learning_rate": 0.00025586994613537544, - "loss": 0.0749, + "epoch": 0.18, + "learning_rate": 0.0002736667161491445, + "loss": 0.0833, "step": 27200 }, { - "epoch": 0.29, - "learning_rate": 0.00025585372185086636, - "loss": 0.0681, + "epoch": 0.18, + "learning_rate": 0.00027365703479478756, + "loss": 0.0771, "step": 27210 }, { - "epoch": 0.29, - "learning_rate": 0.00025583749756635733, - "loss": 0.0695, + "epoch": 0.18, + "learning_rate": 0.00027364735344043064, + "loss": 0.0918, "step": 27220 }, { - "epoch": 0.29, - "learning_rate": 0.00025582127328184826, - "loss": 0.0675, + "epoch": 0.18, + "learning_rate": 0.00027363767208607367, + "loss": 0.0806, "step": 27230 }, { - "epoch": 0.29, - "learning_rate": 0.0002558050489973392, - "loss": 0.0708, + "epoch": 0.18, + "learning_rate": 0.00027362799073171675, + "loss": 0.0797, "step": 27240 }, { - "epoch": 0.29, - "learning_rate": 0.00025578882471283016, - "loss": 0.0783, + "epoch": 0.18, + "learning_rate": 0.0002736183093773598, + "loss": 0.0776, "step": 27250 }, { - "epoch": 0.29, - "learning_rate": 0.0002557726004283211, - "loss": 0.0656, + "epoch": 0.18, + "learning_rate": 0.00027360862802300285, + "loss": 0.0858, "step": 27260 }, { - "epoch": 0.29, - "learning_rate": 0.000255756376143812, - "loss": 0.0733, + "epoch": 0.18, + "learning_rate": 0.00027359894666864593, + "loss": 0.0947, "step": 27270 }, { - "epoch": 0.3, - "learning_rate": 0.000255740151859303, - "loss": 0.0688, + "epoch": 0.18, + "learning_rate": 0.000273589265314289, + "loss": 0.0747, "step": 27280 }, { - "epoch": 0.3, - "learning_rate": 0.0002557239275747939, - "loss": 0.0718, + "epoch": 0.18, + "learning_rate": 0.0002735795839599321, + "loss": 0.077, "step": 27290 }, { - "epoch": 0.3, - "learning_rate": 0.0002557077032902849, - "loss": 0.0651, + "epoch": 0.18, + "learning_rate": 0.0002735699026055751, + "loss": 0.0754, "step": 27300 }, { - "epoch": 0.3, - "learning_rate": 0.0002556914790057758, - "loss": 0.0751, + "epoch": 0.18, + "learning_rate": 0.0002735602212512182, + "loss": 0.0749, "step": 27310 }, { - "epoch": 0.3, - "learning_rate": 0.0002556752547212668, - "loss": 0.0681, + "epoch": 0.18, + "learning_rate": 0.0002735505398968613, + "loss": 0.0684, "step": 27320 }, { - "epoch": 0.3, - "learning_rate": 0.0002556590304367577, - "loss": 0.0694, + "epoch": 0.18, + "learning_rate": 0.00027354085854250436, + "loss": 0.0828, "step": 27330 }, { - "epoch": 0.3, - "learning_rate": 0.0002556428061522487, - "loss": 0.0674, + "epoch": 0.18, + "learning_rate": 0.00027353117718814744, + "loss": 0.0797, "step": 27340 }, { - "epoch": 0.3, - "learning_rate": 0.0002556265818677396, - "loss": 0.069, + "epoch": 0.18, + "learning_rate": 0.0002735214958337905, + "loss": 0.0794, "step": 27350 }, { - "epoch": 0.3, - "learning_rate": 0.0002556103575832306, - "loss": 0.0602, + "epoch": 0.18, + "learning_rate": 0.00027351181447943354, + "loss": 0.0773, "step": 27360 }, { - "epoch": 0.3, - "learning_rate": 0.0002555941332987215, - "loss": 0.0659, + "epoch": 0.18, + "learning_rate": 0.0002735021331250766, + "loss": 0.0813, "step": 27370 }, { - "epoch": 0.3, - "learning_rate": 0.0002555779090142125, - "loss": 0.0672, + "epoch": 0.18, + "learning_rate": 0.0002734924517707197, + "loss": 0.0784, "step": 27380 }, { - "epoch": 0.3, - "learning_rate": 0.0002555616847297034, - "loss": 0.0651, + "epoch": 0.18, + "learning_rate": 0.0002734827704163627, + "loss": 0.0845, "step": 27390 }, { - "epoch": 0.3, - "learning_rate": 0.0002555454604451944, - "loss": 0.0805, + "epoch": 0.18, + "learning_rate": 0.0002734730890620058, + "loss": 0.0761, "step": 27400 }, { - "epoch": 0.3, - "learning_rate": 0.0002555292361606853, - "loss": 0.0679, + "epoch": 0.18, + "learning_rate": 0.0002734634077076489, + "loss": 0.0854, "step": 27410 }, { - "epoch": 0.3, - "learning_rate": 0.0002555130118761762, - "loss": 0.0618, + "epoch": 0.18, + "learning_rate": 0.00027345372635329197, + "loss": 0.0752, "step": 27420 }, { - "epoch": 0.3, - "learning_rate": 0.0002554967875916672, - "loss": 0.0709, + "epoch": 0.18, + "learning_rate": 0.00027344404499893505, + "loss": 0.0779, "step": 27430 }, { - "epoch": 0.3, - "learning_rate": 0.0002554805633071581, - "loss": 0.072, + "epoch": 0.18, + "learning_rate": 0.00027343436364457807, + "loss": 0.0785, "step": 27440 }, { - "epoch": 0.3, - "learning_rate": 0.00025546433902264904, - "loss": 0.0549, + "epoch": 0.18, + "learning_rate": 0.00027342468229022115, + "loss": 0.0779, "step": 27450 }, { - "epoch": 0.3, - "learning_rate": 0.00025544811473814, - "loss": 0.0629, + "epoch": 0.18, + "learning_rate": 0.00027341500093586423, + "loss": 0.0951, "step": 27460 }, { - "epoch": 0.3, - "learning_rate": 0.00025543189045363094, - "loss": 0.0757, + "epoch": 0.18, + "learning_rate": 0.0002734053195815073, + "loss": 0.0843, "step": 27470 }, { - "epoch": 0.3, - "learning_rate": 0.0002554156661691219, - "loss": 0.0695, + "epoch": 0.18, + "learning_rate": 0.0002733956382271504, + "loss": 0.0827, "step": 27480 }, { - "epoch": 0.3, - "learning_rate": 0.00025539944188461284, - "loss": 0.0735, + "epoch": 0.18, + "learning_rate": 0.00027338595687279347, + "loss": 0.0877, "step": 27490 }, { - "epoch": 0.3, - "learning_rate": 0.0002553832176001038, - "loss": 0.0715, + "epoch": 0.18, + "learning_rate": 0.0002733762755184365, + "loss": 0.0796, "step": 27500 }, { - "epoch": 0.3, - "learning_rate": 0.00025536699331559474, - "loss": 0.0549, + "epoch": 0.18, + "learning_rate": 0.0002733665941640796, + "loss": 0.0841, "step": 27510 }, { - "epoch": 0.3, - "learning_rate": 0.0002553507690310857, - "loss": 0.0752, + "epoch": 0.18, + "learning_rate": 0.00027335691280972265, + "loss": 0.0837, "step": 27520 }, { - "epoch": 0.3, - "learning_rate": 0.00025533454474657664, - "loss": 0.0699, + "epoch": 0.18, + "learning_rate": 0.0002733472314553657, + "loss": 0.0779, "step": 27530 }, { - "epoch": 0.3, - "learning_rate": 0.0002553183204620676, - "loss": 0.0692, + "epoch": 0.18, + "learning_rate": 0.00027333755010100876, + "loss": 0.0806, "step": 27540 }, { - "epoch": 0.3, - "learning_rate": 0.00025530209617755854, - "loss": 0.069, + "epoch": 0.18, + "learning_rate": 0.00027332786874665184, + "loss": 0.081, "step": 27550 }, { - "epoch": 0.3, - "learning_rate": 0.0002552858718930495, - "loss": 0.066, + "epoch": 0.18, + "learning_rate": 0.0002733181873922949, + "loss": 0.0768, "step": 27560 }, { - "epoch": 0.3, - "learning_rate": 0.00025526964760854044, - "loss": 0.0707, + "epoch": 0.18, + "learning_rate": 0.000273308506037938, + "loss": 0.0863, "step": 27570 }, { - "epoch": 0.3, - "learning_rate": 0.0002552534233240314, - "loss": 0.0688, + "epoch": 0.18, + "learning_rate": 0.000273298824683581, + "loss": 0.0853, "step": 27580 }, { - "epoch": 0.3, - "learning_rate": 0.00025523719903952234, - "loss": 0.0778, + "epoch": 0.18, + "learning_rate": 0.0002732891433292241, + "loss": 0.0769, "step": 27590 }, { - "epoch": 0.3, - "learning_rate": 0.00025522097475501326, - "loss": 0.0683, + "epoch": 0.18, + "learning_rate": 0.0002732794619748672, + "loss": 0.0859, "step": 27600 }, { - "epoch": 0.3, - "learning_rate": 0.00025520475047050424, - "loss": 0.0778, + "epoch": 0.18, + "learning_rate": 0.00027326978062051026, + "loss": 0.0886, "step": 27610 }, { - "epoch": 0.3, - "learning_rate": 0.00025518852618599516, - "loss": 0.0644, + "epoch": 0.18, + "learning_rate": 0.00027326009926615334, + "loss": 0.0889, "step": 27620 }, { - "epoch": 0.3, - "learning_rate": 0.0002551723019014861, - "loss": 0.0653, + "epoch": 0.18, + "learning_rate": 0.00027325041791179637, + "loss": 0.0818, "step": 27630 }, { - "epoch": 0.3, - "learning_rate": 0.00025515607761697706, - "loss": 0.0719, + "epoch": 0.18, + "learning_rate": 0.00027324073655743945, + "loss": 0.0787, "step": 27640 }, { - "epoch": 0.3, - "learning_rate": 0.000255139853332468, - "loss": 0.0744, + "epoch": 0.18, + "learning_rate": 0.00027323105520308253, + "loss": 0.0778, "step": 27650 }, { - "epoch": 0.3, - "learning_rate": 0.00025512362904795896, - "loss": 0.0663, + "epoch": 0.18, + "learning_rate": 0.00027322137384872556, + "loss": 0.0811, "step": 27660 }, { - "epoch": 0.3, - "learning_rate": 0.0002551074047634499, - "loss": 0.0709, + "epoch": 0.18, + "learning_rate": 0.00027321169249436863, + "loss": 0.0693, "step": 27670 }, { - "epoch": 0.3, - "learning_rate": 0.00025509118047894086, - "loss": 0.0718, + "epoch": 0.18, + "learning_rate": 0.0002732020111400117, + "loss": 0.076, "step": 27680 }, { - "epoch": 0.3, - "learning_rate": 0.0002550749561944318, - "loss": 0.0732, + "epoch": 0.18, + "learning_rate": 0.0002731923297856548, + "loss": 0.0781, "step": 27690 }, { - "epoch": 0.3, - "learning_rate": 0.00025505873190992276, - "loss": 0.0746, + "epoch": 0.18, + "learning_rate": 0.0002731826484312979, + "loss": 0.0887, "step": 27700 }, { - "epoch": 0.3, - "learning_rate": 0.0002550425076254137, - "loss": 0.0673, + "epoch": 0.18, + "learning_rate": 0.00027317296707694095, + "loss": 0.0725, "step": 27710 }, { - "epoch": 0.3, - "learning_rate": 0.00025502628334090466, - "loss": 0.0625, + "epoch": 0.18, + "learning_rate": 0.000273163285722584, + "loss": 0.0751, "step": 27720 }, { - "epoch": 0.3, - "learning_rate": 0.0002550100590563956, - "loss": 0.069, + "epoch": 0.18, + "learning_rate": 0.00027315360436822706, + "loss": 0.0814, "step": 27730 }, { - "epoch": 0.3, - "learning_rate": 0.00025499383477188656, - "loss": 0.0745, + "epoch": 0.18, + "learning_rate": 0.00027314392301387014, + "loss": 0.0779, "step": 27740 }, { - "epoch": 0.3, - "learning_rate": 0.0002549776104873775, - "loss": 0.0746, + "epoch": 0.18, + "learning_rate": 0.0002731342416595132, + "loss": 0.0761, "step": 27750 }, { - "epoch": 0.3, - "learning_rate": 0.00025496138620286846, - "loss": 0.0769, + "epoch": 0.18, + "learning_rate": 0.00027312456030515624, + "loss": 0.0833, "step": 27760 }, { - "epoch": 0.3, - "learning_rate": 0.0002549451619183594, - "loss": 0.0667, + "epoch": 0.18, + "learning_rate": 0.0002731148789507993, + "loss": 0.0798, "step": 27770 }, { - "epoch": 0.3, - "learning_rate": 0.0002549289376338503, - "loss": 0.0623, + "epoch": 0.18, + "learning_rate": 0.0002731051975964424, + "loss": 0.0674, "step": 27780 }, { - "epoch": 0.3, - "learning_rate": 0.0002549127133493413, - "loss": 0.0809, + "epoch": 0.18, + "learning_rate": 0.00027309551624208543, + "loss": 0.0888, "step": 27790 }, { - "epoch": 0.3, - "learning_rate": 0.0002548964890648322, - "loss": 0.0736, + "epoch": 0.18, + "learning_rate": 0.0002730858348877285, + "loss": 0.0796, "step": 27800 }, { - "epoch": 0.3, - "learning_rate": 0.00025488026478032313, - "loss": 0.0725, + "epoch": 0.18, + "learning_rate": 0.0002730761535333716, + "loss": 0.0758, "step": 27810 }, { - "epoch": 0.3, - "learning_rate": 0.0002548640404958141, - "loss": 0.0807, + "epoch": 0.18, + "learning_rate": 0.00027306647217901467, + "loss": 0.0817, "step": 27820 }, { - "epoch": 0.3, - "learning_rate": 0.000254847816211305, - "loss": 0.0754, + "epoch": 0.18, + "learning_rate": 0.00027305679082465775, + "loss": 0.0794, "step": 27830 }, { - "epoch": 0.3, - "learning_rate": 0.000254831591926796, - "loss": 0.0658, + "epoch": 0.18, + "learning_rate": 0.00027304710947030083, + "loss": 0.0787, "step": 27840 }, { - "epoch": 0.3, - "learning_rate": 0.0002548153676422869, - "loss": 0.0747, + "epoch": 0.18, + "learning_rate": 0.0002730374281159439, + "loss": 0.074, "step": 27850 }, { - "epoch": 0.3, - "learning_rate": 0.0002547991433577779, - "loss": 0.0815, + "epoch": 0.18, + "learning_rate": 0.00027302774676158693, + "loss": 0.0822, "step": 27860 }, { - "epoch": 0.3, - "learning_rate": 0.0002547829190732688, - "loss": 0.0693, + "epoch": 0.18, + "learning_rate": 0.00027301806540723, + "loss": 0.0654, "step": 27870 }, { - "epoch": 0.3, - "learning_rate": 0.0002547666947887598, - "loss": 0.0692, + "epoch": 0.18, + "learning_rate": 0.0002730083840528731, + "loss": 0.075, "step": 27880 }, { - "epoch": 0.3, - "learning_rate": 0.0002547504705042507, - "loss": 0.0642, + "epoch": 0.18, + "learning_rate": 0.0002729987026985162, + "loss": 0.0814, "step": 27890 }, { - "epoch": 0.3, - "learning_rate": 0.0002547342462197417, - "loss": 0.0714, + "epoch": 0.18, + "learning_rate": 0.0002729890213441592, + "loss": 0.0844, "step": 27900 }, { - "epoch": 0.3, - "learning_rate": 0.0002547180219352326, - "loss": 0.0717, + "epoch": 0.18, + "learning_rate": 0.0002729793399898023, + "loss": 0.0843, "step": 27910 }, { - "epoch": 0.3, - "learning_rate": 0.0002547017976507236, - "loss": 0.0737, + "epoch": 0.18, + "learning_rate": 0.00027296965863544536, + "loss": 0.0772, "step": 27920 }, { - "epoch": 0.3, - "learning_rate": 0.0002546855733662145, - "loss": 0.0735, + "epoch": 0.18, + "learning_rate": 0.0002729599772810884, + "loss": 0.0782, "step": 27930 }, { - "epoch": 0.3, - "learning_rate": 0.0002546693490817055, - "loss": 0.0635, + "epoch": 0.18, + "learning_rate": 0.00027295029592673146, + "loss": 0.0783, "step": 27940 }, { - "epoch": 0.3, - "learning_rate": 0.0002546531247971964, - "loss": 0.0702, + "epoch": 0.18, + "learning_rate": 0.00027294061457237454, + "loss": 0.0855, "step": 27950 }, { - "epoch": 0.3, - "learning_rate": 0.00025463690051268735, - "loss": 0.0697, + "epoch": 0.18, + "learning_rate": 0.0002729309332180176, + "loss": 0.0796, "step": 27960 }, { - "epoch": 0.3, - "learning_rate": 0.0002546206762281783, - "loss": 0.0705, + "epoch": 0.18, + "learning_rate": 0.0002729212518636607, + "loss": 0.0756, "step": 27970 }, { - "epoch": 0.3, - "learning_rate": 0.00025460445194366925, - "loss": 0.0704, + "epoch": 0.18, + "learning_rate": 0.0002729115705093038, + "loss": 0.0781, "step": 27980 }, { - "epoch": 0.3, - "learning_rate": 0.00025458822765916017, - "loss": 0.0618, + "epoch": 0.18, + "learning_rate": 0.00027290188915494686, + "loss": 0.0796, "step": 27990 }, { - "epoch": 0.3, - "learning_rate": 0.00025457200337465115, - "loss": 0.0702, + "epoch": 0.18, + "learning_rate": 0.0002728922078005899, + "loss": 0.0817, "step": 28000 }, { - "epoch": 0.3, - "eval_cer": 0.9214573603962251, - "eval_loss": 0.0485168993473053, - "eval_runtime": 119.6492, - "eval_samples_per_second": 16.716, - "eval_steps_per_second": 4.179, + "epoch": 0.18, + "eval_cer": 0.9201979437351712, + "eval_loss": 0.053717296570539474, + "eval_runtime": 120.3699, + "eval_samples_per_second": 16.615, + "eval_steps_per_second": 4.154, "step": 28000 }, { - "epoch": 0.3, - "learning_rate": 0.00025455577909014207, - "loss": 0.0642, + "epoch": 0.18, + "learning_rate": 0.00027288252644623297, + "loss": 0.0819, "step": 28010 }, { - "epoch": 0.3, - "learning_rate": 0.00025453955480563305, - "loss": 0.064, + "epoch": 0.18, + "learning_rate": 0.00027287284509187605, + "loss": 0.0742, "step": 28020 }, { - "epoch": 0.3, - "learning_rate": 0.00025452333052112397, - "loss": 0.0683, + "epoch": 0.18, + "learning_rate": 0.0002728631637375191, + "loss": 0.0732, "step": 28030 }, { - "epoch": 0.3, - "learning_rate": 0.00025450710623661494, - "loss": 0.0665, + "epoch": 0.18, + "learning_rate": 0.00027285348238316215, + "loss": 0.081, "step": 28040 }, { - "epoch": 0.3, - "learning_rate": 0.00025449088195210587, - "loss": 0.0757, + "epoch": 0.18, + "learning_rate": 0.00027284380102880523, + "loss": 0.0746, "step": 28050 }, { - "epoch": 0.3, - "learning_rate": 0.00025447465766759684, - "loss": 0.0719, + "epoch": 0.18, + "learning_rate": 0.0002728341196744483, + "loss": 0.081, "step": 28060 }, { - "epoch": 0.3, - "learning_rate": 0.00025445843338308777, - "loss": 0.0672, + "epoch": 0.18, + "learning_rate": 0.00027282443832009134, + "loss": 0.0778, "step": 28070 }, { - "epoch": 0.3, - "learning_rate": 0.00025444220909857874, - "loss": 0.0815, + "epoch": 0.18, + "learning_rate": 0.0002728147569657344, + "loss": 0.0768, "step": 28080 }, { - "epoch": 0.3, - "learning_rate": 0.00025442598481406967, - "loss": 0.0634, + "epoch": 0.18, + "learning_rate": 0.0002728050756113775, + "loss": 0.0745, "step": 28090 }, { - "epoch": 0.3, - "learning_rate": 0.00025440976052956064, - "loss": 0.0675, + "epoch": 0.18, + "learning_rate": 0.0002727953942570206, + "loss": 0.0773, "step": 28100 }, { - "epoch": 0.3, - "learning_rate": 0.00025439353624505157, - "loss": 0.0758, + "epoch": 0.18, + "learning_rate": 0.00027278571290266366, + "loss": 0.0875, "step": 28110 }, { - "epoch": 0.3, - "learning_rate": 0.00025437731196054254, - "loss": 0.0689, + "epoch": 0.18, + "learning_rate": 0.00027277603154830674, + "loss": 0.0791, "step": 28120 }, { - "epoch": 0.3, - "learning_rate": 0.00025436108767603347, - "loss": 0.0698, + "epoch": 0.18, + "learning_rate": 0.00027276635019394976, + "loss": 0.0788, "step": 28130 }, { - "epoch": 0.3, - "learning_rate": 0.0002543448633915244, - "loss": 0.0733, + "epoch": 0.18, + "learning_rate": 0.00027275666883959284, + "loss": 0.0736, "step": 28140 }, { - "epoch": 0.3, - "learning_rate": 0.00025432863910701537, - "loss": 0.0744, + "epoch": 0.18, + "learning_rate": 0.0002727469874852359, + "loss": 0.0827, "step": 28150 }, { - "epoch": 0.3, - "learning_rate": 0.0002543124148225063, - "loss": 0.0682, + "epoch": 0.18, + "learning_rate": 0.00027273730613087895, + "loss": 0.0776, "step": 28160 }, { - "epoch": 0.3, - "learning_rate": 0.00025429619053799726, - "loss": 0.0727, + "epoch": 0.18, + "learning_rate": 0.00027272762477652203, + "loss": 0.075, "step": 28170 }, { - "epoch": 0.3, - "learning_rate": 0.0002542799662534882, - "loss": 0.0802, + "epoch": 0.18, + "learning_rate": 0.0002727179434221651, + "loss": 0.0919, "step": 28180 }, { - "epoch": 0.3, - "learning_rate": 0.00025426374196897916, - "loss": 0.0688, + "epoch": 0.18, + "learning_rate": 0.0002727082620678082, + "loss": 0.0821, "step": 28190 }, { - "epoch": 0.31, - "learning_rate": 0.0002542475176844701, - "loss": 0.0712, + "epoch": 0.18, + "learning_rate": 0.00027269858071345127, + "loss": 0.0789, "step": 28200 }, { - "epoch": 0.31, - "learning_rate": 0.00025423129339996106, - "loss": 0.0695, + "epoch": 0.18, + "learning_rate": 0.0002726888993590943, + "loss": 0.0772, "step": 28210 }, { - "epoch": 0.31, - "learning_rate": 0.000254215069115452, - "loss": 0.0617, + "epoch": 0.18, + "learning_rate": 0.0002726792180047374, + "loss": 0.0771, "step": 28220 }, { - "epoch": 0.31, - "learning_rate": 0.00025419884483094296, - "loss": 0.0732, + "epoch": 0.18, + "learning_rate": 0.00027266953665038045, + "loss": 0.0711, "step": 28230 }, { - "epoch": 0.31, - "learning_rate": 0.0002541826205464339, - "loss": 0.0741, + "epoch": 0.18, + "learning_rate": 0.00027265985529602353, + "loss": 0.0816, "step": 28240 }, { - "epoch": 0.31, - "learning_rate": 0.00025416639626192486, - "loss": 0.0725, + "epoch": 0.18, + "learning_rate": 0.0002726501739416666, + "loss": 0.0687, "step": 28250 }, { - "epoch": 0.31, - "learning_rate": 0.0002541501719774158, - "loss": 0.0632, + "epoch": 0.18, + "learning_rate": 0.0002726404925873097, + "loss": 0.0809, "step": 28260 }, { - "epoch": 0.31, - "learning_rate": 0.00025413394769290676, - "loss": 0.0743, + "epoch": 0.18, + "learning_rate": 0.0002726308112329527, + "loss": 0.0729, "step": 28270 }, { - "epoch": 0.31, - "learning_rate": 0.0002541177234083977, - "loss": 0.0678, + "epoch": 0.18, + "learning_rate": 0.0002726211298785958, + "loss": 0.0775, "step": 28280 }, { - "epoch": 0.31, - "learning_rate": 0.0002541014991238886, - "loss": 0.0676, + "epoch": 0.18, + "learning_rate": 0.0002726114485242389, + "loss": 0.0865, "step": 28290 }, { - "epoch": 0.31, - "learning_rate": 0.0002540852748393796, - "loss": 0.0692, + "epoch": 0.18, + "learning_rate": 0.0002726017671698819, + "loss": 0.0814, "step": 28300 }, { - "epoch": 0.31, - "learning_rate": 0.0002540690505548705, - "loss": 0.0792, + "epoch": 0.18, + "learning_rate": 0.000272592085815525, + "loss": 0.0798, "step": 28310 }, { - "epoch": 0.31, - "learning_rate": 0.00025405282627036143, - "loss": 0.0765, + "epoch": 0.18, + "learning_rate": 0.00027258240446116806, + "loss": 0.0732, "step": 28320 }, { - "epoch": 0.31, - "learning_rate": 0.0002540366019858524, - "loss": 0.068, + "epoch": 0.18, + "learning_rate": 0.00027257272310681114, + "loss": 0.0769, "step": 28330 }, { - "epoch": 0.31, - "learning_rate": 0.00025402037770134333, - "loss": 0.0689, + "epoch": 0.18, + "learning_rate": 0.0002725630417524542, + "loss": 0.0745, "step": 28340 }, { - "epoch": 0.31, - "learning_rate": 0.0002540041534168343, - "loss": 0.0657, + "epoch": 0.18, + "learning_rate": 0.00027255336039809725, + "loss": 0.0775, "step": 28350 }, { - "epoch": 0.31, - "learning_rate": 0.00025398792913232523, - "loss": 0.0769, + "epoch": 0.18, + "learning_rate": 0.00027254367904374033, + "loss": 0.0753, "step": 28360 }, { - "epoch": 0.31, - "learning_rate": 0.0002539717048478162, - "loss": 0.0721, + "epoch": 0.18, + "learning_rate": 0.0002725339976893834, + "loss": 0.0876, "step": 28370 }, { - "epoch": 0.31, - "learning_rate": 0.00025395548056330713, - "loss": 0.0681, + "epoch": 0.18, + "learning_rate": 0.0002725243163350265, + "loss": 0.08, "step": 28380 }, { - "epoch": 0.31, - "learning_rate": 0.0002539392562787981, - "loss": 0.0762, + "epoch": 0.18, + "learning_rate": 0.00027251463498066957, + "loss": 0.068, "step": 28390 }, { - "epoch": 0.31, - "learning_rate": 0.00025392303199428903, - "loss": 0.0756, + "epoch": 0.18, + "learning_rate": 0.0002725049536263126, + "loss": 0.0776, "step": 28400 }, { - "epoch": 0.31, - "learning_rate": 0.00025390680770978, - "loss": 0.07, + "epoch": 0.18, + "learning_rate": 0.00027249527227195567, + "loss": 0.0744, "step": 28410 }, { - "epoch": 0.31, - "learning_rate": 0.00025389058342527093, - "loss": 0.0773, + "epoch": 0.18, + "learning_rate": 0.00027248559091759875, + "loss": 0.0809, "step": 28420 }, { - "epoch": 0.31, - "learning_rate": 0.0002538743591407619, - "loss": 0.0669, + "epoch": 0.18, + "learning_rate": 0.0002724759095632418, + "loss": 0.083, "step": 28430 }, { - "epoch": 0.31, - "learning_rate": 0.00025385813485625283, - "loss": 0.0681, + "epoch": 0.18, + "learning_rate": 0.00027246622820888486, + "loss": 0.0825, "step": 28440 }, { - "epoch": 0.31, - "learning_rate": 0.0002538419105717438, - "loss": 0.0765, + "epoch": 0.18, + "learning_rate": 0.00027245654685452794, + "loss": 0.0816, "step": 28450 }, { - "epoch": 0.31, - "learning_rate": 0.0002538256862872347, - "loss": 0.076, + "epoch": 0.18, + "learning_rate": 0.000272446865500171, + "loss": 0.0747, "step": 28460 }, { - "epoch": 0.31, - "learning_rate": 0.00025380946200272565, - "loss": 0.0809, + "epoch": 0.18, + "learning_rate": 0.0002724371841458141, + "loss": 0.0783, "step": 28470 }, { - "epoch": 0.31, - "learning_rate": 0.0002537932377182166, - "loss": 0.0728, + "epoch": 0.18, + "learning_rate": 0.0002724275027914572, + "loss": 0.0781, "step": 28480 }, { - "epoch": 0.31, - "learning_rate": 0.00025377701343370755, - "loss": 0.0705, + "epoch": 0.18, + "learning_rate": 0.0002724178214371002, + "loss": 0.0797, "step": 28490 }, { - "epoch": 0.31, - "learning_rate": 0.00025376078914919847, - "loss": 0.072, + "epoch": 0.18, + "learning_rate": 0.0002724081400827433, + "loss": 0.0757, "step": 28500 }, { - "epoch": 0.31, - "learning_rate": 0.00025374456486468945, - "loss": 0.0739, + "epoch": 0.18, + "learning_rate": 0.00027239845872838636, + "loss": 0.0729, "step": 28510 }, { - "epoch": 0.31, - "learning_rate": 0.00025372834058018037, - "loss": 0.0765, + "epoch": 0.18, + "learning_rate": 0.00027238877737402944, + "loss": 0.0818, "step": 28520 }, { - "epoch": 0.31, - "learning_rate": 0.00025371211629567135, - "loss": 0.0727, + "epoch": 0.18, + "learning_rate": 0.00027237909601967247, + "loss": 0.0791, "step": 28530 }, { - "epoch": 0.31, - "learning_rate": 0.00025369589201116227, - "loss": 0.0914, + "epoch": 0.18, + "learning_rate": 0.00027236941466531555, + "loss": 0.0792, "step": 28540 }, { - "epoch": 0.31, - "learning_rate": 0.00025367966772665325, - "loss": 0.0792, + "epoch": 0.18, + "learning_rate": 0.0002723597333109586, + "loss": 0.0747, "step": 28550 }, { - "epoch": 0.31, - "learning_rate": 0.00025366344344214417, - "loss": 0.0823, + "epoch": 0.18, + "learning_rate": 0.00027235005195660165, + "loss": 0.077, "step": 28560 }, { - "epoch": 0.31, - "learning_rate": 0.00025364721915763515, - "loss": 0.0746, + "epoch": 0.18, + "learning_rate": 0.00027234037060224473, + "loss": 0.0883, "step": 28570 }, { - "epoch": 0.31, - "learning_rate": 0.00025363099487312607, - "loss": 0.0694, + "epoch": 0.18, + "learning_rate": 0.0002723306892478878, + "loss": 0.0691, "step": 28580 }, { - "epoch": 0.31, - "learning_rate": 0.00025361477058861705, - "loss": 0.0769, + "epoch": 0.18, + "learning_rate": 0.0002723210078935309, + "loss": 0.0784, "step": 28590 }, { - "epoch": 0.31, - "learning_rate": 0.00025359854630410797, - "loss": 0.0777, + "epoch": 0.18, + "learning_rate": 0.00027231132653917397, + "loss": 0.0868, "step": 28600 }, { - "epoch": 0.31, - "learning_rate": 0.00025358232201959895, - "loss": 0.071, + "epoch": 0.18, + "learning_rate": 0.00027230164518481705, + "loss": 0.0763, "step": 28610 }, { - "epoch": 0.31, - "learning_rate": 0.00025356609773508987, - "loss": 0.0751, + "epoch": 0.18, + "learning_rate": 0.00027229196383046013, + "loss": 0.0785, "step": 28620 }, { - "epoch": 0.31, - "learning_rate": 0.00025354987345058085, - "loss": 0.0691, + "epoch": 0.18, + "learning_rate": 0.00027228228247610316, + "loss": 0.072, "step": 28630 }, { - "epoch": 0.31, - "learning_rate": 0.00025353364916607177, - "loss": 0.0785, + "epoch": 0.18, + "learning_rate": 0.00027227260112174624, + "loss": 0.0868, "step": 28640 }, { - "epoch": 0.31, - "learning_rate": 0.0002535174248815627, - "loss": 0.0787, + "epoch": 0.18, + "learning_rate": 0.0002722629197673893, + "loss": 0.0797, "step": 28650 }, { - "epoch": 0.31, - "learning_rate": 0.00025350120059705367, - "loss": 0.0783, + "epoch": 0.18, + "learning_rate": 0.0002722532384130324, + "loss": 0.0797, "step": 28660 }, { - "epoch": 0.31, - "learning_rate": 0.0002534849763125446, - "loss": 0.0817, + "epoch": 0.19, + "learning_rate": 0.0002722435570586754, + "loss": 0.0763, "step": 28670 }, { - "epoch": 0.31, - "learning_rate": 0.0002534687520280355, - "loss": 0.0656, + "epoch": 0.19, + "learning_rate": 0.0002722338757043185, + "loss": 0.0912, "step": 28680 }, { - "epoch": 0.31, - "learning_rate": 0.0002534525277435265, - "loss": 0.0761, + "epoch": 0.19, + "learning_rate": 0.0002722241943499616, + "loss": 0.078, "step": 28690 }, { - "epoch": 0.31, - "learning_rate": 0.0002534363034590174, - "loss": 0.0732, + "epoch": 0.19, + "learning_rate": 0.0002722145129956046, + "loss": 0.0954, "step": 28700 }, { - "epoch": 0.31, - "learning_rate": 0.0002534200791745084, - "loss": 0.0746, + "epoch": 0.19, + "learning_rate": 0.0002722048316412477, + "loss": 0.0721, "step": 28710 }, { - "epoch": 0.31, - "learning_rate": 0.0002534038548899993, - "loss": 0.0799, + "epoch": 0.19, + "learning_rate": 0.00027219515028689077, + "loss": 0.0746, "step": 28720 }, { - "epoch": 0.31, - "learning_rate": 0.0002533876306054903, - "loss": 0.0645, + "epoch": 0.19, + "learning_rate": 0.00027218546893253385, + "loss": 0.0763, "step": 28730 }, { - "epoch": 0.31, - "learning_rate": 0.0002533714063209812, - "loss": 0.0671, + "epoch": 0.19, + "learning_rate": 0.0002721757875781769, + "loss": 0.0749, "step": 28740 }, { - "epoch": 0.31, - "learning_rate": 0.0002533551820364722, - "loss": 0.073, + "epoch": 0.19, + "learning_rate": 0.00027216610622382, + "loss": 0.0769, "step": 28750 }, { - "epoch": 0.31, - "learning_rate": 0.0002533389577519631, - "loss": 0.0738, + "epoch": 0.19, + "learning_rate": 0.0002721564248694631, + "loss": 0.076, "step": 28760 }, { - "epoch": 0.31, - "learning_rate": 0.0002533227334674541, - "loss": 0.0725, + "epoch": 0.19, + "learning_rate": 0.0002721467435151061, + "loss": 0.0794, "step": 28770 }, { - "epoch": 0.31, - "learning_rate": 0.000253306509182945, - "loss": 0.0688, + "epoch": 0.19, + "learning_rate": 0.0002721370621607492, + "loss": 0.0742, "step": 28780 }, { - "epoch": 0.31, - "learning_rate": 0.000253290284898436, - "loss": 0.0695, + "epoch": 0.19, + "learning_rate": 0.00027212738080639227, + "loss": 0.0766, "step": 28790 }, { - "epoch": 0.31, - "learning_rate": 0.0002532740606139269, - "loss": 0.0708, + "epoch": 0.19, + "learning_rate": 0.0002721176994520353, + "loss": 0.0746, "step": 28800 }, { - "epoch": 0.31, - "learning_rate": 0.0002532578363294179, - "loss": 0.0711, + "epoch": 0.19, + "learning_rate": 0.0002721080180976784, + "loss": 0.078, "step": 28810 }, { - "epoch": 0.31, - "learning_rate": 0.0002532416120449088, - "loss": 0.0645, + "epoch": 0.19, + "learning_rate": 0.00027209833674332146, + "loss": 0.0838, "step": 28820 }, { - "epoch": 0.31, - "learning_rate": 0.00025322538776039973, - "loss": 0.0794, + "epoch": 0.19, + "learning_rate": 0.00027208865538896454, + "loss": 0.076, "step": 28830 }, { - "epoch": 0.31, - "learning_rate": 0.0002532091634758907, - "loss": 0.0697, + "epoch": 0.19, + "learning_rate": 0.00027207897403460756, + "loss": 0.0832, "step": 28840 }, { - "epoch": 0.31, - "learning_rate": 0.00025319293919138163, - "loss": 0.0688, + "epoch": 0.19, + "learning_rate": 0.00027206929268025064, + "loss": 0.0815, "step": 28850 }, { - "epoch": 0.31, - "learning_rate": 0.00025317671490687256, - "loss": 0.0738, + "epoch": 0.19, + "learning_rate": 0.0002720596113258937, + "loss": 0.0901, "step": 28860 }, { - "epoch": 0.31, - "learning_rate": 0.00025316049062236353, - "loss": 0.071, + "epoch": 0.19, + "learning_rate": 0.0002720499299715368, + "loss": 0.0766, "step": 28870 }, { - "epoch": 0.31, - "learning_rate": 0.00025314426633785445, - "loss": 0.0642, + "epoch": 0.19, + "learning_rate": 0.0002720402486171799, + "loss": 0.0735, "step": 28880 }, { - "epoch": 0.31, - "learning_rate": 0.00025312804205334543, - "loss": 0.0685, + "epoch": 0.19, + "learning_rate": 0.00027203056726282296, + "loss": 0.0751, "step": 28890 }, { - "epoch": 0.31, - "learning_rate": 0.00025311181776883635, - "loss": 0.0721, + "epoch": 0.19, + "learning_rate": 0.00027202088590846604, + "loss": 0.0845, "step": 28900 }, { - "epoch": 0.31, - "learning_rate": 0.00025309559348432733, - "loss": 0.0699, + "epoch": 0.19, + "learning_rate": 0.00027201120455410907, + "loss": 0.0843, "step": 28910 }, { - "epoch": 0.31, - "learning_rate": 0.00025307936919981825, - "loss": 0.0727, + "epoch": 0.19, + "learning_rate": 0.00027200152319975215, + "loss": 0.0805, "step": 28920 }, { - "epoch": 0.31, - "learning_rate": 0.00025306314491530923, - "loss": 0.0711, + "epoch": 0.19, + "learning_rate": 0.00027199184184539517, + "loss": 0.0756, "step": 28930 }, { - "epoch": 0.31, - "learning_rate": 0.00025304692063080015, - "loss": 0.0677, + "epoch": 0.19, + "learning_rate": 0.00027198216049103825, + "loss": 0.0776, "step": 28940 }, { - "epoch": 0.31, - "learning_rate": 0.00025303069634629113, - "loss": 0.0677, + "epoch": 0.19, + "learning_rate": 0.00027197247913668133, + "loss": 0.0888, "step": 28950 }, { - "epoch": 0.31, - "learning_rate": 0.00025301447206178205, - "loss": 0.0658, + "epoch": 0.19, + "learning_rate": 0.0002719627977823244, + "loss": 0.0812, "step": 28960 }, { - "epoch": 0.31, - "learning_rate": 0.00025299824777727303, - "loss": 0.0707, + "epoch": 0.19, + "learning_rate": 0.0002719531164279675, + "loss": 0.0766, "step": 28970 }, { - "epoch": 0.31, - "learning_rate": 0.00025298202349276395, - "loss": 0.0609, + "epoch": 0.19, + "learning_rate": 0.0002719434350736105, + "loss": 0.0796, "step": 28980 }, { - "epoch": 0.31, - "learning_rate": 0.00025296579920825493, - "loss": 0.074, + "epoch": 0.19, + "learning_rate": 0.0002719337537192536, + "loss": 0.0813, "step": 28990 }, { - "epoch": 0.31, - "learning_rate": 0.00025294957492374585, - "loss": 0.0709, + "epoch": 0.19, + "learning_rate": 0.0002719240723648967, + "loss": 0.0809, "step": 29000 }, { - "epoch": 0.31, - "eval_cer": 0.9213345560756333, - "eval_loss": 0.04926983639597893, - "eval_runtime": 119.3913, - "eval_samples_per_second": 16.752, - "eval_steps_per_second": 4.188, + "epoch": 0.19, + "eval_cer": 0.9201111738786578, + "eval_loss": 0.052740730345249176, + "eval_runtime": 120.2847, + "eval_samples_per_second": 16.627, + "eval_steps_per_second": 4.157, "step": 29000 }, { - "epoch": 0.31, - "learning_rate": 0.0002529333506392368, - "loss": 0.0691, + "epoch": 0.19, + "learning_rate": 0.00027191439101053975, + "loss": 0.0852, "step": 29010 }, { - "epoch": 0.31, - "learning_rate": 0.00025291712635472775, - "loss": 0.0638, + "epoch": 0.19, + "learning_rate": 0.00027190470965618283, + "loss": 0.075, "step": 29020 }, { - "epoch": 0.31, - "learning_rate": 0.0002529009020702187, - "loss": 0.0687, + "epoch": 0.19, + "learning_rate": 0.0002718950283018259, + "loss": 0.0823, "step": 29030 }, { - "epoch": 0.31, - "learning_rate": 0.0002528846777857096, - "loss": 0.0749, + "epoch": 0.19, + "learning_rate": 0.00027188534694746894, + "loss": 0.0825, "step": 29040 }, { - "epoch": 0.31, - "learning_rate": 0.0002528684535012006, - "loss": 0.0732, + "epoch": 0.19, + "learning_rate": 0.000271875665593112, + "loss": 0.0711, "step": 29050 }, { - "epoch": 0.31, - "learning_rate": 0.0002528522292166915, - "loss": 0.0702, + "epoch": 0.19, + "learning_rate": 0.0002718659842387551, + "loss": 0.0705, "step": 29060 }, { - "epoch": 0.31, - "learning_rate": 0.0002528360049321825, - "loss": 0.0718, + "epoch": 0.19, + "learning_rate": 0.0002718563028843981, + "loss": 0.0979, "step": 29070 }, { - "epoch": 0.31, - "learning_rate": 0.0002528197806476734, - "loss": 0.0767, + "epoch": 0.19, + "learning_rate": 0.0002718466215300412, + "loss": 0.0734, "step": 29080 }, { - "epoch": 0.31, - "learning_rate": 0.00025280355636316437, - "loss": 0.0804, + "epoch": 0.19, + "learning_rate": 0.0002718369401756843, + "loss": 0.0762, "step": 29090 }, { - "epoch": 0.31, - "learning_rate": 0.0002527873320786553, - "loss": 0.0663, + "epoch": 0.19, + "learning_rate": 0.00027182725882132736, + "loss": 0.0731, "step": 29100 }, { - "epoch": 0.31, - "learning_rate": 0.00025277110779414627, - "loss": 0.0682, + "epoch": 0.19, + "learning_rate": 0.00027181757746697044, + "loss": 0.0786, "step": 29110 }, { - "epoch": 0.31, - "learning_rate": 0.0002527548835096372, - "loss": 0.081, + "epoch": 0.19, + "learning_rate": 0.00027180789611261347, + "loss": 0.0737, "step": 29120 }, { - "epoch": 0.32, - "learning_rate": 0.00025273865922512817, - "loss": 0.0736, + "epoch": 0.19, + "learning_rate": 0.00027179821475825655, + "loss": 0.0719, "step": 29130 }, { - "epoch": 0.32, - "learning_rate": 0.0002527224349406191, - "loss": 0.0658, + "epoch": 0.19, + "learning_rate": 0.00027178853340389963, + "loss": 0.0713, "step": 29140 }, { - "epoch": 0.32, - "learning_rate": 0.00025270621065611007, - "loss": 0.0681, + "epoch": 0.19, + "learning_rate": 0.0002717788520495427, + "loss": 0.0765, "step": 29150 }, { - "epoch": 0.32, - "learning_rate": 0.000252689986371601, - "loss": 0.0678, + "epoch": 0.19, + "learning_rate": 0.0002717691706951858, + "loss": 0.0749, "step": 29160 }, { - "epoch": 0.32, - "learning_rate": 0.00025267376208709197, - "loss": 0.0671, + "epoch": 0.19, + "learning_rate": 0.0002717594893408288, + "loss": 0.0789, "step": 29170 }, { - "epoch": 0.32, - "learning_rate": 0.0002526575378025829, - "loss": 0.0692, + "epoch": 0.19, + "learning_rate": 0.0002717498079864719, + "loss": 0.0747, "step": 29180 }, { - "epoch": 0.32, - "learning_rate": 0.0002526413135180738, - "loss": 0.0772, + "epoch": 0.19, + "learning_rate": 0.000271740126632115, + "loss": 0.0769, "step": 29190 }, { - "epoch": 0.32, - "learning_rate": 0.0002526250892335648, - "loss": 0.0656, + "epoch": 0.19, + "learning_rate": 0.000271730445277758, + "loss": 0.0768, "step": 29200 }, { - "epoch": 0.32, - "learning_rate": 0.0002526088649490557, - "loss": 0.0665, + "epoch": 0.19, + "learning_rate": 0.0002717207639234011, + "loss": 0.0799, "step": 29210 }, { - "epoch": 0.32, - "learning_rate": 0.00025259264066454664, - "loss": 0.0705, + "epoch": 0.19, + "learning_rate": 0.00027171108256904416, + "loss": 0.0719, "step": 29220 }, { - "epoch": 0.32, - "learning_rate": 0.0002525764163800376, - "loss": 0.0752, + "epoch": 0.19, + "learning_rate": 0.00027170140121468724, + "loss": 0.0848, "step": 29230 }, { - "epoch": 0.32, - "learning_rate": 0.00025256019209552854, - "loss": 0.0751, + "epoch": 0.19, + "learning_rate": 0.0002716917198603303, + "loss": 0.0782, "step": 29240 }, { - "epoch": 0.32, - "learning_rate": 0.0002525439678110195, - "loss": 0.074, + "epoch": 0.19, + "learning_rate": 0.0002716820385059734, + "loss": 0.0922, "step": 29250 }, { - "epoch": 0.32, - "learning_rate": 0.00025252774352651044, - "loss": 0.0773, + "epoch": 0.19, + "learning_rate": 0.0002716723571516164, + "loss": 0.0744, "step": 29260 }, { - "epoch": 0.32, - "learning_rate": 0.0002525115192420014, - "loss": 0.0657, + "epoch": 0.19, + "learning_rate": 0.0002716626757972595, + "loss": 0.0815, "step": 29270 }, { - "epoch": 0.32, - "learning_rate": 0.00025249529495749234, - "loss": 0.0699, + "epoch": 0.19, + "learning_rate": 0.0002716529944429026, + "loss": 0.0841, "step": 29280 }, { - "epoch": 0.32, - "learning_rate": 0.0002524790706729833, - "loss": 0.0766, + "epoch": 0.19, + "learning_rate": 0.00027164331308854566, + "loss": 0.0812, "step": 29290 }, { - "epoch": 0.32, - "learning_rate": 0.00025246284638847424, - "loss": 0.066, + "epoch": 0.19, + "learning_rate": 0.00027163363173418874, + "loss": 0.0699, "step": 29300 }, { - "epoch": 0.32, - "learning_rate": 0.0002524466221039652, - "loss": 0.0685, + "epoch": 0.19, + "learning_rate": 0.00027162395037983177, + "loss": 0.0743, "step": 29310 }, { - "epoch": 0.32, - "learning_rate": 0.00025243039781945614, - "loss": 0.0707, + "epoch": 0.19, + "learning_rate": 0.00027161426902547485, + "loss": 0.0787, "step": 29320 }, { - "epoch": 0.32, - "learning_rate": 0.0002524141735349471, - "loss": 0.0643, + "epoch": 0.19, + "learning_rate": 0.0002716045876711179, + "loss": 0.0727, "step": 29330 }, { - "epoch": 0.32, - "learning_rate": 0.00025239794925043804, - "loss": 0.0733, + "epoch": 0.19, + "learning_rate": 0.00027159490631676095, + "loss": 0.0782, "step": 29340 }, { - "epoch": 0.32, - "learning_rate": 0.000252381724965929, - "loss": 0.0739, + "epoch": 0.19, + "learning_rate": 0.00027158522496240403, + "loss": 0.0759, "step": 29350 }, { - "epoch": 0.32, - "learning_rate": 0.00025236550068141994, - "loss": 0.0649, + "epoch": 0.19, + "learning_rate": 0.0002715755436080471, + "loss": 0.0752, "step": 29360 }, { - "epoch": 0.32, - "learning_rate": 0.00025234927639691086, - "loss": 0.0683, + "epoch": 0.19, + "learning_rate": 0.0002715658622536902, + "loss": 0.078, "step": 29370 }, { - "epoch": 0.32, - "learning_rate": 0.00025233305211240183, - "loss": 0.0685, + "epoch": 0.19, + "learning_rate": 0.0002715561808993333, + "loss": 0.0759, "step": 29380 }, { - "epoch": 0.32, - "learning_rate": 0.00025231682782789276, - "loss": 0.0714, + "epoch": 0.19, + "learning_rate": 0.00027154649954497635, + "loss": 0.0761, "step": 29390 }, { - "epoch": 0.32, - "learning_rate": 0.0002523006035433837, - "loss": 0.0754, + "epoch": 0.19, + "learning_rate": 0.0002715368181906194, + "loss": 0.075, "step": 29400 }, { - "epoch": 0.32, - "learning_rate": 0.00025228437925887466, - "loss": 0.0847, + "epoch": 0.19, + "learning_rate": 0.00027152713683626246, + "loss": 0.0936, "step": 29410 }, { - "epoch": 0.32, - "learning_rate": 0.0002522681549743656, - "loss": 0.0652, + "epoch": 0.19, + "learning_rate": 0.00027151745548190554, + "loss": 0.0746, "step": 29420 }, { - "epoch": 0.32, - "learning_rate": 0.00025225193068985656, - "loss": 0.0646, + "epoch": 0.19, + "learning_rate": 0.0002715077741275486, + "loss": 0.0789, "step": 29430 }, { - "epoch": 0.32, - "learning_rate": 0.0002522357064053475, - "loss": 0.0722, + "epoch": 0.19, + "learning_rate": 0.00027149809277319164, + "loss": 0.08, "step": 29440 }, { - "epoch": 0.32, - "learning_rate": 0.00025221948212083846, - "loss": 0.0745, + "epoch": 0.19, + "learning_rate": 0.0002714884114188347, + "loss": 0.0837, "step": 29450 }, { - "epoch": 0.32, - "learning_rate": 0.0002522032578363294, - "loss": 0.0788, + "epoch": 0.19, + "learning_rate": 0.0002714787300644778, + "loss": 0.0749, "step": 29460 }, { - "epoch": 0.32, - "learning_rate": 0.00025218703355182036, - "loss": 0.0743, + "epoch": 0.19, + "learning_rate": 0.00027146904871012083, + "loss": 0.0818, "step": 29470 }, { - "epoch": 0.32, - "learning_rate": 0.0002521708092673113, - "loss": 0.0706, + "epoch": 0.19, + "learning_rate": 0.0002714593673557639, + "loss": 0.0722, "step": 29480 }, { - "epoch": 0.32, - "learning_rate": 0.00025215458498280226, - "loss": 0.0714, + "epoch": 0.19, + "learning_rate": 0.000271449686001407, + "loss": 0.0967, "step": 29490 }, { - "epoch": 0.32, - "learning_rate": 0.0002521383606982932, - "loss": 0.073, + "epoch": 0.19, + "learning_rate": 0.00027144000464705007, + "loss": 0.0828, "step": 29500 }, { - "epoch": 0.32, - "learning_rate": 0.00025212213641378415, - "loss": 0.0696, + "epoch": 0.19, + "learning_rate": 0.00027143032329269315, + "loss": 0.0768, "step": 29510 }, { - "epoch": 0.32, - "learning_rate": 0.0002521059121292751, - "loss": 0.0684, + "epoch": 0.19, + "learning_rate": 0.00027142064193833623, + "loss": 0.0781, "step": 29520 }, { - "epoch": 0.32, - "learning_rate": 0.00025208968784476605, - "loss": 0.0716, + "epoch": 0.19, + "learning_rate": 0.0002714109605839793, + "loss": 0.0662, "step": 29530 }, { - "epoch": 0.32, - "learning_rate": 0.000252073463560257, - "loss": 0.0666, + "epoch": 0.19, + "learning_rate": 0.00027140127922962233, + "loss": 0.069, "step": 29540 }, { - "epoch": 0.32, - "learning_rate": 0.0002520572392757479, - "loss": 0.0665, + "epoch": 0.19, + "learning_rate": 0.0002713915978752654, + "loss": 0.0932, "step": 29550 }, { - "epoch": 0.32, - "learning_rate": 0.0002520410149912389, - "loss": 0.0661, + "epoch": 0.19, + "learning_rate": 0.0002713819165209085, + "loss": 0.0911, "step": 29560 }, { - "epoch": 0.32, - "learning_rate": 0.0002520247907067298, - "loss": 0.0755, + "epoch": 0.19, + "learning_rate": 0.0002713722351665515, + "loss": 0.0965, "step": 29570 }, { - "epoch": 0.32, - "learning_rate": 0.0002520085664222207, - "loss": 0.0686, + "epoch": 0.19, + "learning_rate": 0.0002713625538121946, + "loss": 0.0692, "step": 29580 }, { - "epoch": 0.32, - "learning_rate": 0.0002519923421377117, - "loss": 0.068, + "epoch": 0.19, + "learning_rate": 0.0002713528724578377, + "loss": 0.0808, "step": 29590 }, { - "epoch": 0.32, - "learning_rate": 0.0002519761178532026, - "loss": 0.0761, + "epoch": 0.19, + "learning_rate": 0.00027134319110348076, + "loss": 0.0854, "step": 29600 }, { - "epoch": 0.32, - "learning_rate": 0.0002519598935686936, - "loss": 0.0756, + "epoch": 0.19, + "learning_rate": 0.0002713335097491238, + "loss": 0.0773, "step": 29610 }, { - "epoch": 0.32, - "learning_rate": 0.0002519436692841845, - "loss": 0.0677, + "epoch": 0.19, + "learning_rate": 0.00027132382839476686, + "loss": 0.0854, "step": 29620 }, { - "epoch": 0.32, - "learning_rate": 0.0002519274449996755, - "loss": 0.0733, + "epoch": 0.19, + "learning_rate": 0.00027131414704040994, + "loss": 0.0898, "step": 29630 }, { - "epoch": 0.32, - "learning_rate": 0.0002519112207151664, - "loss": 0.073, + "epoch": 0.19, + "learning_rate": 0.000271304465686053, + "loss": 0.0866, "step": 29640 }, { - "epoch": 0.32, - "learning_rate": 0.0002518949964306574, - "loss": 0.0682, + "epoch": 0.19, + "learning_rate": 0.0002712947843316961, + "loss": 0.0827, "step": 29650 }, { - "epoch": 0.32, - "learning_rate": 0.0002518787721461483, - "loss": 0.0762, + "epoch": 0.19, + "learning_rate": 0.0002712851029773392, + "loss": 0.0718, "step": 29660 }, { - "epoch": 0.32, - "learning_rate": 0.0002518625478616393, - "loss": 0.0697, + "epoch": 0.19, + "learning_rate": 0.00027127542162298226, + "loss": 0.0798, "step": 29670 }, { - "epoch": 0.32, - "learning_rate": 0.0002518463235771302, - "loss": 0.0677, + "epoch": 0.19, + "learning_rate": 0.0002712657402686253, + "loss": 0.0828, "step": 29680 }, { - "epoch": 0.32, - "learning_rate": 0.0002518300992926212, - "loss": 0.0702, + "epoch": 0.19, + "learning_rate": 0.00027125605891426837, + "loss": 0.0723, "step": 29690 }, { - "epoch": 0.32, - "learning_rate": 0.0002518138750081121, - "loss": 0.0749, + "epoch": 0.19, + "learning_rate": 0.00027124637755991145, + "loss": 0.0764, "step": 29700 }, { - "epoch": 0.32, - "learning_rate": 0.0002517976507236031, - "loss": 0.0627, + "epoch": 0.19, + "learning_rate": 0.0002712366962055545, + "loss": 0.0803, "step": 29710 }, { - "epoch": 0.32, - "learning_rate": 0.000251781426439094, - "loss": 0.0771, + "epoch": 0.19, + "learning_rate": 0.00027122701485119755, + "loss": 0.0694, "step": 29720 }, { - "epoch": 0.32, - "learning_rate": 0.00025176520215458494, - "loss": 0.0746, + "epoch": 0.19, + "learning_rate": 0.00027121733349684063, + "loss": 0.0819, "step": 29730 }, { - "epoch": 0.32, - "learning_rate": 0.0002517489778700759, - "loss": 0.065, + "epoch": 0.19, + "learning_rate": 0.0002712076521424837, + "loss": 0.0692, "step": 29740 }, { - "epoch": 0.32, - "learning_rate": 0.00025173275358556684, - "loss": 0.0683, + "epoch": 0.19, + "learning_rate": 0.00027119797078812674, + "loss": 0.0838, "step": 29750 }, { - "epoch": 0.32, - "learning_rate": 0.00025171652930105776, - "loss": 0.0727, + "epoch": 0.19, + "learning_rate": 0.0002711882894337698, + "loss": 0.078, "step": 29760 }, { - "epoch": 0.32, - "learning_rate": 0.00025170030501654874, - "loss": 0.0634, + "epoch": 0.19, + "learning_rate": 0.0002711786080794129, + "loss": 0.0891, "step": 29770 }, { - "epoch": 0.32, - "learning_rate": 0.00025168408073203966, - "loss": 0.077, + "epoch": 0.19, + "learning_rate": 0.000271168926725056, + "loss": 0.0801, "step": 29780 }, { - "epoch": 0.32, - "learning_rate": 0.00025166785644753064, - "loss": 0.0801, + "epoch": 0.19, + "learning_rate": 0.00027115924537069906, + "loss": 0.0661, "step": 29790 }, { - "epoch": 0.32, - "learning_rate": 0.00025165163216302156, - "loss": 0.0642, + "epoch": 0.19, + "learning_rate": 0.00027114956401634214, + "loss": 0.0785, "step": 29800 }, { - "epoch": 0.32, - "learning_rate": 0.00025163540787851254, - "loss": 0.0726, + "epoch": 0.19, + "learning_rate": 0.00027113988266198516, + "loss": 0.078, "step": 29810 }, { - "epoch": 0.32, - "learning_rate": 0.00025161918359400346, - "loss": 0.0717, + "epoch": 0.19, + "learning_rate": 0.00027113020130762824, + "loss": 0.0828, "step": 29820 }, { - "epoch": 0.32, - "learning_rate": 0.00025160295930949444, - "loss": 0.064, + "epoch": 0.19, + "learning_rate": 0.0002711205199532713, + "loss": 0.0862, "step": 29830 }, { - "epoch": 0.32, - "learning_rate": 0.00025158673502498536, - "loss": 0.0746, + "epoch": 0.19, + "learning_rate": 0.00027111083859891435, + "loss": 0.0788, "step": 29840 }, { - "epoch": 0.32, - "learning_rate": 0.00025157051074047634, - "loss": 0.0734, + "epoch": 0.19, + "learning_rate": 0.00027110115724455743, + "loss": 0.0786, "step": 29850 }, { - "epoch": 0.32, - "learning_rate": 0.00025155428645596726, - "loss": 0.0679, + "epoch": 0.19, + "learning_rate": 0.0002710914758902005, + "loss": 0.0845, "step": 29860 }, { - "epoch": 0.32, - "learning_rate": 0.00025153806217145824, - "loss": 0.0681, + "epoch": 0.19, + "learning_rate": 0.0002710817945358436, + "loss": 0.08, "step": 29870 }, { - "epoch": 0.32, - "learning_rate": 0.00025152183788694916, - "loss": 0.0642, + "epoch": 0.19, + "learning_rate": 0.00027107211318148667, + "loss": 0.0781, "step": 29880 }, { - "epoch": 0.32, - "learning_rate": 0.00025150561360244014, - "loss": 0.0655, + "epoch": 0.19, + "learning_rate": 0.0002710624318271297, + "loss": 0.0749, "step": 29890 }, { - "epoch": 0.32, - "learning_rate": 0.00025148938931793106, - "loss": 0.0655, + "epoch": 0.19, + "learning_rate": 0.00027105275047277277, + "loss": 0.0724, "step": 29900 }, { - "epoch": 0.32, - "learning_rate": 0.000251473165033422, - "loss": 0.0639, + "epoch": 0.19, + "learning_rate": 0.00027104306911841585, + "loss": 0.0787, "step": 29910 }, { - "epoch": 0.32, - "learning_rate": 0.00025145694074891296, - "loss": 0.0732, + "epoch": 0.19, + "learning_rate": 0.00027103338776405893, + "loss": 0.0781, "step": 29920 }, { - "epoch": 0.32, - "learning_rate": 0.0002514407164644039, - "loss": 0.0691, + "epoch": 0.19, + "learning_rate": 0.000271023706409702, + "loss": 0.0641, "step": 29930 }, { - "epoch": 0.32, - "learning_rate": 0.0002514244921798948, - "loss": 0.0682, + "epoch": 0.19, + "learning_rate": 0.00027101402505534504, + "loss": 0.078, "step": 29940 }, { - "epoch": 0.32, - "learning_rate": 0.0002514082678953858, - "loss": 0.0687, + "epoch": 0.19, + "learning_rate": 0.0002710043437009881, + "loss": 0.0766, "step": 29950 }, { - "epoch": 0.32, - "learning_rate": 0.0002513920436108767, - "loss": 0.0721, + "epoch": 0.19, + "learning_rate": 0.0002709946623466312, + "loss": 0.0772, "step": 29960 }, { - "epoch": 0.32, - "learning_rate": 0.0002513758193263677, - "loss": 0.0669, + "epoch": 0.19, + "learning_rate": 0.0002709849809922742, + "loss": 0.0844, "step": 29970 }, { - "epoch": 0.32, - "learning_rate": 0.0002513595950418586, - "loss": 0.0788, + "epoch": 0.19, + "learning_rate": 0.0002709752996379173, + "loss": 0.0789, "step": 29980 }, { - "epoch": 0.32, - "learning_rate": 0.0002513433707573496, - "loss": 0.0705, + "epoch": 0.19, + "learning_rate": 0.0002709656182835604, + "loss": 0.0768, "step": 29990 }, { - "epoch": 0.32, - "learning_rate": 0.0002513271464728405, - "loss": 0.0676, + "epoch": 0.19, + "learning_rate": 0.00027095593692920346, + "loss": 0.0812, "step": 30000 }, { - "epoch": 0.32, - "eval_cer": 0.9213610606052575, - "eval_loss": 0.04796409234404564, - "eval_runtime": 119.4347, - "eval_samples_per_second": 16.746, - "eval_steps_per_second": 4.186, + "epoch": 0.19, + "eval_cer": 0.9201635973336346, + "eval_loss": 0.05120238661766052, + "eval_runtime": 120.611, + "eval_samples_per_second": 16.582, + "eval_steps_per_second": 4.146, "step": 30000 }, { - "epoch": 0.32, - "learning_rate": 0.0002513109221883315, - "loss": 0.0794, + "epoch": 0.19, + "learning_rate": 0.00027094625557484654, + "loss": 0.0775, "step": 30010 }, { - "epoch": 0.32, - "learning_rate": 0.0002512946979038224, - "loss": 0.0681, + "epoch": 0.19, + "learning_rate": 0.0002709365742204896, + "loss": 0.0779, "step": 30020 }, { - "epoch": 0.32, - "learning_rate": 0.0002512784736193134, - "loss": 0.0725, + "epoch": 0.19, + "learning_rate": 0.00027092689286613265, + "loss": 0.0775, "step": 30030 }, { - "epoch": 0.32, - "learning_rate": 0.0002512622493348043, - "loss": 0.0665, + "epoch": 0.19, + "learning_rate": 0.0002709172115117757, + "loss": 0.0758, "step": 30040 }, { - "epoch": 0.33, - "learning_rate": 0.0002512460250502953, - "loss": 0.061, + "epoch": 0.19, + "learning_rate": 0.0002709075301574188, + "loss": 0.0762, "step": 30050 }, { - "epoch": 0.33, - "learning_rate": 0.0002512298007657862, - "loss": 0.0745, + "epoch": 0.19, + "learning_rate": 0.0002708978488030619, + "loss": 0.0794, "step": 30060 }, { - "epoch": 0.33, - "learning_rate": 0.0002512135764812772, - "loss": 0.0734, + "epoch": 0.19, + "learning_rate": 0.00027088816744870497, + "loss": 0.0754, "step": 30070 }, { - "epoch": 0.33, - "learning_rate": 0.0002511973521967681, - "loss": 0.0756, + "epoch": 0.19, + "learning_rate": 0.000270878486094348, + "loss": 0.0857, "step": 30080 }, { - "epoch": 0.33, - "learning_rate": 0.000251181127912259, - "loss": 0.0683, + "epoch": 0.19, + "learning_rate": 0.00027086880473999107, + "loss": 0.0786, "step": 30090 }, { - "epoch": 0.33, - "learning_rate": 0.00025116490362775, - "loss": 0.0681, + "epoch": 0.19, + "learning_rate": 0.00027085912338563415, + "loss": 0.0852, "step": 30100 }, { - "epoch": 0.33, - "learning_rate": 0.0002511486793432409, - "loss": 0.0708, + "epoch": 0.19, + "learning_rate": 0.0002708494420312772, + "loss": 0.0752, "step": 30110 }, { - "epoch": 0.33, - "learning_rate": 0.0002511324550587319, - "loss": 0.0657, + "epoch": 0.19, + "learning_rate": 0.00027083976067692026, + "loss": 0.0765, "step": 30120 }, { - "epoch": 0.33, - "learning_rate": 0.0002511162307742228, - "loss": 0.0697, + "epoch": 0.19, + "learning_rate": 0.00027083007932256334, + "loss": 0.0788, "step": 30130 }, { - "epoch": 0.33, - "learning_rate": 0.00025110000648971375, - "loss": 0.0695, + "epoch": 0.19, + "learning_rate": 0.0002708203979682064, + "loss": 0.0797, "step": 30140 }, { - "epoch": 0.33, - "learning_rate": 0.0002510837822052047, - "loss": 0.0684, + "epoch": 0.19, + "learning_rate": 0.0002708107166138495, + "loss": 0.0805, "step": 30150 }, { - "epoch": 0.33, - "learning_rate": 0.00025106755792069565, - "loss": 0.0672, + "epoch": 0.19, + "learning_rate": 0.0002708010352594926, + "loss": 0.0762, "step": 30160 }, { - "epoch": 0.33, - "learning_rate": 0.0002510513336361866, - "loss": 0.0656, + "epoch": 0.19, + "learning_rate": 0.0002707913539051356, + "loss": 0.0949, "step": 30170 }, { - "epoch": 0.33, - "learning_rate": 0.00025103510935167755, - "loss": 0.0773, + "epoch": 0.19, + "learning_rate": 0.0002707816725507787, + "loss": 0.072, "step": 30180 }, { - "epoch": 0.33, - "learning_rate": 0.0002510188850671685, - "loss": 0.0712, + "epoch": 0.19, + "learning_rate": 0.00027077199119642176, + "loss": 0.0832, "step": 30190 }, { - "epoch": 0.33, - "learning_rate": 0.00025100266078265944, - "loss": 0.0708, + "epoch": 0.19, + "learning_rate": 0.00027076230984206484, + "loss": 0.0739, "step": 30200 }, { - "epoch": 0.33, - "learning_rate": 0.0002509864364981504, - "loss": 0.0806, + "epoch": 0.19, + "learning_rate": 0.00027075262848770787, + "loss": 0.0813, "step": 30210 }, { - "epoch": 0.33, - "learning_rate": 0.00025097021221364134, - "loss": 0.0679, + "epoch": 0.2, + "learning_rate": 0.00027074294713335095, + "loss": 0.073, "step": 30220 }, { - "epoch": 0.33, - "learning_rate": 0.0002509539879291323, - "loss": 0.085, + "epoch": 0.2, + "learning_rate": 0.000270733265778994, + "loss": 0.0803, "step": 30230 }, { - "epoch": 0.33, - "learning_rate": 0.00025093776364462324, - "loss": 0.0713, + "epoch": 0.2, + "learning_rate": 0.00027072358442463705, + "loss": 0.0842, "step": 30240 }, { - "epoch": 0.33, - "learning_rate": 0.0002509215393601142, - "loss": 0.0648, + "epoch": 0.2, + "learning_rate": 0.00027071390307028013, + "loss": 0.0733, "step": 30250 }, { - "epoch": 0.33, - "learning_rate": 0.00025090531507560514, - "loss": 0.067, + "epoch": 0.2, + "learning_rate": 0.0002707042217159232, + "loss": 0.0725, "step": 30260 }, { - "epoch": 0.33, - "learning_rate": 0.00025088909079109607, - "loss": 0.0671, + "epoch": 0.2, + "learning_rate": 0.0002706945403615663, + "loss": 0.0818, "step": 30270 }, { - "epoch": 0.33, - "learning_rate": 0.00025087286650658704, - "loss": 0.0706, + "epoch": 0.2, + "learning_rate": 0.00027068485900720937, + "loss": 0.0822, "step": 30280 }, { - "epoch": 0.33, - "learning_rate": 0.00025085664222207797, - "loss": 0.0657, + "epoch": 0.2, + "learning_rate": 0.00027067517765285245, + "loss": 0.0755, "step": 30290 }, { - "epoch": 0.33, - "learning_rate": 0.00025084041793756894, - "loss": 0.0686, + "epoch": 0.2, + "learning_rate": 0.00027066549629849553, + "loss": 0.0827, "step": 30300 }, { - "epoch": 0.33, - "learning_rate": 0.00025082419365305987, - "loss": 0.0705, + "epoch": 0.2, + "learning_rate": 0.00027065581494413856, + "loss": 0.0838, "step": 30310 }, { - "epoch": 0.33, - "learning_rate": 0.0002508079693685508, - "loss": 0.0695, + "epoch": 0.2, + "learning_rate": 0.00027064613358978164, + "loss": 0.0719, "step": 30320 }, { - "epoch": 0.33, - "learning_rate": 0.00025079174508404176, - "loss": 0.0661, + "epoch": 0.2, + "learning_rate": 0.0002706364522354247, + "loss": 0.0728, "step": 30330 }, { - "epoch": 0.33, - "learning_rate": 0.0002507755207995327, - "loss": 0.0705, + "epoch": 0.2, + "learning_rate": 0.00027062677088106774, + "loss": 0.0828, "step": 30340 }, { - "epoch": 0.33, - "learning_rate": 0.00025075929651502366, - "loss": 0.0793, + "epoch": 0.2, + "learning_rate": 0.0002706170895267108, + "loss": 0.0753, "step": 30350 }, { - "epoch": 0.33, - "learning_rate": 0.0002507430722305146, - "loss": 0.0743, + "epoch": 0.2, + "learning_rate": 0.0002706074081723539, + "loss": 0.0753, "step": 30360 }, { - "epoch": 0.33, - "learning_rate": 0.00025072684794600556, - "loss": 0.0687, + "epoch": 0.2, + "learning_rate": 0.000270597726817997, + "loss": 0.0805, "step": 30370 }, { - "epoch": 0.33, - "learning_rate": 0.0002507106236614965, - "loss": 0.0645, + "epoch": 0.2, + "learning_rate": 0.00027058804546364, + "loss": 0.073, "step": 30380 }, { - "epoch": 0.33, - "learning_rate": 0.00025069439937698746, - "loss": 0.0753, + "epoch": 0.2, + "learning_rate": 0.0002705783641092831, + "loss": 0.0786, "step": 30390 }, { - "epoch": 0.33, - "learning_rate": 0.0002506781750924784, - "loss": 0.0698, + "epoch": 0.2, + "learning_rate": 0.00027056868275492617, + "loss": 0.0745, "step": 30400 }, { - "epoch": 0.33, - "learning_rate": 0.00025066195080796936, - "loss": 0.0706, + "epoch": 0.2, + "learning_rate": 0.00027055900140056925, + "loss": 0.0754, "step": 30410 }, { - "epoch": 0.33, - "learning_rate": 0.0002506457265234603, - "loss": 0.0581, + "epoch": 0.2, + "learning_rate": 0.0002705493200462123, + "loss": 0.0796, "step": 30420 }, { - "epoch": 0.33, - "learning_rate": 0.00025062950223895126, - "loss": 0.0765, + "epoch": 0.2, + "learning_rate": 0.0002705396386918554, + "loss": 0.0663, "step": 30430 }, { - "epoch": 0.33, - "learning_rate": 0.0002506132779544422, - "loss": 0.0686, + "epoch": 0.2, + "learning_rate": 0.0002705299573374985, + "loss": 0.0719, "step": 30440 }, { - "epoch": 0.33, - "learning_rate": 0.0002505970536699331, - "loss": 0.0702, + "epoch": 0.2, + "learning_rate": 0.0002705202759831415, + "loss": 0.0815, "step": 30450 }, { - "epoch": 0.33, - "learning_rate": 0.0002505808293854241, - "loss": 0.0642, + "epoch": 0.2, + "learning_rate": 0.0002705105946287846, + "loss": 0.0752, "step": 30460 }, { - "epoch": 0.33, - "learning_rate": 0.000250564605100915, - "loss": 0.066, + "epoch": 0.2, + "learning_rate": 0.00027050091327442767, + "loss": 0.0749, "step": 30470 }, { - "epoch": 0.33, - "learning_rate": 0.000250548380816406, - "loss": 0.0716, + "epoch": 0.2, + "learning_rate": 0.0002704912319200707, + "loss": 0.0841, "step": 30480 }, { - "epoch": 0.33, - "learning_rate": 0.0002505321565318969, - "loss": 0.0657, + "epoch": 0.2, + "learning_rate": 0.0002704815505657138, + "loss": 0.0752, "step": 30490 }, { - "epoch": 0.33, - "learning_rate": 0.00025051593224738783, - "loss": 0.0699, + "epoch": 0.2, + "learning_rate": 0.00027047186921135685, + "loss": 0.0717, "step": 30500 }, { - "epoch": 0.33, - "learning_rate": 0.0002504997079628788, - "loss": 0.0706, + "epoch": 0.2, + "learning_rate": 0.00027046218785699993, + "loss": 0.0782, "step": 30510 }, { - "epoch": 0.33, - "learning_rate": 0.0002504834836783698, - "loss": 0.067, + "epoch": 0.2, + "learning_rate": 0.00027045250650264296, + "loss": 0.0807, "step": 30520 }, { - "epoch": 0.33, - "learning_rate": 0.0002504672593938607, - "loss": 0.0688, + "epoch": 0.2, + "learning_rate": 0.00027044282514828604, + "loss": 0.0801, "step": 30530 }, { - "epoch": 0.33, - "learning_rate": 0.0002504510351093517, - "loss": 0.0603, + "epoch": 0.2, + "learning_rate": 0.0002704331437939291, + "loss": 0.073, "step": 30540 }, { - "epoch": 0.33, - "learning_rate": 0.0002504348108248426, - "loss": 0.0757, + "epoch": 0.2, + "learning_rate": 0.0002704234624395722, + "loss": 0.0749, "step": 30550 }, { - "epoch": 0.33, - "learning_rate": 0.0002504185865403336, - "loss": 0.068, + "epoch": 0.2, + "learning_rate": 0.0002704137810852153, + "loss": 0.0749, "step": 30560 }, { - "epoch": 0.33, - "learning_rate": 0.0002504023622558245, - "loss": 0.0746, + "epoch": 0.2, + "learning_rate": 0.00027040409973085836, + "loss": 0.0975, "step": 30570 }, { - "epoch": 0.33, - "learning_rate": 0.0002503861379713155, - "loss": 0.0686, + "epoch": 0.2, + "learning_rate": 0.0002703944183765014, + "loss": 0.0806, "step": 30580 }, { - "epoch": 0.33, - "learning_rate": 0.0002503699136868064, - "loss": 0.0632, + "epoch": 0.2, + "learning_rate": 0.00027038473702214446, + "loss": 0.0846, "step": 30590 }, { - "epoch": 0.33, - "learning_rate": 0.00025035368940229733, - "loss": 0.0653, + "epoch": 0.2, + "learning_rate": 0.00027037505566778754, + "loss": 0.0839, "step": 30600 }, { - "epoch": 0.33, - "learning_rate": 0.0002503374651177883, - "loss": 0.0726, + "epoch": 0.2, + "learning_rate": 0.00027036537431343057, + "loss": 0.0798, "step": 30610 }, { - "epoch": 0.33, - "learning_rate": 0.0002503212408332792, - "loss": 0.0643, + "epoch": 0.2, + "learning_rate": 0.00027035569295907365, + "loss": 0.0803, "step": 30620 }, { - "epoch": 0.33, - "learning_rate": 0.00025030501654877015, - "loss": 0.06, + "epoch": 0.2, + "learning_rate": 0.00027034601160471673, + "loss": 0.0735, "step": 30630 }, { - "epoch": 0.33, - "learning_rate": 0.0002502887922642611, - "loss": 0.0688, + "epoch": 0.2, + "learning_rate": 0.0002703363302503598, + "loss": 0.0717, "step": 30640 }, { - "epoch": 0.33, - "learning_rate": 0.00025027256797975205, - "loss": 0.0691, + "epoch": 0.2, + "learning_rate": 0.0002703266488960029, + "loss": 0.0808, "step": 30650 }, { - "epoch": 0.33, - "learning_rate": 0.000250256343695243, - "loss": 0.0735, + "epoch": 0.2, + "learning_rate": 0.0002703169675416459, + "loss": 0.0811, "step": 30660 }, { - "epoch": 0.33, - "learning_rate": 0.00025024011941073395, - "loss": 0.0649, + "epoch": 0.2, + "learning_rate": 0.000270307286187289, + "loss": 0.0691, "step": 30670 }, { - "epoch": 0.33, - "learning_rate": 0.0002502238951262249, - "loss": 0.0705, + "epoch": 0.2, + "learning_rate": 0.0002702976048329321, + "loss": 0.0806, "step": 30680 }, { - "epoch": 0.33, - "learning_rate": 0.00025020767084171585, - "loss": 0.0578, + "epoch": 0.2, + "learning_rate": 0.00027028792347857515, + "loss": 0.0679, "step": 30690 }, { - "epoch": 0.33, - "learning_rate": 0.0002501914465572068, - "loss": 0.0695, + "epoch": 0.2, + "learning_rate": 0.00027027824212421823, + "loss": 0.0915, "step": 30700 }, { - "epoch": 0.33, - "learning_rate": 0.00025017522227269775, - "loss": 0.0684, + "epoch": 0.2, + "learning_rate": 0.00027026856076986126, + "loss": 0.078, "step": 30710 }, { - "epoch": 0.33, - "learning_rate": 0.0002501589979881887, - "loss": 0.0663, + "epoch": 0.2, + "learning_rate": 0.00027025887941550434, + "loss": 0.0737, "step": 30720 }, { - "epoch": 0.33, - "learning_rate": 0.00025014277370367965, - "loss": 0.0676, + "epoch": 0.2, + "learning_rate": 0.0002702491980611474, + "loss": 0.0758, "step": 30730 }, { - "epoch": 0.33, - "learning_rate": 0.0002501265494191706, - "loss": 0.0629, + "epoch": 0.2, + "learning_rate": 0.00027023951670679044, + "loss": 0.0794, "step": 30740 }, { - "epoch": 0.33, - "learning_rate": 0.00025011032513466155, - "loss": 0.0637, + "epoch": 0.2, + "learning_rate": 0.0002702298353524335, + "loss": 0.0793, "step": 30750 }, { - "epoch": 0.33, - "learning_rate": 0.0002500941008501525, - "loss": 0.0677, + "epoch": 0.2, + "learning_rate": 0.0002702201539980766, + "loss": 0.0714, "step": 30760 }, { - "epoch": 0.33, - "learning_rate": 0.00025007787656564345, - "loss": 0.0607, + "epoch": 0.2, + "learning_rate": 0.0002702104726437197, + "loss": 0.0713, "step": 30770 }, { - "epoch": 0.33, - "learning_rate": 0.00025006165228113437, - "loss": 0.0622, + "epoch": 0.2, + "learning_rate": 0.00027020079128936276, + "loss": 0.0775, "step": 30780 }, { - "epoch": 0.33, - "learning_rate": 0.00025004542799662535, - "loss": 0.085, + "epoch": 0.2, + "learning_rate": 0.00027019110993500584, + "loss": 0.08, "step": 30790 }, { - "epoch": 0.33, - "learning_rate": 0.00025002920371211627, - "loss": 0.0657, + "epoch": 0.2, + "learning_rate": 0.00027018142858064887, + "loss": 0.0834, "step": 30800 }, { - "epoch": 0.33, - "learning_rate": 0.00025001297942760725, - "loss": 0.073, + "epoch": 0.2, + "learning_rate": 0.00027017174722629195, + "loss": 0.0773, "step": 30810 }, { - "epoch": 0.33, - "learning_rate": 0.00024999675514309817, - "loss": 0.0681, + "epoch": 0.2, + "learning_rate": 0.00027016206587193503, + "loss": 0.0796, "step": 30820 }, { - "epoch": 0.33, - "learning_rate": 0.0002499805308585891, - "loss": 0.0674, + "epoch": 0.2, + "learning_rate": 0.0002701523845175781, + "loss": 0.0908, "step": 30830 }, { - "epoch": 0.33, - "learning_rate": 0.00024996430657408007, - "loss": 0.0735, + "epoch": 0.2, + "learning_rate": 0.0002701427031632212, + "loss": 0.0775, "step": 30840 }, { - "epoch": 0.33, - "learning_rate": 0.000249948082289571, - "loss": 0.0784, + "epoch": 0.2, + "learning_rate": 0.0002701330218088642, + "loss": 0.0743, "step": 30850 }, { - "epoch": 0.33, - "learning_rate": 0.00024993185800506197, - "loss": 0.0772, + "epoch": 0.2, + "learning_rate": 0.0002701233404545073, + "loss": 0.0795, "step": 30860 }, { - "epoch": 0.33, - "learning_rate": 0.0002499156337205529, - "loss": 0.0708, + "epoch": 0.2, + "learning_rate": 0.0002701136591001504, + "loss": 0.0799, "step": 30870 }, { - "epoch": 0.33, - "learning_rate": 0.00024989940943604387, - "loss": 0.0717, + "epoch": 0.2, + "learning_rate": 0.0002701039777457934, + "loss": 0.0793, "step": 30880 }, { - "epoch": 0.33, - "learning_rate": 0.0002498831851515348, - "loss": 0.0662, + "epoch": 0.2, + "learning_rate": 0.0002700942963914365, + "loss": 0.0777, "step": 30890 }, { - "epoch": 0.33, - "learning_rate": 0.00024986696086702577, - "loss": 0.0706, + "epoch": 0.2, + "learning_rate": 0.00027008461503707956, + "loss": 0.0707, "step": 30900 }, { - "epoch": 0.33, - "learning_rate": 0.0002498507365825167, - "loss": 0.0738, + "epoch": 0.2, + "learning_rate": 0.00027007493368272264, + "loss": 0.0761, "step": 30910 }, { - "epoch": 0.33, - "learning_rate": 0.00024983451229800767, - "loss": 0.0693, + "epoch": 0.2, + "learning_rate": 0.0002700652523283657, + "loss": 0.0801, "step": 30920 }, { - "epoch": 0.33, - "learning_rate": 0.0002498182880134986, - "loss": 0.0691, + "epoch": 0.2, + "learning_rate": 0.0002700555709740088, + "loss": 0.0653, "step": 30930 }, { - "epoch": 0.33, - "learning_rate": 0.00024980206372898957, - "loss": 0.066, + "epoch": 0.2, + "learning_rate": 0.0002700458896196518, + "loss": 0.0706, "step": 30940 }, { - "epoch": 0.33, - "learning_rate": 0.0002497858394444805, - "loss": 0.0638, + "epoch": 0.2, + "learning_rate": 0.0002700362082652949, + "loss": 0.0777, "step": 30950 }, { - "epoch": 0.33, - "learning_rate": 0.0002497696151599714, - "loss": 0.0708, + "epoch": 0.2, + "learning_rate": 0.000270026526910938, + "loss": 0.0797, "step": 30960 }, { - "epoch": 0.33, - "learning_rate": 0.0002497533908754624, - "loss": 0.0797, + "epoch": 0.2, + "learning_rate": 0.00027001684555658106, + "loss": 0.0737, "step": 30970 }, { - "epoch": 0.34, - "learning_rate": 0.0002497371665909533, - "loss": 0.066, + "epoch": 0.2, + "learning_rate": 0.0002700071642022241, + "loss": 0.0671, "step": 30980 }, { - "epoch": 0.34, - "learning_rate": 0.0002497209423064443, - "loss": 0.0659, + "epoch": 0.2, + "learning_rate": 0.00026999748284786717, + "loss": 0.0789, "step": 30990 }, { - "epoch": 0.34, - "learning_rate": 0.0002497047180219352, - "loss": 0.0692, + "epoch": 0.2, + "learning_rate": 0.00026998780149351025, + "loss": 0.0741, "step": 31000 }, { - "epoch": 0.34, - "eval_cer": 0.9214626613021498, - "eval_loss": 0.04675569757819176, - "eval_runtime": 119.7354, - "eval_samples_per_second": 16.703, - "eval_steps_per_second": 4.176, + "epoch": 0.2, + "eval_cer": 0.9201446164275223, + "eval_loss": 0.05069497600197792, + "eval_runtime": 120.4325, + "eval_samples_per_second": 16.607, + "eval_steps_per_second": 4.152, "step": 31000 }, { - "epoch": 0.34, - "learning_rate": 0.00024968849373742613, - "loss": 0.0738, + "epoch": 0.2, + "learning_rate": 0.0002699781201391533, + "loss": 0.0733, "step": 31010 }, { - "epoch": 0.34, - "learning_rate": 0.0002496722694529171, - "loss": 0.0713, + "epoch": 0.2, + "learning_rate": 0.00026996843878479635, + "loss": 0.07, "step": 31020 }, { - "epoch": 0.34, - "learning_rate": 0.00024965604516840803, - "loss": 0.063, + "epoch": 0.2, + "learning_rate": 0.00026995875743043943, + "loss": 0.0665, "step": 31030 }, { - "epoch": 0.34, - "learning_rate": 0.000249639820883899, - "loss": 0.0885, + "epoch": 0.2, + "learning_rate": 0.0002699490760760825, + "loss": 0.0767, "step": 31040 }, { - "epoch": 0.34, - "learning_rate": 0.00024962359659938993, - "loss": 0.0707, + "epoch": 0.2, + "learning_rate": 0.0002699393947217256, + "loss": 0.0745, "step": 31050 }, { - "epoch": 0.34, - "learning_rate": 0.0002496073723148809, - "loss": 0.0667, + "epoch": 0.2, + "learning_rate": 0.00026992971336736867, + "loss": 0.0752, "step": 31060 }, { - "epoch": 0.34, - "learning_rate": 0.00024959114803037183, - "loss": 0.0725, + "epoch": 0.2, + "learning_rate": 0.0002699200320130117, + "loss": 0.0675, "step": 31070 }, { - "epoch": 0.34, - "learning_rate": 0.0002495749237458628, - "loss": 0.0679, + "epoch": 0.2, + "learning_rate": 0.0002699103506586548, + "loss": 0.0761, "step": 31080 }, { - "epoch": 0.34, - "learning_rate": 0.00024955869946135373, - "loss": 0.0709, + "epoch": 0.2, + "learning_rate": 0.00026990066930429786, + "loss": 0.0768, "step": 31090 }, { - "epoch": 0.34, - "learning_rate": 0.0002495424751768447, - "loss": 0.0609, + "epoch": 0.2, + "learning_rate": 0.00026989098794994094, + "loss": 0.0741, "step": 31100 }, { - "epoch": 0.34, - "learning_rate": 0.00024952625089233563, - "loss": 0.0694, + "epoch": 0.2, + "learning_rate": 0.00026988130659558396, + "loss": 0.0683, "step": 31110 }, { - "epoch": 0.34, - "learning_rate": 0.0002495100266078266, - "loss": 0.0649, + "epoch": 0.2, + "learning_rate": 0.00026987162524122704, + "loss": 0.0705, "step": 31120 }, { - "epoch": 0.34, - "learning_rate": 0.00024949380232331753, - "loss": 0.0654, + "epoch": 0.2, + "learning_rate": 0.0002698619438868701, + "loss": 0.08, "step": 31130 }, { - "epoch": 0.34, - "learning_rate": 0.00024947757803880845, - "loss": 0.0686, + "epoch": 0.2, + "learning_rate": 0.00026985226253251315, + "loss": 0.0717, "step": 31140 }, { - "epoch": 0.34, - "learning_rate": 0.00024946135375429943, - "loss": 0.0704, + "epoch": 0.2, + "learning_rate": 0.00026984258117815623, + "loss": 0.0788, "step": 31150 }, { - "epoch": 0.34, - "learning_rate": 0.00024944512946979035, - "loss": 0.0679, + "epoch": 0.2, + "learning_rate": 0.0002698328998237993, + "loss": 0.0708, "step": 31160 }, { - "epoch": 0.34, - "learning_rate": 0.00024942890518528133, - "loss": 0.0737, + "epoch": 0.2, + "learning_rate": 0.0002698232184694424, + "loss": 0.0685, "step": 31170 }, { - "epoch": 0.34, - "learning_rate": 0.00024941268090077225, - "loss": 0.0681, + "epoch": 0.2, + "learning_rate": 0.00026981353711508547, + "loss": 0.075, "step": 31180 }, { - "epoch": 0.34, - "learning_rate": 0.0002493964566162632, - "loss": 0.0648, + "epoch": 0.2, + "learning_rate": 0.00026980385576072855, + "loss": 0.0695, "step": 31190 }, { - "epoch": 0.34, - "learning_rate": 0.00024938023233175415, - "loss": 0.071, + "epoch": 0.2, + "learning_rate": 0.00026979417440637163, + "loss": 0.0659, "step": 31200 }, { - "epoch": 0.34, - "learning_rate": 0.0002493640080472451, - "loss": 0.0628, + "epoch": 0.2, + "learning_rate": 0.00026978449305201465, + "loss": 0.0763, "step": 31210 }, { - "epoch": 0.34, - "learning_rate": 0.00024934778376273605, - "loss": 0.0798, + "epoch": 0.2, + "learning_rate": 0.00026977481169765773, + "loss": 0.0822, "step": 31220 }, { - "epoch": 0.34, - "learning_rate": 0.000249331559478227, - "loss": 0.0653, + "epoch": 0.2, + "learning_rate": 0.0002697651303433008, + "loss": 0.0754, "step": 31230 }, { - "epoch": 0.34, - "learning_rate": 0.00024931533519371795, - "loss": 0.0879, + "epoch": 0.2, + "learning_rate": 0.0002697554489889439, + "loss": 0.0788, "step": 31240 }, { - "epoch": 0.34, - "learning_rate": 0.00024929911090920887, - "loss": 0.0714, + "epoch": 0.2, + "learning_rate": 0.0002697457676345869, + "loss": 0.0839, "step": 31250 }, { - "epoch": 0.34, - "learning_rate": 0.00024928288662469985, - "loss": 0.0765, + "epoch": 0.2, + "learning_rate": 0.00026973608628023, + "loss": 0.085, "step": 31260 }, { - "epoch": 0.34, - "learning_rate": 0.00024926666234019077, - "loss": 0.0718, + "epoch": 0.2, + "learning_rate": 0.0002697264049258731, + "loss": 0.0769, "step": 31270 }, { - "epoch": 0.34, - "learning_rate": 0.00024925043805568175, - "loss": 0.0626, + "epoch": 0.2, + "learning_rate": 0.0002697167235715161, + "loss": 0.0691, "step": 31280 }, { - "epoch": 0.34, - "learning_rate": 0.00024923421377117267, - "loss": 0.0681, + "epoch": 0.2, + "learning_rate": 0.0002697070422171592, + "loss": 0.0798, "step": 31290 }, { - "epoch": 0.34, - "learning_rate": 0.00024921798948666365, - "loss": 0.069, + "epoch": 0.2, + "learning_rate": 0.00026969736086280226, + "loss": 0.0861, "step": 31300 }, { - "epoch": 0.34, - "learning_rate": 0.00024920176520215457, - "loss": 0.0714, + "epoch": 0.2, + "learning_rate": 0.00026968767950844534, + "loss": 0.0684, "step": 31310 }, { - "epoch": 0.34, - "learning_rate": 0.0002491855409176455, - "loss": 0.0774, + "epoch": 0.2, + "learning_rate": 0.0002696779981540884, + "loss": 0.0747, "step": 31320 }, { - "epoch": 0.34, - "learning_rate": 0.00024916931663313647, - "loss": 0.0794, + "epoch": 0.2, + "learning_rate": 0.0002696683167997315, + "loss": 0.0752, "step": 31330 }, { - "epoch": 0.34, - "learning_rate": 0.0002491530923486274, - "loss": 0.0601, + "epoch": 0.2, + "learning_rate": 0.0002696586354453746, + "loss": 0.0856, "step": 31340 }, { - "epoch": 0.34, - "learning_rate": 0.00024913686806411837, - "loss": 0.0595, + "epoch": 0.2, + "learning_rate": 0.0002696489540910176, + "loss": 0.0886, "step": 31350 }, { - "epoch": 0.34, - "learning_rate": 0.0002491206437796093, - "loss": 0.0664, + "epoch": 0.2, + "learning_rate": 0.0002696392727366607, + "loss": 0.0745, "step": 31360 }, { - "epoch": 0.34, - "learning_rate": 0.0002491044194951002, - "loss": 0.0603, + "epoch": 0.2, + "learning_rate": 0.00026962959138230377, + "loss": 0.0814, "step": 31370 }, { - "epoch": 0.34, - "learning_rate": 0.0002490881952105912, - "loss": 0.0704, + "epoch": 0.2, + "learning_rate": 0.0002696199100279468, + "loss": 0.0708, "step": 31380 }, { - "epoch": 0.34, - "learning_rate": 0.0002490719709260821, - "loss": 0.0694, + "epoch": 0.2, + "learning_rate": 0.00026961022867358987, + "loss": 0.0724, "step": 31390 }, { - "epoch": 0.34, - "learning_rate": 0.0002490557466415731, - "loss": 0.0716, + "epoch": 0.2, + "learning_rate": 0.00026960054731923295, + "loss": 0.0766, "step": 31400 }, { - "epoch": 0.34, - "learning_rate": 0.000249039522357064, - "loss": 0.0704, + "epoch": 0.2, + "learning_rate": 0.00026959086596487603, + "loss": 0.0956, "step": 31410 }, { - "epoch": 0.34, - "learning_rate": 0.000249023298072555, - "loss": 0.062, + "epoch": 0.2, + "learning_rate": 0.00026958118461051906, + "loss": 0.0776, "step": 31420 }, { - "epoch": 0.34, - "learning_rate": 0.0002490070737880459, - "loss": 0.0672, + "epoch": 0.2, + "learning_rate": 0.00026957150325616214, + "loss": 0.0793, "step": 31430 }, { - "epoch": 0.34, - "learning_rate": 0.0002489908495035369, - "loss": 0.0654, + "epoch": 0.2, + "learning_rate": 0.0002695618219018052, + "loss": 0.0763, "step": 31440 }, { - "epoch": 0.34, - "learning_rate": 0.0002489746252190278, - "loss": 0.0843, + "epoch": 0.2, + "learning_rate": 0.0002695521405474483, + "loss": 0.0859, "step": 31450 }, { - "epoch": 0.34, - "learning_rate": 0.0002489584009345188, - "loss": 0.0752, + "epoch": 0.2, + "learning_rate": 0.0002695424591930914, + "loss": 0.0697, "step": 31460 }, { - "epoch": 0.34, - "learning_rate": 0.0002489421766500097, - "loss": 0.0717, + "epoch": 0.2, + "learning_rate": 0.00026953277783873446, + "loss": 0.0674, "step": 31470 }, { - "epoch": 0.34, - "learning_rate": 0.0002489259523655007, - "loss": 0.0741, + "epoch": 0.2, + "learning_rate": 0.00026952309648437754, + "loss": 0.0733, "step": 31480 }, { - "epoch": 0.34, - "learning_rate": 0.0002489097280809916, - "loss": 0.0636, + "epoch": 0.2, + "learning_rate": 0.00026951341513002056, + "loss": 0.0675, "step": 31490 }, { - "epoch": 0.34, - "learning_rate": 0.0002488935037964826, - "loss": 0.0684, + "epoch": 0.2, + "learning_rate": 0.00026950373377566364, + "loss": 0.0746, "step": 31500 }, { - "epoch": 0.34, - "learning_rate": 0.0002488772795119735, - "loss": 0.0633, + "epoch": 0.2, + "learning_rate": 0.0002694940524213067, + "loss": 0.0797, "step": 31510 }, { - "epoch": 0.34, - "learning_rate": 0.00024886105522746444, - "loss": 0.0696, + "epoch": 0.2, + "learning_rate": 0.00026948437106694975, + "loss": 0.0744, "step": 31520 }, { - "epoch": 0.34, - "learning_rate": 0.0002488448309429554, - "loss": 0.0599, + "epoch": 0.2, + "learning_rate": 0.0002694746897125928, + "loss": 0.0713, "step": 31530 }, { - "epoch": 0.34, - "learning_rate": 0.00024882860665844633, - "loss": 0.0665, + "epoch": 0.2, + "learning_rate": 0.0002694650083582359, + "loss": 0.0861, "step": 31540 }, { - "epoch": 0.34, - "learning_rate": 0.00024881238237393726, - "loss": 0.0681, + "epoch": 0.2, + "learning_rate": 0.000269455327003879, + "loss": 0.0789, "step": 31550 }, { - "epoch": 0.34, - "learning_rate": 0.00024879615808942823, - "loss": 0.0692, + "epoch": 0.2, + "learning_rate": 0.000269445645649522, + "loss": 0.0719, "step": 31560 }, { - "epoch": 0.34, - "learning_rate": 0.00024877993380491916, - "loss": 0.0696, + "epoch": 0.2, + "learning_rate": 0.0002694359642951651, + "loss": 0.0753, "step": 31570 }, { - "epoch": 0.34, - "learning_rate": 0.00024876370952041013, - "loss": 0.0628, + "epoch": 0.2, + "learning_rate": 0.00026942628294080817, + "loss": 0.0907, "step": 31580 }, { - "epoch": 0.34, - "learning_rate": 0.00024874748523590106, - "loss": 0.0595, + "epoch": 0.2, + "learning_rate": 0.00026941660158645125, + "loss": 0.0691, "step": 31590 }, { - "epoch": 0.34, - "learning_rate": 0.00024873126095139203, - "loss": 0.063, + "epoch": 0.2, + "learning_rate": 0.00026940692023209433, + "loss": 0.0698, "step": 31600 }, { - "epoch": 0.34, - "learning_rate": 0.00024871503666688296, - "loss": 0.065, + "epoch": 0.2, + "learning_rate": 0.0002693972388777374, + "loss": 0.0776, "step": 31610 }, { - "epoch": 0.34, - "learning_rate": 0.00024869881238237393, - "loss": 0.0788, + "epoch": 0.2, + "learning_rate": 0.00026938755752338044, + "loss": 0.0746, "step": 31620 }, { - "epoch": 0.34, - "learning_rate": 0.00024868258809786486, - "loss": 0.0655, + "epoch": 0.2, + "learning_rate": 0.0002693778761690235, + "loss": 0.0763, "step": 31630 }, { - "epoch": 0.34, - "learning_rate": 0.00024866636381335583, - "loss": 0.057, + "epoch": 0.2, + "learning_rate": 0.0002693681948146666, + "loss": 0.0763, "step": 31640 }, { - "epoch": 0.34, - "learning_rate": 0.00024865013952884676, - "loss": 0.0638, + "epoch": 0.2, + "learning_rate": 0.0002693585134603096, + "loss": 0.0739, "step": 31650 }, { - "epoch": 0.34, - "learning_rate": 0.00024863391524433773, - "loss": 0.0623, + "epoch": 0.2, + "learning_rate": 0.0002693488321059527, + "loss": 0.0714, "step": 31660 }, { - "epoch": 0.34, - "learning_rate": 0.00024861769095982865, - "loss": 0.0685, + "epoch": 0.2, + "learning_rate": 0.0002693391507515958, + "loss": 0.0714, "step": 31670 }, { - "epoch": 0.34, - "learning_rate": 0.00024860146667531963, - "loss": 0.0704, + "epoch": 0.2, + "learning_rate": 0.00026932946939723886, + "loss": 0.0779, "step": 31680 }, { - "epoch": 0.34, - "learning_rate": 0.00024858524239081055, - "loss": 0.0642, + "epoch": 0.2, + "learning_rate": 0.00026931978804288194, + "loss": 0.0704, "step": 31690 }, { - "epoch": 0.34, - "learning_rate": 0.0002485690181063015, - "loss": 0.0683, + "epoch": 0.2, + "learning_rate": 0.00026931010668852497, + "loss": 0.0718, "step": 31700 }, { - "epoch": 0.34, - "learning_rate": 0.00024855279382179245, - "loss": 0.0678, + "epoch": 0.2, + "learning_rate": 0.00026930042533416805, + "loss": 0.0812, "step": 31710 }, { - "epoch": 0.34, - "learning_rate": 0.0002485365695372834, - "loss": 0.0634, + "epoch": 0.2, + "learning_rate": 0.0002692907439798111, + "loss": 0.0689, "step": 31720 }, { - "epoch": 0.34, - "learning_rate": 0.0002485203452527743, - "loss": 0.0601, + "epoch": 0.2, + "learning_rate": 0.0002692810626254542, + "loss": 0.0772, "step": 31730 }, { - "epoch": 0.34, - "learning_rate": 0.0002485041209682653, - "loss": 0.0631, + "epoch": 0.2, + "learning_rate": 0.0002692713812710973, + "loss": 0.0735, "step": 31740 }, { - "epoch": 0.34, - "learning_rate": 0.0002484878966837562, - "loss": 0.0659, + "epoch": 0.2, + "learning_rate": 0.0002692616999167403, + "loss": 0.078, "step": 31750 }, { - "epoch": 0.34, - "learning_rate": 0.0002484716723992472, - "loss": 0.0679, + "epoch": 0.2, + "learning_rate": 0.0002692520185623834, + "loss": 0.0779, "step": 31760 }, { - "epoch": 0.34, - "learning_rate": 0.0002484554481147381, - "loss": 0.0697, + "epoch": 0.21, + "learning_rate": 0.00026924233720802647, + "loss": 0.0795, "step": 31770 }, { - "epoch": 0.34, - "learning_rate": 0.0002484392238302291, - "loss": 0.0709, + "epoch": 0.21, + "learning_rate": 0.0002692326558536695, + "loss": 0.0859, "step": 31780 }, { - "epoch": 0.34, - "learning_rate": 0.00024842299954572, - "loss": 0.0651, + "epoch": 0.21, + "learning_rate": 0.0002692229744993126, + "loss": 0.0771, "step": 31790 }, { - "epoch": 0.34, - "learning_rate": 0.000248406775261211, - "loss": 0.0692, + "epoch": 0.21, + "learning_rate": 0.00026921329314495566, + "loss": 0.0815, "step": 31800 }, { - "epoch": 0.34, - "learning_rate": 0.0002483905509767019, - "loss": 0.0625, + "epoch": 0.21, + "learning_rate": 0.00026920361179059874, + "loss": 0.0811, "step": 31810 }, { - "epoch": 0.34, - "learning_rate": 0.0002483743266921929, - "loss": 0.0672, + "epoch": 0.21, + "learning_rate": 0.0002691939304362418, + "loss": 0.0766, "step": 31820 }, { - "epoch": 0.34, - "learning_rate": 0.0002483581024076838, - "loss": 0.0675, + "epoch": 0.21, + "learning_rate": 0.0002691842490818849, + "loss": 0.0776, "step": 31830 }, { - "epoch": 0.34, - "learning_rate": 0.0002483418781231748, - "loss": 0.0747, + "epoch": 0.21, + "learning_rate": 0.0002691745677275279, + "loss": 0.0717, "step": 31840 }, { - "epoch": 0.34, - "learning_rate": 0.0002483256538386657, - "loss": 0.0651, + "epoch": 0.21, + "learning_rate": 0.000269164886373171, + "loss": 0.0741, "step": 31850 }, { - "epoch": 0.34, - "learning_rate": 0.0002483094295541567, - "loss": 0.0925, + "epoch": 0.21, + "learning_rate": 0.0002691552050188141, + "loss": 0.079, "step": 31860 }, { - "epoch": 0.34, - "learning_rate": 0.0002482932052696476, - "loss": 0.0683, + "epoch": 0.21, + "learning_rate": 0.00026914552366445716, + "loss": 0.0749, "step": 31870 }, { - "epoch": 0.34, - "learning_rate": 0.0002482769809851385, - "loss": 0.0651, + "epoch": 0.21, + "learning_rate": 0.00026913584231010024, + "loss": 0.0799, "step": 31880 }, { - "epoch": 0.34, - "learning_rate": 0.0002482607567006295, - "loss": 0.075, + "epoch": 0.21, + "learning_rate": 0.00026912616095574327, + "loss": 0.0693, "step": 31890 }, { - "epoch": 0.35, - "learning_rate": 0.0002482445324161204, - "loss": 0.066, + "epoch": 0.21, + "learning_rate": 0.00026911647960138635, + "loss": 0.0784, "step": 31900 }, { - "epoch": 0.35, - "learning_rate": 0.00024822830813161134, - "loss": 0.0712, + "epoch": 0.21, + "learning_rate": 0.0002691067982470294, + "loss": 0.0743, "step": 31910 }, { - "epoch": 0.35, - "learning_rate": 0.0002482120838471023, - "loss": 0.0655, + "epoch": 0.21, + "learning_rate": 0.00026909711689267245, + "loss": 0.0672, "step": 31920 }, { - "epoch": 0.35, - "learning_rate": 0.00024819585956259324, - "loss": 0.0691, + "epoch": 0.21, + "learning_rate": 0.00026908743553831553, + "loss": 0.0776, "step": 31930 }, { - "epoch": 0.35, - "learning_rate": 0.0002481796352780842, - "loss": 0.0647, + "epoch": 0.21, + "learning_rate": 0.0002690777541839586, + "loss": 0.0736, "step": 31940 }, { - "epoch": 0.35, - "learning_rate": 0.00024816341099357514, - "loss": 0.0646, + "epoch": 0.21, + "learning_rate": 0.0002690680728296017, + "loss": 0.0712, "step": 31950 }, { - "epoch": 0.35, - "learning_rate": 0.0002481471867090661, - "loss": 0.0735, + "epoch": 0.21, + "learning_rate": 0.00026905839147524477, + "loss": 0.0761, "step": 31960 }, { - "epoch": 0.35, - "learning_rate": 0.00024813096242455704, - "loss": 0.0698, + "epoch": 0.21, + "learning_rate": 0.00026904871012088785, + "loss": 0.0782, "step": 31970 }, { - "epoch": 0.35, - "learning_rate": 0.000248114738140048, - "loss": 0.077, + "epoch": 0.21, + "learning_rate": 0.0002690390287665309, + "loss": 0.0872, "step": 31980 }, { - "epoch": 0.35, - "learning_rate": 0.00024809851385553894, - "loss": 0.0643, + "epoch": 0.21, + "learning_rate": 0.00026902934741217395, + "loss": 0.0729, "step": 31990 }, { - "epoch": 0.35, - "learning_rate": 0.0002480822895710299, - "loss": 0.0633, + "epoch": 0.21, + "learning_rate": 0.00026901966605781703, + "loss": 0.0764, "step": 32000 }, { - "epoch": 0.35, - "eval_cer": 0.9212753626261395, - "eval_loss": 0.04725624993443489, - "eval_runtime": 119.2878, - "eval_samples_per_second": 16.766, - "eval_steps_per_second": 4.192, + "epoch": 0.21, + "eval_cer": 0.9201102700259858, + "eval_loss": 0.05101795867085457, + "eval_runtime": 120.5294, + "eval_samples_per_second": 16.593, + "eval_steps_per_second": 4.148, "step": 32000 }, { - "epoch": 0.35, - "learning_rate": 0.00024806606528652084, - "loss": 0.0669, + "epoch": 0.21, + "learning_rate": 0.0002690099847034601, + "loss": 0.0842, "step": 32010 }, { - "epoch": 0.35, - "learning_rate": 0.0002480498410020118, - "loss": 0.07, + "epoch": 0.21, + "learning_rate": 0.00026900030334910314, + "loss": 0.0764, "step": 32020 }, { - "epoch": 0.35, - "learning_rate": 0.00024803361671750274, - "loss": 0.0695, + "epoch": 0.21, + "learning_rate": 0.0002689906219947462, + "loss": 0.0696, "step": 32030 }, { - "epoch": 0.35, - "learning_rate": 0.0002480173924329937, - "loss": 0.062, + "epoch": 0.21, + "learning_rate": 0.0002689809406403893, + "loss": 0.0819, "step": 32040 }, { - "epoch": 0.35, - "learning_rate": 0.00024800116814848464, - "loss": 0.0704, + "epoch": 0.21, + "learning_rate": 0.0002689712592860323, + "loss": 0.0687, "step": 32050 }, { - "epoch": 0.35, - "learning_rate": 0.00024798494386397556, - "loss": 0.0757, + "epoch": 0.21, + "learning_rate": 0.0002689615779316754, + "loss": 0.0786, "step": 32060 }, { - "epoch": 0.35, - "learning_rate": 0.00024796871957946654, - "loss": 0.0698, + "epoch": 0.21, + "learning_rate": 0.0002689518965773185, + "loss": 0.0714, "step": 32070 }, { - "epoch": 0.35, - "learning_rate": 0.00024795249529495746, - "loss": 0.0631, + "epoch": 0.21, + "learning_rate": 0.00026894221522296156, + "loss": 0.074, "step": 32080 }, { - "epoch": 0.35, - "learning_rate": 0.0002479362710104484, - "loss": 0.0585, + "epoch": 0.21, + "learning_rate": 0.00026893253386860464, + "loss": 0.0682, "step": 32090 }, { - "epoch": 0.35, - "learning_rate": 0.00024792004672593936, - "loss": 0.0753, + "epoch": 0.21, + "learning_rate": 0.0002689228525142477, + "loss": 0.0767, "step": 32100 }, { - "epoch": 0.35, - "learning_rate": 0.0002479038224414303, - "loss": 0.0703, + "epoch": 0.21, + "learning_rate": 0.0002689131711598908, + "loss": 0.0696, "step": 32110 }, { - "epoch": 0.35, - "learning_rate": 0.00024788759815692126, - "loss": 0.0675, + "epoch": 0.21, + "learning_rate": 0.00026890348980553383, + "loss": 0.0678, "step": 32120 }, { - "epoch": 0.35, - "learning_rate": 0.0002478713738724122, - "loss": 0.0705, + "epoch": 0.21, + "learning_rate": 0.0002688938084511769, + "loss": 0.0701, "step": 32130 }, { - "epoch": 0.35, - "learning_rate": 0.00024785514958790316, - "loss": 0.0631, + "epoch": 0.21, + "learning_rate": 0.00026888412709682, + "loss": 0.0752, "step": 32140 }, { - "epoch": 0.35, - "learning_rate": 0.0002478389253033941, - "loss": 0.0673, + "epoch": 0.21, + "learning_rate": 0.000268874445742463, + "loss": 0.0761, "step": 32150 }, { - "epoch": 0.35, - "learning_rate": 0.00024782270101888506, - "loss": 0.0626, + "epoch": 0.21, + "learning_rate": 0.0002688647643881061, + "loss": 0.0637, "step": 32160 }, { - "epoch": 0.35, - "learning_rate": 0.000247806476734376, - "loss": 0.0631, + "epoch": 0.21, + "learning_rate": 0.0002688550830337492, + "loss": 0.0762, "step": 32170 }, { - "epoch": 0.35, - "learning_rate": 0.00024779025244986696, - "loss": 0.0648, + "epoch": 0.21, + "learning_rate": 0.00026884540167939225, + "loss": 0.0688, "step": 32180 }, { - "epoch": 0.35, - "learning_rate": 0.0002477740281653579, - "loss": 0.0679, + "epoch": 0.21, + "learning_rate": 0.0002688357203250353, + "loss": 0.0734, "step": 32190 }, { - "epoch": 0.35, - "learning_rate": 0.00024775780388084886, - "loss": 0.0676, + "epoch": 0.21, + "learning_rate": 0.00026882603897067836, + "loss": 0.074, "step": 32200 }, { - "epoch": 0.35, - "learning_rate": 0.0002477415795963398, - "loss": 0.0638, + "epoch": 0.21, + "learning_rate": 0.00026881635761632144, + "loss": 0.0748, "step": 32210 }, { - "epoch": 0.35, - "learning_rate": 0.00024772535531183076, - "loss": 0.0671, + "epoch": 0.21, + "learning_rate": 0.0002688066762619645, + "loss": 0.0675, "step": 32220 }, { - "epoch": 0.35, - "learning_rate": 0.0002477091310273217, - "loss": 0.0654, + "epoch": 0.21, + "learning_rate": 0.0002687969949076076, + "loss": 0.0773, "step": 32230 }, { - "epoch": 0.35, - "learning_rate": 0.0002476929067428126, - "loss": 0.0675, + "epoch": 0.21, + "learning_rate": 0.0002687873135532507, + "loss": 0.0738, "step": 32240 }, { - "epoch": 0.35, - "learning_rate": 0.0002476766824583036, - "loss": 0.0722, + "epoch": 0.21, + "learning_rate": 0.00026877763219889376, + "loss": 0.0847, "step": 32250 }, { - "epoch": 0.35, - "learning_rate": 0.0002476604581737945, - "loss": 0.0759, + "epoch": 0.21, + "learning_rate": 0.0002687679508445368, + "loss": 0.0657, "step": 32260 }, { - "epoch": 0.35, - "learning_rate": 0.0002476442338892854, - "loss": 0.0648, + "epoch": 0.21, + "learning_rate": 0.00026875826949017986, + "loss": 0.0888, "step": 32270 }, { - "epoch": 0.35, - "learning_rate": 0.0002476280096047764, - "loss": 0.0659, + "epoch": 0.21, + "learning_rate": 0.00026874858813582294, + "loss": 0.0816, "step": 32280 }, { - "epoch": 0.35, - "learning_rate": 0.0002476117853202673, - "loss": 0.0676, + "epoch": 0.21, + "learning_rate": 0.00026873890678146597, + "loss": 0.0677, "step": 32290 }, { - "epoch": 0.35, - "learning_rate": 0.0002475955610357583, - "loss": 0.0747, + "epoch": 0.21, + "learning_rate": 0.00026872922542710905, + "loss": 0.0812, "step": 32300 }, { - "epoch": 0.35, - "learning_rate": 0.0002475793367512492, - "loss": 0.0706, + "epoch": 0.21, + "learning_rate": 0.00026871954407275213, + "loss": 0.082, "step": 32310 }, { - "epoch": 0.35, - "learning_rate": 0.0002475631124667402, - "loss": 0.0741, + "epoch": 0.21, + "learning_rate": 0.0002687098627183952, + "loss": 0.0716, "step": 32320 }, { - "epoch": 0.35, - "learning_rate": 0.0002475468881822311, - "loss": 0.0676, + "epoch": 0.21, + "learning_rate": 0.00026870018136403823, + "loss": 0.0752, "step": 32330 }, { - "epoch": 0.35, - "learning_rate": 0.0002475306638977221, - "loss": 0.0643, + "epoch": 0.21, + "learning_rate": 0.0002686905000096813, + "loss": 0.0759, "step": 32340 }, { - "epoch": 0.35, - "learning_rate": 0.000247514439613213, - "loss": 0.0606, + "epoch": 0.21, + "learning_rate": 0.0002686808186553244, + "loss": 0.0817, "step": 32350 }, { - "epoch": 0.35, - "learning_rate": 0.000247498215328704, - "loss": 0.073, + "epoch": 0.21, + "learning_rate": 0.0002686711373009675, + "loss": 0.0771, "step": 32360 }, { - "epoch": 0.35, - "learning_rate": 0.0002474819910441949, - "loss": 0.0666, + "epoch": 0.21, + "learning_rate": 0.00026866145594661055, + "loss": 0.0748, "step": 32370 }, { - "epoch": 0.35, - "learning_rate": 0.0002474657667596859, - "loss": 0.0721, + "epoch": 0.21, + "learning_rate": 0.00026865177459225363, + "loss": 0.0852, "step": 32380 }, { - "epoch": 0.35, - "learning_rate": 0.0002474495424751768, - "loss": 0.0724, + "epoch": 0.21, + "learning_rate": 0.00026864209323789666, + "loss": 0.074, "step": 32390 }, { - "epoch": 0.35, - "learning_rate": 0.0002474333181906678, - "loss": 0.0644, + "epoch": 0.21, + "learning_rate": 0.00026863241188353974, + "loss": 0.0686, "step": 32400 }, { - "epoch": 0.35, - "learning_rate": 0.0002474170939061587, - "loss": 0.0634, + "epoch": 0.21, + "learning_rate": 0.0002686227305291828, + "loss": 0.0771, "step": 32410 }, { - "epoch": 0.35, - "learning_rate": 0.00024740086962164964, - "loss": 0.0632, + "epoch": 0.21, + "learning_rate": 0.00026861304917482584, + "loss": 0.071, "step": 32420 }, { - "epoch": 0.35, - "learning_rate": 0.0002473846453371406, - "loss": 0.0676, + "epoch": 0.21, + "learning_rate": 0.0002686033678204689, + "loss": 0.0674, "step": 32430 }, { - "epoch": 0.35, - "learning_rate": 0.00024736842105263154, - "loss": 0.0734, + "epoch": 0.21, + "learning_rate": 0.000268593686466112, + "loss": 0.0728, "step": 32440 }, { - "epoch": 0.35, - "learning_rate": 0.00024735219676812247, - "loss": 0.0665, + "epoch": 0.21, + "learning_rate": 0.0002685840051117551, + "loss": 0.0703, "step": 32450 }, { - "epoch": 0.35, - "learning_rate": 0.00024733597248361344, - "loss": 0.0678, + "epoch": 0.21, + "learning_rate": 0.00026857432375739816, + "loss": 0.0761, "step": 32460 }, { - "epoch": 0.35, - "learning_rate": 0.00024731974819910437, - "loss": 0.0665, + "epoch": 0.21, + "learning_rate": 0.0002685646424030412, + "loss": 0.0734, "step": 32470 }, { - "epoch": 0.35, - "learning_rate": 0.00024730352391459534, - "loss": 0.0668, + "epoch": 0.21, + "learning_rate": 0.00026855496104868427, + "loss": 0.0733, "step": 32480 }, { - "epoch": 0.35, - "learning_rate": 0.00024728729963008626, - "loss": 0.0595, + "epoch": 0.21, + "learning_rate": 0.00026854527969432735, + "loss": 0.0773, "step": 32490 }, { - "epoch": 0.35, - "learning_rate": 0.00024727107534557724, - "loss": 0.0627, + "epoch": 0.21, + "learning_rate": 0.00026853559833997043, + "loss": 0.0741, "step": 32500 }, { - "epoch": 0.35, - "learning_rate": 0.00024725485106106816, - "loss": 0.0656, + "epoch": 0.21, + "learning_rate": 0.0002685259169856135, + "loss": 0.0712, "step": 32510 }, { - "epoch": 0.35, - "learning_rate": 0.00024723862677655914, - "loss": 0.0704, + "epoch": 0.21, + "learning_rate": 0.00026851623563125653, + "loss": 0.0743, "step": 32520 }, { - "epoch": 0.35, - "learning_rate": 0.00024722240249205006, - "loss": 0.0622, + "epoch": 0.21, + "learning_rate": 0.0002685065542768996, + "loss": 0.0747, "step": 32530 }, { - "epoch": 0.35, - "learning_rate": 0.00024720617820754104, - "loss": 0.0672, + "epoch": 0.21, + "learning_rate": 0.0002684968729225427, + "loss": 0.0778, "step": 32540 }, { - "epoch": 0.35, - "learning_rate": 0.00024718995392303196, - "loss": 0.0666, + "epoch": 0.21, + "learning_rate": 0.0002684871915681857, + "loss": 0.0709, "step": 32550 }, { - "epoch": 0.35, - "learning_rate": 0.00024717372963852294, - "loss": 0.0584, + "epoch": 0.21, + "learning_rate": 0.0002684775102138288, + "loss": 0.0802, "step": 32560 }, { - "epoch": 0.35, - "learning_rate": 0.00024715750535401386, - "loss": 0.0683, + "epoch": 0.21, + "learning_rate": 0.0002684678288594719, + "loss": 0.0811, "step": 32570 }, { - "epoch": 0.35, - "learning_rate": 0.00024714128106950484, - "loss": 0.0731, + "epoch": 0.21, + "learning_rate": 0.00026845814750511496, + "loss": 0.0812, "step": 32580 }, { - "epoch": 0.35, - "learning_rate": 0.00024712505678499576, - "loss": 0.0707, + "epoch": 0.21, + "learning_rate": 0.00026844846615075804, + "loss": 0.0709, "step": 32590 }, { - "epoch": 0.35, - "learning_rate": 0.0002471088325004867, - "loss": 0.0684, + "epoch": 0.21, + "learning_rate": 0.0002684387847964011, + "loss": 0.0788, "step": 32600 }, { - "epoch": 0.35, - "learning_rate": 0.00024709260821597766, - "loss": 0.0712, + "epoch": 0.21, + "learning_rate": 0.00026842910344204414, + "loss": 0.0733, "step": 32610 }, { - "epoch": 0.35, - "learning_rate": 0.0002470763839314686, - "loss": 0.0596, + "epoch": 0.21, + "learning_rate": 0.0002684194220876872, + "loss": 0.0817, "step": 32620 }, { - "epoch": 0.35, - "learning_rate": 0.0002470601596469595, - "loss": 0.0677, + "epoch": 0.21, + "learning_rate": 0.0002684097407333303, + "loss": 0.0931, "step": 32630 }, { - "epoch": 0.35, - "learning_rate": 0.0002470439353624505, - "loss": 0.0694, + "epoch": 0.21, + "learning_rate": 0.0002684000593789734, + "loss": 0.0763, "step": 32640 }, { - "epoch": 0.35, - "learning_rate": 0.0002470277110779414, - "loss": 0.0672, + "epoch": 0.21, + "learning_rate": 0.00026839037802461646, + "loss": 0.078, "step": 32650 }, { - "epoch": 0.35, - "learning_rate": 0.0002470114867934324, - "loss": 0.0645, + "epoch": 0.21, + "learning_rate": 0.0002683806966702595, + "loss": 0.066, "step": 32660 }, { - "epoch": 0.35, - "learning_rate": 0.0002469952625089233, - "loss": 0.0756, + "epoch": 0.21, + "learning_rate": 0.00026837101531590257, + "loss": 0.0834, "step": 32670 }, { - "epoch": 0.35, - "learning_rate": 0.0002469790382244143, - "loss": 0.0691, + "epoch": 0.21, + "learning_rate": 0.00026836133396154565, + "loss": 0.0702, "step": 32680 }, { - "epoch": 0.35, - "learning_rate": 0.0002469628139399052, - "loss": 0.0701, + "epoch": 0.21, + "learning_rate": 0.0002683516526071887, + "loss": 0.0711, "step": 32690 }, { - "epoch": 0.35, - "learning_rate": 0.0002469465896553962, - "loss": 0.0638, + "epoch": 0.21, + "learning_rate": 0.00026834197125283175, + "loss": 0.0741, "step": 32700 }, { - "epoch": 0.35, - "learning_rate": 0.0002469303653708871, - "loss": 0.0598, + "epoch": 0.21, + "learning_rate": 0.00026833228989847483, + "loss": 0.0725, "step": 32710 }, { - "epoch": 0.35, - "learning_rate": 0.0002469141410863781, - "loss": 0.0602, + "epoch": 0.21, + "learning_rate": 0.0002683226085441179, + "loss": 0.0812, "step": 32720 }, { - "epoch": 0.35, - "learning_rate": 0.000246897916801869, - "loss": 0.0662, + "epoch": 0.21, + "learning_rate": 0.000268312927189761, + "loss": 0.0792, "step": 32730 }, { - "epoch": 0.35, - "learning_rate": 0.00024688169251736, - "loss": 0.0742, + "epoch": 0.21, + "learning_rate": 0.00026830324583540407, + "loss": 0.0679, "step": 32740 }, { - "epoch": 0.35, - "learning_rate": 0.0002468654682328509, - "loss": 0.0665, + "epoch": 0.21, + "learning_rate": 0.0002682935644810471, + "loss": 0.0803, "step": 32750 }, { - "epoch": 0.35, - "learning_rate": 0.0002468492439483419, - "loss": 0.0875, + "epoch": 0.21, + "learning_rate": 0.0002682838831266902, + "loss": 0.0836, "step": 32760 }, { - "epoch": 0.35, - "learning_rate": 0.0002468330196638328, - "loss": 0.095, + "epoch": 0.21, + "learning_rate": 0.00026827420177233326, + "loss": 0.0763, "step": 32770 }, { - "epoch": 0.35, - "learning_rate": 0.0002468167953793237, - "loss": 0.0614, + "epoch": 0.21, + "learning_rate": 0.00026826452041797634, + "loss": 0.0756, "step": 32780 }, { - "epoch": 0.35, - "learning_rate": 0.0002468005710948147, - "loss": 0.0721, + "epoch": 0.21, + "learning_rate": 0.00026825483906361936, + "loss": 0.0774, "step": 32790 }, { - "epoch": 0.35, - "learning_rate": 0.0002467843468103056, - "loss": 0.0791, + "epoch": 0.21, + "learning_rate": 0.00026824515770926244, + "loss": 0.0734, "step": 32800 }, { - "epoch": 0.35, - "learning_rate": 0.00024676812252579655, - "loss": 0.0691, + "epoch": 0.21, + "learning_rate": 0.0002682354763549055, + "loss": 0.0778, "step": 32810 }, { - "epoch": 0.35, - "learning_rate": 0.0002467518982412875, - "loss": 0.0609, + "epoch": 0.21, + "learning_rate": 0.00026822579500054855, + "loss": 0.069, "step": 32820 }, { - "epoch": 0.36, - "learning_rate": 0.00024673567395677845, - "loss": 0.0733, + "epoch": 0.21, + "learning_rate": 0.00026821611364619163, + "loss": 0.084, "step": 32830 }, { - "epoch": 0.36, - "learning_rate": 0.0002467194496722694, - "loss": 0.0723, + "epoch": 0.21, + "learning_rate": 0.0002682064322918347, + "loss": 0.0795, "step": 32840 }, { - "epoch": 0.36, - "learning_rate": 0.00024670322538776035, - "loss": 0.0752, + "epoch": 0.21, + "learning_rate": 0.0002681967509374778, + "loss": 0.0684, "step": 32850 }, { - "epoch": 0.36, - "learning_rate": 0.0002466870011032513, - "loss": 0.0761, + "epoch": 0.21, + "learning_rate": 0.00026818706958312087, + "loss": 0.0713, "step": 32860 }, { - "epoch": 0.36, - "learning_rate": 0.0002466707768187423, - "loss": 0.071, + "epoch": 0.21, + "learning_rate": 0.00026817738822876395, + "loss": 0.0737, "step": 32870 }, { - "epoch": 0.36, - "learning_rate": 0.0002466545525342332, - "loss": 0.0794, + "epoch": 0.21, + "learning_rate": 0.000268167706874407, + "loss": 0.077, "step": 32880 }, { - "epoch": 0.36, - "learning_rate": 0.0002466383282497242, - "loss": 0.0633, + "epoch": 0.21, + "learning_rate": 0.00026815802552005005, + "loss": 0.079, "step": 32890 }, { - "epoch": 0.36, - "learning_rate": 0.0002466221039652151, - "loss": 0.062, + "epoch": 0.21, + "learning_rate": 0.00026814834416569313, + "loss": 0.0692, "step": 32900 }, { - "epoch": 0.36, - "learning_rate": 0.0002466058796807061, - "loss": 0.0843, + "epoch": 0.21, + "learning_rate": 0.0002681386628113362, + "loss": 0.0676, "step": 32910 }, { - "epoch": 0.36, - "learning_rate": 0.000246589655396197, - "loss": 0.0729, + "epoch": 0.21, + "learning_rate": 0.00026812898145697924, + "loss": 0.085, "step": 32920 }, { - "epoch": 0.36, - "learning_rate": 0.00024657343111168795, - "loss": 0.0655, + "epoch": 0.21, + "learning_rate": 0.0002681193001026223, + "loss": 0.0699, "step": 32930 }, { - "epoch": 0.36, - "learning_rate": 0.0002465572068271789, - "loss": 0.0611, + "epoch": 0.21, + "learning_rate": 0.0002681096187482654, + "loss": 0.0738, "step": 32940 }, { - "epoch": 0.36, - "learning_rate": 0.00024654098254266985, - "loss": 0.0679, + "epoch": 0.21, + "learning_rate": 0.0002680999373939085, + "loss": 0.0745, "step": 32950 }, { - "epoch": 0.36, - "learning_rate": 0.00024652475825816077, - "loss": 0.0691, + "epoch": 0.21, + "learning_rate": 0.0002680902560395515, + "loss": 0.089, "step": 32960 }, { - "epoch": 0.36, - "learning_rate": 0.00024650853397365175, - "loss": 0.0656, + "epoch": 0.21, + "learning_rate": 0.0002680805746851946, + "loss": 0.0745, "step": 32970 }, { - "epoch": 0.36, - "learning_rate": 0.00024649230968914267, - "loss": 0.0681, + "epoch": 0.21, + "learning_rate": 0.00026807089333083766, + "loss": 0.0806, "step": 32980 }, { - "epoch": 0.36, - "learning_rate": 0.00024647608540463364, - "loss": 0.0688, + "epoch": 0.21, + "learning_rate": 0.00026806121197648074, + "loss": 0.0702, "step": 32990 }, { - "epoch": 0.36, - "learning_rate": 0.00024645986112012457, - "loss": 0.0732, + "epoch": 0.21, + "learning_rate": 0.0002680515306221238, + "loss": 0.0741, "step": 33000 }, { - "epoch": 0.36, - "eval_cer": 0.9213460413718038, - "eval_loss": 0.04550056532025337, - "eval_runtime": 119.2971, - "eval_samples_per_second": 16.765, - "eval_steps_per_second": 4.191, + "epoch": 0.21, + "eval_cer": 0.9201437125748503, + "eval_loss": 0.049433525651693344, + "eval_runtime": 120.4106, + "eval_samples_per_second": 16.61, + "eval_steps_per_second": 4.152, "step": 33000 }, { - "epoch": 0.36, - "learning_rate": 0.00024644363683561554, - "loss": 0.0643, + "epoch": 0.21, + "learning_rate": 0.0002680418492677669, + "loss": 0.0794, "step": 33010 }, { - "epoch": 0.36, - "learning_rate": 0.00024642741255110647, - "loss": 0.0651, + "epoch": 0.21, + "learning_rate": 0.00026803216791341, + "loss": 0.0753, "step": 33020 }, { - "epoch": 0.36, - "learning_rate": 0.00024641118826659744, - "loss": 0.0699, + "epoch": 0.21, + "learning_rate": 0.000268022486559053, + "loss": 0.0753, "step": 33030 }, { - "epoch": 0.36, - "learning_rate": 0.00024639496398208837, - "loss": 0.0699, + "epoch": 0.21, + "learning_rate": 0.0002680128052046961, + "loss": 0.074, "step": 33040 }, { - "epoch": 0.36, - "learning_rate": 0.00024637873969757934, - "loss": 0.0623, + "epoch": 0.21, + "learning_rate": 0.00026800312385033917, + "loss": 0.066, "step": 33050 }, { - "epoch": 0.36, - "learning_rate": 0.00024636251541307027, - "loss": 0.0681, + "epoch": 0.21, + "learning_rate": 0.0002679934424959822, + "loss": 0.0765, "step": 33060 }, { - "epoch": 0.36, - "learning_rate": 0.00024634629112856124, - "loss": 0.0656, + "epoch": 0.21, + "learning_rate": 0.00026798376114162527, + "loss": 0.0811, "step": 33070 }, { - "epoch": 0.36, - "learning_rate": 0.00024633006684405217, - "loss": 0.069, + "epoch": 0.21, + "learning_rate": 0.00026797407978726835, + "loss": 0.0691, "step": 33080 }, { - "epoch": 0.36, - "learning_rate": 0.00024631384255954314, - "loss": 0.0576, + "epoch": 0.21, + "learning_rate": 0.00026796439843291143, + "loss": 0.0801, "step": 33090 }, { - "epoch": 0.36, - "learning_rate": 0.00024629761827503407, - "loss": 0.0775, + "epoch": 0.21, + "learning_rate": 0.00026795471707855446, + "loss": 0.0712, "step": 33100 }, { - "epoch": 0.36, - "learning_rate": 0.000246281393990525, - "loss": 0.0638, + "epoch": 0.21, + "learning_rate": 0.00026794503572419754, + "loss": 0.079, "step": 33110 }, { - "epoch": 0.36, - "learning_rate": 0.00024626516970601596, - "loss": 0.0709, + "epoch": 0.21, + "learning_rate": 0.0002679353543698406, + "loss": 0.0702, "step": 33120 }, { - "epoch": 0.36, - "learning_rate": 0.0002462489454215069, - "loss": 0.0636, + "epoch": 0.21, + "learning_rate": 0.0002679256730154837, + "loss": 0.0701, "step": 33130 }, { - "epoch": 0.36, - "learning_rate": 0.0002462327211369978, - "loss": 0.0695, + "epoch": 0.21, + "learning_rate": 0.0002679159916611268, + "loss": 0.072, "step": 33140 }, { - "epoch": 0.36, - "learning_rate": 0.0002462164968524888, - "loss": 0.0591, + "epoch": 0.21, + "learning_rate": 0.00026790631030676986, + "loss": 0.0775, "step": 33150 }, { - "epoch": 0.36, - "learning_rate": 0.0002462002725679797, - "loss": 0.0638, + "epoch": 0.21, + "learning_rate": 0.0002678966289524129, + "loss": 0.0811, "step": 33160 }, { - "epoch": 0.36, - "learning_rate": 0.0002461840482834707, - "loss": 0.0646, + "epoch": 0.21, + "learning_rate": 0.00026788694759805596, + "loss": 0.0714, "step": 33170 }, { - "epoch": 0.36, - "learning_rate": 0.0002461678239989616, - "loss": 0.0657, + "epoch": 0.21, + "learning_rate": 0.00026787726624369904, + "loss": 0.0799, "step": 33180 }, { - "epoch": 0.36, - "learning_rate": 0.0002461515997144526, - "loss": 0.0598, + "epoch": 0.21, + "learning_rate": 0.00026786758488934207, + "loss": 0.0737, "step": 33190 }, { - "epoch": 0.36, - "learning_rate": 0.0002461353754299435, - "loss": 0.0705, + "epoch": 0.21, + "learning_rate": 0.00026785790353498515, + "loss": 0.0693, "step": 33200 }, { - "epoch": 0.36, - "learning_rate": 0.0002461191511454345, - "loss": 0.0646, + "epoch": 0.21, + "learning_rate": 0.0002678482221806282, + "loss": 0.0783, "step": 33210 }, { - "epoch": 0.36, - "learning_rate": 0.0002461029268609254, - "loss": 0.0716, + "epoch": 0.21, + "learning_rate": 0.0002678385408262713, + "loss": 0.077, "step": 33220 }, { - "epoch": 0.36, - "learning_rate": 0.0002460867025764164, - "loss": 0.0777, + "epoch": 0.21, + "learning_rate": 0.0002678288594719144, + "loss": 0.071, "step": 33230 }, { - "epoch": 0.36, - "learning_rate": 0.0002460704782919073, - "loss": 0.0754, + "epoch": 0.21, + "learning_rate": 0.0002678191781175574, + "loss": 0.078, "step": 33240 }, { - "epoch": 0.36, - "learning_rate": 0.0002460542540073983, - "loss": 0.0694, + "epoch": 0.21, + "learning_rate": 0.0002678094967632005, + "loss": 0.0681, "step": 33250 }, { - "epoch": 0.36, - "learning_rate": 0.0002460380297228892, - "loss": 0.0694, + "epoch": 0.21, + "learning_rate": 0.00026779981540884357, + "loss": 0.0762, "step": 33260 }, { - "epoch": 0.36, - "learning_rate": 0.0002460218054383802, - "loss": 0.0701, + "epoch": 0.21, + "learning_rate": 0.00026779013405448665, + "loss": 0.0736, "step": 33270 }, { - "epoch": 0.36, - "learning_rate": 0.0002460055811538711, - "loss": 0.0635, + "epoch": 0.21, + "learning_rate": 0.00026778045270012973, + "loss": 0.0774, "step": 33280 }, { - "epoch": 0.36, - "learning_rate": 0.00024598935686936203, - "loss": 0.0642, + "epoch": 0.21, + "learning_rate": 0.0002677707713457728, + "loss": 0.0747, "step": 33290 }, { - "epoch": 0.36, - "learning_rate": 0.000245973132584853, - "loss": 0.0763, + "epoch": 0.21, + "learning_rate": 0.00026776108999141584, + "loss": 0.0739, "step": 33300 }, { - "epoch": 0.36, - "learning_rate": 0.00024595690830034393, - "loss": 0.0654, + "epoch": 0.21, + "learning_rate": 0.0002677514086370589, + "loss": 0.0762, "step": 33310 }, { - "epoch": 0.36, - "learning_rate": 0.00024594068401583485, - "loss": 0.0597, + "epoch": 0.22, + "learning_rate": 0.00026774172728270194, + "loss": 0.0764, "step": 33320 }, { - "epoch": 0.36, - "learning_rate": 0.00024592445973132583, - "loss": 0.0648, + "epoch": 0.22, + "learning_rate": 0.000267732045928345, + "loss": 0.0755, "step": 33330 }, { - "epoch": 0.36, - "learning_rate": 0.00024590823544681675, - "loss": 0.064, + "epoch": 0.22, + "learning_rate": 0.0002677223645739881, + "loss": 0.0848, "step": 33340 }, { - "epoch": 0.36, - "learning_rate": 0.00024589201116230773, - "loss": 0.0586, + "epoch": 0.22, + "learning_rate": 0.0002677126832196312, + "loss": 0.0733, "step": 33350 }, { - "epoch": 0.36, - "learning_rate": 0.00024587578687779865, - "loss": 0.0704, + "epoch": 0.22, + "learning_rate": 0.00026770300186527426, + "loss": 0.0696, "step": 33360 }, { - "epoch": 0.36, - "learning_rate": 0.00024585956259328963, - "loss": 0.0635, + "epoch": 0.22, + "learning_rate": 0.00026769332051091734, + "loss": 0.0724, "step": 33370 }, { - "epoch": 0.36, - "learning_rate": 0.00024584333830878055, - "loss": 0.0612, + "epoch": 0.22, + "learning_rate": 0.00026768363915656037, + "loss": 0.0797, "step": 33380 }, { - "epoch": 0.36, - "learning_rate": 0.00024582711402427153, - "loss": 0.0644, + "epoch": 0.22, + "learning_rate": 0.00026767395780220345, + "loss": 0.0715, "step": 33390 }, { - "epoch": 0.36, - "learning_rate": 0.00024581088973976245, - "loss": 0.0606, + "epoch": 0.22, + "learning_rate": 0.0002676642764478465, + "loss": 0.072, "step": 33400 }, { - "epoch": 0.36, - "learning_rate": 0.0002457946654552534, - "loss": 0.0687, + "epoch": 0.22, + "learning_rate": 0.0002676545950934896, + "loss": 0.071, "step": 33410 }, { - "epoch": 0.36, - "learning_rate": 0.00024577844117074435, - "loss": 0.0629, + "epoch": 0.22, + "learning_rate": 0.0002676449137391327, + "loss": 0.0735, "step": 33420 }, { - "epoch": 0.36, - "learning_rate": 0.0002457622168862353, - "loss": 0.0663, + "epoch": 0.22, + "learning_rate": 0.0002676352323847757, + "loss": 0.0662, "step": 33430 }, { - "epoch": 0.36, - "learning_rate": 0.00024574599260172625, - "loss": 0.0597, + "epoch": 0.22, + "learning_rate": 0.0002676255510304188, + "loss": 0.074, "step": 33440 }, { - "epoch": 0.36, - "learning_rate": 0.0002457297683172172, - "loss": 0.0697, + "epoch": 0.22, + "learning_rate": 0.00026761586967606187, + "loss": 0.0805, "step": 33450 }, { - "epoch": 0.36, - "learning_rate": 0.00024571354403270815, - "loss": 0.072, + "epoch": 0.22, + "learning_rate": 0.0002676061883217049, + "loss": 0.0646, "step": 33460 }, { - "epoch": 0.36, - "learning_rate": 0.00024569731974819907, - "loss": 0.0738, + "epoch": 0.22, + "learning_rate": 0.000267596506967348, + "loss": 0.0728, "step": 33470 }, { - "epoch": 0.36, - "learning_rate": 0.00024568109546369005, - "loss": 0.0627, + "epoch": 0.22, + "learning_rate": 0.00026758682561299105, + "loss": 0.0695, "step": 33480 }, { - "epoch": 0.36, - "learning_rate": 0.00024566487117918097, - "loss": 0.0649, + "epoch": 0.22, + "learning_rate": 0.00026757714425863413, + "loss": 0.0683, "step": 33490 }, { - "epoch": 0.36, - "learning_rate": 0.0002456486468946719, - "loss": 0.0599, + "epoch": 0.22, + "learning_rate": 0.0002675674629042772, + "loss": 0.0756, "step": 33500 }, { - "epoch": 0.36, - "learning_rate": 0.00024563242261016287, - "loss": 0.0768, + "epoch": 0.22, + "learning_rate": 0.0002675577815499203, + "loss": 0.0767, "step": 33510 }, { - "epoch": 0.36, - "learning_rate": 0.0002456161983256538, - "loss": 0.0701, + "epoch": 0.22, + "learning_rate": 0.0002675481001955633, + "loss": 0.0792, "step": 33520 }, { - "epoch": 0.36, - "learning_rate": 0.00024559997404114477, - "loss": 0.0649, + "epoch": 0.22, + "learning_rate": 0.0002675384188412064, + "loss": 0.0812, "step": 33530 }, { - "epoch": 0.36, - "learning_rate": 0.0002455837497566357, - "loss": 0.0624, + "epoch": 0.22, + "learning_rate": 0.0002675287374868495, + "loss": 0.0847, "step": 33540 }, { - "epoch": 0.36, - "learning_rate": 0.00024556752547212667, - "loss": 0.0753, + "epoch": 0.22, + "learning_rate": 0.00026751905613249256, + "loss": 0.0686, "step": 33550 }, { - "epoch": 0.36, - "learning_rate": 0.0002455513011876176, - "loss": 0.0626, + "epoch": 0.22, + "learning_rate": 0.0002675093747781356, + "loss": 0.0638, "step": 33560 }, { - "epoch": 0.36, - "learning_rate": 0.00024553507690310857, - "loss": 0.0637, + "epoch": 0.22, + "learning_rate": 0.00026749969342377866, + "loss": 0.0756, "step": 33570 }, { - "epoch": 0.36, - "learning_rate": 0.0002455188526185995, - "loss": 0.063, + "epoch": 0.22, + "learning_rate": 0.00026749001206942174, + "loss": 0.082, "step": 33580 }, { - "epoch": 0.36, - "learning_rate": 0.00024550262833409047, - "loss": 0.0587, + "epoch": 0.22, + "learning_rate": 0.00026748033071506477, + "loss": 0.0714, "step": 33590 }, { - "epoch": 0.36, - "learning_rate": 0.0002454864040495814, - "loss": 0.0637, + "epoch": 0.22, + "learning_rate": 0.00026747064936070785, + "loss": 0.081, "step": 33600 }, { - "epoch": 0.36, - "learning_rate": 0.00024547017976507237, - "loss": 0.0699, + "epoch": 0.22, + "learning_rate": 0.00026746096800635093, + "loss": 0.0659, "step": 33610 }, { - "epoch": 0.36, - "learning_rate": 0.0002454539554805633, - "loss": 0.0709, + "epoch": 0.22, + "learning_rate": 0.000267451286651994, + "loss": 0.0759, "step": 33620 }, { - "epoch": 0.36, - "learning_rate": 0.00024543773119605427, - "loss": 0.0658, + "epoch": 0.22, + "learning_rate": 0.0002674416052976371, + "loss": 0.0772, "step": 33630 }, { - "epoch": 0.36, - "learning_rate": 0.0002454215069115452, - "loss": 0.0656, + "epoch": 0.22, + "learning_rate": 0.00026743192394328017, + "loss": 0.0682, "step": 33640 }, { - "epoch": 0.36, - "learning_rate": 0.0002454052826270361, - "loss": 0.0747, + "epoch": 0.22, + "learning_rate": 0.00026742224258892325, + "loss": 0.0806, "step": 33650 }, { - "epoch": 0.36, - "learning_rate": 0.0002453890583425271, - "loss": 0.0656, + "epoch": 0.22, + "learning_rate": 0.0002674125612345663, + "loss": 0.0887, "step": 33660 }, { - "epoch": 0.36, - "learning_rate": 0.000245372834058018, - "loss": 0.0642, + "epoch": 0.22, + "learning_rate": 0.00026740287988020935, + "loss": 0.0794, "step": 33670 }, { - "epoch": 0.36, - "learning_rate": 0.00024535660977350894, - "loss": 0.0616, + "epoch": 0.22, + "learning_rate": 0.00026739319852585243, + "loss": 0.0794, "step": 33680 }, { - "epoch": 0.36, - "learning_rate": 0.0002453403854889999, - "loss": 0.0731, + "epoch": 0.22, + "learning_rate": 0.0002673835171714955, + "loss": 0.0737, "step": 33690 }, { - "epoch": 0.36, - "learning_rate": 0.00024532416120449083, - "loss": 0.0603, + "epoch": 0.22, + "learning_rate": 0.00026737383581713854, + "loss": 0.0743, "step": 33700 }, { - "epoch": 0.36, - "learning_rate": 0.0002453079369199818, - "loss": 0.0703, + "epoch": 0.22, + "learning_rate": 0.0002673641544627816, + "loss": 0.0764, "step": 33710 }, { - "epoch": 0.36, - "learning_rate": 0.00024529171263547273, - "loss": 0.0764, + "epoch": 0.22, + "learning_rate": 0.0002673544731084247, + "loss": 0.074, "step": 33720 }, { - "epoch": 0.36, - "learning_rate": 0.0002452754883509637, - "loss": 0.0651, + "epoch": 0.22, + "learning_rate": 0.0002673447917540677, + "loss": 0.0801, "step": 33730 }, { - "epoch": 0.36, - "learning_rate": 0.00024525926406645463, - "loss": 0.065, + "epoch": 0.22, + "learning_rate": 0.0002673351103997108, + "loss": 0.0737, "step": 33740 }, { - "epoch": 0.37, - "learning_rate": 0.0002452430397819456, - "loss": 0.0698, + "epoch": 0.22, + "learning_rate": 0.0002673254290453539, + "loss": 0.0766, "step": 33750 }, { - "epoch": 0.37, - "learning_rate": 0.00024522681549743653, - "loss": 0.0761, + "epoch": 0.22, + "learning_rate": 0.00026731574769099696, + "loss": 0.0751, "step": 33760 }, { - "epoch": 0.37, - "learning_rate": 0.0002452105912129275, - "loss": 0.0774, + "epoch": 0.22, + "learning_rate": 0.00026730606633664004, + "loss": 0.0693, "step": 33770 }, { - "epoch": 0.37, - "learning_rate": 0.00024519436692841843, - "loss": 0.0628, + "epoch": 0.22, + "learning_rate": 0.0002672963849822831, + "loss": 0.0652, "step": 33780 }, { - "epoch": 0.37, - "learning_rate": 0.0002451781426439094, - "loss": 0.066, + "epoch": 0.22, + "learning_rate": 0.0002672867036279262, + "loss": 0.0703, "step": 33790 }, { - "epoch": 0.37, - "learning_rate": 0.00024516191835940033, - "loss": 0.0636, + "epoch": 0.22, + "learning_rate": 0.00026727702227356923, + "loss": 0.0737, "step": 33800 }, { - "epoch": 0.37, - "learning_rate": 0.0002451456940748913, - "loss": 0.0704, + "epoch": 0.22, + "learning_rate": 0.0002672673409192123, + "loss": 0.0713, "step": 33810 }, { - "epoch": 0.37, - "learning_rate": 0.00024512946979038223, - "loss": 0.0619, + "epoch": 0.22, + "learning_rate": 0.0002672576595648554, + "loss": 0.0787, "step": 33820 }, { - "epoch": 0.37, - "learning_rate": 0.00024511324550587315, - "loss": 0.0618, + "epoch": 0.22, + "learning_rate": 0.0002672479782104984, + "loss": 0.0691, "step": 33830 }, { - "epoch": 0.37, - "learning_rate": 0.00024509702122136413, - "loss": 0.0715, + "epoch": 0.22, + "learning_rate": 0.0002672382968561415, + "loss": 0.0651, "step": 33840 }, { - "epoch": 0.37, - "learning_rate": 0.00024508079693685505, - "loss": 0.0819, + "epoch": 0.22, + "learning_rate": 0.0002672286155017846, + "loss": 0.0774, "step": 33850 }, { - "epoch": 0.37, - "learning_rate": 0.000245064572652346, - "loss": 0.0599, + "epoch": 0.22, + "learning_rate": 0.00026721893414742765, + "loss": 0.0784, "step": 33860 }, { - "epoch": 0.37, - "learning_rate": 0.00024504834836783695, - "loss": 0.0663, + "epoch": 0.22, + "learning_rate": 0.0002672092527930707, + "loss": 0.076, "step": 33870 }, { - "epoch": 0.37, - "learning_rate": 0.0002450321240833279, - "loss": 0.0742, + "epoch": 0.22, + "learning_rate": 0.00026719957143871376, + "loss": 0.0713, "step": 33880 }, { - "epoch": 0.37, - "learning_rate": 0.00024501589979881885, - "loss": 0.0749, + "epoch": 0.22, + "learning_rate": 0.00026718989008435684, + "loss": 0.0715, "step": 33890 }, { - "epoch": 0.37, - "learning_rate": 0.0002449996755143098, - "loss": 0.071, + "epoch": 0.22, + "learning_rate": 0.0002671802087299999, + "loss": 0.0727, "step": 33900 }, { - "epoch": 0.37, - "learning_rate": 0.00024498345122980075, - "loss": 0.0687, + "epoch": 0.22, + "learning_rate": 0.000267170527375643, + "loss": 0.0715, "step": 33910 }, { - "epoch": 0.37, - "learning_rate": 0.0002449672269452917, - "loss": 0.0624, + "epoch": 0.22, + "learning_rate": 0.0002671608460212861, + "loss": 0.0766, "step": 33920 }, { - "epoch": 0.37, - "learning_rate": 0.00024495100266078265, - "loss": 0.075, + "epoch": 0.22, + "learning_rate": 0.0002671511646669291, + "loss": 0.0688, "step": 33930 }, { - "epoch": 0.37, - "learning_rate": 0.0002449347783762736, - "loss": 0.0772, + "epoch": 0.22, + "learning_rate": 0.0002671414833125722, + "loss": 0.0703, "step": 33940 }, { - "epoch": 0.37, - "learning_rate": 0.00024491855409176455, - "loss": 0.0663, + "epoch": 0.22, + "learning_rate": 0.00026713180195821526, + "loss": 0.0698, "step": 33950 }, { - "epoch": 0.37, - "learning_rate": 0.0002449023298072555, - "loss": 0.0656, + "epoch": 0.22, + "learning_rate": 0.0002671221206038583, + "loss": 0.0809, "step": 33960 }, { - "epoch": 0.37, - "learning_rate": 0.00024488610552274645, - "loss": 0.0614, + "epoch": 0.22, + "learning_rate": 0.00026711243924950137, + "loss": 0.071, "step": 33970 }, { - "epoch": 0.37, - "learning_rate": 0.0002448698812382374, - "loss": 0.0663, + "epoch": 0.22, + "learning_rate": 0.00026710275789514445, + "loss": 0.0678, "step": 33980 }, { - "epoch": 0.37, - "learning_rate": 0.00024485365695372835, - "loss": 0.074, + "epoch": 0.22, + "learning_rate": 0.00026709307654078753, + "loss": 0.0734, "step": 33990 }, { - "epoch": 0.37, - "learning_rate": 0.0002448374326692193, - "loss": 0.0809, + "epoch": 0.22, + "learning_rate": 0.0002670833951864306, + "loss": 0.0736, "step": 34000 }, { - "epoch": 0.37, - "eval_cer": 0.9213972834624103, - "eval_loss": 0.04552512988448143, - "eval_runtime": 119.4461, - "eval_samples_per_second": 16.744, - "eval_steps_per_second": 4.186, + "epoch": 0.22, + "eval_cer": 0.9201382894588183, + "eval_loss": 0.049920111894607544, + "eval_runtime": 120.2767, + "eval_samples_per_second": 16.628, + "eval_steps_per_second": 4.157, "step": 34000 }, { - "epoch": 0.37, - "learning_rate": 0.0002448212083847102, - "loss": 0.0704, + "epoch": 0.22, + "learning_rate": 0.00026707371383207363, + "loss": 0.0733, "step": 34010 }, { - "epoch": 0.37, - "learning_rate": 0.0002448049841002012, - "loss": 0.0687, + "epoch": 0.22, + "learning_rate": 0.0002670640324777167, + "loss": 0.0795, "step": 34020 }, { - "epoch": 0.37, - "learning_rate": 0.0002447887598156921, - "loss": 0.0663, + "epoch": 0.22, + "learning_rate": 0.0002670543511233598, + "loss": 0.0762, "step": 34030 }, { - "epoch": 0.37, - "learning_rate": 0.000244772535531183, - "loss": 0.0606, + "epoch": 0.22, + "learning_rate": 0.00026704466976900287, + "loss": 0.0708, "step": 34040 }, { - "epoch": 0.37, - "learning_rate": 0.000244756311246674, - "loss": 0.0616, + "epoch": 0.22, + "learning_rate": 0.00026703498841464595, + "loss": 0.0761, "step": 34050 }, { - "epoch": 0.37, - "learning_rate": 0.0002447400869621649, - "loss": 0.0594, + "epoch": 0.22, + "learning_rate": 0.00026702530706028903, + "loss": 0.0775, "step": 34060 }, { - "epoch": 0.37, - "learning_rate": 0.0002447238626776559, - "loss": 0.0664, + "epoch": 0.22, + "learning_rate": 0.00026701562570593206, + "loss": 0.0704, "step": 34070 }, { - "epoch": 0.37, - "learning_rate": 0.0002447076383931468, - "loss": 0.0645, + "epoch": 0.22, + "learning_rate": 0.00026700594435157514, + "loss": 0.0771, "step": 34080 }, { - "epoch": 0.37, - "learning_rate": 0.0002446914141086378, - "loss": 0.0681, + "epoch": 0.22, + "learning_rate": 0.0002669962629972182, + "loss": 0.0743, "step": 34090 }, { - "epoch": 0.37, - "learning_rate": 0.0002446751898241287, - "loss": 0.0731, + "epoch": 0.22, + "learning_rate": 0.00026698658164286124, + "loss": 0.0754, "step": 34100 }, { - "epoch": 0.37, - "learning_rate": 0.0002446589655396197, - "loss": 0.0711, + "epoch": 0.22, + "learning_rate": 0.0002669769002885043, + "loss": 0.0862, "step": 34110 }, { - "epoch": 0.37, - "learning_rate": 0.0002446427412551106, - "loss": 0.062, + "epoch": 0.22, + "learning_rate": 0.0002669672189341474, + "loss": 0.0676, "step": 34120 }, { - "epoch": 0.37, - "learning_rate": 0.0002446265169706016, - "loss": 0.0646, + "epoch": 0.22, + "learning_rate": 0.0002669575375797905, + "loss": 0.0739, "step": 34130 }, { - "epoch": 0.37, - "learning_rate": 0.0002446102926860925, - "loss": 0.0789, + "epoch": 0.22, + "learning_rate": 0.00026694785622543356, + "loss": 0.0779, "step": 34140 }, { - "epoch": 0.37, - "learning_rate": 0.0002445940684015835, - "loss": 0.0706, + "epoch": 0.22, + "learning_rate": 0.0002669381748710766, + "loss": 0.0734, "step": 34150 }, { - "epoch": 0.37, - "learning_rate": 0.0002445778441170744, - "loss": 0.0604, + "epoch": 0.22, + "learning_rate": 0.00026692849351671967, + "loss": 0.0719, "step": 34160 }, { - "epoch": 0.37, - "learning_rate": 0.0002445616198325654, - "loss": 0.0708, + "epoch": 0.22, + "learning_rate": 0.00026691881216236275, + "loss": 0.0887, "step": 34170 }, { - "epoch": 0.37, - "learning_rate": 0.0002445453955480563, - "loss": 0.0595, + "epoch": 0.22, + "learning_rate": 0.00026690913080800583, + "loss": 0.0752, "step": 34180 }, { - "epoch": 0.37, - "learning_rate": 0.00024452917126354724, - "loss": 0.0637, + "epoch": 0.22, + "learning_rate": 0.0002668994494536489, + "loss": 0.0754, "step": 34190 }, { - "epoch": 0.37, - "learning_rate": 0.0002445129469790382, - "loss": 0.0606, + "epoch": 0.22, + "learning_rate": 0.00026688976809929193, + "loss": 0.0772, "step": 34200 }, { - "epoch": 0.37, - "learning_rate": 0.00024449672269452914, - "loss": 0.0714, + "epoch": 0.22, + "learning_rate": 0.000266880086744935, + "loss": 0.0701, "step": 34210 }, { - "epoch": 0.37, - "learning_rate": 0.00024448049841002006, - "loss": 0.0625, + "epoch": 0.22, + "learning_rate": 0.0002668704053905781, + "loss": 0.0809, "step": 34220 }, { - "epoch": 0.37, - "learning_rate": 0.00024446427412551104, - "loss": 0.062, + "epoch": 0.22, + "learning_rate": 0.0002668607240362211, + "loss": 0.0906, "step": 34230 }, { - "epoch": 0.37, - "learning_rate": 0.00024444804984100196, - "loss": 0.0722, + "epoch": 0.22, + "learning_rate": 0.0002668510426818642, + "loss": 0.0798, "step": 34240 }, { - "epoch": 0.37, - "learning_rate": 0.00024443182555649294, - "loss": 0.0688, + "epoch": 0.22, + "learning_rate": 0.0002668413613275073, + "loss": 0.0763, "step": 34250 }, { - "epoch": 0.37, - "learning_rate": 0.00024441560127198386, - "loss": 0.0645, + "epoch": 0.22, + "learning_rate": 0.00026683167997315036, + "loss": 0.0814, "step": 34260 }, { - "epoch": 0.37, - "learning_rate": 0.00024439937698747484, - "loss": 0.077, + "epoch": 0.22, + "learning_rate": 0.00026682199861879344, + "loss": 0.066, "step": 34270 }, { - "epoch": 0.37, - "learning_rate": 0.00024438315270296576, - "loss": 0.0585, + "epoch": 0.22, + "learning_rate": 0.0002668123172644365, + "loss": 0.0757, "step": 34280 }, { - "epoch": 0.37, - "learning_rate": 0.00024436692841845674, - "loss": 0.0661, + "epoch": 0.22, + "learning_rate": 0.00026680263591007954, + "loss": 0.0761, "step": 34290 }, { - "epoch": 0.37, - "learning_rate": 0.00024435070413394766, - "loss": 0.0659, + "epoch": 0.22, + "learning_rate": 0.0002667929545557226, + "loss": 0.0819, "step": 34300 }, { - "epoch": 0.37, - "learning_rate": 0.00024433447984943864, - "loss": 0.066, + "epoch": 0.22, + "learning_rate": 0.0002667832732013657, + "loss": 0.0751, "step": 34310 }, { - "epoch": 0.37, - "learning_rate": 0.00024431825556492956, - "loss": 0.0696, + "epoch": 0.22, + "learning_rate": 0.0002667735918470088, + "loss": 0.0729, "step": 34320 }, { - "epoch": 0.37, - "learning_rate": 0.00024430203128042053, - "loss": 0.072, + "epoch": 0.22, + "learning_rate": 0.0002667639104926518, + "loss": 0.0693, "step": 34330 }, { - "epoch": 0.37, - "learning_rate": 0.00024428580699591146, - "loss": 0.074, + "epoch": 0.22, + "learning_rate": 0.0002667542291382949, + "loss": 0.0788, "step": 34340 }, { - "epoch": 0.37, - "learning_rate": 0.00024426958271140243, - "loss": 0.0621, + "epoch": 0.22, + "learning_rate": 0.00026674454778393797, + "loss": 0.0725, "step": 34350 }, { - "epoch": 0.37, - "learning_rate": 0.00024425335842689336, - "loss": 0.0641, + "epoch": 0.22, + "learning_rate": 0.000266734866429581, + "loss": 0.0847, "step": 34360 }, { - "epoch": 0.37, - "learning_rate": 0.0002442371341423843, - "loss": 0.0683, + "epoch": 0.22, + "learning_rate": 0.00026672518507522407, + "loss": 0.0759, "step": 34370 }, { - "epoch": 0.37, - "learning_rate": 0.00024422090985787526, - "loss": 0.0683, + "epoch": 0.22, + "learning_rate": 0.00026671550372086715, + "loss": 0.0756, "step": 34380 }, { - "epoch": 0.37, - "learning_rate": 0.0002442046855733662, - "loss": 0.0713, + "epoch": 0.22, + "learning_rate": 0.00026670582236651023, + "loss": 0.065, "step": 34390 }, { - "epoch": 0.37, - "learning_rate": 0.00024418846128885716, - "loss": 0.0659, + "epoch": 0.22, + "learning_rate": 0.0002666961410121533, + "loss": 0.0778, "step": 34400 }, { - "epoch": 0.37, - "learning_rate": 0.0002441722370043481, - "loss": 0.0742, + "epoch": 0.22, + "learning_rate": 0.0002666864596577964, + "loss": 0.0841, "step": 34410 }, { - "epoch": 0.37, - "learning_rate": 0.000244156012719839, - "loss": 0.0641, + "epoch": 0.22, + "learning_rate": 0.00026667677830343947, + "loss": 0.0817, "step": 34420 }, { - "epoch": 0.37, - "learning_rate": 0.00024413978843532998, - "loss": 0.0577, + "epoch": 0.22, + "learning_rate": 0.0002666670969490825, + "loss": 0.0737, "step": 34430 }, { - "epoch": 0.37, - "learning_rate": 0.00024412356415082093, - "loss": 0.0626, + "epoch": 0.22, + "learning_rate": 0.0002666574155947256, + "loss": 0.0773, "step": 34440 }, { - "epoch": 0.37, - "learning_rate": 0.00024410733986631188, - "loss": 0.0678, + "epoch": 0.22, + "learning_rate": 0.00026664773424036866, + "loss": 0.0687, "step": 34450 }, { - "epoch": 0.37, - "learning_rate": 0.0002440911155818028, - "loss": 0.0668, + "epoch": 0.22, + "learning_rate": 0.00026663805288601174, + "loss": 0.0756, "step": 34460 }, { - "epoch": 0.37, - "learning_rate": 0.00024407489129729378, - "loss": 0.0577, + "epoch": 0.22, + "learning_rate": 0.00026662837153165476, + "loss": 0.073, "step": 34470 }, { - "epoch": 0.37, - "learning_rate": 0.0002440586670127847, - "loss": 0.0599, + "epoch": 0.22, + "learning_rate": 0.00026661869017729784, + "loss": 0.0703, "step": 34480 }, { - "epoch": 0.37, - "learning_rate": 0.00024404244272827568, - "loss": 0.0645, + "epoch": 0.22, + "learning_rate": 0.0002666090088229409, + "loss": 0.0788, "step": 34490 }, { - "epoch": 0.37, - "learning_rate": 0.0002440262184437666, - "loss": 0.0635, + "epoch": 0.22, + "learning_rate": 0.00026659932746858395, + "loss": 0.0712, "step": 34500 }, { - "epoch": 0.37, - "learning_rate": 0.00024400999415925755, - "loss": 0.0619, + "epoch": 0.22, + "learning_rate": 0.000266589646114227, + "loss": 0.082, "step": 34510 }, { - "epoch": 0.37, - "learning_rate": 0.0002439937698747485, - "loss": 0.0638, + "epoch": 0.22, + "learning_rate": 0.0002665799647598701, + "loss": 0.0721, "step": 34520 }, { - "epoch": 0.37, - "learning_rate": 0.00024397754559023945, - "loss": 0.0746, + "epoch": 0.22, + "learning_rate": 0.0002665702834055132, + "loss": 0.0697, "step": 34530 }, { - "epoch": 0.37, - "learning_rate": 0.00024396132130573037, - "loss": 0.0647, + "epoch": 0.22, + "learning_rate": 0.00026656060205115627, + "loss": 0.0771, "step": 34540 }, { - "epoch": 0.37, - "learning_rate": 0.00024394509702122135, - "loss": 0.0717, + "epoch": 0.22, + "learning_rate": 0.00026655092069679935, + "loss": 0.0701, "step": 34550 }, { - "epoch": 0.37, - "learning_rate": 0.00024392887273671227, - "loss": 0.0662, + "epoch": 0.22, + "learning_rate": 0.0002665412393424424, + "loss": 0.0716, "step": 34560 }, { - "epoch": 0.37, - "learning_rate": 0.00024391264845220325, - "loss": 0.0715, + "epoch": 0.22, + "learning_rate": 0.00026653155798808545, + "loss": 0.0913, "step": 34570 }, { - "epoch": 0.37, - "learning_rate": 0.00024389642416769417, - "loss": 0.0748, + "epoch": 0.22, + "learning_rate": 0.00026652187663372853, + "loss": 0.0734, "step": 34580 }, { - "epoch": 0.37, - "learning_rate": 0.00024388019988318515, - "loss": 0.0554, + "epoch": 0.22, + "learning_rate": 0.0002665121952793716, + "loss": 0.074, "step": 34590 }, { - "epoch": 0.37, - "learning_rate": 0.00024386397559867607, - "loss": 0.0678, + "epoch": 0.22, + "learning_rate": 0.00026650251392501464, + "loss": 0.0719, "step": 34600 }, { - "epoch": 0.37, - "learning_rate": 0.00024384775131416702, - "loss": 0.0613, + "epoch": 0.22, + "learning_rate": 0.0002664928325706577, + "loss": 0.0657, "step": 34610 }, { - "epoch": 0.37, - "learning_rate": 0.00024383152702965797, - "loss": 0.0605, + "epoch": 0.22, + "learning_rate": 0.0002664831512163008, + "loss": 0.0732, "step": 34620 }, { - "epoch": 0.37, - "learning_rate": 0.00024381530274514892, - "loss": 0.0702, + "epoch": 0.22, + "learning_rate": 0.0002664734698619439, + "loss": 0.0697, "step": 34630 }, { - "epoch": 0.37, - "learning_rate": 0.00024379907846063984, - "loss": 0.0586, + "epoch": 0.22, + "learning_rate": 0.0002664637885075869, + "loss": 0.0763, "step": 34640 }, { - "epoch": 0.37, - "learning_rate": 0.00024378285417613082, - "loss": 0.0707, + "epoch": 0.22, + "learning_rate": 0.00026645410715323, + "loss": 0.0827, "step": 34650 }, { - "epoch": 0.37, - "learning_rate": 0.00024376662989162174, - "loss": 0.067, + "epoch": 0.22, + "learning_rate": 0.00026644442579887306, + "loss": 0.086, "step": 34660 }, { - "epoch": 0.37, - "learning_rate": 0.00024375040560711272, - "loss": 0.0638, + "epoch": 0.22, + "learning_rate": 0.00026643474444451614, + "loss": 0.068, "step": 34670 }, { - "epoch": 0.38, - "learning_rate": 0.00024373418132260364, - "loss": 0.0639, + "epoch": 0.22, + "learning_rate": 0.0002664250630901592, + "loss": 0.0697, "step": 34680 }, { - "epoch": 0.38, - "learning_rate": 0.0002437179570380946, - "loss": 0.0683, + "epoch": 0.22, + "learning_rate": 0.0002664153817358023, + "loss": 0.0709, "step": 34690 }, { - "epoch": 0.38, - "learning_rate": 0.00024370173275358554, - "loss": 0.0663, + "epoch": 0.22, + "learning_rate": 0.0002664057003814453, + "loss": 0.0687, "step": 34700 }, { - "epoch": 0.38, - "learning_rate": 0.0002436855084690765, - "loss": 0.0659, + "epoch": 0.22, + "learning_rate": 0.0002663960190270884, + "loss": 0.0765, "step": 34710 }, { - "epoch": 0.38, - "learning_rate": 0.0002436692841845674, - "loss": 0.0684, + "epoch": 0.22, + "learning_rate": 0.0002663863376727315, + "loss": 0.0748, "step": 34720 }, { - "epoch": 0.38, - "learning_rate": 0.0002436530599000584, - "loss": 0.0737, + "epoch": 0.22, + "learning_rate": 0.0002663766563183745, + "loss": 0.0806, "step": 34730 }, { - "epoch": 0.38, - "learning_rate": 0.0002436368356155493, - "loss": 0.0607, + "epoch": 0.22, + "learning_rate": 0.0002663669749640176, + "loss": 0.0688, "step": 34740 }, { - "epoch": 0.38, - "learning_rate": 0.0002436206113310403, - "loss": 0.0701, + "epoch": 0.22, + "learning_rate": 0.00026635729360966067, + "loss": 0.0686, "step": 34750 }, { - "epoch": 0.38, - "learning_rate": 0.0002436043870465312, - "loss": 0.0662, + "epoch": 0.22, + "learning_rate": 0.00026634761225530375, + "loss": 0.07, "step": 34760 }, { - "epoch": 0.38, - "learning_rate": 0.0002435881627620222, - "loss": 0.0617, + "epoch": 0.22, + "learning_rate": 0.00026633793090094683, + "loss": 0.0713, "step": 34770 }, { - "epoch": 0.38, - "learning_rate": 0.0002435719384775131, - "loss": 0.0636, + "epoch": 0.22, + "learning_rate": 0.00026632824954658986, + "loss": 0.0693, "step": 34780 }, { - "epoch": 0.38, - "learning_rate": 0.00024355571419300406, - "loss": 0.0596, + "epoch": 0.22, + "learning_rate": 0.00026631856819223294, + "loss": 0.0708, "step": 34790 }, { - "epoch": 0.38, - "learning_rate": 0.000243539489908495, - "loss": 0.0625, + "epoch": 0.22, + "learning_rate": 0.000266308886837876, + "loss": 0.0743, "step": 34800 }, { - "epoch": 0.38, - "learning_rate": 0.00024352326562398596, - "loss": 0.0629, + "epoch": 0.22, + "learning_rate": 0.0002662992054835191, + "loss": 0.0867, "step": 34810 }, { - "epoch": 0.38, - "learning_rate": 0.00024350704133947688, - "loss": 0.0738, + "epoch": 0.22, + "learning_rate": 0.0002662895241291622, + "loss": 0.0699, "step": 34820 }, { - "epoch": 0.38, - "learning_rate": 0.00024349081705496786, - "loss": 0.0649, + "epoch": 0.22, + "learning_rate": 0.00026627984277480525, + "loss": 0.0704, "step": 34830 }, { - "epoch": 0.38, - "learning_rate": 0.00024347459277045878, - "loss": 0.0695, + "epoch": 0.22, + "learning_rate": 0.0002662701614204483, + "loss": 0.0749, "step": 34840 }, { - "epoch": 0.38, - "learning_rate": 0.00024345836848594976, - "loss": 0.0571, + "epoch": 0.22, + "learning_rate": 0.00026626048006609136, + "loss": 0.0711, "step": 34850 }, { - "epoch": 0.38, - "learning_rate": 0.00024344214420144068, - "loss": 0.0572, + "epoch": 0.22, + "learning_rate": 0.00026625079871173444, + "loss": 0.0671, "step": 34860 }, { - "epoch": 0.38, - "learning_rate": 0.00024342591991693163, - "loss": 0.0671, + "epoch": 0.23, + "learning_rate": 0.00026624111735737747, + "loss": 0.0697, "step": 34870 }, { - "epoch": 0.38, - "learning_rate": 0.00024340969563242258, - "loss": 0.0668, + "epoch": 0.23, + "learning_rate": 0.00026623143600302055, + "loss": 0.0752, "step": 34880 }, { - "epoch": 0.38, - "learning_rate": 0.00024339347134791353, - "loss": 0.062, + "epoch": 0.23, + "learning_rate": 0.0002662217546486636, + "loss": 0.0711, "step": 34890 }, { - "epoch": 0.38, - "learning_rate": 0.00024337724706340445, - "loss": 0.0566, + "epoch": 0.23, + "learning_rate": 0.0002662120732943067, + "loss": 0.0741, "step": 34900 }, { - "epoch": 0.38, - "learning_rate": 0.00024336102277889543, - "loss": 0.0582, + "epoch": 0.23, + "learning_rate": 0.0002662023919399498, + "loss": 0.0719, "step": 34910 }, { - "epoch": 0.38, - "learning_rate": 0.00024334479849438635, - "loss": 0.0631, + "epoch": 0.23, + "learning_rate": 0.0002661927105855928, + "loss": 0.0836, "step": 34920 }, { - "epoch": 0.38, - "learning_rate": 0.00024332857420987733, - "loss": 0.0623, + "epoch": 0.23, + "learning_rate": 0.0002661830292312359, + "loss": 0.065, "step": 34930 }, { - "epoch": 0.38, - "learning_rate": 0.00024331234992536825, - "loss": 0.0691, + "epoch": 0.23, + "learning_rate": 0.00026617334787687897, + "loss": 0.0741, "step": 34940 }, { - "epoch": 0.38, - "learning_rate": 0.00024329612564085923, - "loss": 0.0683, + "epoch": 0.23, + "learning_rate": 0.00026616366652252205, + "loss": 0.0703, "step": 34950 }, { - "epoch": 0.38, - "learning_rate": 0.00024327990135635015, - "loss": 0.0617, + "epoch": 0.23, + "learning_rate": 0.00026615398516816513, + "loss": 0.0747, "step": 34960 }, { - "epoch": 0.38, - "learning_rate": 0.0002432636770718411, - "loss": 0.0674, + "epoch": 0.23, + "learning_rate": 0.00026614430381380816, + "loss": 0.0693, "step": 34970 }, { - "epoch": 0.38, - "learning_rate": 0.00024324745278733205, - "loss": 0.066, + "epoch": 0.23, + "learning_rate": 0.00026613462245945123, + "loss": 0.0704, "step": 34980 }, { - "epoch": 0.38, - "learning_rate": 0.000243231228502823, - "loss": 0.0688, + "epoch": 0.23, + "learning_rate": 0.0002661249411050943, + "loss": 0.0738, "step": 34990 }, { - "epoch": 0.38, - "learning_rate": 0.00024321500421831393, - "loss": 0.0562, + "epoch": 0.23, + "learning_rate": 0.00026611525975073734, + "loss": 0.0674, "step": 35000 }, { - "epoch": 0.38, - "eval_cer": 0.9213592936366158, - "eval_loss": 0.045057717710733414, - "eval_runtime": 119.209, - "eval_samples_per_second": 16.777, - "eval_steps_per_second": 4.194, + "epoch": 0.23, + "eval_cer": 0.9201554626595865, + "eval_loss": 0.04858190566301346, + "eval_runtime": 120.2631, + "eval_samples_per_second": 16.63, + "eval_steps_per_second": 4.158, "step": 35000 }, { - "epoch": 0.38, - "learning_rate": 0.0002431987799338049, - "loss": 0.0632, + "epoch": 0.23, + "learning_rate": 0.0002661055783963804, + "loss": 0.0744, "step": 35010 }, { - "epoch": 0.38, - "learning_rate": 0.00024318255564929582, - "loss": 0.0601, + "epoch": 0.23, + "learning_rate": 0.0002660958970420235, + "loss": 0.0735, "step": 35020 }, { - "epoch": 0.38, - "learning_rate": 0.0002431663313647868, - "loss": 0.0652, + "epoch": 0.23, + "learning_rate": 0.0002660862156876666, + "loss": 0.0713, "step": 35030 }, { - "epoch": 0.38, - "learning_rate": 0.00024315010708027772, - "loss": 0.0575, + "epoch": 0.23, + "learning_rate": 0.00026607653433330966, + "loss": 0.0802, "step": 35040 }, { - "epoch": 0.38, - "learning_rate": 0.00024313388279576867, - "loss": 0.076, + "epoch": 0.23, + "learning_rate": 0.00026606685297895274, + "loss": 0.0754, "step": 35050 }, { - "epoch": 0.38, - "learning_rate": 0.00024311765851125962, - "loss": 0.0625, + "epoch": 0.23, + "learning_rate": 0.00026605717162459576, + "loss": 0.0727, "step": 35060 }, { - "epoch": 0.38, - "learning_rate": 0.00024310143422675057, - "loss": 0.0629, + "epoch": 0.23, + "learning_rate": 0.00026604749027023884, + "loss": 0.0707, "step": 35070 }, { - "epoch": 0.38, - "learning_rate": 0.00024308520994224152, - "loss": 0.0677, + "epoch": 0.23, + "learning_rate": 0.0002660378089158819, + "loss": 0.0736, "step": 35080 }, { - "epoch": 0.38, - "learning_rate": 0.00024306898565773247, - "loss": 0.0651, + "epoch": 0.23, + "learning_rate": 0.000266028127561525, + "loss": 0.065, "step": 35090 }, { - "epoch": 0.38, - "learning_rate": 0.0002430527613732234, - "loss": 0.0575, + "epoch": 0.23, + "learning_rate": 0.00026601844620716803, + "loss": 0.076, "step": 35100 }, { - "epoch": 0.38, - "learning_rate": 0.00024303653708871437, - "loss": 0.0656, + "epoch": 0.23, + "learning_rate": 0.0002660087648528111, + "loss": 0.0818, "step": 35110 }, { - "epoch": 0.38, - "learning_rate": 0.0002430203128042053, - "loss": 0.0614, + "epoch": 0.23, + "learning_rate": 0.0002659990834984542, + "loss": 0.0695, "step": 35120 }, { - "epoch": 0.38, - "learning_rate": 0.00024300408851969627, - "loss": 0.0759, + "epoch": 0.23, + "learning_rate": 0.0002659894021440972, + "loss": 0.0681, "step": 35130 }, { - "epoch": 0.38, - "learning_rate": 0.0002429878642351872, - "loss": 0.0643, + "epoch": 0.23, + "learning_rate": 0.0002659797207897403, + "loss": 0.0723, "step": 35140 }, { - "epoch": 0.38, - "learning_rate": 0.00024297163995067814, - "loss": 0.0669, + "epoch": 0.23, + "learning_rate": 0.0002659700394353834, + "loss": 0.0721, "step": 35150 }, { - "epoch": 0.38, - "learning_rate": 0.0002429554156661691, - "loss": 0.0623, + "epoch": 0.23, + "learning_rate": 0.00026596035808102645, + "loss": 0.0693, "step": 35160 }, { - "epoch": 0.38, - "learning_rate": 0.00024293919138166004, - "loss": 0.0752, + "epoch": 0.23, + "learning_rate": 0.00026595067672666953, + "loss": 0.0611, "step": 35170 }, { - "epoch": 0.38, - "learning_rate": 0.00024292296709715097, - "loss": 0.0652, + "epoch": 0.23, + "learning_rate": 0.0002659409953723126, + "loss": 0.0787, "step": 35180 }, { - "epoch": 0.38, - "learning_rate": 0.00024290674281264194, - "loss": 0.0629, + "epoch": 0.23, + "learning_rate": 0.0002659313140179557, + "loss": 0.0707, "step": 35190 }, { - "epoch": 0.38, - "learning_rate": 0.0002428905185281329, - "loss": 0.0643, + "epoch": 0.23, + "learning_rate": 0.0002659216326635987, + "loss": 0.0691, "step": 35200 }, { - "epoch": 0.38, - "learning_rate": 0.00024287429424362384, - "loss": 0.0667, + "epoch": 0.23, + "learning_rate": 0.0002659119513092418, + "loss": 0.0664, "step": 35210 }, { - "epoch": 0.38, - "learning_rate": 0.0002428580699591148, - "loss": 0.0639, + "epoch": 0.23, + "learning_rate": 0.0002659022699548849, + "loss": 0.0725, "step": 35220 }, { - "epoch": 0.38, - "learning_rate": 0.00024284184567460572, - "loss": 0.0648, + "epoch": 0.23, + "learning_rate": 0.00026589258860052796, + "loss": 0.078, "step": 35230 }, { - "epoch": 0.38, - "learning_rate": 0.0002428256213900967, - "loss": 0.0709, + "epoch": 0.23, + "learning_rate": 0.000265882907246171, + "loss": 0.0719, "step": 35240 }, { - "epoch": 0.38, - "learning_rate": 0.00024280939710558762, - "loss": 0.056, + "epoch": 0.23, + "learning_rate": 0.00026587322589181406, + "loss": 0.0713, "step": 35250 }, { - "epoch": 0.38, - "learning_rate": 0.0002427931728210786, - "loss": 0.0584, + "epoch": 0.23, + "learning_rate": 0.00026586354453745714, + "loss": 0.0673, "step": 35260 }, { - "epoch": 0.38, - "learning_rate": 0.00024277694853656951, - "loss": 0.0714, + "epoch": 0.23, + "learning_rate": 0.00026585386318310017, + "loss": 0.0707, "step": 35270 }, { - "epoch": 0.38, - "learning_rate": 0.0002427607242520605, - "loss": 0.0703, + "epoch": 0.23, + "learning_rate": 0.00026584418182874325, + "loss": 0.0721, "step": 35280 }, { - "epoch": 0.38, - "learning_rate": 0.00024274449996755141, - "loss": 0.0766, + "epoch": 0.23, + "learning_rate": 0.00026583450047438633, + "loss": 0.0758, "step": 35290 }, { - "epoch": 0.38, - "learning_rate": 0.00024272827568304236, - "loss": 0.0632, + "epoch": 0.23, + "learning_rate": 0.0002658248191200294, + "loss": 0.0803, "step": 35300 }, { - "epoch": 0.38, - "learning_rate": 0.00024271205139853331, - "loss": 0.0612, + "epoch": 0.23, + "learning_rate": 0.0002658151377656725, + "loss": 0.0762, "step": 35310 }, { - "epoch": 0.38, - "learning_rate": 0.00024269582711402426, - "loss": 0.0678, + "epoch": 0.23, + "learning_rate": 0.00026580545641131557, + "loss": 0.0802, "step": 35320 }, { - "epoch": 0.38, - "learning_rate": 0.0002426796028295152, - "loss": 0.0684, + "epoch": 0.23, + "learning_rate": 0.00026579577505695865, + "loss": 0.0718, "step": 35330 }, { - "epoch": 0.38, - "learning_rate": 0.00024266337854500616, - "loss": 0.0661, + "epoch": 0.23, + "learning_rate": 0.0002657860937026017, + "loss": 0.0706, "step": 35340 }, { - "epoch": 0.38, - "learning_rate": 0.00024264715426049709, - "loss": 0.0644, + "epoch": 0.23, + "learning_rate": 0.00026577641234824475, + "loss": 0.0696, "step": 35350 }, { - "epoch": 0.38, - "learning_rate": 0.00024263092997598806, - "loss": 0.0609, + "epoch": 0.23, + "learning_rate": 0.00026576673099388783, + "loss": 0.0743, "step": 35360 }, { - "epoch": 0.38, - "learning_rate": 0.00024261470569147899, - "loss": 0.0665, + "epoch": 0.23, + "learning_rate": 0.00026575704963953086, + "loss": 0.069, "step": 35370 }, { - "epoch": 0.38, - "learning_rate": 0.00024259848140696994, - "loss": 0.0688, + "epoch": 0.23, + "learning_rate": 0.00026574736828517394, + "loss": 0.0678, "step": 35380 }, { - "epoch": 0.38, - "learning_rate": 0.00024258225712246089, - "loss": 0.0707, + "epoch": 0.23, + "learning_rate": 0.000265737686930817, + "loss": 0.0687, "step": 35390 }, { - "epoch": 0.38, - "learning_rate": 0.00024256603283795183, - "loss": 0.0775, + "epoch": 0.23, + "learning_rate": 0.0002657280055764601, + "loss": 0.0753, "step": 35400 }, { - "epoch": 0.38, - "learning_rate": 0.00024254980855344276, - "loss": 0.0733, + "epoch": 0.23, + "learning_rate": 0.0002657183242221031, + "loss": 0.0664, "step": 35410 }, { - "epoch": 0.38, - "learning_rate": 0.00024253358426893373, - "loss": 0.0651, + "epoch": 0.23, + "learning_rate": 0.0002657086428677462, + "loss": 0.0692, "step": 35420 }, { - "epoch": 0.38, - "learning_rate": 0.00024251735998442466, - "loss": 0.0679, + "epoch": 0.23, + "learning_rate": 0.0002656989615133893, + "loss": 0.0692, "step": 35430 }, { - "epoch": 0.38, - "learning_rate": 0.00024250113569991563, - "loss": 0.0591, + "epoch": 0.23, + "learning_rate": 0.00026568928015903236, + "loss": 0.0674, "step": 35440 }, { - "epoch": 0.38, - "learning_rate": 0.00024248491141540656, - "loss": 0.0645, + "epoch": 0.23, + "learning_rate": 0.00026567959880467544, + "loss": 0.0687, "step": 35450 }, { - "epoch": 0.38, - "learning_rate": 0.00024246868713089753, - "loss": 0.0737, + "epoch": 0.23, + "learning_rate": 0.0002656699174503185, + "loss": 0.0638, "step": 35460 }, { - "epoch": 0.38, - "learning_rate": 0.00024245246284638846, - "loss": 0.0752, + "epoch": 0.23, + "learning_rate": 0.0002656602360959616, + "loss": 0.0661, "step": 35470 }, { - "epoch": 0.38, - "learning_rate": 0.0002424362385618794, - "loss": 0.0667, + "epoch": 0.23, + "learning_rate": 0.00026565055474160463, + "loss": 0.0815, "step": 35480 }, { - "epoch": 0.38, - "learning_rate": 0.00024242001427737036, - "loss": 0.0689, + "epoch": 0.23, + "learning_rate": 0.0002656408733872477, + "loss": 0.0685, "step": 35490 }, { - "epoch": 0.38, - "learning_rate": 0.0002424037899928613, - "loss": 0.0676, + "epoch": 0.23, + "learning_rate": 0.0002656311920328908, + "loss": 0.0733, "step": 35500 }, { - "epoch": 0.38, - "learning_rate": 0.00024238756570835223, - "loss": 0.0664, + "epoch": 0.23, + "learning_rate": 0.0002656215106785338, + "loss": 0.0767, "step": 35510 }, { - "epoch": 0.38, - "learning_rate": 0.0002423713414238432, - "loss": 0.0716, + "epoch": 0.23, + "learning_rate": 0.0002656118293241769, + "loss": 0.0743, "step": 35520 }, { - "epoch": 0.38, - "learning_rate": 0.00024235511713933413, - "loss": 0.1255, + "epoch": 0.23, + "learning_rate": 0.00026560214796981997, + "loss": 0.0693, "step": 35530 }, { - "epoch": 0.38, - "learning_rate": 0.0002423388928548251, - "loss": 0.0784, + "epoch": 0.23, + "learning_rate": 0.00026559246661546305, + "loss": 0.0794, "step": 35540 }, { - "epoch": 0.38, - "learning_rate": 0.00024232266857031603, - "loss": 0.0843, + "epoch": 0.23, + "learning_rate": 0.0002655827852611061, + "loss": 0.0741, "step": 35550 }, { - "epoch": 0.38, - "learning_rate": 0.00024230644428580698, - "loss": 0.0753, + "epoch": 0.23, + "learning_rate": 0.00026557310390674916, + "loss": 0.0789, "step": 35560 }, { - "epoch": 0.38, - "learning_rate": 0.00024229022000129793, - "loss": 0.0794, + "epoch": 0.23, + "learning_rate": 0.00026556342255239224, + "loss": 0.0699, "step": 35570 }, { - "epoch": 0.38, - "learning_rate": 0.00024227399571678888, - "loss": 0.0728, + "epoch": 0.23, + "learning_rate": 0.0002655537411980353, + "loss": 0.0716, "step": 35580 }, { - "epoch": 0.38, - "learning_rate": 0.0002422577714322798, - "loss": 0.0785, + "epoch": 0.23, + "learning_rate": 0.0002655440598436784, + "loss": 0.0715, "step": 35590 }, { - "epoch": 0.39, - "learning_rate": 0.00024224154714777078, - "loss": 0.0747, + "epoch": 0.23, + "learning_rate": 0.0002655343784893215, + "loss": 0.0766, "step": 35600 }, { - "epoch": 0.39, - "learning_rate": 0.0002422253228632617, - "loss": 0.0729, + "epoch": 0.23, + "learning_rate": 0.0002655246971349645, + "loss": 0.0732, "step": 35610 }, { - "epoch": 0.39, - "learning_rate": 0.00024220909857875268, - "loss": 0.0701, + "epoch": 0.23, + "learning_rate": 0.0002655150157806076, + "loss": 0.0639, "step": 35620 }, { - "epoch": 0.39, - "learning_rate": 0.0002421928742942436, - "loss": 0.0639, + "epoch": 0.23, + "learning_rate": 0.00026550533442625066, + "loss": 0.0953, "step": 35630 }, { - "epoch": 0.39, - "learning_rate": 0.00024217665000973458, - "loss": 0.0661, + "epoch": 0.23, + "learning_rate": 0.0002654956530718937, + "loss": 0.0673, "step": 35640 }, { - "epoch": 0.39, - "learning_rate": 0.0002421604257252255, - "loss": 0.0633, + "epoch": 0.23, + "learning_rate": 0.00026548597171753677, + "loss": 0.0686, "step": 35650 }, { - "epoch": 0.39, - "learning_rate": 0.00024214420144071645, - "loss": 0.0588, + "epoch": 0.23, + "learning_rate": 0.00026547629036317985, + "loss": 0.0749, "step": 35660 }, { - "epoch": 0.39, - "learning_rate": 0.0002421279771562074, - "loss": 0.0624, + "epoch": 0.23, + "learning_rate": 0.00026546660900882293, + "loss": 0.0723, "step": 35670 }, { - "epoch": 0.39, - "learning_rate": 0.00024211175287169835, - "loss": 0.0691, + "epoch": 0.23, + "learning_rate": 0.000265456927654466, + "loss": 0.071, "step": 35680 }, { - "epoch": 0.39, - "learning_rate": 0.00024209552858718927, - "loss": 0.0688, + "epoch": 0.23, + "learning_rate": 0.00026544724630010903, + "loss": 0.0812, "step": 35690 }, { - "epoch": 0.39, - "learning_rate": 0.00024207930430268025, - "loss": 0.0625, + "epoch": 0.23, + "learning_rate": 0.0002654375649457521, + "loss": 0.0726, "step": 35700 }, { - "epoch": 0.39, - "learning_rate": 0.00024206308001817117, - "loss": 0.0588, + "epoch": 0.23, + "learning_rate": 0.0002654278835913952, + "loss": 0.081, "step": 35710 }, { - "epoch": 0.39, - "learning_rate": 0.00024204685573366215, - "loss": 0.0689, + "epoch": 0.23, + "learning_rate": 0.00026541820223703827, + "loss": 0.068, "step": 35720 }, { - "epoch": 0.39, - "learning_rate": 0.00024203063144915307, - "loss": 0.0665, + "epoch": 0.23, + "learning_rate": 0.00026540852088268135, + "loss": 0.0722, "step": 35730 }, { - "epoch": 0.39, - "learning_rate": 0.00024201440716464402, - "loss": 0.0723, + "epoch": 0.23, + "learning_rate": 0.0002653988395283244, + "loss": 0.0686, "step": 35740 }, { - "epoch": 0.39, - "learning_rate": 0.00024199818288013497, - "loss": 0.0613, + "epoch": 0.23, + "learning_rate": 0.00026538915817396746, + "loss": 0.0772, "step": 35750 }, { - "epoch": 0.39, - "learning_rate": 0.00024198195859562592, - "loss": 0.0668, + "epoch": 0.23, + "learning_rate": 0.00026537947681961054, + "loss": 0.0747, "step": 35760 }, { - "epoch": 0.39, - "learning_rate": 0.00024196573431111687, - "loss": 0.0657, + "epoch": 0.23, + "learning_rate": 0.00026536979546525356, + "loss": 0.0794, "step": 35770 }, { - "epoch": 0.39, - "learning_rate": 0.00024194951002660782, - "loss": 0.0751, + "epoch": 0.23, + "learning_rate": 0.00026536011411089664, + "loss": 0.08, "step": 35780 }, { - "epoch": 0.39, - "learning_rate": 0.00024193328574209874, - "loss": 0.0635, + "epoch": 0.23, + "learning_rate": 0.0002653504327565397, + "loss": 0.0699, "step": 35790 }, { - "epoch": 0.39, - "learning_rate": 0.00024191706145758972, - "loss": 0.0609, + "epoch": 0.23, + "learning_rate": 0.0002653407514021828, + "loss": 0.0794, "step": 35800 }, { - "epoch": 0.39, - "learning_rate": 0.00024190083717308064, - "loss": 0.0677, + "epoch": 0.23, + "learning_rate": 0.0002653310700478259, + "loss": 0.0732, "step": 35810 }, { - "epoch": 0.39, - "learning_rate": 0.00024188461288857162, - "loss": 0.0724, + "epoch": 0.23, + "learning_rate": 0.00026532138869346896, + "loss": 0.067, "step": 35820 }, { - "epoch": 0.39, - "learning_rate": 0.00024186838860406254, - "loss": 0.0677, + "epoch": 0.23, + "learning_rate": 0.000265311707339112, + "loss": 0.0678, "step": 35830 }, { - "epoch": 0.39, - "learning_rate": 0.0002418521643195535, - "loss": 0.073, + "epoch": 0.23, + "learning_rate": 0.00026530202598475507, + "loss": 0.0724, "step": 35840 }, { - "epoch": 0.39, - "learning_rate": 0.00024183594003504444, - "loss": 0.0679, + "epoch": 0.23, + "learning_rate": 0.00026529234463039815, + "loss": 0.0719, "step": 35850 }, { - "epoch": 0.39, - "learning_rate": 0.0002418197157505354, - "loss": 0.0638, + "epoch": 0.23, + "learning_rate": 0.0002652826632760412, + "loss": 0.0765, "step": 35860 }, { - "epoch": 0.39, - "learning_rate": 0.0002418034914660263, - "loss": 0.0645, + "epoch": 0.23, + "learning_rate": 0.0002652729819216843, + "loss": 0.0824, "step": 35870 }, { - "epoch": 0.39, - "learning_rate": 0.0002417872671815173, - "loss": 0.0613, + "epoch": 0.23, + "learning_rate": 0.00026526330056732733, + "loss": 0.0712, "step": 35880 }, { - "epoch": 0.39, - "learning_rate": 0.0002417710428970082, - "loss": 0.0613, + "epoch": 0.23, + "learning_rate": 0.0002652536192129704, + "loss": 0.0734, "step": 35890 }, { - "epoch": 0.39, - "learning_rate": 0.0002417548186124992, - "loss": 0.064, + "epoch": 0.23, + "learning_rate": 0.0002652439378586135, + "loss": 0.0793, "step": 35900 }, { - "epoch": 0.39, - "learning_rate": 0.0002417385943279901, - "loss": 0.065, + "epoch": 0.23, + "learning_rate": 0.0002652342565042565, + "loss": 0.0711, "step": 35910 }, { - "epoch": 0.39, - "learning_rate": 0.00024172237004348106, - "loss": 0.0613, + "epoch": 0.23, + "learning_rate": 0.0002652245751498996, + "loss": 0.0749, "step": 35920 }, { - "epoch": 0.39, - "learning_rate": 0.000241706145758972, - "loss": 0.0653, + "epoch": 0.23, + "learning_rate": 0.0002652148937955427, + "loss": 0.066, "step": 35930 }, { - "epoch": 0.39, - "learning_rate": 0.00024168992147446296, - "loss": 0.064, + "epoch": 0.23, + "learning_rate": 0.00026520521244118576, + "loss": 0.079, "step": 35940 }, { - "epoch": 0.39, - "learning_rate": 0.0002416736971899539, - "loss": 0.0669, + "epoch": 0.23, + "learning_rate": 0.00026519553108682884, + "loss": 0.0738, "step": 35950 }, { - "epoch": 0.39, - "learning_rate": 0.00024165747290544486, - "loss": 0.0679, + "epoch": 0.23, + "learning_rate": 0.0002651858497324719, + "loss": 0.0756, "step": 35960 }, { - "epoch": 0.39, - "learning_rate": 0.00024164124862093578, - "loss": 0.0636, + "epoch": 0.23, + "learning_rate": 0.00026517616837811494, + "loss": 0.065, "step": 35970 }, { - "epoch": 0.39, - "learning_rate": 0.00024162502433642676, - "loss": 0.0739, + "epoch": 0.23, + "learning_rate": 0.000265166487023758, + "loss": 0.073, "step": 35980 }, { - "epoch": 0.39, - "learning_rate": 0.00024160880005191768, - "loss": 0.0594, + "epoch": 0.23, + "learning_rate": 0.0002651568056694011, + "loss": 0.0868, "step": 35990 }, { - "epoch": 0.39, - "learning_rate": 0.00024159257576740866, - "loss": 0.0715, + "epoch": 0.23, + "learning_rate": 0.0002651471243150442, + "loss": 0.0775, "step": 36000 }, { - "epoch": 0.39, - "eval_cer": 0.9213884486192023, - "eval_loss": 0.04401349648833275, - "eval_runtime": 119.3853, - "eval_samples_per_second": 16.752, - "eval_steps_per_second": 4.188, + "epoch": 0.23, + "eval_cer": 0.9200876737091854, + "eval_loss": 0.04887823387980461, + "eval_runtime": 120.558, + "eval_samples_per_second": 16.59, + "eval_steps_per_second": 4.147, "step": 36000 }, { - "epoch": 0.39, - "learning_rate": 0.00024157635148289958, - "loss": 0.0632, + "epoch": 0.23, + "learning_rate": 0.0002651374429606872, + "loss": 0.0742, "step": 36010 }, { - "epoch": 0.39, - "learning_rate": 0.00024156012719839053, - "loss": 0.063, + "epoch": 0.23, + "learning_rate": 0.0002651277616063303, + "loss": 0.0734, "step": 36020 }, { - "epoch": 0.39, - "learning_rate": 0.00024154390291388148, - "loss": 0.064, + "epoch": 0.23, + "learning_rate": 0.00026511808025197337, + "loss": 0.0632, "step": 36030 }, { - "epoch": 0.39, - "learning_rate": 0.00024152767862937243, - "loss": 0.0742, + "epoch": 0.23, + "learning_rate": 0.0002651083988976164, + "loss": 0.0726, "step": 36040 }, { - "epoch": 0.39, - "learning_rate": 0.00024151145434486335, - "loss": 0.0619, + "epoch": 0.23, + "learning_rate": 0.00026509871754325947, + "loss": 0.0772, "step": 36050 }, { - "epoch": 0.39, - "learning_rate": 0.00024149523006035433, - "loss": 0.0616, + "epoch": 0.23, + "learning_rate": 0.00026508903618890255, + "loss": 0.068, "step": 36060 }, { - "epoch": 0.39, - "learning_rate": 0.00024147900577584525, - "loss": 0.0732, + "epoch": 0.23, + "learning_rate": 0.00026507935483454563, + "loss": 0.0679, "step": 36070 }, { - "epoch": 0.39, - "learning_rate": 0.00024146278149133623, - "loss": 0.0619, + "epoch": 0.23, + "learning_rate": 0.0002650696734801887, + "loss": 0.0741, "step": 36080 }, { - "epoch": 0.39, - "learning_rate": 0.00024144655720682715, - "loss": 0.0638, + "epoch": 0.23, + "learning_rate": 0.0002650599921258318, + "loss": 0.0772, "step": 36090 }, { - "epoch": 0.39, - "learning_rate": 0.0002414303329223181, - "loss": 0.0623, + "epoch": 0.23, + "learning_rate": 0.00026505031077147487, + "loss": 0.0759, "step": 36100 }, { - "epoch": 0.39, - "learning_rate": 0.00024141410863780905, - "loss": 0.064, + "epoch": 0.23, + "learning_rate": 0.0002650406294171179, + "loss": 0.0621, "step": 36110 }, { - "epoch": 0.39, - "learning_rate": 0.0002413978843533, - "loss": 0.0659, + "epoch": 0.23, + "learning_rate": 0.000265030948062761, + "loss": 0.0777, "step": 36120 }, { - "epoch": 0.39, - "learning_rate": 0.00024138166006879095, - "loss": 0.0601, + "epoch": 0.23, + "learning_rate": 0.00026502126670840406, + "loss": 0.0756, "step": 36130 }, { - "epoch": 0.39, - "learning_rate": 0.0002413654357842819, - "loss": 0.0665, + "epoch": 0.23, + "learning_rate": 0.0002650115853540471, + "loss": 0.0682, "step": 36140 }, { - "epoch": 0.39, - "learning_rate": 0.00024134921149977282, - "loss": 0.0712, + "epoch": 0.23, + "learning_rate": 0.00026500190399969016, + "loss": 0.0763, "step": 36150 }, { - "epoch": 0.39, - "learning_rate": 0.0002413329872152638, - "loss": 0.0613, + "epoch": 0.23, + "learning_rate": 0.00026499222264533324, + "loss": 0.0686, "step": 36160 }, { - "epoch": 0.39, - "learning_rate": 0.00024131676293075472, - "loss": 0.059, + "epoch": 0.23, + "learning_rate": 0.0002649825412909763, + "loss": 0.0647, "step": 36170 }, { - "epoch": 0.39, - "learning_rate": 0.0002413005386462457, - "loss": 0.0641, + "epoch": 0.23, + "learning_rate": 0.00026497285993661935, + "loss": 0.0725, "step": 36180 }, { - "epoch": 0.39, - "learning_rate": 0.00024128431436173662, - "loss": 0.0625, + "epoch": 0.23, + "learning_rate": 0.0002649631785822624, + "loss": 0.0723, "step": 36190 }, { - "epoch": 0.39, - "learning_rate": 0.00024126809007722757, - "loss": 0.0622, + "epoch": 0.23, + "learning_rate": 0.0002649534972279055, + "loss": 0.0688, "step": 36200 }, { - "epoch": 0.39, - "learning_rate": 0.00024125186579271852, - "loss": 0.0683, + "epoch": 0.23, + "learning_rate": 0.0002649438158735486, + "loss": 0.0788, "step": 36210 }, { - "epoch": 0.39, - "learning_rate": 0.00024123564150820947, - "loss": 0.0627, + "epoch": 0.23, + "learning_rate": 0.00026493413451919167, + "loss": 0.0669, "step": 36220 }, { - "epoch": 0.39, - "learning_rate": 0.0002412194172237004, - "loss": 0.0614, + "epoch": 0.23, + "learning_rate": 0.00026492445316483475, + "loss": 0.0753, "step": 36230 }, { - "epoch": 0.39, - "learning_rate": 0.00024120319293919137, - "loss": 0.0585, + "epoch": 0.23, + "learning_rate": 0.0002649147718104778, + "loss": 0.0679, "step": 36240 }, { - "epoch": 0.39, - "learning_rate": 0.0002411869686546823, - "loss": 0.0675, + "epoch": 0.23, + "learning_rate": 0.00026490509045612085, + "loss": 0.0684, "step": 36250 }, { - "epoch": 0.39, - "learning_rate": 0.00024117074437017327, - "loss": 0.0625, + "epoch": 0.23, + "learning_rate": 0.00026489540910176393, + "loss": 0.0666, "step": 36260 }, { - "epoch": 0.39, - "learning_rate": 0.0002411545200856642, - "loss": 0.0648, + "epoch": 0.23, + "learning_rate": 0.000264885727747407, + "loss": 0.0681, "step": 36270 }, { - "epoch": 0.39, - "learning_rate": 0.00024113829580115514, - "loss": 0.067, + "epoch": 0.23, + "learning_rate": 0.00026487604639305004, + "loss": 0.0743, "step": 36280 }, { - "epoch": 0.39, - "learning_rate": 0.0002411220715166461, - "loss": 0.0645, + "epoch": 0.23, + "learning_rate": 0.0002648663650386931, + "loss": 0.07, "step": 36290 }, { - "epoch": 0.39, - "learning_rate": 0.00024110584723213704, - "loss": 0.06, + "epoch": 0.23, + "learning_rate": 0.0002648566836843362, + "loss": 0.0701, "step": 36300 }, { - "epoch": 0.39, - "learning_rate": 0.000241089622947628, - "loss": 0.0642, + "epoch": 0.23, + "learning_rate": 0.0002648470023299793, + "loss": 0.0695, "step": 36310 }, { - "epoch": 0.39, - "learning_rate": 0.00024107339866311894, - "loss": 0.0686, + "epoch": 0.23, + "learning_rate": 0.0002648373209756223, + "loss": 0.0727, "step": 36320 }, { - "epoch": 0.39, - "learning_rate": 0.00024105717437860987, - "loss": 0.0641, + "epoch": 0.23, + "learning_rate": 0.0002648276396212654, + "loss": 0.0774, "step": 36330 }, { - "epoch": 0.39, - "learning_rate": 0.00024104095009410084, - "loss": 0.0583, + "epoch": 0.23, + "learning_rate": 0.00026481795826690846, + "loss": 0.077, "step": 36340 }, { - "epoch": 0.39, - "learning_rate": 0.00024102472580959176, - "loss": 0.0608, + "epoch": 0.23, + "learning_rate": 0.00026480827691255154, + "loss": 0.0737, "step": 36350 }, { - "epoch": 0.39, - "learning_rate": 0.00024100850152508274, - "loss": 0.0678, + "epoch": 0.23, + "learning_rate": 0.0002647985955581946, + "loss": 0.0778, "step": 36360 }, { - "epoch": 0.39, - "learning_rate": 0.00024099227724057366, - "loss": 0.0737, + "epoch": 0.23, + "learning_rate": 0.0002647889142038377, + "loss": 0.0825, "step": 36370 }, { - "epoch": 0.39, - "learning_rate": 0.00024097605295606461, - "loss": 0.0636, + "epoch": 0.23, + "learning_rate": 0.0002647792328494807, + "loss": 0.0653, "step": 36380 }, { - "epoch": 0.39, - "learning_rate": 0.00024095982867155556, - "loss": 0.0666, + "epoch": 0.23, + "learning_rate": 0.0002647695514951238, + "loss": 0.0736, "step": 36390 }, { - "epoch": 0.39, - "learning_rate": 0.00024094360438704651, - "loss": 0.0624, + "epoch": 0.23, + "learning_rate": 0.0002647598701407669, + "loss": 0.0723, "step": 36400 }, { - "epoch": 0.39, - "learning_rate": 0.00024092738010253744, - "loss": 0.0626, + "epoch": 0.23, + "learning_rate": 0.0002647501887864099, + "loss": 0.0693, "step": 36410 }, { - "epoch": 0.39, - "learning_rate": 0.0002409111558180284, - "loss": 0.0623, + "epoch": 0.24, + "learning_rate": 0.000264740507432053, + "loss": 0.0706, "step": 36420 }, { - "epoch": 0.39, - "learning_rate": 0.00024089493153351934, - "loss": 0.0677, + "epoch": 0.24, + "learning_rate": 0.00026473082607769607, + "loss": 0.0679, "step": 36430 }, { - "epoch": 0.39, - "learning_rate": 0.0002408787072490103, - "loss": 0.0609, + "epoch": 0.24, + "learning_rate": 0.00026472114472333915, + "loss": 0.0745, "step": 36440 }, { - "epoch": 0.39, - "learning_rate": 0.00024086248296450124, - "loss": 0.0542, + "epoch": 0.24, + "learning_rate": 0.00026471146336898223, + "loss": 0.0835, "step": 36450 }, { - "epoch": 0.39, - "learning_rate": 0.0002408462586799922, - "loss": 0.0674, + "epoch": 0.24, + "learning_rate": 0.00026470178201462526, + "loss": 0.0814, "step": 36460 }, { - "epoch": 0.39, - "learning_rate": 0.00024083003439548314, - "loss": 0.0629, + "epoch": 0.24, + "learning_rate": 0.00026469210066026833, + "loss": 0.0654, "step": 36470 }, { - "epoch": 0.39, - "learning_rate": 0.00024081381011097408, - "loss": 0.0618, + "epoch": 0.24, + "learning_rate": 0.0002646824193059114, + "loss": 0.0668, "step": 36480 }, { - "epoch": 0.39, - "learning_rate": 0.00024079758582646503, - "loss": 0.0582, + "epoch": 0.24, + "learning_rate": 0.0002646727379515545, + "loss": 0.0745, "step": 36490 }, { - "epoch": 0.39, - "learning_rate": 0.00024078136154195598, - "loss": 0.0729, + "epoch": 0.24, + "learning_rate": 0.0002646630565971976, + "loss": 0.0791, "step": 36500 }, { - "epoch": 0.39, - "learning_rate": 0.0002407651372574469, - "loss": 0.0599, + "epoch": 0.24, + "learning_rate": 0.0002646533752428406, + "loss": 0.0712, "step": 36510 }, { - "epoch": 0.4, - "learning_rate": 0.00024074891297293788, - "loss": 0.0606, + "epoch": 0.24, + "learning_rate": 0.0002646436938884837, + "loss": 0.0901, "step": 36520 }, { - "epoch": 0.4, - "learning_rate": 0.0002407326886884288, - "loss": 0.0698, + "epoch": 0.24, + "learning_rate": 0.00026463401253412676, + "loss": 0.0742, "step": 36530 }, { - "epoch": 0.4, - "learning_rate": 0.00024071646440391978, - "loss": 0.0634, + "epoch": 0.24, + "learning_rate": 0.0002646243311797698, + "loss": 0.068, "step": 36540 }, { - "epoch": 0.4, - "learning_rate": 0.0002407002401194107, - "loss": 0.0578, + "epoch": 0.24, + "learning_rate": 0.00026461464982541286, + "loss": 0.0651, "step": 36550 }, { - "epoch": 0.4, - "learning_rate": 0.00024068401583490166, - "loss": 0.0672, + "epoch": 0.24, + "learning_rate": 0.00026460496847105594, + "loss": 0.0673, "step": 36560 }, { - "epoch": 0.4, - "learning_rate": 0.0002406677915503926, - "loss": 0.0603, + "epoch": 0.24, + "learning_rate": 0.000264595287116699, + "loss": 0.0717, "step": 36570 }, { - "epoch": 0.4, - "learning_rate": 0.00024065156726588356, - "loss": 0.0637, + "epoch": 0.24, + "learning_rate": 0.0002645856057623421, + "loss": 0.0666, "step": 36580 }, { - "epoch": 0.4, - "learning_rate": 0.00024063534298137448, - "loss": 0.0607, + "epoch": 0.24, + "learning_rate": 0.0002645759244079852, + "loss": 0.0729, "step": 36590 }, { - "epoch": 0.4, - "learning_rate": 0.00024061911869686545, - "loss": 0.0744, + "epoch": 0.24, + "learning_rate": 0.0002645662430536282, + "loss": 0.0708, "step": 36600 }, { - "epoch": 0.4, - "learning_rate": 0.00024060289441235638, - "loss": 0.0586, + "epoch": 0.24, + "learning_rate": 0.0002645565616992713, + "loss": 0.0678, "step": 36610 }, { - "epoch": 0.4, - "learning_rate": 0.00024058667012784735, - "loss": 0.0649, + "epoch": 0.24, + "learning_rate": 0.00026454688034491437, + "loss": 0.0795, "step": 36620 }, { - "epoch": 0.4, - "learning_rate": 0.00024057044584333828, - "loss": 0.0652, + "epoch": 0.24, + "learning_rate": 0.00026453719899055745, + "loss": 0.0684, "step": 36630 }, { - "epoch": 0.4, - "learning_rate": 0.00024055422155882925, - "loss": 0.0606, + "epoch": 0.24, + "learning_rate": 0.00026452751763620053, + "loss": 0.0773, "step": 36640 }, { - "epoch": 0.4, - "learning_rate": 0.00024053799727432018, - "loss": 0.061, + "epoch": 0.24, + "learning_rate": 0.00026451783628184355, + "loss": 0.0719, "step": 36650 }, { - "epoch": 0.4, - "learning_rate": 0.00024052177298981113, - "loss": 0.0599, + "epoch": 0.24, + "learning_rate": 0.00026450815492748663, + "loss": 0.082, "step": 36660 }, { - "epoch": 0.4, - "learning_rate": 0.00024050554870530208, - "loss": 0.0622, + "epoch": 0.24, + "learning_rate": 0.0002644984735731297, + "loss": 0.0634, "step": 36670 }, { - "epoch": 0.4, - "learning_rate": 0.00024048932442079303, - "loss": 0.0699, + "epoch": 0.24, + "learning_rate": 0.00026448879221877274, + "loss": 0.0754, "step": 36680 }, { - "epoch": 0.4, - "learning_rate": 0.00024047310013628395, - "loss": 0.0684, + "epoch": 0.24, + "learning_rate": 0.0002644791108644158, + "loss": 0.0702, "step": 36690 }, { - "epoch": 0.4, - "learning_rate": 0.00024045687585177493, - "loss": 0.0668, + "epoch": 0.24, + "learning_rate": 0.0002644694295100589, + "loss": 0.0684, "step": 36700 }, { - "epoch": 0.4, - "learning_rate": 0.00024044065156726585, - "loss": 0.0622, + "epoch": 0.24, + "learning_rate": 0.000264459748155702, + "loss": 0.0747, "step": 36710 }, { - "epoch": 0.4, - "learning_rate": 0.00024042442728275683, - "loss": 0.0668, + "epoch": 0.24, + "learning_rate": 0.00026445006680134506, + "loss": 0.0688, "step": 36720 }, { - "epoch": 0.4, - "learning_rate": 0.00024040820299824775, - "loss": 0.0672, + "epoch": 0.24, + "learning_rate": 0.00026444038544698814, + "loss": 0.0722, "step": 36730 }, { - "epoch": 0.4, - "learning_rate": 0.0002403919787137387, - "loss": 0.0691, + "epoch": 0.24, + "learning_rate": 0.00026443070409263116, + "loss": 0.0848, "step": 36740 }, { - "epoch": 0.4, - "learning_rate": 0.00024037575442922965, - "loss": 0.0788, + "epoch": 0.24, + "learning_rate": 0.00026442102273827424, + "loss": 0.0661, "step": 36750 }, { - "epoch": 0.4, - "learning_rate": 0.0002403595301447206, - "loss": 0.0772, + "epoch": 0.24, + "learning_rate": 0.0002644113413839173, + "loss": 0.0774, "step": 36760 }, { - "epoch": 0.4, - "learning_rate": 0.00024034330586021152, - "loss": 0.0601, + "epoch": 0.24, + "learning_rate": 0.0002644016600295604, + "loss": 0.0703, "step": 36770 }, { - "epoch": 0.4, - "learning_rate": 0.0002403270815757025, - "loss": 0.0638, + "epoch": 0.24, + "learning_rate": 0.00026439197867520343, + "loss": 0.0707, "step": 36780 }, { - "epoch": 0.4, - "learning_rate": 0.00024031085729119342, - "loss": 0.0567, + "epoch": 0.24, + "learning_rate": 0.0002643822973208465, + "loss": 0.07, "step": 36790 }, { - "epoch": 0.4, - "learning_rate": 0.0002402946330066844, - "loss": 0.0653, + "epoch": 0.24, + "learning_rate": 0.0002643726159664896, + "loss": 0.0724, "step": 36800 }, { - "epoch": 0.4, - "learning_rate": 0.00024027840872217532, - "loss": 0.0662, + "epoch": 0.24, + "learning_rate": 0.0002643629346121326, + "loss": 0.0811, "step": 36810 }, { - "epoch": 0.4, - "learning_rate": 0.0002402621844376663, - "loss": 0.0614, + "epoch": 0.24, + "learning_rate": 0.0002643532532577757, + "loss": 0.0744, "step": 36820 }, { - "epoch": 0.4, - "learning_rate": 0.00024024596015315722, - "loss": 0.0634, + "epoch": 0.24, + "learning_rate": 0.0002643435719034188, + "loss": 0.0711, "step": 36830 }, { - "epoch": 0.4, - "learning_rate": 0.00024022973586864817, - "loss": 0.0595, + "epoch": 0.24, + "learning_rate": 0.00026433389054906185, + "loss": 0.0675, "step": 36840 }, { - "epoch": 0.4, - "learning_rate": 0.00024021351158413912, - "loss": 0.0633, + "epoch": 0.24, + "learning_rate": 0.00026432420919470493, + "loss": 0.0692, "step": 36850 }, { - "epoch": 0.4, - "learning_rate": 0.00024019728729963007, - "loss": 0.068, + "epoch": 0.24, + "learning_rate": 0.000264314527840348, + "loss": 0.0755, "step": 36860 }, { - "epoch": 0.4, - "learning_rate": 0.000240181063015121, - "loss": 0.0731, + "epoch": 0.24, + "learning_rate": 0.0002643048464859911, + "loss": 0.0667, "step": 36870 }, { - "epoch": 0.4, - "learning_rate": 0.00024016483873061197, - "loss": 0.06, + "epoch": 0.24, + "learning_rate": 0.0002642951651316341, + "loss": 0.0677, "step": 36880 }, { - "epoch": 0.4, - "learning_rate": 0.0002401486144461029, - "loss": 0.0672, + "epoch": 0.24, + "learning_rate": 0.0002642854837772772, + "loss": 0.0728, "step": 36890 }, { - "epoch": 0.4, - "learning_rate": 0.00024013239016159387, - "loss": 0.0667, + "epoch": 0.24, + "learning_rate": 0.0002642758024229203, + "loss": 0.0687, "step": 36900 }, { - "epoch": 0.4, - "learning_rate": 0.0002401161658770848, - "loss": 0.062, + "epoch": 0.24, + "learning_rate": 0.0002642661210685633, + "loss": 0.0644, "step": 36910 }, { - "epoch": 0.4, - "learning_rate": 0.00024009994159257574, - "loss": 0.0681, + "epoch": 0.24, + "learning_rate": 0.0002642564397142064, + "loss": 0.0709, "step": 36920 }, { - "epoch": 0.4, - "learning_rate": 0.0002400837173080667, - "loss": 0.0623, + "epoch": 0.24, + "learning_rate": 0.00026424675835984946, + "loss": 0.0785, "step": 36930 }, { - "epoch": 0.4, - "learning_rate": 0.00024006749302355764, - "loss": 0.0613, + "epoch": 0.24, + "learning_rate": 0.00026423707700549254, + "loss": 0.0673, "step": 36940 }, { - "epoch": 0.4, - "learning_rate": 0.00024005126873904856, - "loss": 0.0605, + "epoch": 0.24, + "learning_rate": 0.00026422739565113557, + "loss": 0.0752, "step": 36950 }, { - "epoch": 0.4, - "learning_rate": 0.00024003504445453954, - "loss": 0.059, + "epoch": 0.24, + "learning_rate": 0.00026421771429677865, + "loss": 0.0741, "step": 36960 }, { - "epoch": 0.4, - "learning_rate": 0.00024001882017003046, - "loss": 0.0631, + "epoch": 0.24, + "learning_rate": 0.00026420803294242173, + "loss": 0.0701, "step": 36970 }, { - "epoch": 0.4, - "learning_rate": 0.00024000259588552144, - "loss": 0.0675, + "epoch": 0.24, + "learning_rate": 0.0002641983515880648, + "loss": 0.079, "step": 36980 }, { - "epoch": 0.4, - "learning_rate": 0.00023998637160101236, - "loss": 0.0718, + "epoch": 0.24, + "learning_rate": 0.0002641886702337079, + "loss": 0.066, "step": 36990 }, { - "epoch": 0.4, - "learning_rate": 0.00023997014731650334, - "loss": 0.0596, + "epoch": 0.24, + "learning_rate": 0.00026417898887935097, + "loss": 0.0772, "step": 37000 }, { - "epoch": 0.4, - "eval_cer": 0.9213601771209367, - "eval_loss": 0.044058144092559814, - "eval_runtime": 119.5428, - "eval_samples_per_second": 16.73, - "eval_steps_per_second": 4.183, + "epoch": 0.24, + "eval_cer": 0.9201798666817309, + "eval_loss": 0.048399925231933594, + "eval_runtime": 120.3324, + "eval_samples_per_second": 16.621, + "eval_steps_per_second": 4.155, "step": 37000 }, { - "epoch": 0.4, - "learning_rate": 0.00023995392303199426, - "loss": 0.061, + "epoch": 0.24, + "learning_rate": 0.00026416930752499405, + "loss": 0.0766, "step": 37010 }, { - "epoch": 0.4, - "learning_rate": 0.0002399376987474852, - "loss": 0.0701, + "epoch": 0.24, + "learning_rate": 0.00026415962617063707, + "loss": 0.0687, "step": 37020 }, { - "epoch": 0.4, - "learning_rate": 0.00023992147446297616, - "loss": 0.0673, + "epoch": 0.24, + "learning_rate": 0.00026414994481628015, + "loss": 0.0706, "step": 37030 }, { - "epoch": 0.4, - "learning_rate": 0.0002399052501784671, - "loss": 0.0661, + "epoch": 0.24, + "learning_rate": 0.00026414026346192323, + "loss": 0.0752, "step": 37040 }, { - "epoch": 0.4, - "learning_rate": 0.00023988902589395803, - "loss": 0.0634, + "epoch": 0.24, + "learning_rate": 0.00026413058210756626, + "loss": 0.0734, "step": 37050 }, { - "epoch": 0.4, - "learning_rate": 0.000239872801609449, - "loss": 0.0618, + "epoch": 0.24, + "learning_rate": 0.00026412090075320934, + "loss": 0.0706, "step": 37060 }, { - "epoch": 0.4, - "learning_rate": 0.00023985657732493993, - "loss": 0.069, + "epoch": 0.24, + "learning_rate": 0.0002641112193988524, + "loss": 0.0699, "step": 37070 }, { - "epoch": 0.4, - "learning_rate": 0.0002398403530404309, - "loss": 0.0657, + "epoch": 0.24, + "learning_rate": 0.0002641015380444955, + "loss": 0.0717, "step": 37080 }, { - "epoch": 0.4, - "learning_rate": 0.00023982412875592183, - "loss": 0.0649, + "epoch": 0.24, + "learning_rate": 0.0002640918566901385, + "loss": 0.0647, "step": 37090 }, { - "epoch": 0.4, - "learning_rate": 0.00023980790447141278, - "loss": 0.0691, + "epoch": 0.24, + "learning_rate": 0.0002640821753357816, + "loss": 0.0688, "step": 37100 }, { - "epoch": 0.4, - "learning_rate": 0.00023979168018690373, - "loss": 0.065, + "epoch": 0.24, + "learning_rate": 0.0002640724939814247, + "loss": 0.0697, "step": 37110 }, { - "epoch": 0.4, - "learning_rate": 0.00023977545590239468, - "loss": 0.0593, + "epoch": 0.24, + "learning_rate": 0.00026406281262706776, + "loss": 0.0694, "step": 37120 }, { - "epoch": 0.4, - "learning_rate": 0.0002397592316178856, - "loss": 0.0623, + "epoch": 0.24, + "learning_rate": 0.00026405313127271084, + "loss": 0.0697, "step": 37130 }, { - "epoch": 0.4, - "learning_rate": 0.00023974300733337658, - "loss": 0.0619, + "epoch": 0.24, + "learning_rate": 0.0002640434499183539, + "loss": 0.0662, "step": 37140 }, { - "epoch": 0.4, - "learning_rate": 0.0002397267830488675, - "loss": 0.0648, + "epoch": 0.24, + "learning_rate": 0.00026403376856399695, + "loss": 0.0706, "step": 37150 }, { - "epoch": 0.4, - "learning_rate": 0.00023971055876435848, - "loss": 0.0721, + "epoch": 0.24, + "learning_rate": 0.00026402408720964003, + "loss": 0.0747, "step": 37160 }, { - "epoch": 0.4, - "learning_rate": 0.0002396943344798494, - "loss": 0.0707, + "epoch": 0.24, + "learning_rate": 0.0002640144058552831, + "loss": 0.0671, "step": 37170 }, { - "epoch": 0.4, - "learning_rate": 0.00023967811019534038, - "loss": 0.0601, + "epoch": 0.24, + "learning_rate": 0.00026400472450092613, + "loss": 0.0713, "step": 37180 }, { - "epoch": 0.4, - "learning_rate": 0.0002396618859108313, - "loss": 0.0744, + "epoch": 0.24, + "learning_rate": 0.0002639950431465692, + "loss": 0.0694, "step": 37190 }, { - "epoch": 0.4, - "learning_rate": 0.00023964566162632225, - "loss": 0.0658, + "epoch": 0.24, + "learning_rate": 0.0002639853617922123, + "loss": 0.0686, "step": 37200 }, { - "epoch": 0.4, - "learning_rate": 0.0002396294373418132, - "loss": 0.0674, + "epoch": 0.24, + "learning_rate": 0.00026397568043785537, + "loss": 0.0707, "step": 37210 }, { - "epoch": 0.4, - "learning_rate": 0.00023961321305730415, - "loss": 0.0661, + "epoch": 0.24, + "learning_rate": 0.00026396599908349845, + "loss": 0.0758, "step": 37220 }, { - "epoch": 0.4, - "learning_rate": 0.00023959698877279507, - "loss": 0.0629, + "epoch": 0.24, + "learning_rate": 0.0002639563177291415, + "loss": 0.073, "step": 37230 }, { - "epoch": 0.4, - "learning_rate": 0.00023958076448828605, - "loss": 0.0627, + "epoch": 0.24, + "learning_rate": 0.00026394663637478456, + "loss": 0.0752, "step": 37240 }, { - "epoch": 0.4, - "learning_rate": 0.00023956454020377697, - "loss": 0.0639, + "epoch": 0.24, + "learning_rate": 0.00026393695502042764, + "loss": 0.0666, "step": 37250 }, { - "epoch": 0.4, - "learning_rate": 0.00023954831591926795, - "loss": 0.0617, + "epoch": 0.24, + "learning_rate": 0.0002639272736660707, + "loss": 0.0708, "step": 37260 }, { - "epoch": 0.4, - "learning_rate": 0.00023953209163475887, - "loss": 0.0644, + "epoch": 0.24, + "learning_rate": 0.0002639175923117138, + "loss": 0.0731, "step": 37270 }, { - "epoch": 0.4, - "learning_rate": 0.00023951586735024982, - "loss": 0.062, + "epoch": 0.24, + "learning_rate": 0.0002639079109573569, + "loss": 0.0709, "step": 37280 }, { - "epoch": 0.4, - "learning_rate": 0.00023949964306574077, - "loss": 0.0616, + "epoch": 0.24, + "learning_rate": 0.0002638982296029999, + "loss": 0.0761, "step": 37290 }, { - "epoch": 0.4, - "learning_rate": 0.00023948341878123172, - "loss": 0.0558, + "epoch": 0.24, + "learning_rate": 0.000263888548248643, + "loss": 0.0681, "step": 37300 }, { - "epoch": 0.4, - "learning_rate": 0.00023946719449672267, - "loss": 0.0625, + "epoch": 0.24, + "learning_rate": 0.000263878866894286, + "loss": 0.0821, "step": 37310 }, { - "epoch": 0.4, - "learning_rate": 0.00023945097021221362, - "loss": 0.0591, + "epoch": 0.24, + "learning_rate": 0.0002638691855399291, + "loss": 0.0698, "step": 37320 }, { - "epoch": 0.4, - "learning_rate": 0.00023943474592770454, - "loss": 0.0701, + "epoch": 0.24, + "learning_rate": 0.00026385950418557217, + "loss": 0.0639, "step": 37330 }, { - "epoch": 0.4, - "learning_rate": 0.00023941852164319552, - "loss": 0.0709, + "epoch": 0.24, + "learning_rate": 0.00026384982283121525, + "loss": 0.0718, "step": 37340 }, { - "epoch": 0.4, - "learning_rate": 0.00023940229735868644, - "loss": 0.0561, + "epoch": 0.24, + "learning_rate": 0.0002638401414768583, + "loss": 0.0776, "step": 37350 }, { - "epoch": 0.4, - "learning_rate": 0.00023938607307417742, - "loss": 0.0572, + "epoch": 0.24, + "learning_rate": 0.0002638304601225014, + "loss": 0.0827, "step": 37360 }, { - "epoch": 0.4, - "learning_rate": 0.00023936984878966834, - "loss": 0.06, + "epoch": 0.24, + "learning_rate": 0.00026382077876814443, + "loss": 0.0733, "step": 37370 }, { - "epoch": 0.4, - "learning_rate": 0.0002393536245051593, - "loss": 0.0688, + "epoch": 0.24, + "learning_rate": 0.0002638110974137875, + "loss": 0.0692, "step": 37380 }, { - "epoch": 0.4, - "learning_rate": 0.00023933740022065024, - "loss": 0.0641, + "epoch": 0.24, + "learning_rate": 0.0002638014160594306, + "loss": 0.0715, "step": 37390 }, { - "epoch": 0.4, - "learning_rate": 0.0002393211759361412, - "loss": 0.0628, + "epoch": 0.24, + "learning_rate": 0.00026379173470507367, + "loss": 0.0754, "step": 37400 }, { - "epoch": 0.4, - "learning_rate": 0.00023930495165163212, + "epoch": 0.24, + "learning_rate": 0.00026378205335071675, "loss": 0.0769, "step": 37410 }, { - "epoch": 0.4, - "learning_rate": 0.0002392887273671231, - "loss": 0.0669, + "epoch": 0.24, + "learning_rate": 0.0002637723719963598, + "loss": 0.0676, "step": 37420 }, { - "epoch": 0.4, - "learning_rate": 0.00023927250308261401, - "loss": 0.0598, + "epoch": 0.24, + "learning_rate": 0.00026376269064200286, + "loss": 0.0683, "step": 37430 }, { - "epoch": 0.4, - "learning_rate": 0.000239256278798105, - "loss": 0.0586, + "epoch": 0.24, + "learning_rate": 0.00026375300928764594, + "loss": 0.0628, "step": 37440 }, { - "epoch": 0.41, - "learning_rate": 0.00023924005451359591, - "loss": 0.0589, + "epoch": 0.24, + "learning_rate": 0.00026374332793328896, + "loss": 0.0672, "step": 37450 }, { - "epoch": 0.41, - "learning_rate": 0.00023922383022908686, - "loss": 0.0662, + "epoch": 0.24, + "learning_rate": 0.00026373364657893204, + "loss": 0.0678, "step": 37460 }, { - "epoch": 0.41, - "learning_rate": 0.00023920760594457781, - "loss": 0.0689, + "epoch": 0.24, + "learning_rate": 0.0002637239652245751, + "loss": 0.0676, "step": 37470 }, { - "epoch": 0.41, - "learning_rate": 0.00023919138166006876, - "loss": 0.0585, + "epoch": 0.24, + "learning_rate": 0.0002637142838702182, + "loss": 0.0809, "step": 37480 }, { - "epoch": 0.41, - "learning_rate": 0.0002391751573755597, - "loss": 0.0605, + "epoch": 0.24, + "learning_rate": 0.0002637046025158613, + "loss": 0.0708, "step": 37490 }, { - "epoch": 0.41, - "learning_rate": 0.00023915893309105066, - "loss": 0.0588, + "epoch": 0.24, + "learning_rate": 0.00026369492116150436, + "loss": 0.0773, "step": 37500 }, { - "epoch": 0.41, - "learning_rate": 0.00023914270880654159, - "loss": 0.0696, + "epoch": 0.24, + "learning_rate": 0.0002636852398071474, + "loss": 0.0691, "step": 37510 }, { - "epoch": 0.41, - "learning_rate": 0.00023912648452203256, - "loss": 0.0616, + "epoch": 0.24, + "learning_rate": 0.00026367555845279047, + "loss": 0.0788, "step": 37520 }, { - "epoch": 0.41, - "learning_rate": 0.00023911026023752349, - "loss": 0.0717, + "epoch": 0.24, + "learning_rate": 0.00026366587709843355, + "loss": 0.0674, "step": 37530 }, { - "epoch": 0.41, - "learning_rate": 0.00023909403595301446, - "loss": 0.0577, + "epoch": 0.24, + "learning_rate": 0.0002636561957440766, + "loss": 0.0729, "step": 37540 }, { - "epoch": 0.41, - "learning_rate": 0.0002390778116685054, - "loss": 0.0567, + "epoch": 0.24, + "learning_rate": 0.00026364651438971965, + "loss": 0.0685, "step": 37550 }, { - "epoch": 0.41, - "learning_rate": 0.00023906158738399633, - "loss": 0.0608, + "epoch": 0.24, + "learning_rate": 0.00026363683303536273, + "loss": 0.0739, "step": 37560 }, { - "epoch": 0.41, - "learning_rate": 0.0002390453630994873, - "loss": 0.0701, + "epoch": 0.24, + "learning_rate": 0.0002636271516810058, + "loss": 0.0667, "step": 37570 }, { - "epoch": 0.41, - "learning_rate": 0.00023902913881497823, - "loss": 0.0603, + "epoch": 0.24, + "learning_rate": 0.00026361747032664884, + "loss": 0.0703, "step": 37580 }, { - "epoch": 0.41, - "learning_rate": 0.0002390129145304692, - "loss": 0.0708, + "epoch": 0.24, + "learning_rate": 0.0002636077889722919, + "loss": 0.0676, "step": 37590 }, { - "epoch": 0.41, - "learning_rate": 0.00023899669024596013, - "loss": 0.065, + "epoch": 0.24, + "learning_rate": 0.000263598107617935, + "loss": 0.0718, "step": 37600 }, { - "epoch": 0.41, - "learning_rate": 0.00023898046596145108, - "loss": 0.0585, + "epoch": 0.24, + "learning_rate": 0.0002635884262635781, + "loss": 0.0699, "step": 37610 }, { - "epoch": 0.41, - "learning_rate": 0.00023896424167694203, - "loss": 0.0582, + "epoch": 0.24, + "learning_rate": 0.00026357874490922116, + "loss": 0.0724, "step": 37620 }, { - "epoch": 0.41, - "learning_rate": 0.00023894801739243298, - "loss": 0.0554, + "epoch": 0.24, + "learning_rate": 0.00026356906355486424, + "loss": 0.0615, "step": 37630 }, { - "epoch": 0.41, - "learning_rate": 0.0002389317931079239, - "loss": 0.0533, + "epoch": 0.24, + "learning_rate": 0.0002635593822005073, + "loss": 0.0718, "step": 37640 }, { - "epoch": 0.41, - "learning_rate": 0.00023891556882341488, - "loss": 0.0698, + "epoch": 0.24, + "learning_rate": 0.00026354970084615034, + "loss": 0.0736, "step": 37650 }, { - "epoch": 0.41, - "learning_rate": 0.0002388993445389058, - "loss": 0.0591, + "epoch": 0.24, + "learning_rate": 0.0002635400194917934, + "loss": 0.0695, "step": 37660 }, { - "epoch": 0.41, - "learning_rate": 0.00023888312025439678, - "loss": 0.0644, + "epoch": 0.24, + "learning_rate": 0.0002635303381374365, + "loss": 0.0691, "step": 37670 }, { - "epoch": 0.41, - "learning_rate": 0.0002388668959698877, - "loss": 0.0663, + "epoch": 0.24, + "learning_rate": 0.0002635206567830796, + "loss": 0.0686, "step": 37680 }, { - "epoch": 0.41, - "learning_rate": 0.00023885067168537868, - "loss": 0.071, + "epoch": 0.24, + "learning_rate": 0.0002635109754287226, + "loss": 0.0676, "step": 37690 }, { - "epoch": 0.41, - "learning_rate": 0.0002388344474008696, - "loss": 0.059, + "epoch": 0.24, + "learning_rate": 0.0002635012940743657, + "loss": 0.068, "step": 37700 }, { - "epoch": 0.41, - "learning_rate": 0.00023881822311636055, - "loss": 0.0622, + "epoch": 0.24, + "learning_rate": 0.00026349161272000877, + "loss": 0.0707, "step": 37710 }, { - "epoch": 0.41, - "learning_rate": 0.0002388019988318515, - "loss": 0.0626, + "epoch": 0.24, + "learning_rate": 0.0002634819313656518, + "loss": 0.0675, "step": 37720 }, { - "epoch": 0.41, - "learning_rate": 0.00023878577454734245, - "loss": 0.0591, + "epoch": 0.24, + "learning_rate": 0.00026347225001129487, + "loss": 0.0699, "step": 37730 }, { - "epoch": 0.41, - "learning_rate": 0.00023876955026283338, - "loss": 0.0668, + "epoch": 0.24, + "learning_rate": 0.00026346256865693795, + "loss": 0.078, "step": 37740 }, { - "epoch": 0.41, - "learning_rate": 0.00023875332597832435, - "loss": 0.0617, + "epoch": 0.24, + "learning_rate": 0.00026345288730258103, + "loss": 0.0687, "step": 37750 }, { - "epoch": 0.41, - "learning_rate": 0.00023873710169381528, - "loss": 0.0611, + "epoch": 0.24, + "learning_rate": 0.0002634432059482241, + "loss": 0.072, "step": 37760 }, { - "epoch": 0.41, - "learning_rate": 0.00023872087740930625, - "loss": 0.0682, + "epoch": 0.24, + "learning_rate": 0.0002634335245938672, + "loss": 0.076, "step": 37770 }, { - "epoch": 0.41, - "learning_rate": 0.00023870465312479718, - "loss": 0.0604, + "epoch": 0.24, + "learning_rate": 0.00026342384323951027, + "loss": 0.084, "step": 37780 }, { - "epoch": 0.41, - "learning_rate": 0.00023868842884028813, - "loss": 0.068, + "epoch": 0.24, + "learning_rate": 0.0002634141618851533, + "loss": 0.0754, "step": 37790 }, { - "epoch": 0.41, - "learning_rate": 0.00023867220455577908, - "loss": 0.0635, + "epoch": 0.24, + "learning_rate": 0.0002634044805307964, + "loss": 0.0702, "step": 37800 }, { - "epoch": 0.41, - "learning_rate": 0.00023865598027127002, - "loss": 0.0544, + "epoch": 0.24, + "learning_rate": 0.00026339479917643945, + "loss": 0.0712, "step": 37810 }, { - "epoch": 0.41, - "learning_rate": 0.00023863975598676095, - "loss": 0.0717, + "epoch": 0.24, + "learning_rate": 0.0002633851178220825, + "loss": 0.0796, "step": 37820 }, { - "epoch": 0.41, - "learning_rate": 0.00023862353170225192, - "loss": 0.0615, + "epoch": 0.24, + "learning_rate": 0.00026337543646772556, + "loss": 0.0722, "step": 37830 }, { - "epoch": 0.41, - "learning_rate": 0.00023860730741774285, - "loss": 0.0715, + "epoch": 0.24, + "learning_rate": 0.00026336575511336864, + "loss": 0.0721, "step": 37840 }, { - "epoch": 0.41, - "learning_rate": 0.00023859108313323382, - "loss": 0.0684, + "epoch": 0.24, + "learning_rate": 0.0002633560737590117, + "loss": 0.0752, "step": 37850 }, { - "epoch": 0.41, - "learning_rate": 0.00023857485884872475, - "loss": 0.0599, + "epoch": 0.24, + "learning_rate": 0.00026334639240465475, + "loss": 0.0761, "step": 37860 }, { - "epoch": 0.41, - "learning_rate": 0.00023855863456421572, - "loss": 0.0621, + "epoch": 0.24, + "learning_rate": 0.0002633367110502978, + "loss": 0.0692, "step": 37870 }, { - "epoch": 0.41, - "learning_rate": 0.00023854241027970665, - "loss": 0.0663, + "epoch": 0.24, + "learning_rate": 0.0002633270296959409, + "loss": 0.076, "step": 37880 }, { - "epoch": 0.41, - "learning_rate": 0.0002385261859951976, - "loss": 0.0618, + "epoch": 0.24, + "learning_rate": 0.000263317348341584, + "loss": 0.0737, "step": 37890 }, { - "epoch": 0.41, - "learning_rate": 0.00023850996171068855, - "loss": 0.0649, + "epoch": 0.24, + "learning_rate": 0.00026330766698722706, + "loss": 0.0772, "step": 37900 }, { - "epoch": 0.41, - "learning_rate": 0.0002384937374261795, - "loss": 0.0658, + "epoch": 0.24, + "learning_rate": 0.00026329798563287014, + "loss": 0.0726, "step": 37910 }, { - "epoch": 0.41, - "learning_rate": 0.00023847751314167042, - "loss": 0.0657, + "epoch": 0.24, + "learning_rate": 0.00026328830427851317, + "loss": 0.0741, "step": 37920 }, { - "epoch": 0.41, - "learning_rate": 0.0002384612888571614, - "loss": 0.0615, + "epoch": 0.24, + "learning_rate": 0.00026327862292415625, + "loss": 0.0724, "step": 37930 }, { - "epoch": 0.41, - "learning_rate": 0.00023844506457265232, - "loss": 0.0619, + "epoch": 0.24, + "learning_rate": 0.00026326894156979933, + "loss": 0.0675, "step": 37940 }, { - "epoch": 0.41, - "learning_rate": 0.0002384288402881433, - "loss": 0.0606, + "epoch": 0.24, + "learning_rate": 0.00026325926021544236, + "loss": 0.0645, "step": 37950 }, { - "epoch": 0.41, - "learning_rate": 0.00023841261600363422, - "loss": 0.0681, + "epoch": 0.25, + "learning_rate": 0.00026324957886108543, + "loss": 0.0759, "step": 37960 }, { - "epoch": 0.41, - "learning_rate": 0.00023839639171912517, - "loss": 0.0639, + "epoch": 0.25, + "learning_rate": 0.0002632398975067285, + "loss": 0.0757, "step": 37970 }, { - "epoch": 0.41, - "learning_rate": 0.00023838016743461612, - "loss": 0.0632, + "epoch": 0.25, + "learning_rate": 0.0002632302161523716, + "loss": 0.0709, "step": 37980 }, { - "epoch": 0.41, - "learning_rate": 0.00023836394315010707, - "loss": 0.0581, + "epoch": 0.25, + "learning_rate": 0.0002632205347980146, + "loss": 0.0755, "step": 37990 }, { - "epoch": 0.41, - "learning_rate": 0.00023834771886559802, - "loss": 0.0534, + "epoch": 0.25, + "learning_rate": 0.0002632108534436577, + "loss": 0.073, "step": 38000 }, { - "epoch": 0.41, - "eval_cer": 0.9213425074345205, - "eval_loss": 0.043030429631471634, - "eval_runtime": 119.4335, - "eval_samples_per_second": 16.746, - "eval_steps_per_second": 4.186, + "epoch": 0.25, + "eval_cer": 0.9201852897977629, + "eval_loss": 0.04867184907197952, + "eval_runtime": 120.3167, + "eval_samples_per_second": 16.623, + "eval_steps_per_second": 4.156, "step": 38000 }, { - "epoch": 0.41, - "learning_rate": 0.00023833149458108897, - "loss": 0.0569, + "epoch": 0.25, + "learning_rate": 0.0002632011720893008, + "loss": 0.0725, "step": 38010 }, { - "epoch": 0.41, - "learning_rate": 0.0002383152702965799, - "loss": 0.0576, + "epoch": 0.25, + "learning_rate": 0.00026319149073494386, + "loss": 0.0761, "step": 38020 }, { - "epoch": 0.41, - "learning_rate": 0.00023829904601207087, - "loss": 0.0664, + "epoch": 0.25, + "learning_rate": 0.00026318180938058694, + "loss": 0.0714, "step": 38030 }, { - "epoch": 0.41, - "learning_rate": 0.0002382828217275618, - "loss": 0.0648, + "epoch": 0.25, + "learning_rate": 0.00026317212802623, + "loss": 0.067, "step": 38040 }, { - "epoch": 0.41, - "learning_rate": 0.00023826659744305277, - "loss": 0.0601, + "epoch": 0.25, + "learning_rate": 0.0002631624466718731, + "loss": 0.072, "step": 38050 }, { - "epoch": 0.41, - "learning_rate": 0.0002382503731585437, - "loss": 0.0602, + "epoch": 0.25, + "learning_rate": 0.0002631527653175161, + "loss": 0.0667, "step": 38060 }, { - "epoch": 0.41, - "learning_rate": 0.00023823414887403464, - "loss": 0.0636, + "epoch": 0.25, + "learning_rate": 0.0002631430839631592, + "loss": 0.0668, "step": 38070 }, { - "epoch": 0.41, - "learning_rate": 0.0002382179245895256, - "loss": 0.0592, + "epoch": 0.25, + "learning_rate": 0.0002631334026088023, + "loss": 0.0633, "step": 38080 }, { - "epoch": 0.41, - "learning_rate": 0.00023820170030501654, - "loss": 0.0612, + "epoch": 0.25, + "learning_rate": 0.0002631237212544453, + "loss": 0.0704, "step": 38090 }, { - "epoch": 0.41, - "learning_rate": 0.00023818547602050746, - "loss": 0.0585, + "epoch": 0.25, + "learning_rate": 0.0002631140399000884, + "loss": 0.0718, "step": 38100 }, { - "epoch": 0.41, - "learning_rate": 0.00023816925173599844, - "loss": 0.0621, + "epoch": 0.25, + "learning_rate": 0.00026310435854573147, + "loss": 0.0672, "step": 38110 }, { - "epoch": 0.41, - "learning_rate": 0.00023815302745148936, - "loss": 0.0598, + "epoch": 0.25, + "learning_rate": 0.00026309467719137455, + "loss": 0.0715, "step": 38120 }, { - "epoch": 0.41, - "learning_rate": 0.00023813680316698034, - "loss": 0.0643, + "epoch": 0.25, + "learning_rate": 0.0002630849958370176, + "loss": 0.0651, "step": 38130 }, { - "epoch": 0.41, - "learning_rate": 0.00023812057888247126, - "loss": 0.0639, + "epoch": 0.25, + "learning_rate": 0.00026307531448266065, + "loss": 0.0653, "step": 38140 }, { - "epoch": 0.41, - "learning_rate": 0.0002381043545979622, - "loss": 0.0651, + "epoch": 0.25, + "learning_rate": 0.00026306563312830373, + "loss": 0.0691, "step": 38150 }, { - "epoch": 0.41, - "learning_rate": 0.00023808813031345316, - "loss": 0.0712, + "epoch": 0.25, + "learning_rate": 0.0002630559517739468, + "loss": 0.0655, "step": 38160 }, { - "epoch": 0.41, - "learning_rate": 0.0002380719060289441, - "loss": 0.063, + "epoch": 0.25, + "learning_rate": 0.0002630462704195899, + "loss": 0.0773, "step": 38170 }, { - "epoch": 0.41, - "learning_rate": 0.00023805568174443506, - "loss": 0.0596, + "epoch": 0.25, + "learning_rate": 0.000263036589065233, + "loss": 0.0783, "step": 38180 }, { - "epoch": 0.41, - "learning_rate": 0.000238039457459926, - "loss": 0.0631, + "epoch": 0.25, + "learning_rate": 0.000263026907710876, + "loss": 0.0717, "step": 38190 }, { - "epoch": 0.41, - "learning_rate": 0.00023802323317541693, - "loss": 0.0607, + "epoch": 0.25, + "learning_rate": 0.0002630172263565191, + "loss": 0.0715, "step": 38200 }, { - "epoch": 0.41, - "learning_rate": 0.0002380070088909079, - "loss": 0.0734, + "epoch": 0.25, + "learning_rate": 0.00026300754500216216, + "loss": 0.0805, "step": 38210 }, { - "epoch": 0.41, - "learning_rate": 0.00023799078460639883, - "loss": 0.0628, + "epoch": 0.25, + "learning_rate": 0.0002629978636478052, + "loss": 0.0672, "step": 38220 }, { - "epoch": 0.41, - "learning_rate": 0.0002379745603218898, - "loss": 0.0639, + "epoch": 0.25, + "learning_rate": 0.00026298818229344826, + "loss": 0.0806, "step": 38230 }, { - "epoch": 0.41, - "learning_rate": 0.00023795833603738073, - "loss": 0.068, + "epoch": 0.25, + "learning_rate": 0.00026297850093909134, + "loss": 0.0668, "step": 38240 }, { - "epoch": 0.41, - "learning_rate": 0.00023794211175287168, - "loss": 0.0592, + "epoch": 0.25, + "learning_rate": 0.0002629688195847344, + "loss": 0.0742, "step": 38250 }, { - "epoch": 0.41, - "learning_rate": 0.00023792588746836263, - "loss": 0.0685, + "epoch": 0.25, + "learning_rate": 0.0002629591382303775, + "loss": 0.0722, "step": 38260 }, { - "epoch": 0.41, - "learning_rate": 0.00023790966318385358, - "loss": 0.0647, + "epoch": 0.25, + "learning_rate": 0.00026294945687602053, + "loss": 0.0859, "step": 38270 }, { - "epoch": 0.41, - "learning_rate": 0.0002378934388993445, - "loss": 0.0667, + "epoch": 0.25, + "learning_rate": 0.0002629397755216636, + "loss": 0.0744, "step": 38280 }, { - "epoch": 0.41, - "learning_rate": 0.00023787721461483548, - "loss": 0.0528, + "epoch": 0.25, + "learning_rate": 0.0002629300941673067, + "loss": 0.0758, "step": 38290 }, { - "epoch": 0.41, - "learning_rate": 0.0002378609903303264, - "loss": 0.0583, + "epoch": 0.25, + "learning_rate": 0.00026292041281294977, + "loss": 0.0772, "step": 38300 }, { - "epoch": 0.41, - "learning_rate": 0.00023784476604581738, - "loss": 0.0592, + "epoch": 0.25, + "learning_rate": 0.00026291073145859285, + "loss": 0.068, "step": 38310 }, { - "epoch": 0.41, - "learning_rate": 0.0002378285417613083, - "loss": 0.0639, + "epoch": 0.25, + "learning_rate": 0.0002629010501042359, + "loss": 0.0693, "step": 38320 }, { - "epoch": 0.41, - "learning_rate": 0.00023781231747679925, - "loss": 0.0634, + "epoch": 0.25, + "learning_rate": 0.00026289136874987895, + "loss": 0.0714, "step": 38330 }, { - "epoch": 0.41, - "learning_rate": 0.0002377960931922902, - "loss": 0.0629, + "epoch": 0.25, + "learning_rate": 0.00026288168739552203, + "loss": 0.0769, "step": 38340 }, { - "epoch": 0.41, - "learning_rate": 0.00023777986890778115, - "loss": 0.0624, + "epoch": 0.25, + "learning_rate": 0.00026287200604116506, + "loss": 0.0692, "step": 38350 }, { - "epoch": 0.41, - "learning_rate": 0.0002377636446232721, - "loss": 0.0611, + "epoch": 0.25, + "learning_rate": 0.00026286232468680814, + "loss": 0.0671, "step": 38360 }, { - "epoch": 0.42, - "learning_rate": 0.00023774742033876305, - "loss": 0.0672, + "epoch": 0.25, + "learning_rate": 0.0002628526433324512, + "loss": 0.0676, "step": 38370 }, { - "epoch": 0.42, - "learning_rate": 0.00023773119605425397, - "loss": 0.0645, + "epoch": 0.25, + "learning_rate": 0.0002628429619780943, + "loss": 0.0744, "step": 38380 }, { - "epoch": 0.42, - "learning_rate": 0.00023771497176974495, - "loss": 0.0771, + "epoch": 0.25, + "learning_rate": 0.0002628332806237374, + "loss": 0.0661, "step": 38390 }, { - "epoch": 0.42, - "learning_rate": 0.00023769874748523587, - "loss": 0.0571, + "epoch": 0.25, + "learning_rate": 0.00026282359926938046, + "loss": 0.0743, "step": 38400 }, { - "epoch": 0.42, - "learning_rate": 0.00023768252320072685, - "loss": 0.0637, + "epoch": 0.25, + "learning_rate": 0.0002628139179150235, + "loss": 0.0728, "step": 38410 }, { - "epoch": 0.42, - "learning_rate": 0.00023766629891621777, - "loss": 0.0646, + "epoch": 0.25, + "learning_rate": 0.00026280423656066656, + "loss": 0.0728, "step": 38420 }, { - "epoch": 0.42, - "learning_rate": 0.00023765007463170872, - "loss": 0.0627, + "epoch": 0.25, + "learning_rate": 0.00026279455520630964, + "loss": 0.0676, "step": 38430 }, { - "epoch": 0.42, - "learning_rate": 0.00023763385034719967, - "loss": 0.0663, + "epoch": 0.25, + "learning_rate": 0.0002627848738519527, + "loss": 0.0721, "step": 38440 }, { - "epoch": 0.42, - "learning_rate": 0.00023761762606269062, - "loss": 0.0674, + "epoch": 0.25, + "learning_rate": 0.0002627751924975958, + "loss": 0.0768, "step": 38450 }, { - "epoch": 0.42, - "learning_rate": 0.00023760140177818154, - "loss": 0.0603, + "epoch": 0.25, + "learning_rate": 0.00026276551114323883, + "loss": 0.0751, "step": 38460 }, { - "epoch": 0.42, - "learning_rate": 0.00023758517749367252, - "loss": 0.0649, + "epoch": 0.25, + "learning_rate": 0.0002627558297888819, + "loss": 0.0768, "step": 38470 }, { - "epoch": 0.42, - "learning_rate": 0.00023756895320916344, - "loss": 0.0592, + "epoch": 0.25, + "learning_rate": 0.000262746148434525, + "loss": 0.0729, "step": 38480 }, { - "epoch": 0.42, - "learning_rate": 0.00023755272892465442, - "loss": 0.0667, + "epoch": 0.25, + "learning_rate": 0.000262736467080168, + "loss": 0.0702, "step": 38490 }, { - "epoch": 0.42, - "learning_rate": 0.00023753650464014534, - "loss": 0.0727, + "epoch": 0.25, + "learning_rate": 0.0002627267857258111, + "loss": 0.0682, "step": 38500 }, { - "epoch": 0.42, - "learning_rate": 0.0002375202803556363, - "loss": 0.0673, + "epoch": 0.25, + "learning_rate": 0.00026271710437145417, + "loss": 0.0674, "step": 38510 }, { - "epoch": 0.42, - "learning_rate": 0.00023750405607112724, - "loss": 0.0676, + "epoch": 0.25, + "learning_rate": 0.00026270742301709725, + "loss": 0.0731, "step": 38520 }, { - "epoch": 0.42, - "learning_rate": 0.0002374878317866182, - "loss": 0.0636, + "epoch": 0.25, + "learning_rate": 0.00026269774166274033, + "loss": 0.0696, "step": 38530 }, { - "epoch": 0.42, - "learning_rate": 0.00023747160750210914, - "loss": 0.0757, + "epoch": 0.25, + "learning_rate": 0.0002626880603083834, + "loss": 0.0621, "step": 38540 }, { - "epoch": 0.42, - "learning_rate": 0.0002374553832176001, - "loss": 0.0643, + "epoch": 0.25, + "learning_rate": 0.00026267837895402644, + "loss": 0.0762, "step": 38550 }, { - "epoch": 0.42, - "learning_rate": 0.00023743915893309101, - "loss": 0.0583, + "epoch": 0.25, + "learning_rate": 0.0002626686975996695, + "loss": 0.0672, "step": 38560 }, { - "epoch": 0.42, - "learning_rate": 0.000237422934648582, - "loss": 0.0708, + "epoch": 0.25, + "learning_rate": 0.0002626590162453126, + "loss": 0.0696, "step": 38570 }, { - "epoch": 0.42, - "learning_rate": 0.0002374067103640729, - "loss": 0.0608, + "epoch": 0.25, + "learning_rate": 0.0002626493348909557, + "loss": 0.0792, "step": 38580 }, { - "epoch": 0.42, - "learning_rate": 0.0002373904860795639, - "loss": 0.0648, + "epoch": 0.25, + "learning_rate": 0.0002626396535365987, + "loss": 0.0636, "step": 38590 }, { - "epoch": 0.42, - "learning_rate": 0.0002373742617950548, - "loss": 0.067, + "epoch": 0.25, + "learning_rate": 0.0002626299721822418, + "loss": 0.0707, "step": 38600 }, { - "epoch": 0.42, - "learning_rate": 0.00023735803751054576, - "loss": 0.0634, + "epoch": 0.25, + "learning_rate": 0.00026262029082788486, + "loss": 0.0725, "step": 38610 }, { - "epoch": 0.42, - "learning_rate": 0.0002373418132260367, - "loss": 0.0639, + "epoch": 0.25, + "learning_rate": 0.0002626106094735279, + "loss": 0.0743, "step": 38620 }, { - "epoch": 0.42, - "learning_rate": 0.00023732558894152766, - "loss": 0.0678, + "epoch": 0.25, + "learning_rate": 0.00026260092811917097, + "loss": 0.0726, "step": 38630 }, { - "epoch": 0.42, - "learning_rate": 0.00023730936465701858, - "loss": 0.0593, + "epoch": 0.25, + "learning_rate": 0.00026259124676481405, + "loss": 0.0691, "step": 38640 }, { - "epoch": 0.42, - "learning_rate": 0.00023729314037250956, - "loss": 0.0695, + "epoch": 0.25, + "learning_rate": 0.00026258156541045713, + "loss": 0.0754, "step": 38650 }, { - "epoch": 0.42, - "learning_rate": 0.00023727691608800048, - "loss": 0.0664, + "epoch": 0.25, + "learning_rate": 0.0002625718840561002, + "loss": 0.0714, "step": 38660 }, { - "epoch": 0.42, - "learning_rate": 0.00023726069180349146, - "loss": 0.0656, + "epoch": 0.25, + "learning_rate": 0.0002625622027017433, + "loss": 0.0675, "step": 38670 }, { - "epoch": 0.42, - "learning_rate": 0.00023724446751898238, - "loss": 0.0634, + "epoch": 0.25, + "learning_rate": 0.00026255252134738637, + "loss": 0.0712, "step": 38680 }, { - "epoch": 0.42, - "learning_rate": 0.00023722824323447336, - "loss": 0.0606, + "epoch": 0.25, + "learning_rate": 0.0002625428399930294, + "loss": 0.0644, "step": 38690 }, { - "epoch": 0.42, - "learning_rate": 0.00023721201894996428, - "loss": 0.0658, + "epoch": 0.25, + "learning_rate": 0.00026253315863867247, + "loss": 0.0717, "step": 38700 }, { - "epoch": 0.42, - "learning_rate": 0.00023719579466545523, - "loss": 0.0712, + "epoch": 0.25, + "learning_rate": 0.00026252347728431555, + "loss": 0.0642, "step": 38710 }, { - "epoch": 0.42, - "learning_rate": 0.00023717957038094618, - "loss": 0.0588, + "epoch": 0.25, + "learning_rate": 0.0002625137959299586, + "loss": 0.0692, "step": 38720 }, { - "epoch": 0.42, - "learning_rate": 0.00023716334609643713, - "loss": 0.066, + "epoch": 0.25, + "learning_rate": 0.00026250411457560166, + "loss": 0.0716, "step": 38730 }, { - "epoch": 0.42, - "learning_rate": 0.00023714712181192806, - "loss": 0.0664, + "epoch": 0.25, + "learning_rate": 0.00026249443322124474, + "loss": 0.077, "step": 38740 }, { - "epoch": 0.42, - "learning_rate": 0.00023713089752741903, - "loss": 0.0553, + "epoch": 0.25, + "learning_rate": 0.0002624847518668878, + "loss": 0.0746, "step": 38750 }, { - "epoch": 0.42, - "learning_rate": 0.00023711467324290995, - "loss": 0.0678, + "epoch": 0.25, + "learning_rate": 0.00026247507051253084, + "loss": 0.0706, "step": 38760 }, { - "epoch": 0.42, - "learning_rate": 0.00023709844895840093, - "loss": 0.0582, + "epoch": 0.25, + "learning_rate": 0.0002624653891581739, + "loss": 0.0779, "step": 38770 }, { - "epoch": 0.42, - "learning_rate": 0.00023708222467389185, - "loss": 0.0644, + "epoch": 0.25, + "learning_rate": 0.000262455707803817, + "loss": 0.0841, "step": 38780 }, { - "epoch": 0.42, - "learning_rate": 0.0002370660003893828, - "loss": 0.0615, + "epoch": 0.25, + "learning_rate": 0.0002624460264494601, + "loss": 0.0688, "step": 38790 }, { - "epoch": 0.42, - "learning_rate": 0.00023704977610487375, - "loss": 0.0699, + "epoch": 0.25, + "learning_rate": 0.00026243634509510316, + "loss": 0.0638, "step": 38800 }, { - "epoch": 0.42, - "learning_rate": 0.0002370335518203647, - "loss": 0.0701, + "epoch": 0.25, + "learning_rate": 0.00026242666374074624, + "loss": 0.0716, "step": 38810 }, { - "epoch": 0.42, - "learning_rate": 0.00023701732753585563, - "loss": 0.0721, + "epoch": 0.25, + "learning_rate": 0.0002624169823863893, + "loss": 0.0717, "step": 38820 }, { - "epoch": 0.42, - "learning_rate": 0.0002370011032513466, - "loss": 0.0662, + "epoch": 0.25, + "learning_rate": 0.00026240730103203235, + "loss": 0.08, "step": 38830 }, { - "epoch": 0.42, - "learning_rate": 0.00023698487896683753, - "loss": 0.0579, + "epoch": 0.25, + "learning_rate": 0.0002623976196776754, + "loss": 0.0915, "step": 38840 }, { - "epoch": 0.42, - "learning_rate": 0.0002369686546823285, - "loss": 0.0616, + "epoch": 0.25, + "learning_rate": 0.0002623879383233185, + "loss": 0.0671, "step": 38850 }, { - "epoch": 0.42, - "learning_rate": 0.00023695243039781943, - "loss": 0.0694, + "epoch": 0.25, + "learning_rate": 0.00026237825696896153, + "loss": 0.0744, "step": 38860 }, { - "epoch": 0.42, - "learning_rate": 0.0002369362061133104, - "loss": 0.0645, + "epoch": 0.25, + "learning_rate": 0.0002623685756146046, + "loss": 0.0759, "step": 38870 }, { - "epoch": 0.42, - "learning_rate": 0.00023691998182880133, - "loss": 0.0626, + "epoch": 0.25, + "learning_rate": 0.0002623588942602477, + "loss": 0.0671, "step": 38880 }, { - "epoch": 0.42, - "learning_rate": 0.00023690375754429227, - "loss": 0.0659, + "epoch": 0.25, + "learning_rate": 0.00026234921290589077, + "loss": 0.0693, "step": 38890 }, { - "epoch": 0.42, - "learning_rate": 0.00023688753325978322, - "loss": 0.0624, + "epoch": 0.25, + "learning_rate": 0.0002623395315515338, + "loss": 0.0708, "step": 38900 }, { - "epoch": 0.42, - "learning_rate": 0.00023687130897527417, - "loss": 0.0648, + "epoch": 0.25, + "learning_rate": 0.0002623298501971769, + "loss": 0.0661, "step": 38910 }, { - "epoch": 0.42, - "learning_rate": 0.0002368550846907651, - "loss": 0.0554, + "epoch": 0.25, + "learning_rate": 0.00026232016884281996, + "loss": 0.0711, "step": 38920 }, { - "epoch": 0.42, - "learning_rate": 0.00023683886040625607, - "loss": 0.0528, + "epoch": 0.25, + "learning_rate": 0.00026231048748846304, + "loss": 0.0744, "step": 38930 }, { - "epoch": 0.42, - "learning_rate": 0.000236822636121747, - "loss": 0.0665, + "epoch": 0.25, + "learning_rate": 0.0002623008061341061, + "loss": 0.0736, "step": 38940 }, { - "epoch": 0.42, - "learning_rate": 0.00023680641183723797, + "epoch": 0.25, + "learning_rate": 0.0002622911247797492, "loss": 0.0663, "step": 38950 }, { - "epoch": 0.42, - "learning_rate": 0.0002367901875527289, - "loss": 0.0533, + "epoch": 0.25, + "learning_rate": 0.0002622814434253922, + "loss": 0.0689, "step": 38960 }, { - "epoch": 0.42, - "learning_rate": 0.00023677396326821985, - "loss": 0.0599, + "epoch": 0.25, + "learning_rate": 0.0002622717620710353, + "loss": 0.0679, "step": 38970 }, { - "epoch": 0.42, - "learning_rate": 0.0002367577389837108, - "loss": 0.0565, + "epoch": 0.25, + "learning_rate": 0.0002622620807166784, + "loss": 0.0678, "step": 38980 }, { - "epoch": 0.42, - "learning_rate": 0.00023674151469920175, - "loss": 0.0604, + "epoch": 0.25, + "learning_rate": 0.0002622523993623214, + "loss": 0.0731, "step": 38990 }, { - "epoch": 0.42, - "learning_rate": 0.00023672529041469267, - "loss": 0.0657, + "epoch": 0.25, + "learning_rate": 0.0002622427180079645, + "loss": 0.0675, "step": 39000 }, { - "epoch": 0.42, - "eval_cer": 0.9214273219293178, - "eval_loss": 0.04273923486471176, - "eval_runtime": 119.6336, - "eval_samples_per_second": 16.718, - "eval_steps_per_second": 4.179, + "epoch": 0.25, + "eval_cer": 0.919996384589312, + "eval_loss": 0.047410257160663605, + "eval_runtime": 120.2237, + "eval_samples_per_second": 16.636, + "eval_steps_per_second": 4.159, "step": 39000 }, { - "epoch": 0.42, - "learning_rate": 0.00023670906613018364, - "loss": 0.0601, + "epoch": 0.25, + "learning_rate": 0.00026223303665360757, + "loss": 0.0729, "step": 39010 }, { - "epoch": 0.42, - "learning_rate": 0.00023669284184567457, - "loss": 0.0709, + "epoch": 0.25, + "learning_rate": 0.00026222335529925065, + "loss": 0.0711, "step": 39020 }, { - "epoch": 0.42, - "learning_rate": 0.00023667661756116554, - "loss": 0.0592, + "epoch": 0.25, + "learning_rate": 0.0002622136739448937, + "loss": 0.0652, "step": 39030 }, { - "epoch": 0.42, - "learning_rate": 0.00023666039327665647, - "loss": 0.0661, + "epoch": 0.25, + "learning_rate": 0.00026220399259053675, + "loss": 0.0658, "step": 39040 }, { - "epoch": 0.42, - "learning_rate": 0.00023664416899214744, - "loss": 0.0658, + "epoch": 0.25, + "learning_rate": 0.00026219431123617983, + "loss": 0.0686, "step": 39050 }, { - "epoch": 0.42, - "learning_rate": 0.00023662794470763837, - "loss": 0.0636, + "epoch": 0.25, + "learning_rate": 0.0002621846298818229, + "loss": 0.0653, "step": 39060 }, { - "epoch": 0.42, - "learning_rate": 0.00023661172042312932, - "loss": 0.0613, + "epoch": 0.25, + "learning_rate": 0.000262174948527466, + "loss": 0.068, "step": 39070 }, { - "epoch": 0.42, - "learning_rate": 0.00023659549613862027, - "loss": 0.0623, + "epoch": 0.25, + "learning_rate": 0.00026216526717310907, + "loss": 0.0674, "step": 39080 }, { - "epoch": 0.42, - "learning_rate": 0.00023657927185411122, - "loss": 0.0606, + "epoch": 0.25, + "learning_rate": 0.0002621555858187521, + "loss": 0.0613, "step": 39090 }, { - "epoch": 0.42, - "learning_rate": 0.00023656304756960214, - "loss": 0.0529, + "epoch": 0.25, + "learning_rate": 0.0002621459044643952, + "loss": 0.0705, "step": 39100 }, { - "epoch": 0.42, - "learning_rate": 0.00023654682328509312, - "loss": 0.0593, + "epoch": 0.25, + "learning_rate": 0.00026213622311003826, + "loss": 0.0632, "step": 39110 }, { - "epoch": 0.42, - "learning_rate": 0.00023653059900058404, - "loss": 0.0631, + "epoch": 0.25, + "learning_rate": 0.0002621265417556813, + "loss": 0.0621, "step": 39120 }, { - "epoch": 0.42, - "learning_rate": 0.00023651437471607502, - "loss": 0.0708, + "epoch": 0.25, + "learning_rate": 0.00026211686040132436, + "loss": 0.0717, "step": 39130 }, { - "epoch": 0.42, - "learning_rate": 0.00023649815043156594, - "loss": 0.0541, + "epoch": 0.25, + "learning_rate": 0.00026210717904696744, + "loss": 0.0715, "step": 39140 }, { - "epoch": 0.42, - "learning_rate": 0.0002364819261470569, - "loss": 0.0609, + "epoch": 0.25, + "learning_rate": 0.0002620974976926105, + "loss": 0.0672, "step": 39150 }, { - "epoch": 0.42, - "learning_rate": 0.00023646570186254784, - "loss": 0.0589, + "epoch": 0.25, + "learning_rate": 0.0002620878163382536, + "loss": 0.0664, "step": 39160 }, { - "epoch": 0.42, - "learning_rate": 0.0002364494775780388, - "loss": 0.0669, + "epoch": 0.25, + "learning_rate": 0.0002620781349838967, + "loss": 0.0683, "step": 39170 }, { - "epoch": 0.42, - "learning_rate": 0.0002364332532935297, - "loss": 0.0661, + "epoch": 0.25, + "learning_rate": 0.0002620684536295397, + "loss": 0.068, "step": 39180 }, { - "epoch": 0.42, - "learning_rate": 0.0002364170290090207, - "loss": 0.0788, + "epoch": 0.25, + "learning_rate": 0.0002620587722751828, + "loss": 0.0634, "step": 39190 }, { - "epoch": 0.42, - "learning_rate": 0.0002364008047245116, - "loss": 0.0594, + "epoch": 0.25, + "learning_rate": 0.00026204909092082587, + "loss": 0.068, "step": 39200 }, { - "epoch": 0.42, - "learning_rate": 0.00023638458044000259, - "loss": 0.067, + "epoch": 0.25, + "learning_rate": 0.00026203940956646895, + "loss": 0.0736, "step": 39210 }, { - "epoch": 0.42, - "learning_rate": 0.0002363683561554935, - "loss": 0.0637, + "epoch": 0.25, + "learning_rate": 0.000262029728212112, + "loss": 0.0626, "step": 39220 }, { - "epoch": 0.42, - "learning_rate": 0.00023635213187098449, - "loss": 0.0664, + "epoch": 0.25, + "learning_rate": 0.00026202004685775505, + "loss": 0.0634, "step": 39230 }, { - "epoch": 0.42, - "learning_rate": 0.0002363359075864754, - "loss": 0.0579, + "epoch": 0.25, + "learning_rate": 0.00026201036550339813, + "loss": 0.0632, "step": 39240 }, { - "epoch": 0.42, - "learning_rate": 0.00023631968330196636, - "loss": 0.0661, + "epoch": 0.25, + "learning_rate": 0.0002620006841490412, + "loss": 0.064, "step": 39250 }, { - "epoch": 0.42, - "learning_rate": 0.0002363034590174573, - "loss": 0.0808, + "epoch": 0.25, + "learning_rate": 0.00026199100279468424, + "loss": 0.063, "step": 39260 }, { - "epoch": 0.42, - "learning_rate": 0.00023628723473294826, - "loss": 0.0694, + "epoch": 0.25, + "learning_rate": 0.0002619813214403273, + "loss": 0.0707, "step": 39270 }, { - "epoch": 0.42, - "learning_rate": 0.00023627101044843918, - "loss": 0.0697, + "epoch": 0.25, + "learning_rate": 0.0002619716400859704, + "loss": 0.0661, "step": 39280 }, { - "epoch": 0.42, - "learning_rate": 0.00023625478616393016, - "loss": 0.0667, + "epoch": 0.25, + "learning_rate": 0.0002619619587316135, + "loss": 0.0609, "step": 39290 }, { - "epoch": 0.43, - "learning_rate": 0.00023623856187942108, - "loss": 0.0645, + "epoch": 0.25, + "learning_rate": 0.00026195227737725655, + "loss": 0.0663, "step": 39300 }, { - "epoch": 0.43, - "learning_rate": 0.00023622233759491206, - "loss": 0.0663, + "epoch": 0.25, + "learning_rate": 0.00026194259602289963, + "loss": 0.064, "step": 39310 }, { - "epoch": 0.43, - "learning_rate": 0.00023620611331040298, - "loss": 0.0635, + "epoch": 0.25, + "learning_rate": 0.00026193291466854266, + "loss": 0.0713, "step": 39320 }, { - "epoch": 0.43, - "learning_rate": 0.00023618988902589393, - "loss": 0.0598, + "epoch": 0.25, + "learning_rate": 0.00026192323331418574, + "loss": 0.0702, "step": 39330 }, { - "epoch": 0.43, - "learning_rate": 0.00023617366474138488, - "loss": 0.0676, + "epoch": 0.25, + "learning_rate": 0.0002619135519598288, + "loss": 0.0598, "step": 39340 }, { - "epoch": 0.43, - "learning_rate": 0.00023615744045687583, - "loss": 0.0612, + "epoch": 0.25, + "learning_rate": 0.0002619038706054719, + "loss": 0.074, "step": 39350 }, { - "epoch": 0.43, - "learning_rate": 0.00023614121617236678, - "loss": 0.0717, + "epoch": 0.25, + "learning_rate": 0.0002618941892511149, + "loss": 0.0678, "step": 39360 }, { - "epoch": 0.43, - "learning_rate": 0.00023612499188785773, - "loss": 0.0685, + "epoch": 0.25, + "learning_rate": 0.000261884507896758, + "loss": 0.0672, "step": 39370 }, { - "epoch": 0.43, - "learning_rate": 0.00023610876760334865, - "loss": 0.0662, + "epoch": 0.25, + "learning_rate": 0.0002618748265424011, + "loss": 0.0752, "step": 39380 }, { - "epoch": 0.43, - "learning_rate": 0.00023609254331883963, - "loss": 0.064, + "epoch": 0.25, + "learning_rate": 0.0002618651451880441, + "loss": 0.0799, "step": 39390 }, { - "epoch": 0.43, - "learning_rate": 0.00023607631903433055, - "loss": 0.061, + "epoch": 0.25, + "learning_rate": 0.0002618554638336872, + "loss": 0.082, "step": 39400 }, { - "epoch": 0.43, - "learning_rate": 0.00023606009474982153, - "loss": 0.0667, + "epoch": 0.25, + "learning_rate": 0.00026184578247933027, + "loss": 0.0672, "step": 39410 }, { - "epoch": 0.43, - "learning_rate": 0.00023604387046531245, - "loss": 0.0648, + "epoch": 0.25, + "learning_rate": 0.00026183610112497335, + "loss": 0.0697, "step": 39420 }, { - "epoch": 0.43, - "learning_rate": 0.0002360276461808034, - "loss": 0.0552, + "epoch": 0.25, + "learning_rate": 0.00026182641977061643, + "loss": 0.0677, "step": 39430 }, { - "epoch": 0.43, - "learning_rate": 0.00023601142189629435, - "loss": 0.0586, + "epoch": 0.25, + "learning_rate": 0.0002618167384162595, + "loss": 0.0627, "step": 39440 }, { - "epoch": 0.43, - "learning_rate": 0.0002359951976117853, - "loss": 0.0629, + "epoch": 0.25, + "learning_rate": 0.0002618070570619026, + "loss": 0.0687, "step": 39450 }, { - "epoch": 0.43, - "learning_rate": 0.00023597897332727622, - "loss": 0.059, + "epoch": 0.25, + "learning_rate": 0.0002617973757075456, + "loss": 0.0743, "step": 39460 }, { - "epoch": 0.43, - "learning_rate": 0.0002359627490427672, - "loss": 0.0616, + "epoch": 0.25, + "learning_rate": 0.0002617876943531887, + "loss": 0.0949, "step": 39470 }, { - "epoch": 0.43, - "learning_rate": 0.00023594652475825812, - "loss": 0.0719, + "epoch": 0.25, + "learning_rate": 0.0002617780129988318, + "loss": 0.0829, "step": 39480 }, { - "epoch": 0.43, - "learning_rate": 0.0002359303004737491, - "loss": 0.0652, + "epoch": 0.25, + "learning_rate": 0.0002617683316444748, + "loss": 0.0723, "step": 39490 }, { - "epoch": 0.43, - "learning_rate": 0.00023591407618924002, - "loss": 0.0674, + "epoch": 0.25, + "learning_rate": 0.0002617586502901179, + "loss": 0.083, "step": 39500 }, { - "epoch": 0.43, - "learning_rate": 0.00023589785190473097, - "loss": 0.0594, + "epoch": 0.26, + "learning_rate": 0.00026174896893576096, + "loss": 0.0666, "step": 39510 }, { - "epoch": 0.43, - "learning_rate": 0.00023588162762022192, - "loss": 0.0625, + "epoch": 0.26, + "learning_rate": 0.00026173928758140404, + "loss": 0.0693, "step": 39520 }, { - "epoch": 0.43, - "learning_rate": 0.00023586540333571287, - "loss": 0.0596, + "epoch": 0.26, + "learning_rate": 0.00026172960622704706, + "loss": 0.0681, "step": 39530 }, { - "epoch": 0.43, - "learning_rate": 0.00023584917905120382, - "loss": 0.064, + "epoch": 0.26, + "learning_rate": 0.00026171992487269014, + "loss": 0.0859, "step": 39540 }, { - "epoch": 0.43, - "learning_rate": 0.00023583295476669477, - "loss": 0.0715, + "epoch": 0.26, + "learning_rate": 0.0002617102435183332, + "loss": 0.0696, "step": 39550 }, { - "epoch": 0.43, - "learning_rate": 0.0002358167304821857, - "loss": 0.0636, + "epoch": 0.26, + "learning_rate": 0.0002617005621639763, + "loss": 0.0667, "step": 39560 }, { - "epoch": 0.43, - "learning_rate": 0.00023580050619767667, - "loss": 0.0605, + "epoch": 0.26, + "learning_rate": 0.0002616908808096194, + "loss": 0.0708, "step": 39570 }, { - "epoch": 0.43, - "learning_rate": 0.0002357842819131676, - "loss": 0.0597, + "epoch": 0.26, + "learning_rate": 0.00026168119945526246, + "loss": 0.0687, "step": 39580 }, { - "epoch": 0.43, - "learning_rate": 0.00023576805762865857, - "loss": 0.0551, + "epoch": 0.26, + "learning_rate": 0.00026167151810090554, + "loss": 0.0783, "step": 39590 }, { - "epoch": 0.43, - "learning_rate": 0.0002357518333441495, - "loss": 0.0677, + "epoch": 0.26, + "learning_rate": 0.00026166183674654857, + "loss": 0.0698, "step": 39600 }, { - "epoch": 0.43, - "learning_rate": 0.00023573560905964044, - "loss": 0.0619, + "epoch": 0.26, + "learning_rate": 0.00026165215539219165, + "loss": 0.0739, "step": 39610 }, { - "epoch": 0.43, - "learning_rate": 0.0002357193847751314, - "loss": 0.0643, + "epoch": 0.26, + "learning_rate": 0.00026164247403783473, + "loss": 0.0664, "step": 39620 }, { - "epoch": 0.43, - "learning_rate": 0.00023570316049062234, - "loss": 0.062, + "epoch": 0.26, + "learning_rate": 0.00026163279268347775, + "loss": 0.0647, "step": 39630 }, { - "epoch": 0.43, - "learning_rate": 0.00023568693620611326, - "loss": 0.0582, + "epoch": 0.26, + "learning_rate": 0.00026162311132912083, + "loss": 0.0648, "step": 39640 }, { - "epoch": 0.43, - "learning_rate": 0.00023567071192160424, - "loss": 0.0633, + "epoch": 0.26, + "learning_rate": 0.0002616134299747639, + "loss": 0.0659, "step": 39650 }, { - "epoch": 0.43, - "learning_rate": 0.00023565448763709516, - "loss": 0.0632, + "epoch": 0.26, + "learning_rate": 0.000261603748620407, + "loss": 0.0722, "step": 39660 }, { - "epoch": 0.43, - "learning_rate": 0.00023563826335258614, - "loss": 0.058, + "epoch": 0.26, + "learning_rate": 0.00026159406726605, + "loss": 0.0678, "step": 39670 }, { - "epoch": 0.43, - "learning_rate": 0.00023562203906807706, - "loss": 0.0632, + "epoch": 0.26, + "learning_rate": 0.0002615843859116931, + "loss": 0.0683, "step": 39680 }, { - "epoch": 0.43, - "learning_rate": 0.000235605814783568, - "loss": 0.0581, + "epoch": 0.26, + "learning_rate": 0.0002615747045573362, + "loss": 0.0668, "step": 39690 }, { - "epoch": 0.43, - "learning_rate": 0.00023558959049905896, - "loss": 0.0676, + "epoch": 0.26, + "learning_rate": 0.00026156502320297926, + "loss": 0.0703, "step": 39700 }, { - "epoch": 0.43, - "learning_rate": 0.0002355733662145499, - "loss": 0.0566, + "epoch": 0.26, + "learning_rate": 0.00026155534184862234, + "loss": 0.0656, "step": 39710 }, { - "epoch": 0.43, - "learning_rate": 0.00023555714193004086, - "loss": 0.0572, + "epoch": 0.26, + "learning_rate": 0.0002615456604942654, + "loss": 0.0656, "step": 39720 }, { - "epoch": 0.43, - "learning_rate": 0.0002355409176455318, - "loss": 0.058, + "epoch": 0.26, + "learning_rate": 0.00026153597913990844, + "loss": 0.0736, "step": 39730 }, { - "epoch": 0.43, - "learning_rate": 0.00023552469336102273, - "loss": 0.0553, + "epoch": 0.26, + "learning_rate": 0.0002615262977855515, + "loss": 0.0635, "step": 39740 }, { - "epoch": 0.43, - "learning_rate": 0.0002355084690765137, - "loss": 0.0608, + "epoch": 0.26, + "learning_rate": 0.0002615166164311946, + "loss": 0.0666, "step": 39750 }, { - "epoch": 0.43, - "learning_rate": 0.00023549224479200463, - "loss": 0.0594, + "epoch": 0.26, + "learning_rate": 0.00026150693507683763, + "loss": 0.0656, "step": 39760 }, { - "epoch": 0.43, - "learning_rate": 0.0002354760205074956, - "loss": 0.0537, + "epoch": 0.26, + "learning_rate": 0.0002614972537224807, + "loss": 0.0713, "step": 39770 }, { - "epoch": 0.43, - "learning_rate": 0.00023545979622298653, - "loss": 0.0557, + "epoch": 0.26, + "learning_rate": 0.0002614875723681238, + "loss": 0.0647, "step": 39780 }, { - "epoch": 0.43, - "learning_rate": 0.00023544357193847748, - "loss": 0.0595, + "epoch": 0.26, + "learning_rate": 0.00026147789101376687, + "loss": 0.0696, "step": 39790 }, { - "epoch": 0.43, - "learning_rate": 0.00023542734765396843, - "loss": 0.0621, + "epoch": 0.26, + "learning_rate": 0.00026146820965940995, + "loss": 0.0705, "step": 39800 }, { - "epoch": 0.43, - "learning_rate": 0.00023541112336945938, - "loss": 0.0588, + "epoch": 0.26, + "learning_rate": 0.000261458528305053, + "loss": 0.0796, "step": 39810 }, { - "epoch": 0.43, - "learning_rate": 0.0002353948990849503, - "loss": 0.0556, + "epoch": 0.26, + "learning_rate": 0.00026144884695069605, + "loss": 0.0673, "step": 39820 }, { - "epoch": 0.43, - "learning_rate": 0.00023537867480044128, - "loss": 0.0573, + "epoch": 0.26, + "learning_rate": 0.00026143916559633913, + "loss": 0.0744, "step": 39830 }, { - "epoch": 0.43, - "learning_rate": 0.0002353624505159322, - "loss": 0.057, + "epoch": 0.26, + "learning_rate": 0.0002614294842419822, + "loss": 0.07, "step": 39840 }, { - "epoch": 0.43, - "learning_rate": 0.00023534622623142318, + "epoch": 0.26, + "learning_rate": 0.0002614198028876253, "loss": 0.0611, "step": 39850 }, { - "epoch": 0.43, - "learning_rate": 0.0002353300019469141, - "loss": 0.0606, + "epoch": 0.26, + "learning_rate": 0.00026141012153326837, + "loss": 0.0649, "step": 39860 }, { - "epoch": 0.43, - "learning_rate": 0.00023531377766240505, - "loss": 0.0629, + "epoch": 0.26, + "learning_rate": 0.0002614004401789114, + "loss": 0.0739, "step": 39870 }, { - "epoch": 0.43, - "learning_rate": 0.000235297553377896, - "loss": 0.0668, + "epoch": 0.26, + "learning_rate": 0.0002613907588245545, + "loss": 0.0715, "step": 39880 }, { - "epoch": 0.43, - "learning_rate": 0.00023528132909338695, - "loss": 0.0569, + "epoch": 0.26, + "learning_rate": 0.00026138107747019756, + "loss": 0.069, "step": 39890 }, { - "epoch": 0.43, - "learning_rate": 0.00023526510480887793, - "loss": 0.0589, + "epoch": 0.26, + "learning_rate": 0.0002613713961158406, + "loss": 0.067, "step": 39900 }, { - "epoch": 0.43, - "learning_rate": 0.00023524888052436885, - "loss": 0.0727, + "epoch": 0.26, + "learning_rate": 0.00026136171476148366, + "loss": 0.0665, "step": 39910 }, { - "epoch": 0.43, - "learning_rate": 0.00023523265623985983, - "loss": 0.0581, + "epoch": 0.26, + "learning_rate": 0.00026135203340712674, + "loss": 0.0727, "step": 39920 }, { - "epoch": 0.43, - "learning_rate": 0.00023521643195535075, - "loss": 0.0523, + "epoch": 0.26, + "learning_rate": 0.0002613423520527698, + "loss": 0.0735, "step": 39930 }, { - "epoch": 0.43, - "learning_rate": 0.0002352002076708417, - "loss": 0.0611, + "epoch": 0.26, + "learning_rate": 0.0002613326706984129, + "loss": 0.071, "step": 39940 }, { - "epoch": 0.43, - "learning_rate": 0.00023518398338633265, - "loss": 0.0595, + "epoch": 0.26, + "learning_rate": 0.00026132298934405593, + "loss": 0.0679, "step": 39950 }, { - "epoch": 0.43, - "learning_rate": 0.0002351677591018236, - "loss": 0.0618, + "epoch": 0.26, + "learning_rate": 0.000261313307989699, + "loss": 0.0736, "step": 39960 }, { - "epoch": 0.43, - "learning_rate": 0.00023515153481731452, - "loss": 0.0594, + "epoch": 0.26, + "learning_rate": 0.0002613036266353421, + "loss": 0.0731, "step": 39970 }, { - "epoch": 0.43, - "learning_rate": 0.0002351353105328055, - "loss": 0.0565, + "epoch": 0.26, + "learning_rate": 0.00026129394528098517, + "loss": 0.0618, "step": 39980 }, { - "epoch": 0.43, - "learning_rate": 0.00023511908624829642, - "loss": 0.0584, + "epoch": 0.26, + "learning_rate": 0.00026128426392662825, + "loss": 0.0672, "step": 39990 }, { - "epoch": 0.43, - "learning_rate": 0.0002351028619637874, - "loss": 0.0643, + "epoch": 0.26, + "learning_rate": 0.0002612745825722713, + "loss": 0.0739, "step": 40000 }, { - "epoch": 0.43, - "eval_cer": 0.9211993829745504, - "eval_loss": 0.044067420065402985, - "eval_runtime": 119.3283, - "eval_samples_per_second": 16.76, - "eval_steps_per_second": 4.19, + "epoch": 0.26, + "eval_cer": 0.9201039430572817, + "eval_loss": 0.04600047320127487, + "eval_runtime": 120.2571, + "eval_samples_per_second": 16.631, + "eval_steps_per_second": 4.158, "step": 40000 }, { - "epoch": 0.43, - "learning_rate": 0.00023508663767927832, - "loss": 0.0576, + "epoch": 0.26, + "learning_rate": 0.00026126490121791435, + "loss": 0.0708, "step": 40010 }, { - "epoch": 0.43, - "learning_rate": 0.00023507041339476927, - "loss": 0.0646, + "epoch": 0.26, + "learning_rate": 0.00026125521986355743, + "loss": 0.068, "step": 40020 }, { - "epoch": 0.43, - "learning_rate": 0.00023505418911026022, - "loss": 0.0638, + "epoch": 0.26, + "learning_rate": 0.00026124553850920046, + "loss": 0.072, "step": 40030 }, { - "epoch": 0.43, - "learning_rate": 0.00023503796482575117, - "loss": 0.0573, + "epoch": 0.26, + "learning_rate": 0.00026123585715484354, + "loss": 0.0924, "step": 40040 }, { - "epoch": 0.43, - "learning_rate": 0.00023502174054124212, - "loss": 0.0609, + "epoch": 0.26, + "learning_rate": 0.0002612261758004866, + "loss": 0.0713, "step": 40050 }, { - "epoch": 0.43, - "learning_rate": 0.00023500551625673307, - "loss": 0.0646, + "epoch": 0.26, + "learning_rate": 0.0002612164944461297, + "loss": 0.079, "step": 40060 }, { - "epoch": 0.43, - "learning_rate": 0.000234989291972224, - "loss": 0.0595, + "epoch": 0.26, + "learning_rate": 0.0002612068130917728, + "loss": 0.0671, "step": 40070 }, { - "epoch": 0.43, - "learning_rate": 0.00023497306768771497, - "loss": 0.0703, + "epoch": 0.26, + "learning_rate": 0.00026119713173741586, + "loss": 0.0696, "step": 40080 }, { - "epoch": 0.43, - "learning_rate": 0.0002349568434032059, - "loss": 0.0648, + "epoch": 0.26, + "learning_rate": 0.0002611874503830589, + "loss": 0.0801, "step": 40090 }, { - "epoch": 0.43, - "learning_rate": 0.00023494061911869687, - "loss": 0.0747, + "epoch": 0.26, + "learning_rate": 0.00026117776902870196, + "loss": 0.0718, "step": 40100 }, { - "epoch": 0.43, - "learning_rate": 0.0002349243948341878, - "loss": 0.063, + "epoch": 0.26, + "learning_rate": 0.00026116808767434504, + "loss": 0.0659, "step": 40110 }, { - "epoch": 0.43, - "learning_rate": 0.00023490817054967874, - "loss": 0.0659, + "epoch": 0.26, + "learning_rate": 0.0002611584063199881, + "loss": 0.0664, "step": 40120 }, { - "epoch": 0.43, - "learning_rate": 0.0002348919462651697, - "loss": 0.0605, + "epoch": 0.26, + "learning_rate": 0.00026114872496563115, + "loss": 0.068, "step": 40130 }, { - "epoch": 0.43, - "learning_rate": 0.00023487572198066064, - "loss": 0.0635, + "epoch": 0.26, + "learning_rate": 0.00026113904361127423, + "loss": 0.0695, "step": 40140 }, { - "epoch": 0.43, - "learning_rate": 0.00023485949769615157, - "loss": 0.0654, + "epoch": 0.26, + "learning_rate": 0.0002611293622569173, + "loss": 0.073, "step": 40150 }, { - "epoch": 0.43, - "learning_rate": 0.00023484327341164254, - "loss": 0.0559, + "epoch": 0.26, + "learning_rate": 0.00026111968090256033, + "loss": 0.0678, "step": 40160 }, { - "epoch": 0.43, - "learning_rate": 0.00023482704912713347, - "loss": 0.0518, + "epoch": 0.26, + "learning_rate": 0.0002611099995482034, + "loss": 0.0737, "step": 40170 }, { - "epoch": 0.43, - "learning_rate": 0.00023481082484262444, - "loss": 0.0602, + "epoch": 0.26, + "learning_rate": 0.0002611003181938465, + "loss": 0.0772, "step": 40180 }, { - "epoch": 0.43, - "learning_rate": 0.00023479460055811537, - "loss": 0.057, + "epoch": 0.26, + "learning_rate": 0.00026109063683948957, + "loss": 0.0747, "step": 40190 }, { - "epoch": 0.43, - "learning_rate": 0.00023477837627360632, - "loss": 0.0714, + "epoch": 0.26, + "learning_rate": 0.00026108095548513265, + "loss": 0.0703, "step": 40200 }, { - "epoch": 0.43, - "learning_rate": 0.00023476215198909727, - "loss": 0.0702, + "epoch": 0.26, + "learning_rate": 0.00026107127413077573, + "loss": 0.0665, "step": 40210 }, { - "epoch": 0.44, - "learning_rate": 0.00023474592770458821, - "loss": 0.0629, + "epoch": 0.26, + "learning_rate": 0.0002610615927764188, + "loss": 0.0668, "step": 40220 }, { - "epoch": 0.44, - "learning_rate": 0.00023472970342007916, - "loss": 0.0641, + "epoch": 0.26, + "learning_rate": 0.00026105191142206184, + "loss": 0.0707, "step": 40230 }, { - "epoch": 0.44, - "learning_rate": 0.00023471347913557011, - "loss": 0.0608, + "epoch": 0.26, + "learning_rate": 0.0002610422300677049, + "loss": 0.0698, "step": 40240 }, { - "epoch": 0.44, - "learning_rate": 0.00023469725485106104, - "loss": 0.0646, + "epoch": 0.26, + "learning_rate": 0.000261032548713348, + "loss": 0.0701, "step": 40250 }, { - "epoch": 0.44, - "learning_rate": 0.00023468103056655201, - "loss": 0.0657, + "epoch": 0.26, + "learning_rate": 0.0002610228673589911, + "loss": 0.0639, "step": 40260 }, { - "epoch": 0.44, - "learning_rate": 0.00023466480628204294, - "loss": 0.0566, + "epoch": 0.26, + "learning_rate": 0.0002610131860046341, + "loss": 0.066, "step": 40270 }, { - "epoch": 0.44, - "learning_rate": 0.0002346485819975339, - "loss": 0.0621, + "epoch": 0.26, + "learning_rate": 0.0002610035046502772, + "loss": 0.0742, "step": 40280 }, { - "epoch": 0.44, - "learning_rate": 0.00023463235771302484, - "loss": 0.0627, + "epoch": 0.26, + "learning_rate": 0.00026099382329592026, + "loss": 0.0639, "step": 40290 }, { - "epoch": 0.44, - "learning_rate": 0.00023461613342851579, - "loss": 0.0564, + "epoch": 0.26, + "learning_rate": 0.0002609841419415633, + "loss": 0.0643, "step": 40300 }, { - "epoch": 0.44, - "learning_rate": 0.00023459990914400674, - "loss": 0.0583, + "epoch": 0.26, + "learning_rate": 0.00026097446058720637, + "loss": 0.0625, "step": 40310 }, { - "epoch": 0.44, - "learning_rate": 0.00023458368485949769, - "loss": 0.0666, + "epoch": 0.26, + "learning_rate": 0.00026096477923284945, + "loss": 0.0689, "step": 40320 }, { - "epoch": 0.44, - "learning_rate": 0.0002345674605749886, - "loss": 0.0594, + "epoch": 0.26, + "learning_rate": 0.0002609550978784925, + "loss": 0.0733, "step": 40330 }, { - "epoch": 0.44, - "learning_rate": 0.00023455123629047959, - "loss": 0.0526, + "epoch": 0.26, + "learning_rate": 0.0002609454165241356, + "loss": 0.0706, "step": 40340 }, { - "epoch": 0.44, - "learning_rate": 0.0002345350120059705, - "loss": 0.0762, + "epoch": 0.26, + "learning_rate": 0.0002609357351697787, + "loss": 0.0666, "step": 40350 }, { - "epoch": 0.44, - "learning_rate": 0.00023451878772146148, - "loss": 0.0638, + "epoch": 0.26, + "learning_rate": 0.00026092605381542177, + "loss": 0.0666, "step": 40360 }, { - "epoch": 0.44, - "learning_rate": 0.0002345025634369524, - "loss": 0.0652, + "epoch": 0.26, + "learning_rate": 0.0002609163724610648, + "loss": 0.0712, "step": 40370 }, { - "epoch": 0.44, - "learning_rate": 0.00023448633915244336, - "loss": 0.0548, + "epoch": 0.26, + "learning_rate": 0.00026090669110670787, + "loss": 0.0644, "step": 40380 }, { - "epoch": 0.44, - "learning_rate": 0.0002344701148679343, - "loss": 0.0602, + "epoch": 0.26, + "learning_rate": 0.00026089700975235095, + "loss": 0.0697, "step": 40390 }, { - "epoch": 0.44, - "learning_rate": 0.00023445389058342526, - "loss": 0.0606, + "epoch": 0.26, + "learning_rate": 0.000260887328397994, + "loss": 0.0684, "step": 40400 }, { - "epoch": 0.44, - "learning_rate": 0.0002344376662989162, - "loss": 0.0729, + "epoch": 0.26, + "learning_rate": 0.00026087764704363706, + "loss": 0.0702, "step": 40410 }, { - "epoch": 0.44, - "learning_rate": 0.00023442144201440716, - "loss": 0.0665, + "epoch": 0.26, + "learning_rate": 0.00026086796568928014, + "loss": 0.0698, "step": 40420 }, { - "epoch": 0.44, - "learning_rate": 0.00023440521772989808, - "loss": 0.0647, + "epoch": 0.26, + "learning_rate": 0.0002608582843349232, + "loss": 0.0655, "step": 40430 }, { - "epoch": 0.44, - "learning_rate": 0.00023438899344538906, - "loss": 0.0616, + "epoch": 0.26, + "learning_rate": 0.00026084860298056624, + "loss": 0.0614, "step": 40440 }, { - "epoch": 0.44, - "learning_rate": 0.00023437276916087998, - "loss": 0.061, + "epoch": 0.26, + "learning_rate": 0.0002608389216262093, + "loss": 0.0706, "step": 40450 }, { - "epoch": 0.44, - "learning_rate": 0.00023435654487637096, - "loss": 0.0631, + "epoch": 0.26, + "learning_rate": 0.0002608292402718524, + "loss": 0.0693, "step": 40460 }, { - "epoch": 0.44, - "learning_rate": 0.00023434032059186188, - "loss": 0.0572, + "epoch": 0.26, + "learning_rate": 0.0002608195589174955, + "loss": 0.072, "step": 40470 }, { - "epoch": 0.44, - "learning_rate": 0.00023432409630735283, - "loss": 0.0577, + "epoch": 0.26, + "learning_rate": 0.00026080987756313856, + "loss": 0.0682, "step": 40480 }, { - "epoch": 0.44, - "learning_rate": 0.00023430787202284378, - "loss": 0.0574, + "epoch": 0.26, + "learning_rate": 0.00026080019620878164, + "loss": 0.0607, "step": 40490 }, { - "epoch": 0.44, - "learning_rate": 0.00023429164773833473, - "loss": 0.055, + "epoch": 0.26, + "learning_rate": 0.00026079051485442467, + "loss": 0.0703, "step": 40500 }, { - "epoch": 0.44, - "learning_rate": 0.00023427542345382565, - "loss": 0.0564, + "epoch": 0.26, + "learning_rate": 0.00026078083350006775, + "loss": 0.0703, "step": 40510 }, { - "epoch": 0.44, - "learning_rate": 0.00023425919916931663, - "loss": 0.0746, + "epoch": 0.26, + "learning_rate": 0.0002607711521457108, + "loss": 0.0669, "step": 40520 }, { - "epoch": 0.44, - "learning_rate": 0.00023424297488480755, - "loss": 0.0664, + "epoch": 0.26, + "learning_rate": 0.00026076147079135385, + "loss": 0.0707, "step": 40530 }, { - "epoch": 0.44, - "learning_rate": 0.00023422675060029853, - "loss": 0.0575, + "epoch": 0.26, + "learning_rate": 0.00026075178943699693, + "loss": 0.0648, "step": 40540 }, { - "epoch": 0.44, - "learning_rate": 0.00023421052631578945, - "loss": 0.0622, + "epoch": 0.26, + "learning_rate": 0.00026074210808264, + "loss": 0.0741, "step": 40550 }, { - "epoch": 0.44, - "learning_rate": 0.0002341943020312804, - "loss": 0.0645, + "epoch": 0.26, + "learning_rate": 0.0002607324267282831, + "loss": 0.0701, "step": 40560 }, { - "epoch": 0.44, - "learning_rate": 0.00023417807774677135, - "loss": 0.0647, + "epoch": 0.26, + "learning_rate": 0.00026072274537392617, + "loss": 0.0689, "step": 40570 }, { - "epoch": 0.44, - "learning_rate": 0.0002341618534622623, - "loss": 0.0689, + "epoch": 0.26, + "learning_rate": 0.0002607130640195692, + "loss": 0.072, "step": 40580 }, { - "epoch": 0.44, - "learning_rate": 0.00023414562917775325, - "loss": 0.0603, + "epoch": 0.26, + "learning_rate": 0.0002607033826652123, + "loss": 0.0678, "step": 40590 }, { - "epoch": 0.44, - "learning_rate": 0.0002341294048932442, - "loss": 0.0672, + "epoch": 0.26, + "learning_rate": 0.00026069370131085536, + "loss": 0.0699, "step": 40600 }, { - "epoch": 0.44, - "learning_rate": 0.00023411318060873512, - "loss": 0.0615, + "epoch": 0.26, + "learning_rate": 0.00026068401995649844, + "loss": 0.072, "step": 40610 }, { - "epoch": 0.44, - "learning_rate": 0.0002340969563242261, - "loss": 0.0619, + "epoch": 0.26, + "learning_rate": 0.0002606743386021415, + "loss": 0.0732, "step": 40620 }, { - "epoch": 0.44, - "learning_rate": 0.00023408073203971702, - "loss": 0.0685, + "epoch": 0.26, + "learning_rate": 0.0002606646572477846, + "loss": 0.0663, "step": 40630 }, { - "epoch": 0.44, - "learning_rate": 0.000234064507755208, - "loss": 0.0694, + "epoch": 0.26, + "learning_rate": 0.0002606549758934276, + "loss": 0.0701, "step": 40640 }, { - "epoch": 0.44, - "learning_rate": 0.00023404828347069892, - "loss": 0.057, + "epoch": 0.26, + "learning_rate": 0.0002606452945390707, + "loss": 0.0681, "step": 40650 }, { - "epoch": 0.44, - "learning_rate": 0.00023403205918618987, - "loss": 0.0565, + "epoch": 0.26, + "learning_rate": 0.0002606356131847138, + "loss": 0.0659, "step": 40660 }, { - "epoch": 0.44, - "learning_rate": 0.00023401583490168082, - "loss": 0.0747, + "epoch": 0.26, + "learning_rate": 0.0002606259318303568, + "loss": 0.0775, "step": 40670 }, { - "epoch": 0.44, - "learning_rate": 0.00023399961061717177, - "loss": 0.0632, + "epoch": 0.26, + "learning_rate": 0.0002606162504759999, + "loss": 0.066, "step": 40680 }, { - "epoch": 0.44, - "learning_rate": 0.0002339833863326627, - "loss": 0.0629, + "epoch": 0.26, + "learning_rate": 0.00026060656912164297, + "loss": 0.0661, "step": 40690 }, { - "epoch": 0.44, - "learning_rate": 0.00023396716204815367, - "loss": 0.0676, + "epoch": 0.26, + "learning_rate": 0.00026059688776728605, + "loss": 0.0654, "step": 40700 }, { - "epoch": 0.44, - "learning_rate": 0.0002339509377636446, - "loss": 0.0676, + "epoch": 0.26, + "learning_rate": 0.0002605872064129291, + "loss": 0.069, "step": 40710 }, { - "epoch": 0.44, - "learning_rate": 0.00023393471347913557, - "loss": 0.0557, + "epoch": 0.26, + "learning_rate": 0.00026057752505857215, + "loss": 0.072, "step": 40720 }, { - "epoch": 0.44, - "learning_rate": 0.0002339184891946265, - "loss": 0.0611, + "epoch": 0.26, + "learning_rate": 0.00026056784370421523, + "loss": 0.0713, "step": 40730 }, { - "epoch": 0.44, - "learning_rate": 0.00023390226491011747, - "loss": 0.0596, + "epoch": 0.26, + "learning_rate": 0.0002605581623498583, + "loss": 0.076, "step": 40740 }, { - "epoch": 0.44, - "learning_rate": 0.0002338860406256084, - "loss": 0.0571, + "epoch": 0.26, + "learning_rate": 0.0002605484809955014, + "loss": 0.0733, "step": 40750 }, { - "epoch": 0.44, - "learning_rate": 0.00023386981634109934, - "loss": 0.0669, + "epoch": 0.26, + "learning_rate": 0.00026053879964114447, + "loss": 0.0712, "step": 40760 }, { - "epoch": 0.44, - "learning_rate": 0.0002338535920565903, - "loss": 0.0646, + "epoch": 0.26, + "learning_rate": 0.0002605291182867875, + "loss": 0.0769, "step": 40770 }, { - "epoch": 0.44, - "learning_rate": 0.00023383736777208124, - "loss": 0.0571, + "epoch": 0.26, + "learning_rate": 0.0002605194369324306, + "loss": 0.0643, "step": 40780 }, { - "epoch": 0.44, - "learning_rate": 0.00023382114348757216, - "loss": 0.068, + "epoch": 0.26, + "learning_rate": 0.00026050975557807365, + "loss": 0.0642, "step": 40790 }, { - "epoch": 0.44, - "learning_rate": 0.00023380491920306314, - "loss": 0.0597, + "epoch": 0.26, + "learning_rate": 0.0002605000742237167, + "loss": 0.076, "step": 40800 }, { - "epoch": 0.44, - "learning_rate": 0.00023378869491855406, - "loss": 0.0695, + "epoch": 0.26, + "learning_rate": 0.00026049039286935976, + "loss": 0.0703, "step": 40810 }, { - "epoch": 0.44, - "learning_rate": 0.00023377247063404504, - "loss": 0.0587, + "epoch": 0.26, + "learning_rate": 0.00026048071151500284, + "loss": 0.0705, "step": 40820 }, { - "epoch": 0.44, - "learning_rate": 0.00023375624634953596, - "loss": 0.0621, + "epoch": 0.26, + "learning_rate": 0.0002604710301606459, + "loss": 0.0626, "step": 40830 }, { - "epoch": 0.44, - "learning_rate": 0.0002337400220650269, - "loss": 0.0581, + "epoch": 0.26, + "learning_rate": 0.000260461348806289, + "loss": 0.0722, "step": 40840 }, { - "epoch": 0.44, - "learning_rate": 0.00023372379778051786, - "loss": 0.0562, + "epoch": 0.26, + "learning_rate": 0.0002604516674519321, + "loss": 0.0662, "step": 40850 }, { - "epoch": 0.44, - "learning_rate": 0.0002337075734960088, - "loss": 0.0557, + "epoch": 0.26, + "learning_rate": 0.0002604419860975751, + "loss": 0.0634, "step": 40860 }, { - "epoch": 0.44, - "learning_rate": 0.00023369134921149973, - "loss": 0.062, + "epoch": 0.26, + "learning_rate": 0.0002604323047432182, + "loss": 0.0699, "step": 40870 }, { - "epoch": 0.44, - "learning_rate": 0.0002336751249269907, - "loss": 0.0583, + "epoch": 0.26, + "learning_rate": 0.00026042262338886126, + "loss": 0.0636, "step": 40880 }, { - "epoch": 0.44, - "learning_rate": 0.00023365890064248163, - "loss": 0.0578, + "epoch": 0.26, + "learning_rate": 0.00026041294203450434, + "loss": 0.0742, "step": 40890 }, { - "epoch": 0.44, - "learning_rate": 0.0002336426763579726, - "loss": 0.0535, + "epoch": 0.26, + "learning_rate": 0.00026040326068014737, + "loss": 0.0734, "step": 40900 }, { - "epoch": 0.44, - "learning_rate": 0.00023362645207346353, - "loss": 0.0712, + "epoch": 0.26, + "learning_rate": 0.00026039357932579045, + "loss": 0.064, "step": 40910 }, { - "epoch": 0.44, - "learning_rate": 0.0002336102277889545, - "loss": 0.06, + "epoch": 0.26, + "learning_rate": 0.00026038389797143353, + "loss": 0.0635, "step": 40920 }, { - "epoch": 0.44, - "learning_rate": 0.00023359400350444543, - "loss": 0.0628, + "epoch": 0.26, + "learning_rate": 0.00026037421661707656, + "loss": 0.0739, "step": 40930 }, { - "epoch": 0.44, - "learning_rate": 0.00023357777921993638, - "loss": 0.059, + "epoch": 0.26, + "learning_rate": 0.00026036453526271963, + "loss": 0.0747, "step": 40940 }, { - "epoch": 0.44, - "learning_rate": 0.00023356155493542733, - "loss": 0.0554, + "epoch": 0.26, + "learning_rate": 0.0002603548539083627, + "loss": 0.075, "step": 40950 }, { - "epoch": 0.44, - "learning_rate": 0.00023354533065091828, - "loss": 0.066, + "epoch": 0.26, + "learning_rate": 0.0002603451725540058, + "loss": 0.067, "step": 40960 }, { - "epoch": 0.44, - "learning_rate": 0.0002335291063664092, - "loss": 0.0553, + "epoch": 0.26, + "learning_rate": 0.0002603354911996489, + "loss": 0.0635, "step": 40970 }, { - "epoch": 0.44, - "learning_rate": 0.00023351288208190018, - "loss": 0.0579, + "epoch": 0.26, + "learning_rate": 0.00026032580984529195, + "loss": 0.0585, "step": 40980 }, { - "epoch": 0.44, - "learning_rate": 0.0002334966577973911, - "loss": 0.0626, + "epoch": 0.26, + "learning_rate": 0.00026031612849093503, + "loss": 0.0698, "step": 40990 }, { - "epoch": 0.44, - "learning_rate": 0.00023348043351288208, - "loss": 0.0579, + "epoch": 0.26, + "learning_rate": 0.00026030644713657806, + "loss": 0.0694, "step": 41000 }, { - "epoch": 0.44, - "eval_cer": 0.9212603433926858, - "eval_loss": 0.041380371898412704, - "eval_runtime": 119.0976, - "eval_samples_per_second": 16.793, - "eval_steps_per_second": 4.198, + "epoch": 0.26, + "eval_cer": 0.9200316348435205, + "eval_loss": 0.04777882248163223, + "eval_runtime": 120.3453, + "eval_samples_per_second": 16.619, + "eval_steps_per_second": 4.155, "step": 41000 }, { - "epoch": 0.44, - "learning_rate": 0.000233464209228373, - "loss": 0.0554, + "epoch": 0.26, + "learning_rate": 0.00026029676578222114, + "loss": 0.0727, "step": 41010 }, { - "epoch": 0.44, - "learning_rate": 0.00023344798494386395, - "loss": 0.0655, + "epoch": 0.26, + "learning_rate": 0.0002602870844278642, + "loss": 0.0695, "step": 41020 }, { - "epoch": 0.44, - "learning_rate": 0.0002334317606593549, - "loss": 0.0582, + "epoch": 0.26, + "learning_rate": 0.0002602774030735073, + "loss": 0.0671, "step": 41030 }, { - "epoch": 0.44, - "learning_rate": 0.00023341553637484585, - "loss": 0.0649, + "epoch": 0.26, + "learning_rate": 0.0002602677217191503, + "loss": 0.0644, "step": 41040 }, { - "epoch": 0.44, - "learning_rate": 0.00023339931209033677, - "loss": 0.0571, + "epoch": 0.26, + "learning_rate": 0.0002602580403647934, + "loss": 0.0736, "step": 41050 }, { - "epoch": 0.44, - "learning_rate": 0.00023338308780582775, - "loss": 0.0469, + "epoch": 0.27, + "learning_rate": 0.0002602483590104365, + "loss": 0.0704, "step": 41060 }, { - "epoch": 0.44, - "learning_rate": 0.00023336686352131867, - "loss": 0.0567, + "epoch": 0.27, + "learning_rate": 0.0002602386776560795, + "loss": 0.0682, "step": 41070 }, { - "epoch": 0.44, - "learning_rate": 0.00023335063923680965, - "loss": 0.0522, + "epoch": 0.27, + "learning_rate": 0.0002602289963017226, + "loss": 0.0652, "step": 41080 }, { - "epoch": 0.44, - "learning_rate": 0.00023333441495230057, - "loss": 0.0596, + "epoch": 0.27, + "learning_rate": 0.00026021931494736567, + "loss": 0.0676, "step": 41090 }, { - "epoch": 0.44, - "learning_rate": 0.00023331819066779155, - "loss": 0.0548, + "epoch": 0.27, + "learning_rate": 0.00026020963359300875, + "loss": 0.0614, "step": 41100 }, { - "epoch": 0.44, - "learning_rate": 0.00023330196638328247, - "loss": 0.0624, + "epoch": 0.27, + "learning_rate": 0.00026019995223865183, + "loss": 0.0629, "step": 41110 }, { - "epoch": 0.44, - "learning_rate": 0.00023328574209877342, - "loss": 0.0598, + "epoch": 0.27, + "learning_rate": 0.0002601902708842949, + "loss": 0.0637, "step": 41120 }, { - "epoch": 0.44, - "learning_rate": 0.00023326951781426437, - "loss": 0.0661, + "epoch": 0.27, + "learning_rate": 0.000260180589529938, + "loss": 0.063, "step": 41130 }, { - "epoch": 0.44, - "learning_rate": 0.00023325329352975532, - "loss": 0.0587, + "epoch": 0.27, + "learning_rate": 0.000260170908175581, + "loss": 0.0634, "step": 41140 }, { - "epoch": 0.45, - "learning_rate": 0.00023323706924524625, - "loss": 0.065, + "epoch": 0.27, + "learning_rate": 0.0002601612268212241, + "loss": 0.0704, "step": 41150 }, { - "epoch": 0.45, - "learning_rate": 0.00023322084496073722, - "loss": 0.0627, + "epoch": 0.27, + "learning_rate": 0.0002601515454668672, + "loss": 0.0703, "step": 41160 }, { - "epoch": 0.45, - "learning_rate": 0.00023320462067622814, - "loss": 0.0594, + "epoch": 0.27, + "learning_rate": 0.0002601418641125102, + "loss": 0.0652, "step": 41170 }, { - "epoch": 0.45, - "learning_rate": 0.00023318839639171912, - "loss": 0.0568, + "epoch": 0.27, + "learning_rate": 0.0002601321827581533, + "loss": 0.0629, "step": 41180 }, { - "epoch": 0.45, - "learning_rate": 0.00023317217210721004, - "loss": 0.0599, + "epoch": 0.27, + "learning_rate": 0.00026012250140379636, + "loss": 0.0707, "step": 41190 }, { - "epoch": 0.45, - "learning_rate": 0.000233155947822701, - "loss": 0.0596, + "epoch": 0.27, + "learning_rate": 0.00026011282004943944, + "loss": 0.0652, "step": 41200 }, { - "epoch": 0.45, - "learning_rate": 0.00023313972353819194, - "loss": 0.068, + "epoch": 0.27, + "learning_rate": 0.00026010313869508246, + "loss": 0.0702, "step": 41210 }, { - "epoch": 0.45, - "learning_rate": 0.0002331234992536829, - "loss": 0.0569, + "epoch": 0.27, + "learning_rate": 0.00026009345734072554, + "loss": 0.0678, "step": 41220 }, { - "epoch": 0.45, - "learning_rate": 0.00023310727496917382, - "loss": 0.0695, + "epoch": 0.27, + "learning_rate": 0.0002600837759863686, + "loss": 0.0806, "step": 41230 }, { - "epoch": 0.45, - "learning_rate": 0.0002330910506846648, - "loss": 0.0571, + "epoch": 0.27, + "learning_rate": 0.0002600740946320117, + "loss": 0.0615, "step": 41240 }, { - "epoch": 0.45, - "learning_rate": 0.00023307482640015572, - "loss": 0.0612, + "epoch": 0.27, + "learning_rate": 0.0002600644132776548, + "loss": 0.0608, "step": 41250 }, { - "epoch": 0.45, - "learning_rate": 0.0002330586021156467, - "loss": 0.0619, + "epoch": 0.27, + "learning_rate": 0.00026005473192329786, + "loss": 0.0678, "step": 41260 }, { - "epoch": 0.45, - "learning_rate": 0.00023304237783113762, - "loss": 0.063, + "epoch": 0.27, + "learning_rate": 0.00026004505056894094, + "loss": 0.0691, "step": 41270 }, { - "epoch": 0.45, - "learning_rate": 0.0002330261535466286, - "loss": 0.0682, + "epoch": 0.27, + "learning_rate": 0.00026003536921458397, + "loss": 0.0641, "step": 41280 }, { - "epoch": 0.45, - "learning_rate": 0.00023300992926211952, - "loss": 0.0716, + "epoch": 0.27, + "learning_rate": 0.00026002568786022705, + "loss": 0.0669, "step": 41290 }, { - "epoch": 0.45, - "learning_rate": 0.00023299370497761046, - "loss": 0.0627, + "epoch": 0.27, + "learning_rate": 0.0002600160065058701, + "loss": 0.0662, "step": 41300 }, { - "epoch": 0.45, - "learning_rate": 0.00023297748069310141, - "loss": 0.068, + "epoch": 0.27, + "learning_rate": 0.00026000632515151315, + "loss": 0.071, "step": 41310 }, { - "epoch": 0.45, - "learning_rate": 0.00023296125640859236, - "loss": 0.0623, + "epoch": 0.27, + "learning_rate": 0.00025999664379715623, + "loss": 0.0678, "step": 41320 }, { - "epoch": 0.45, - "learning_rate": 0.0002329450321240833, - "loss": 0.0578, + "epoch": 0.27, + "learning_rate": 0.0002599869624427993, + "loss": 0.0719, "step": 41330 }, { - "epoch": 0.45, - "learning_rate": 0.00023292880783957426, - "loss": 0.0619, + "epoch": 0.27, + "learning_rate": 0.0002599772810884424, + "loss": 0.0659, "step": 41340 }, { - "epoch": 0.45, - "learning_rate": 0.0002329125835550652, - "loss": 0.0673, + "epoch": 0.27, + "learning_rate": 0.0002599675997340854, + "loss": 0.0666, "step": 41350 }, { - "epoch": 0.45, - "learning_rate": 0.00023289635927055616, - "loss": 0.0574, + "epoch": 0.27, + "learning_rate": 0.0002599579183797285, + "loss": 0.0652, "step": 41360 }, { - "epoch": 0.45, - "learning_rate": 0.00023288013498604709, - "loss": 0.0649, + "epoch": 0.27, + "learning_rate": 0.0002599482370253716, + "loss": 0.0707, "step": 41370 }, { - "epoch": 0.45, - "learning_rate": 0.00023286391070153804, - "loss": 0.0618, + "epoch": 0.27, + "learning_rate": 0.00025993855567101466, + "loss": 0.0659, "step": 41380 }, { - "epoch": 0.45, - "learning_rate": 0.00023284768641702899, - "loss": 0.056, + "epoch": 0.27, + "learning_rate": 0.00025992887431665774, + "loss": 0.0626, "step": 41390 }, { - "epoch": 0.45, - "learning_rate": 0.00023283146213251994, - "loss": 0.0589, + "epoch": 0.27, + "learning_rate": 0.0002599191929623008, + "loss": 0.0663, "step": 41400 }, { - "epoch": 0.45, - "learning_rate": 0.00023281523784801086, - "loss": 0.0565, + "epoch": 0.27, + "learning_rate": 0.00025990951160794384, + "loss": 0.0727, "step": 41410 }, { - "epoch": 0.45, - "learning_rate": 0.00023279901356350183, - "loss": 0.0613, + "epoch": 0.27, + "learning_rate": 0.0002598998302535869, + "loss": 0.0697, "step": 41420 }, { - "epoch": 0.45, - "learning_rate": 0.00023278278927899276, - "loss": 0.0674, + "epoch": 0.27, + "learning_rate": 0.00025989014889923, + "loss": 0.0757, "step": 41430 }, { - "epoch": 0.45, - "learning_rate": 0.00023276656499448373, - "loss": 0.0582, + "epoch": 0.27, + "learning_rate": 0.00025988046754487303, + "loss": 0.0724, "step": 41440 }, { - "epoch": 0.45, - "learning_rate": 0.00023275034070997466, - "loss": 0.0541, + "epoch": 0.27, + "learning_rate": 0.0002598707861905161, + "loss": 0.0649, "step": 41450 }, { - "epoch": 0.45, - "learning_rate": 0.00023273411642546563, - "loss": 0.0604, + "epoch": 0.27, + "learning_rate": 0.0002598611048361592, + "loss": 0.0701, "step": 41460 }, { - "epoch": 0.45, - "learning_rate": 0.00023271789214095656, - "loss": 0.051, + "epoch": 0.27, + "learning_rate": 0.00025985142348180227, + "loss": 0.0696, "step": 41470 }, { - "epoch": 0.45, - "learning_rate": 0.0002327016678564475, - "loss": 0.0615, + "epoch": 0.27, + "learning_rate": 0.00025984174212744535, + "loss": 0.0697, "step": 41480 }, { - "epoch": 0.45, - "learning_rate": 0.00023268544357193846, - "loss": 0.0573, + "epoch": 0.27, + "learning_rate": 0.0002598320607730884, + "loss": 0.0703, "step": 41490 }, { - "epoch": 0.45, - "learning_rate": 0.0002326692192874294, - "loss": 0.0581, + "epoch": 0.27, + "learning_rate": 0.00025982237941873145, + "loss": 0.0719, "step": 41500 }, { - "epoch": 0.45, - "learning_rate": 0.00023265299500292033, - "loss": 0.0651, + "epoch": 0.27, + "learning_rate": 0.00025981269806437453, + "loss": 0.0765, "step": 41510 }, { - "epoch": 0.45, - "learning_rate": 0.0002326367707184113, - "loss": 0.0626, + "epoch": 0.27, + "learning_rate": 0.0002598030167100176, + "loss": 0.0692, "step": 41520 }, { - "epoch": 0.45, - "learning_rate": 0.00023262054643390223, - "loss": 0.0639, + "epoch": 0.27, + "learning_rate": 0.0002597933353556607, + "loss": 0.0705, "step": 41530 }, { - "epoch": 0.45, - "learning_rate": 0.0002326043221493932, - "loss": 0.0644, + "epoch": 0.27, + "learning_rate": 0.0002597836540013037, + "loss": 0.0671, "step": 41540 }, { - "epoch": 0.45, - "learning_rate": 0.00023258809786488413, - "loss": 0.0549, + "epoch": 0.27, + "learning_rate": 0.0002597739726469468, + "loss": 0.0706, "step": 41550 }, { - "epoch": 0.45, - "learning_rate": 0.00023257187358037508, - "loss": 0.0651, + "epoch": 0.27, + "learning_rate": 0.0002597642912925899, + "loss": 0.0675, "step": 41560 }, { - "epoch": 0.45, - "learning_rate": 0.00023255564929586603, - "loss": 0.0641, + "epoch": 0.27, + "learning_rate": 0.0002597546099382329, + "loss": 0.065, "step": 41570 }, { - "epoch": 0.45, - "learning_rate": 0.00023253942501135698, - "loss": 0.0561, + "epoch": 0.27, + "learning_rate": 0.000259744928583876, + "loss": 0.0643, "step": 41580 }, { - "epoch": 0.45, - "learning_rate": 0.00023252320072684793, - "loss": 0.0548, + "epoch": 0.27, + "learning_rate": 0.00025973524722951906, + "loss": 0.0676, "step": 41590 }, { - "epoch": 0.45, - "learning_rate": 0.00023250697644233888, - "loss": 0.0596, + "epoch": 0.27, + "learning_rate": 0.00025972556587516214, + "loss": 0.069, "step": 41600 }, { - "epoch": 0.45, - "learning_rate": 0.0002324907521578298, - "loss": 0.0683, + "epoch": 0.27, + "learning_rate": 0.0002597158845208052, + "loss": 0.0713, "step": 41610 }, { - "epoch": 0.45, - "learning_rate": 0.00023247452787332078, - "loss": 0.0571, + "epoch": 0.27, + "learning_rate": 0.0002597062031664483, + "loss": 0.0787, "step": 41620 }, { - "epoch": 0.45, - "learning_rate": 0.0002324583035888117, - "loss": 0.0585, + "epoch": 0.27, + "learning_rate": 0.00025969652181209133, + "loss": 0.0734, "step": 41630 }, { - "epoch": 0.45, - "learning_rate": 0.00023244207930430268, - "loss": 0.059, + "epoch": 0.27, + "learning_rate": 0.0002596868404577344, + "loss": 0.0762, "step": 41640 }, { - "epoch": 0.45, - "learning_rate": 0.0002324258550197936, - "loss": 0.0565, + "epoch": 0.27, + "learning_rate": 0.0002596771591033775, + "loss": 0.0708, "step": 41650 }, { - "epoch": 0.45, - "learning_rate": 0.00023240963073528455, - "loss": 0.0593, + "epoch": 0.27, + "learning_rate": 0.00025966747774902057, + "loss": 0.064, "step": 41660 }, { - "epoch": 0.45, - "learning_rate": 0.0002323934064507755, - "loss": 0.0546, + "epoch": 0.27, + "learning_rate": 0.00025965779639466365, + "loss": 0.0753, "step": 41670 }, { - "epoch": 0.45, - "learning_rate": 0.00023237718216626645, - "loss": 0.0579, + "epoch": 0.27, + "learning_rate": 0.00025964811504030667, + "loss": 0.0688, "step": 41680 }, { - "epoch": 0.45, - "learning_rate": 0.00023236095788175737, - "loss": 0.0561, + "epoch": 0.27, + "learning_rate": 0.00025963843368594975, + "loss": 0.0639, "step": 41690 }, { - "epoch": 0.45, - "learning_rate": 0.00023234473359724835, - "loss": 0.0643, + "epoch": 0.27, + "learning_rate": 0.0002596287523315928, + "loss": 0.0722, "step": 41700 }, { - "epoch": 0.45, - "learning_rate": 0.00023232850931273927, - "loss": 0.0612, + "epoch": 0.27, + "learning_rate": 0.00025961907097723586, + "loss": 0.0602, "step": 41710 }, { - "epoch": 0.45, - "learning_rate": 0.00023231228502823025, - "loss": 0.0707, + "epoch": 0.27, + "learning_rate": 0.00025960938962287894, + "loss": 0.0681, "step": 41720 }, { - "epoch": 0.45, - "learning_rate": 0.00023229606074372117, - "loss": 0.0641, + "epoch": 0.27, + "learning_rate": 0.000259599708268522, + "loss": 0.0714, "step": 41730 }, { - "epoch": 0.45, - "learning_rate": 0.00023227983645921212, - "loss": 0.0617, + "epoch": 0.27, + "learning_rate": 0.0002595900269141651, + "loss": 0.0704, "step": 41740 }, { - "epoch": 0.45, - "learning_rate": 0.00023226361217470307, - "loss": 0.0677, + "epoch": 0.27, + "learning_rate": 0.0002595803455598082, + "loss": 0.0648, "step": 41750 }, { - "epoch": 0.45, - "learning_rate": 0.00023224738789019402, - "loss": 0.059, + "epoch": 0.27, + "learning_rate": 0.00025957066420545126, + "loss": 0.0592, "step": 41760 }, { - "epoch": 0.45, - "learning_rate": 0.00023223116360568497, - "loss": 0.0552, + "epoch": 0.27, + "learning_rate": 0.0002595609828510943, + "loss": 0.075, "step": 41770 }, { - "epoch": 0.45, - "learning_rate": 0.00023221493932117592, - "loss": 0.0585, + "epoch": 0.27, + "learning_rate": 0.00025955130149673736, + "loss": 0.0709, "step": 41780 }, { - "epoch": 0.45, - "learning_rate": 0.00023219871503666684, - "loss": 0.0503, + "epoch": 0.27, + "learning_rate": 0.00025954162014238044, + "loss": 0.0655, "step": 41790 }, { - "epoch": 0.45, - "learning_rate": 0.00023218249075215782, - "loss": 0.0599, + "epoch": 0.27, + "learning_rate": 0.0002595319387880235, + "loss": 0.0703, "step": 41800 }, { - "epoch": 0.45, - "learning_rate": 0.00023216626646764874, - "loss": 0.0704, + "epoch": 0.27, + "learning_rate": 0.00025952225743366655, + "loss": 0.0705, "step": 41810 }, { - "epoch": 0.45, - "learning_rate": 0.00023215004218313972, - "loss": 0.0567, + "epoch": 0.27, + "learning_rate": 0.0002595125760793096, + "loss": 0.0724, "step": 41820 }, { - "epoch": 0.45, - "learning_rate": 0.00023213381789863064, - "loss": 0.0581, + "epoch": 0.27, + "learning_rate": 0.0002595028947249527, + "loss": 0.07, "step": 41830 }, { - "epoch": 0.45, - "learning_rate": 0.0002321175936141216, - "loss": 0.0638, + "epoch": 0.27, + "learning_rate": 0.00025949321337059573, + "loss": 0.0673, "step": 41840 }, { - "epoch": 0.45, - "learning_rate": 0.00023210136932961254, - "loss": 0.0533, + "epoch": 0.27, + "learning_rate": 0.0002594835320162388, + "loss": 0.0741, "step": 41850 }, { - "epoch": 0.45, - "learning_rate": 0.0002320851450451035, - "loss": 0.0709, + "epoch": 0.27, + "learning_rate": 0.0002594738506618819, + "loss": 0.0746, "step": 41860 }, { - "epoch": 0.45, - "learning_rate": 0.0002320689207605944, - "loss": 0.0602, + "epoch": 0.27, + "learning_rate": 0.00025946416930752497, + "loss": 0.064, "step": 41870 }, { - "epoch": 0.45, - "learning_rate": 0.0002320526964760854, - "loss": 0.0534, + "epoch": 0.27, + "learning_rate": 0.00025945448795316805, + "loss": 0.0682, "step": 41880 }, { - "epoch": 0.45, - "learning_rate": 0.0002320364721915763, - "loss": 0.0646, + "epoch": 0.27, + "learning_rate": 0.00025944480659881113, + "loss": 0.0655, "step": 41890 }, { - "epoch": 0.45, - "learning_rate": 0.0002320202479070673, - "loss": 0.0695, + "epoch": 0.27, + "learning_rate": 0.0002594351252444542, + "loss": 0.0707, "step": 41900 }, { - "epoch": 0.45, - "learning_rate": 0.0002320040236225582, - "loss": 0.0645, + "epoch": 0.27, + "learning_rate": 0.00025942544389009724, + "loss": 0.0627, "step": 41910 }, { - "epoch": 0.45, - "learning_rate": 0.00023198779933804916, - "loss": 0.0585, + "epoch": 0.27, + "learning_rate": 0.0002594157625357403, + "loss": 0.06, "step": 41920 }, { - "epoch": 0.45, - "learning_rate": 0.0002319715750535401, - "loss": 0.0569, + "epoch": 0.27, + "learning_rate": 0.0002594060811813834, + "loss": 0.0646, "step": 41930 }, { - "epoch": 0.45, - "learning_rate": 0.00023195535076903106, - "loss": 0.0642, + "epoch": 0.27, + "learning_rate": 0.0002593963998270264, + "loss": 0.0585, "step": 41940 }, { - "epoch": 0.45, - "learning_rate": 0.000231939126484522, - "loss": 0.053, + "epoch": 0.27, + "learning_rate": 0.0002593867184726695, + "loss": 0.0668, "step": 41950 }, { - "epoch": 0.45, - "learning_rate": 0.00023192290220001296, - "loss": 0.0596, + "epoch": 0.27, + "learning_rate": 0.0002593770371183126, + "loss": 0.0739, "step": 41960 }, { - "epoch": 0.45, - "learning_rate": 0.00023190667791550388, - "loss": 0.0654, + "epoch": 0.27, + "learning_rate": 0.00025936735576395566, + "loss": 0.0672, "step": 41970 }, { - "epoch": 0.45, - "learning_rate": 0.00023189045363099486, - "loss": 0.0557, + "epoch": 0.27, + "learning_rate": 0.0002593576744095987, + "loss": 0.0675, "step": 41980 }, { - "epoch": 0.45, - "learning_rate": 0.00023187422934648578, - "loss": 0.0704, + "epoch": 0.27, + "learning_rate": 0.00025934799305524177, + "loss": 0.0674, "step": 41990 }, { - "epoch": 0.45, - "learning_rate": 0.00023185800506197676, - "loss": 0.0695, + "epoch": 0.27, + "learning_rate": 0.00025933831170088485, + "loss": 0.0659, "step": 42000 }, { - "epoch": 0.45, - "eval_cer": 0.9212373728003449, - "eval_loss": 0.0429798886179924, - "eval_runtime": 119.6655, - "eval_samples_per_second": 16.713, - "eval_steps_per_second": 4.178, + "epoch": 0.27, + "eval_cer": 0.9200949045305615, + "eval_loss": 0.04507534205913544, + "eval_runtime": 120.3293, + "eval_samples_per_second": 16.621, + "eval_steps_per_second": 4.155, "step": 42000 }, { - "epoch": 0.45, - "learning_rate": 0.00023184178077746768, - "loss": 0.063, + "epoch": 0.27, + "learning_rate": 0.0002593286303465279, + "loss": 0.0675, "step": 42010 }, { - "epoch": 0.45, - "learning_rate": 0.00023182555649295863, - "loss": 0.0546, + "epoch": 0.27, + "learning_rate": 0.000259318948992171, + "loss": 0.06, "step": 42020 }, { - "epoch": 0.45, - "learning_rate": 0.00023180933220844958, - "loss": 0.063, + "epoch": 0.27, + "learning_rate": 0.0002593092676378141, + "loss": 0.0757, "step": 42030 }, { - "epoch": 0.45, - "learning_rate": 0.00023179310792394053, - "loss": 0.0579, + "epoch": 0.27, + "learning_rate": 0.00025929958628345717, + "loss": 0.066, "step": 42040 }, { - "epoch": 0.45, - "learning_rate": 0.00023177688363943145, - "loss": 0.0609, + "epoch": 0.27, + "learning_rate": 0.0002592899049291002, + "loss": 0.0664, "step": 42050 }, { - "epoch": 0.45, - "learning_rate": 0.00023176065935492243, - "loss": 0.0588, + "epoch": 0.27, + "learning_rate": 0.00025928022357474327, + "loss": 0.0697, "step": 42060 }, { - "epoch": 0.46, - "learning_rate": 0.00023174443507041335, - "loss": 0.0603, + "epoch": 0.27, + "learning_rate": 0.00025927054222038635, + "loss": 0.0626, "step": 42070 }, { - "epoch": 0.46, - "learning_rate": 0.00023172821078590433, - "loss": 0.0635, + "epoch": 0.27, + "learning_rate": 0.0002592608608660294, + "loss": 0.0736, "step": 42080 }, { - "epoch": 0.46, - "learning_rate": 0.00023171198650139525, - "loss": 0.0597, + "epoch": 0.27, + "learning_rate": 0.00025925117951167246, + "loss": 0.0651, "step": 42090 }, { - "epoch": 0.46, - "learning_rate": 0.0002316957622168862, - "loss": 0.06, + "epoch": 0.27, + "learning_rate": 0.00025924149815731554, + "loss": 0.0649, "step": 42100 }, { - "epoch": 0.46, - "learning_rate": 0.00023167953793237715, - "loss": 0.0702, + "epoch": 0.27, + "learning_rate": 0.0002592318168029586, + "loss": 0.07, "step": 42110 }, { - "epoch": 0.46, - "learning_rate": 0.0002316633136478681, - "loss": 0.0601, + "epoch": 0.27, + "learning_rate": 0.00025922213544860164, + "loss": 0.0719, "step": 42120 }, { - "epoch": 0.46, - "learning_rate": 0.00023164708936335905, - "loss": 0.0583, + "epoch": 0.27, + "learning_rate": 0.0002592124540942447, + "loss": 0.0697, "step": 42130 }, { - "epoch": 0.46, - "learning_rate": 0.00023163086507885, - "loss": 0.0651, + "epoch": 0.27, + "learning_rate": 0.0002592027727398878, + "loss": 0.0721, "step": 42140 }, { - "epoch": 0.46, - "learning_rate": 0.00023161464079434092, - "loss": 0.0692, + "epoch": 0.27, + "learning_rate": 0.0002591930913855309, + "loss": 0.0765, "step": 42150 }, { - "epoch": 0.46, - "learning_rate": 0.0002315984165098319, - "loss": 0.0708, + "epoch": 0.27, + "learning_rate": 0.00025918341003117396, + "loss": 0.0751, "step": 42160 }, { - "epoch": 0.46, - "learning_rate": 0.00023158219222532282, - "loss": 0.067, + "epoch": 0.27, + "learning_rate": 0.00025917372867681704, + "loss": 0.0818, "step": 42170 }, { - "epoch": 0.46, - "learning_rate": 0.0002315659679408138, - "loss": 0.0666, + "epoch": 0.27, + "learning_rate": 0.00025916404732246007, + "loss": 0.0707, "step": 42180 }, { - "epoch": 0.46, - "learning_rate": 0.00023154974365630472, - "loss": 0.0613, + "epoch": 0.27, + "learning_rate": 0.00025915436596810315, + "loss": 0.0762, "step": 42190 }, { - "epoch": 0.46, - "learning_rate": 0.00023153351937179567, - "loss": 0.0549, + "epoch": 0.27, + "learning_rate": 0.0002591446846137462, + "loss": 0.0746, "step": 42200 }, { - "epoch": 0.46, - "learning_rate": 0.00023151729508728662, - "loss": 0.063, + "epoch": 0.27, + "learning_rate": 0.00025913500325938925, + "loss": 0.0734, "step": 42210 }, { - "epoch": 0.46, - "learning_rate": 0.00023150107080277757, - "loss": 0.0569, + "epoch": 0.27, + "learning_rate": 0.00025912532190503233, + "loss": 0.0676, "step": 42220 }, { - "epoch": 0.46, - "learning_rate": 0.0002314848465182685, - "loss": 0.057, + "epoch": 0.27, + "learning_rate": 0.0002591156405506754, + "loss": 0.0732, "step": 42230 }, { - "epoch": 0.46, - "learning_rate": 0.00023146862223375947, - "loss": 0.0575, + "epoch": 0.27, + "learning_rate": 0.0002591059591963185, + "loss": 0.0631, "step": 42240 }, { - "epoch": 0.46, - "learning_rate": 0.00023145239794925042, - "loss": 0.0622, + "epoch": 0.27, + "learning_rate": 0.00025909627784196157, + "loss": 0.0593, "step": 42250 }, { - "epoch": 0.46, - "learning_rate": 0.00023143617366474137, - "loss": 0.0616, + "epoch": 0.27, + "learning_rate": 0.0002590865964876046, + "loss": 0.0717, "step": 42260 }, { - "epoch": 0.46, - "learning_rate": 0.00023141994938023232, - "loss": 0.0592, + "epoch": 0.27, + "learning_rate": 0.0002590769151332477, + "loss": 0.0669, "step": 42270 }, { - "epoch": 0.46, - "learning_rate": 0.00023140372509572327, - "loss": 0.0557, + "epoch": 0.27, + "learning_rate": 0.00025906723377889075, + "loss": 0.0642, "step": 42280 }, { - "epoch": 0.46, - "learning_rate": 0.00023138750081121422, - "loss": 0.0586, + "epoch": 0.27, + "learning_rate": 0.00025905755242453383, + "loss": 0.0729, "step": 42290 }, { - "epoch": 0.46, - "learning_rate": 0.00023137127652670514, - "loss": 0.0527, + "epoch": 0.27, + "learning_rate": 0.0002590478710701769, + "loss": 0.0736, "step": 42300 }, { - "epoch": 0.46, - "learning_rate": 0.00023135505224219612, - "loss": 0.0574, + "epoch": 0.27, + "learning_rate": 0.00025903818971581994, + "loss": 0.0789, "step": 42310 }, { - "epoch": 0.46, - "learning_rate": 0.00023133882795768704, - "loss": 0.051, + "epoch": 0.27, + "learning_rate": 0.000259028508361463, + "loss": 0.0678, "step": 42320 }, { - "epoch": 0.46, - "learning_rate": 0.00023132260367317802, - "loss": 0.0548, + "epoch": 0.27, + "learning_rate": 0.0002590188270071061, + "loss": 0.0668, "step": 42330 }, { - "epoch": 0.46, - "learning_rate": 0.00023130637938866894, - "loss": 0.0642, + "epoch": 0.27, + "learning_rate": 0.0002590091456527491, + "loss": 0.0699, "step": 42340 }, { - "epoch": 0.46, - "learning_rate": 0.0002312901551041599, - "loss": 0.0526, + "epoch": 0.27, + "learning_rate": 0.0002589994642983922, + "loss": 0.0709, "step": 42350 }, { - "epoch": 0.46, - "learning_rate": 0.00023127393081965084, - "loss": 0.0564, + "epoch": 0.27, + "learning_rate": 0.0002589897829440353, + "loss": 0.0726, "step": 42360 }, { - "epoch": 0.46, - "learning_rate": 0.0002312577065351418, - "loss": 0.055, + "epoch": 0.27, + "learning_rate": 0.00025898010158967836, + "loss": 0.0795, "step": 42370 }, { - "epoch": 0.46, - "learning_rate": 0.00023124148225063271, - "loss": 0.0506, + "epoch": 0.27, + "learning_rate": 0.00025897042023532144, + "loss": 0.0655, "step": 42380 }, { - "epoch": 0.46, - "learning_rate": 0.0002312252579661237, - "loss": 0.0559, + "epoch": 0.27, + "learning_rate": 0.0002589607388809645, + "loss": 0.0638, "step": 42390 }, { - "epoch": 0.46, - "learning_rate": 0.00023120903368161461, - "loss": 0.0543, + "epoch": 0.27, + "learning_rate": 0.00025895105752660755, + "loss": 0.0659, "step": 42400 }, { - "epoch": 0.46, - "learning_rate": 0.0002311928093971056, - "loss": 0.0567, + "epoch": 0.27, + "learning_rate": 0.00025894137617225063, + "loss": 0.0693, "step": 42410 }, { - "epoch": 0.46, - "learning_rate": 0.00023117658511259651, - "loss": 0.0556, + "epoch": 0.27, + "learning_rate": 0.0002589316948178937, + "loss": 0.0733, "step": 42420 }, { - "epoch": 0.46, - "learning_rate": 0.00023116036082808746, - "loss": 0.0644, + "epoch": 0.27, + "learning_rate": 0.0002589220134635368, + "loss": 0.0679, "step": 42430 }, { - "epoch": 0.46, - "learning_rate": 0.0002311441365435784, - "loss": 0.055, + "epoch": 0.27, + "learning_rate": 0.00025891233210917987, + "loss": 0.0657, "step": 42440 }, { - "epoch": 0.46, - "learning_rate": 0.00023112791225906936, - "loss": 0.0532, + "epoch": 0.27, + "learning_rate": 0.0002589026507548229, + "loss": 0.0719, "step": 42450 }, { - "epoch": 0.46, - "learning_rate": 0.0002311116879745603, - "loss": 0.0589, + "epoch": 0.27, + "learning_rate": 0.000258892969400466, + "loss": 0.0639, "step": 42460 }, { - "epoch": 0.46, - "learning_rate": 0.00023109546369005126, - "loss": 0.0637, + "epoch": 0.27, + "learning_rate": 0.00025888328804610905, + "loss": 0.066, "step": 42470 }, { - "epoch": 0.46, - "learning_rate": 0.00023107923940554219, - "loss": 0.0571, + "epoch": 0.27, + "learning_rate": 0.0002588736066917521, + "loss": 0.0748, "step": 42480 }, { - "epoch": 0.46, - "learning_rate": 0.00023106301512103316, - "loss": 0.0606, + "epoch": 0.27, + "learning_rate": 0.00025886392533739516, + "loss": 0.0773, "step": 42490 }, { - "epoch": 0.46, - "learning_rate": 0.00023104679083652408, - "loss": 0.0702, + "epoch": 0.27, + "learning_rate": 0.00025885424398303824, + "loss": 0.0687, "step": 42500 }, { - "epoch": 0.46, - "learning_rate": 0.00023103056655201506, - "loss": 0.0642, + "epoch": 0.27, + "learning_rate": 0.0002588445626286813, + "loss": 0.0773, "step": 42510 }, { - "epoch": 0.46, - "learning_rate": 0.00023101434226750598, - "loss": 0.0598, + "epoch": 0.27, + "learning_rate": 0.0002588348812743244, + "loss": 0.0619, "step": 42520 }, { - "epoch": 0.46, - "learning_rate": 0.00023099811798299693, - "loss": 0.0569, + "epoch": 0.27, + "learning_rate": 0.0002588251999199675, + "loss": 0.0642, "step": 42530 }, { - "epoch": 0.46, - "learning_rate": 0.00023098189369848788, - "loss": 0.055, + "epoch": 0.27, + "learning_rate": 0.0002588155185656105, + "loss": 0.0667, "step": 42540 }, { - "epoch": 0.46, - "learning_rate": 0.00023096566941397883, - "loss": 0.0643, + "epoch": 0.27, + "learning_rate": 0.0002588058372112536, + "loss": 0.0689, "step": 42550 }, { - "epoch": 0.46, - "learning_rate": 0.00023094944512946976, - "loss": 0.0591, + "epoch": 0.27, + "learning_rate": 0.00025879615585689666, + "loss": 0.0734, "step": 42560 }, { - "epoch": 0.46, - "learning_rate": 0.00023093322084496073, - "loss": 0.0601, + "epoch": 0.27, + "learning_rate": 0.00025878647450253974, + "loss": 0.072, "step": 42570 }, { - "epoch": 0.46, - "learning_rate": 0.00023091699656045166, - "loss": 0.0601, + "epoch": 0.27, + "learning_rate": 0.00025877679314818277, + "loss": 0.0655, "step": 42580 }, { - "epoch": 0.46, - "learning_rate": 0.00023090077227594263, - "loss": 0.052, + "epoch": 0.27, + "learning_rate": 0.00025876711179382585, + "loss": 0.0717, "step": 42590 }, { - "epoch": 0.46, - "learning_rate": 0.00023088454799143356, - "loss": 0.0573, + "epoch": 0.27, + "learning_rate": 0.00025875743043946893, + "loss": 0.0726, "step": 42600 }, { - "epoch": 0.46, - "learning_rate": 0.0002308683237069245, - "loss": 0.0611, + "epoch": 0.28, + "learning_rate": 0.00025874774908511195, + "loss": 0.0665, "step": 42610 }, { - "epoch": 0.46, - "learning_rate": 0.00023085209942241546, - "loss": 0.0662, + "epoch": 0.28, + "learning_rate": 0.00025873806773075503, + "loss": 0.066, "step": 42620 }, { - "epoch": 0.46, - "learning_rate": 0.0002308358751379064, - "loss": 0.06, + "epoch": 0.28, + "learning_rate": 0.0002587283863763981, + "loss": 0.0731, "step": 42630 }, { - "epoch": 0.46, - "learning_rate": 0.00023081965085339735, - "loss": 0.0699, + "epoch": 0.28, + "learning_rate": 0.0002587187050220412, + "loss": 0.0638, "step": 42640 }, { - "epoch": 0.46, - "learning_rate": 0.0002308034265688883, - "loss": 0.0549, + "epoch": 0.28, + "learning_rate": 0.0002587090236676843, + "loss": 0.0721, "step": 42650 }, { - "epoch": 0.46, - "learning_rate": 0.00023078720228437923, - "loss": 0.0518, + "epoch": 0.28, + "learning_rate": 0.00025869934231332735, + "loss": 0.0736, "step": 42660 }, { - "epoch": 0.46, - "learning_rate": 0.0002307709779998702, - "loss": 0.0565, + "epoch": 0.28, + "learning_rate": 0.00025868966095897043, + "loss": 0.0679, "step": 42670 }, { - "epoch": 0.46, - "learning_rate": 0.00023075475371536113, - "loss": 0.0559, + "epoch": 0.28, + "learning_rate": 0.00025867997960461346, + "loss": 0.0663, "step": 42680 }, { - "epoch": 0.46, - "learning_rate": 0.0002307385294308521, - "loss": 0.0502, + "epoch": 0.28, + "learning_rate": 0.00025867029825025654, + "loss": 0.0599, "step": 42690 }, { - "epoch": 0.46, - "learning_rate": 0.00023072230514634303, - "loss": 0.0542, + "epoch": 0.28, + "learning_rate": 0.0002586606168958996, + "loss": 0.0693, "step": 42700 }, { - "epoch": 0.46, - "learning_rate": 0.00023070608086183398, - "loss": 0.0588, + "epoch": 0.28, + "learning_rate": 0.00025865093554154264, + "loss": 0.0707, "step": 42710 }, { - "epoch": 0.46, - "learning_rate": 0.00023068985657732493, - "loss": 0.0599, + "epoch": 0.28, + "learning_rate": 0.0002586412541871857, + "loss": 0.0665, "step": 42720 }, { - "epoch": 0.46, - "learning_rate": 0.00023067363229281588, - "loss": 0.0581, + "epoch": 0.28, + "learning_rate": 0.0002586315728328288, + "loss": 0.062, "step": 42730 }, { - "epoch": 0.46, - "learning_rate": 0.0002306574080083068, - "loss": 0.0614, + "epoch": 0.28, + "learning_rate": 0.0002586218914784719, + "loss": 0.058, "step": 42740 }, { - "epoch": 0.46, - "learning_rate": 0.00023064118372379778, - "loss": 0.0633, + "epoch": 0.28, + "learning_rate": 0.0002586122101241149, + "loss": 0.0599, "step": 42750 }, { - "epoch": 0.46, - "learning_rate": 0.0002306249594392887, - "loss": 0.0584, + "epoch": 0.28, + "learning_rate": 0.000258602528769758, + "loss": 0.0637, "step": 42760 }, { - "epoch": 0.46, - "learning_rate": 0.00023060873515477967, - "loss": 0.0612, + "epoch": 0.28, + "learning_rate": 0.00025859284741540107, + "loss": 0.0599, "step": 42770 }, { - "epoch": 0.46, - "learning_rate": 0.0002305925108702706, - "loss": 0.0678, + "epoch": 0.28, + "learning_rate": 0.00025858316606104415, + "loss": 0.0632, "step": 42780 }, { - "epoch": 0.46, - "learning_rate": 0.00023057628658576155, - "loss": 0.0597, + "epoch": 0.28, + "learning_rate": 0.00025857348470668723, + "loss": 0.0711, "step": 42790 }, { - "epoch": 0.46, - "learning_rate": 0.0002305600623012525, - "loss": 0.0621, + "epoch": 0.28, + "learning_rate": 0.0002585638033523303, + "loss": 0.0706, "step": 42800 }, { - "epoch": 0.46, - "learning_rate": 0.00023054383801674345, - "loss": 0.0701, + "epoch": 0.28, + "learning_rate": 0.0002585541219979734, + "loss": 0.0663, "step": 42810 }, { - "epoch": 0.46, - "learning_rate": 0.0002305276137322344, - "loss": 0.0641, + "epoch": 0.28, + "learning_rate": 0.0002585444406436164, + "loss": 0.0638, "step": 42820 }, { - "epoch": 0.46, - "learning_rate": 0.00023051138944772535, - "loss": 0.0603, + "epoch": 0.28, + "learning_rate": 0.0002585347592892595, + "loss": 0.07, "step": 42830 }, { - "epoch": 0.46, - "learning_rate": 0.00023049516516321627, - "loss": 0.0618, + "epoch": 0.28, + "learning_rate": 0.00025852507793490257, + "loss": 0.0627, "step": 42840 }, { - "epoch": 0.46, - "learning_rate": 0.00023047894087870725, - "loss": 0.0571, + "epoch": 0.28, + "learning_rate": 0.0002585153965805456, + "loss": 0.064, "step": 42850 }, { - "epoch": 0.46, - "learning_rate": 0.00023046271659419817, - "loss": 0.0618, + "epoch": 0.28, + "learning_rate": 0.0002585057152261887, + "loss": 0.0694, "step": 42860 }, { - "epoch": 0.46, - "learning_rate": 0.00023044649230968915, - "loss": 0.0679, + "epoch": 0.28, + "learning_rate": 0.00025849603387183176, + "loss": 0.0722, "step": 42870 }, { - "epoch": 0.46, - "learning_rate": 0.00023043026802518007, - "loss": 0.0514, + "epoch": 0.28, + "learning_rate": 0.00025848635251747484, + "loss": 0.0643, "step": 42880 }, { - "epoch": 0.46, - "learning_rate": 0.00023041404374067102, - "loss": 0.0523, + "epoch": 0.28, + "learning_rate": 0.00025847667116311786, + "loss": 0.0678, "step": 42890 }, { - "epoch": 0.46, - "learning_rate": 0.00023039781945616197, + "epoch": 0.28, + "learning_rate": 0.00025846698980876094, "loss": 0.0666, "step": 42900 }, { - "epoch": 0.46, - "learning_rate": 0.00023038159517165292, - "loss": 0.0629, + "epoch": 0.28, + "learning_rate": 0.000258457308454404, + "loss": 0.0571, "step": 42910 }, { - "epoch": 0.46, - "learning_rate": 0.00023036537088714384, - "loss": 0.059, + "epoch": 0.28, + "learning_rate": 0.0002584476271000471, + "loss": 0.0643, "step": 42920 }, { - "epoch": 0.46, - "learning_rate": 0.00023034914660263482, - "loss": 0.0665, + "epoch": 0.28, + "learning_rate": 0.0002584379457456902, + "loss": 0.0705, "step": 42930 }, { - "epoch": 0.46, - "learning_rate": 0.00023033292231812574, - "loss": 0.0629, + "epoch": 0.28, + "learning_rate": 0.00025842826439133326, + "loss": 0.0606, "step": 42940 }, { - "epoch": 0.46, - "learning_rate": 0.00023031669803361672, + "epoch": 0.28, + "learning_rate": 0.0002584185830369763, "loss": 0.0617, "step": 42950 }, { - "epoch": 0.46, - "learning_rate": 0.00023030047374910764, - "loss": 0.0532, + "epoch": 0.28, + "learning_rate": 0.00025840890168261937, + "loss": 0.0721, "step": 42960 }, { - "epoch": 0.46, - "learning_rate": 0.00023028424946459862, - "loss": 0.0635, + "epoch": 0.28, + "learning_rate": 0.00025839922032826245, + "loss": 0.0698, "step": 42970 }, { - "epoch": 0.46, - "learning_rate": 0.00023026802518008954, - "loss": 0.0599, + "epoch": 0.28, + "learning_rate": 0.0002583895389739055, + "loss": 0.0674, "step": 42980 }, { - "epoch": 0.46, - "learning_rate": 0.0002302518008955805, - "loss": 0.0571, + "epoch": 0.28, + "learning_rate": 0.00025837985761954855, + "loss": 0.064, "step": 42990 }, { - "epoch": 0.47, - "learning_rate": 0.00023023557661107144, - "loss": 0.0566, + "epoch": 0.28, + "learning_rate": 0.00025837017626519163, + "loss": 0.0638, "step": 43000 }, { - "epoch": 0.47, - "eval_cer": 0.9212479746121945, - "eval_loss": 0.04133139178156853, - "eval_runtime": 119.8233, - "eval_samples_per_second": 16.691, - "eval_steps_per_second": 4.173, + "epoch": 0.28, + "eval_cer": 0.9200361541068806, + "eval_loss": 0.044854536652565, + "eval_runtime": 120.1061, + "eval_samples_per_second": 16.652, + "eval_steps_per_second": 4.163, "step": 43000 }, { - "epoch": 0.47, - "learning_rate": 0.0002302193523265624, + "epoch": 0.28, + "learning_rate": 0.0002583604949108347, "loss": 0.0634, "step": 43010 }, { - "epoch": 0.47, - "learning_rate": 0.0002302031280420533, - "loss": 0.0624, + "epoch": 0.28, + "learning_rate": 0.0002583508135564778, + "loss": 0.0679, "step": 43020 }, { - "epoch": 0.47, - "learning_rate": 0.0002301869037575443, - "loss": 0.0538, + "epoch": 0.28, + "learning_rate": 0.0002583411322021208, + "loss": 0.061, "step": 43030 }, { - "epoch": 0.47, - "learning_rate": 0.0002301706794730352, - "loss": 0.0608, + "epoch": 0.28, + "learning_rate": 0.0002583314508477639, + "loss": 0.0665, "step": 43040 }, { - "epoch": 0.47, - "learning_rate": 0.0002301544551885262, - "loss": 0.062, + "epoch": 0.28, + "learning_rate": 0.000258321769493407, + "loss": 0.0691, "step": 43050 }, { - "epoch": 0.47, - "learning_rate": 0.0002301382309040171, - "loss": 0.053, + "epoch": 0.28, + "learning_rate": 0.00025831208813905006, + "loss": 0.0679, "step": 43060 }, { - "epoch": 0.47, - "learning_rate": 0.00023012200661950806, - "loss": 0.0575, + "epoch": 0.28, + "learning_rate": 0.00025830240678469314, + "loss": 0.0695, "step": 43070 }, { - "epoch": 0.47, - "learning_rate": 0.000230105782334999, - "loss": 0.0583, + "epoch": 0.28, + "learning_rate": 0.00025829272543033616, + "loss": 0.0698, "step": 43080 }, { - "epoch": 0.47, - "learning_rate": 0.00023008955805048996, - "loss": 0.0628, + "epoch": 0.28, + "learning_rate": 0.00025828304407597924, + "loss": 0.0669, "step": 43090 }, { - "epoch": 0.47, - "learning_rate": 0.00023007333376598088, - "loss": 0.0675, + "epoch": 0.28, + "learning_rate": 0.0002582733627216223, + "loss": 0.0676, "step": 43100 }, { - "epoch": 0.47, - "learning_rate": 0.00023005710948147186, - "loss": 0.0588, + "epoch": 0.28, + "learning_rate": 0.00025826368136726535, + "loss": 0.0623, "step": 43110 }, { - "epoch": 0.47, - "learning_rate": 0.00023004088519696278, - "loss": 0.0595, + "epoch": 0.28, + "learning_rate": 0.00025825400001290843, + "loss": 0.0647, "step": 43120 }, { - "epoch": 0.47, - "learning_rate": 0.00023002466091245376, - "loss": 0.0685, + "epoch": 0.28, + "learning_rate": 0.0002582443186585515, + "loss": 0.0647, "step": 43130 }, { - "epoch": 0.47, - "learning_rate": 0.00023000843662794468, - "loss": 0.0537, + "epoch": 0.28, + "learning_rate": 0.0002582346373041946, + "loss": 0.0593, "step": 43140 }, { - "epoch": 0.47, - "learning_rate": 0.00022999221234343566, - "loss": 0.0659, + "epoch": 0.28, + "learning_rate": 0.00025822495594983767, + "loss": 0.0584, "step": 43150 }, { - "epoch": 0.47, - "learning_rate": 0.00022997598805892658, - "loss": 0.062, + "epoch": 0.28, + "learning_rate": 0.00025821527459548075, + "loss": 0.064, "step": 43160 }, { - "epoch": 0.47, - "learning_rate": 0.00022995976377441753, - "loss": 0.0597, + "epoch": 0.28, + "learning_rate": 0.00025820559324112377, + "loss": 0.0621, "step": 43170 }, { - "epoch": 0.47, - "learning_rate": 0.00022994353948990848, - "loss": 0.0625, + "epoch": 0.28, + "learning_rate": 0.00025819591188676685, + "loss": 0.0697, "step": 43180 }, { - "epoch": 0.47, - "learning_rate": 0.00022992731520539943, - "loss": 0.0603, + "epoch": 0.28, + "learning_rate": 0.00025818623053240993, + "loss": 0.0664, "step": 43190 }, { - "epoch": 0.47, - "learning_rate": 0.00022991109092089035, - "loss": 0.0741, + "epoch": 0.28, + "learning_rate": 0.000258176549178053, + "loss": 0.0676, "step": 43200 }, { - "epoch": 0.47, - "learning_rate": 0.00022989486663638133, - "loss": 0.0714, + "epoch": 0.28, + "learning_rate": 0.0002581668678236961, + "loss": 0.0649, "step": 43210 }, { - "epoch": 0.47, - "learning_rate": 0.00022987864235187225, - "loss": 0.0617, + "epoch": 0.28, + "learning_rate": 0.0002581571864693391, + "loss": 0.0621, "step": 43220 }, { - "epoch": 0.47, - "learning_rate": 0.00022986241806736323, - "loss": 0.0597, + "epoch": 0.28, + "learning_rate": 0.0002581475051149822, + "loss": 0.068, "step": 43230 }, { - "epoch": 0.47, - "learning_rate": 0.00022984619378285415, - "loss": 0.0636, + "epoch": 0.28, + "learning_rate": 0.0002581378237606253, + "loss": 0.069, "step": 43240 }, { - "epoch": 0.47, - "learning_rate": 0.0002298299694983451, - "loss": 0.0645, + "epoch": 0.28, + "learning_rate": 0.0002581281424062683, + "loss": 0.0682, "step": 43250 }, { - "epoch": 0.47, - "learning_rate": 0.00022981374521383605, - "loss": 0.0578, + "epoch": 0.28, + "learning_rate": 0.0002581184610519114, + "loss": 0.0636, "step": 43260 }, { - "epoch": 0.47, - "learning_rate": 0.000229797520929327, - "loss": 0.058, + "epoch": 0.28, + "learning_rate": 0.00025810877969755446, + "loss": 0.0679, "step": 43270 }, { - "epoch": 0.47, - "learning_rate": 0.00022978129664481792, - "loss": 0.0614, + "epoch": 0.28, + "learning_rate": 0.00025809909834319754, + "loss": 0.0626, "step": 43280 }, { - "epoch": 0.47, - "learning_rate": 0.0002297650723603089, - "loss": 0.0588, + "epoch": 0.28, + "learning_rate": 0.0002580894169888406, + "loss": 0.0705, "step": 43290 }, { - "epoch": 0.47, - "learning_rate": 0.00022974884807579982, - "loss": 0.0638, + "epoch": 0.28, + "learning_rate": 0.0002580797356344837, + "loss": 0.0707, "step": 43300 }, { - "epoch": 0.47, - "learning_rate": 0.0002297326237912908, - "loss": 0.0632, + "epoch": 0.28, + "learning_rate": 0.0002580700542801267, + "loss": 0.0657, "step": 43310 }, { - "epoch": 0.47, - "learning_rate": 0.00022971639950678172, - "loss": 0.0538, + "epoch": 0.28, + "learning_rate": 0.0002580603729257698, + "loss": 0.0676, "step": 43320 }, { - "epoch": 0.47, - "learning_rate": 0.0002297001752222727, - "loss": 0.0596, + "epoch": 0.28, + "learning_rate": 0.0002580506915714129, + "loss": 0.0658, "step": 43330 }, { - "epoch": 0.47, - "learning_rate": 0.00022968395093776362, - "loss": 0.0509, + "epoch": 0.28, + "learning_rate": 0.00025804101021705597, + "loss": 0.0627, "step": 43340 }, { - "epoch": 0.47, - "learning_rate": 0.00022966772665325457, - "loss": 0.0584, + "epoch": 0.28, + "learning_rate": 0.000258031328862699, + "loss": 0.066, "step": 43350 }, { - "epoch": 0.47, - "learning_rate": 0.00022965150236874552, - "loss": 0.0617, + "epoch": 0.28, + "learning_rate": 0.00025802164750834207, + "loss": 0.0736, "step": 43360 }, { - "epoch": 0.47, - "learning_rate": 0.00022963527808423647, - "loss": 0.0591, + "epoch": 0.28, + "learning_rate": 0.00025801196615398515, + "loss": 0.0653, "step": 43370 }, { - "epoch": 0.47, - "learning_rate": 0.0002296190537997274, - "loss": 0.0542, + "epoch": 0.28, + "learning_rate": 0.0002580022847996282, + "loss": 0.0691, "step": 43380 }, { - "epoch": 0.47, - "learning_rate": 0.00022960282951521837, - "loss": 0.0597, + "epoch": 0.28, + "learning_rate": 0.00025799260344527126, + "loss": 0.0647, "step": 43390 }, { - "epoch": 0.47, - "learning_rate": 0.0002295866052307093, - "loss": 0.0623, + "epoch": 0.28, + "learning_rate": 0.00025798292209091434, + "loss": 0.0686, "step": 43400 }, { - "epoch": 0.47, - "learning_rate": 0.00022957038094620027, - "loss": 0.0675, + "epoch": 0.28, + "learning_rate": 0.0002579732407365574, + "loss": 0.0666, "step": 43410 }, { - "epoch": 0.47, - "learning_rate": 0.0002295541566616912, - "loss": 0.0531, + "epoch": 0.28, + "learning_rate": 0.0002579635593822005, + "loss": 0.067, "step": 43420 }, { - "epoch": 0.47, - "learning_rate": 0.00022953793237718214, - "loss": 0.0548, + "epoch": 0.28, + "learning_rate": 0.0002579538780278436, + "loss": 0.0644, "step": 43430 }, { - "epoch": 0.47, - "learning_rate": 0.0002295217080926731, - "loss": 0.0624, + "epoch": 0.28, + "learning_rate": 0.00025794419667348666, + "loss": 0.0601, "step": 43440 }, { - "epoch": 0.47, - "learning_rate": 0.00022950548380816404, - "loss": 0.0574, + "epoch": 0.28, + "learning_rate": 0.0002579345153191297, + "loss": 0.0704, "step": 43450 }, { - "epoch": 0.47, - "learning_rate": 0.00022948925952365496, - "loss": 0.0574, + "epoch": 0.28, + "learning_rate": 0.00025792483396477276, + "loss": 0.0679, "step": 43460 }, { - "epoch": 0.47, - "learning_rate": 0.00022947303523914594, - "loss": 0.0598, + "epoch": 0.28, + "learning_rate": 0.00025791515261041584, + "loss": 0.065, "step": 43470 }, { - "epoch": 0.47, - "learning_rate": 0.00022945681095463686, - "loss": 0.0609, + "epoch": 0.28, + "learning_rate": 0.00025790547125605887, + "loss": 0.0641, "step": 43480 }, { - "epoch": 0.47, - "learning_rate": 0.00022944058667012784, - "loss": 0.0584, + "epoch": 0.28, + "learning_rate": 0.00025789578990170195, + "loss": 0.0638, "step": 43490 }, { - "epoch": 0.47, - "learning_rate": 0.00022942436238561876, - "loss": 0.0567, + "epoch": 0.28, + "learning_rate": 0.000257886108547345, + "loss": 0.0617, "step": 43500 }, { - "epoch": 0.47, - "learning_rate": 0.00022940813810110974, - "loss": 0.0603, + "epoch": 0.28, + "learning_rate": 0.0002578764271929881, + "loss": 0.0637, "step": 43510 }, { - "epoch": 0.47, - "learning_rate": 0.00022939191381660066, - "loss": 0.0544, + "epoch": 0.28, + "learning_rate": 0.00025786674583863113, + "loss": 0.069, "step": 43520 }, { - "epoch": 0.47, - "learning_rate": 0.0002293756895320916, - "loss": 0.059, + "epoch": 0.28, + "learning_rate": 0.0002578570644842742, + "loss": 0.0656, "step": 43530 }, { - "epoch": 0.47, - "learning_rate": 0.00022935946524758256, - "loss": 0.0694, + "epoch": 0.28, + "learning_rate": 0.0002578473831299173, + "loss": 0.0619, "step": 43540 }, { - "epoch": 0.47, - "learning_rate": 0.0002293432409630735, - "loss": 0.0664, + "epoch": 0.28, + "learning_rate": 0.00025783770177556037, + "loss": 0.0649, "step": 43550 }, { - "epoch": 0.47, - "learning_rate": 0.00022932701667856444, - "loss": 0.055, + "epoch": 0.28, + "learning_rate": 0.00025782802042120345, + "loss": 0.0707, "step": 43560 }, { - "epoch": 0.47, - "learning_rate": 0.0002293107923940554, - "loss": 0.0722, + "epoch": 0.28, + "learning_rate": 0.00025781833906684653, + "loss": 0.0626, "step": 43570 }, { - "epoch": 0.47, - "learning_rate": 0.00022929456810954633, - "loss": 0.0544, + "epoch": 0.28, + "learning_rate": 0.0002578086577124896, + "loss": 0.0678, "step": 43580 }, { - "epoch": 0.47, - "learning_rate": 0.0002292783438250373, - "loss": 0.06, + "epoch": 0.28, + "learning_rate": 0.00025779897635813264, + "loss": 0.072, "step": 43590 }, { - "epoch": 0.47, - "learning_rate": 0.00022926211954052823, - "loss": 0.0704, + "epoch": 0.28, + "learning_rate": 0.0002577892950037757, + "loss": 0.0651, "step": 43600 }, { - "epoch": 0.47, - "learning_rate": 0.00022924589525601918, - "loss": 0.0598, + "epoch": 0.28, + "learning_rate": 0.0002577796136494188, + "loss": 0.0721, "step": 43610 }, { - "epoch": 0.47, - "learning_rate": 0.00022922967097151013, - "loss": 0.0644, + "epoch": 0.28, + "learning_rate": 0.0002577699322950618, + "loss": 0.067, "step": 43620 }, { - "epoch": 0.47, - "learning_rate": 0.00022921344668700108, - "loss": 0.0606, + "epoch": 0.28, + "learning_rate": 0.0002577602509407049, + "loss": 0.0599, "step": 43630 }, { - "epoch": 0.47, - "learning_rate": 0.00022919722240249203, - "loss": 0.0567, + "epoch": 0.28, + "learning_rate": 0.000257750569586348, + "loss": 0.0743, "step": 43640 }, { - "epoch": 0.47, - "learning_rate": 0.00022918099811798298, - "loss": 0.0612, + "epoch": 0.28, + "learning_rate": 0.00025774088823199106, + "loss": 0.069, "step": 43650 }, { - "epoch": 0.47, - "learning_rate": 0.0002291647738334739, - "loss": 0.0541, + "epoch": 0.28, + "learning_rate": 0.0002577312068776341, + "loss": 0.0663, "step": 43660 }, { - "epoch": 0.47, - "learning_rate": 0.00022914854954896488, - "loss": 0.0607, + "epoch": 0.28, + "learning_rate": 0.00025772152552327717, + "loss": 0.0718, "step": 43670 }, { - "epoch": 0.47, - "learning_rate": 0.0002291323252644558, - "loss": 0.0599, + "epoch": 0.28, + "learning_rate": 0.00025771184416892025, + "loss": 0.0682, "step": 43680 }, { - "epoch": 0.47, - "learning_rate": 0.00022911610097994678, - "loss": 0.0592, + "epoch": 0.28, + "learning_rate": 0.0002577021628145633, + "loss": 0.0674, "step": 43690 }, { - "epoch": 0.47, - "learning_rate": 0.0002290998766954377, - "loss": 0.0594, + "epoch": 0.28, + "learning_rate": 0.0002576924814602064, + "loss": 0.0757, "step": 43700 }, { - "epoch": 0.47, - "learning_rate": 0.00022908365241092865, - "loss": 0.0608, + "epoch": 0.28, + "learning_rate": 0.0002576828001058495, + "loss": 0.0659, "step": 43710 }, { - "epoch": 0.47, - "learning_rate": 0.0002290674281264196, - "loss": 0.068, + "epoch": 0.28, + "learning_rate": 0.0002576731187514925, + "loss": 0.0625, "step": 43720 }, { - "epoch": 0.47, - "learning_rate": 0.00022905120384191055, - "loss": 0.0529, + "epoch": 0.28, + "learning_rate": 0.0002576634373971356, + "loss": 0.069, "step": 43730 }, { - "epoch": 0.47, - "learning_rate": 0.00022903497955740148, - "loss": 0.0599, + "epoch": 0.28, + "learning_rate": 0.00025765375604277867, + "loss": 0.0681, "step": 43740 }, { - "epoch": 0.47, - "learning_rate": 0.00022901875527289245, - "loss": 0.0593, + "epoch": 0.28, + "learning_rate": 0.0002576440746884217, + "loss": 0.079, "step": 43750 }, { - "epoch": 0.47, - "learning_rate": 0.00022900253098838338, - "loss": 0.0605, + "epoch": 0.28, + "learning_rate": 0.0002576343933340648, + "loss": 0.0718, "step": 43760 }, { - "epoch": 0.47, - "learning_rate": 0.00022898630670387435, - "loss": 0.0622, + "epoch": 0.28, + "learning_rate": 0.00025762471197970785, + "loss": 0.0668, "step": 43770 }, { - "epoch": 0.47, - "learning_rate": 0.00022897008241936528, - "loss": 0.0628, + "epoch": 0.28, + "learning_rate": 0.00025761503062535093, + "loss": 0.0715, "step": 43780 }, { - "epoch": 0.47, - "learning_rate": 0.00022895385813485623, - "loss": 0.0534, + "epoch": 0.28, + "learning_rate": 0.000257605349270994, + "loss": 0.0653, "step": 43790 }, { - "epoch": 0.47, - "learning_rate": 0.00022893763385034718, - "loss": 0.0609, + "epoch": 0.28, + "learning_rate": 0.00025759566791663704, + "loss": 0.0731, "step": 43800 }, { - "epoch": 0.47, - "learning_rate": 0.00022892140956583813, - "loss": 0.055, + "epoch": 0.28, + "learning_rate": 0.0002575859865622801, + "loss": 0.0694, "step": 43810 }, { - "epoch": 0.47, - "learning_rate": 0.00022890518528132908, - "loss": 0.0574, + "epoch": 0.28, + "learning_rate": 0.0002575763052079232, + "loss": 0.0651, "step": 43820 }, { - "epoch": 0.47, - "learning_rate": 0.00022888896099682002, - "loss": 0.0606, + "epoch": 0.28, + "learning_rate": 0.0002575666238535663, + "loss": 0.0669, "step": 43830 }, { - "epoch": 0.47, - "learning_rate": 0.00022887273671231095, - "loss": 0.0586, + "epoch": 0.28, + "learning_rate": 0.00025755694249920936, + "loss": 0.0777, "step": 43840 }, { - "epoch": 0.47, - "learning_rate": 0.00022885651242780192, - "loss": 0.0597, + "epoch": 0.28, + "learning_rate": 0.00025754726114485244, + "loss": 0.0674, "step": 43850 }, { - "epoch": 0.47, - "learning_rate": 0.00022884028814329285, - "loss": 0.0575, + "epoch": 0.28, + "learning_rate": 0.00025753757979049546, + "loss": 0.0695, "step": 43860 }, { - "epoch": 0.47, - "learning_rate": 0.00022882406385878382, - "loss": 0.0499, + "epoch": 0.28, + "learning_rate": 0.00025752789843613854, + "loss": 0.0701, "step": 43870 }, { - "epoch": 0.47, - "learning_rate": 0.00022880783957427475, - "loss": 0.0562, + "epoch": 0.28, + "learning_rate": 0.00025751821708178157, + "loss": 0.0765, "step": 43880 }, { - "epoch": 0.47, - "learning_rate": 0.0002287916152897657, - "loss": 0.0583, + "epoch": 0.28, + "learning_rate": 0.00025750853572742465, + "loss": 0.0755, "step": 43890 }, { - "epoch": 0.47, - "learning_rate": 0.00022877539100525665, - "loss": 0.0554, + "epoch": 0.28, + "learning_rate": 0.00025749885437306773, + "loss": 0.0706, "step": 43900 }, { - "epoch": 0.47, - "learning_rate": 0.0002287591667207476, - "loss": 0.0542, + "epoch": 0.28, + "learning_rate": 0.0002574891730187108, + "loss": 0.0673, "step": 43910 }, { - "epoch": 0.48, - "learning_rate": 0.00022874294243623852, - "loss": 0.0552, + "epoch": 0.28, + "learning_rate": 0.0002574794916643539, + "loss": 0.0667, "step": 43920 }, { - "epoch": 0.48, - "learning_rate": 0.0002287267181517295, - "loss": 0.0528, + "epoch": 0.28, + "learning_rate": 0.00025746981030999697, + "loss": 0.065, "step": 43930 }, { - "epoch": 0.48, - "learning_rate": 0.00022871049386722042, - "loss": 0.054, - "step": 43940 + "epoch": 0.28, + "learning_rate": 0.00025746012895564, + "loss": 0.0613, + "step": 43940 }, { - "epoch": 0.48, - "learning_rate": 0.0002286942695827114, - "loss": 0.0533, + "epoch": 0.28, + "learning_rate": 0.0002574504476012831, + "loss": 0.0638, "step": 43950 }, { - "epoch": 0.48, - "learning_rate": 0.00022867804529820232, - "loss": 0.0619, + "epoch": 0.28, + "learning_rate": 0.00025744076624692615, + "loss": 0.0672, "step": 43960 }, { - "epoch": 0.48, - "learning_rate": 0.00022866182101369327, - "loss": 0.0711, + "epoch": 0.28, + "learning_rate": 0.00025743108489256923, + "loss": 0.0698, "step": 43970 }, { - "epoch": 0.48, - "learning_rate": 0.00022864559672918422, - "loss": 0.0574, + "epoch": 0.28, + "learning_rate": 0.0002574214035382123, + "loss": 0.0609, "step": 43980 }, { - "epoch": 0.48, - "learning_rate": 0.00022862937244467517, - "loss": 0.0641, + "epoch": 0.28, + "learning_rate": 0.00025741172218385534, + "loss": 0.0668, "step": 43990 }, { - "epoch": 0.48, - "learning_rate": 0.00022861314816016612, - "loss": 0.0646, + "epoch": 0.28, + "learning_rate": 0.0002574020408294984, + "loss": 0.0704, "step": 44000 }, { - "epoch": 0.48, - "eval_cer": 0.9212983332184804, - "eval_loss": 0.04152320697903633, - "eval_runtime": 119.4692, - "eval_samples_per_second": 16.741, - "eval_steps_per_second": 4.185, + "epoch": 0.28, + "eval_cer": 0.920119308552706, + "eval_loss": 0.044700879603624344, + "eval_runtime": 120.2434, + "eval_samples_per_second": 16.633, + "eval_steps_per_second": 4.158, "step": 44000 }, { - "epoch": 0.48, - "learning_rate": 0.00022859692387565707, - "loss": 0.0692, + "epoch": 0.28, + "learning_rate": 0.0002573923594751415, + "loss": 0.0653, "step": 44010 }, { - "epoch": 0.48, - "learning_rate": 0.000228580699591148, - "loss": 0.0594, + "epoch": 0.28, + "learning_rate": 0.0002573826781207845, + "loss": 0.0601, "step": 44020 }, { - "epoch": 0.48, - "learning_rate": 0.00022856447530663897, - "loss": 0.0546, + "epoch": 0.28, + "learning_rate": 0.0002573729967664276, + "loss": 0.0725, "step": 44030 }, { - "epoch": 0.48, - "learning_rate": 0.0002285482510221299, - "loss": 0.0525, + "epoch": 0.28, + "learning_rate": 0.0002573633154120707, + "loss": 0.0705, "step": 44040 }, { - "epoch": 0.48, - "learning_rate": 0.00022853202673762087, - "loss": 0.0617, + "epoch": 0.28, + "learning_rate": 0.00025735363405771376, + "loss": 0.0642, "step": 44050 }, { - "epoch": 0.48, - "learning_rate": 0.0002285158024531118, - "loss": 0.0605, + "epoch": 0.28, + "learning_rate": 0.00025734395270335684, + "loss": 0.0669, "step": 44060 }, { - "epoch": 0.48, - "learning_rate": 0.00022849957816860274, - "loss": 0.063, + "epoch": 0.28, + "learning_rate": 0.0002573342713489999, + "loss": 0.069, "step": 44070 }, { - "epoch": 0.48, - "learning_rate": 0.0002284833538840937, - "loss": 0.0547, + "epoch": 0.28, + "learning_rate": 0.00025732458999464295, + "loss": 0.0664, "step": 44080 }, { - "epoch": 0.48, - "learning_rate": 0.00022846712959958464, - "loss": 0.0528, + "epoch": 0.28, + "learning_rate": 0.00025731490864028603, + "loss": 0.0616, "step": 44090 }, { - "epoch": 0.48, - "learning_rate": 0.00022845090531507556, - "loss": 0.0695, + "epoch": 0.28, + "learning_rate": 0.0002573052272859291, + "loss": 0.0682, "step": 44100 }, { - "epoch": 0.48, - "learning_rate": 0.00022843468103056654, - "loss": 0.0571, + "epoch": 0.28, + "learning_rate": 0.0002572955459315722, + "loss": 0.0655, "step": 44110 }, { - "epoch": 0.48, - "learning_rate": 0.00022841845674605746, - "loss": 0.0633, + "epoch": 0.28, + "learning_rate": 0.0002572858645772152, + "loss": 0.0676, "step": 44120 }, { - "epoch": 0.48, - "learning_rate": 0.00022840223246154844, - "loss": 0.0603, + "epoch": 0.28, + "learning_rate": 0.0002572761832228583, + "loss": 0.0642, "step": 44130 }, { - "epoch": 0.48, - "learning_rate": 0.00022838600817703936, - "loss": 0.0666, + "epoch": 0.28, + "learning_rate": 0.0002572665018685014, + "loss": 0.063, "step": 44140 }, { - "epoch": 0.48, - "learning_rate": 0.0002283697838925303, - "loss": 0.0553, + "epoch": 0.28, + "learning_rate": 0.0002572568205141444, + "loss": 0.0589, "step": 44150 }, { - "epoch": 0.48, - "learning_rate": 0.00022835355960802126, - "loss": 0.0656, + "epoch": 0.29, + "learning_rate": 0.0002572471391597875, + "loss": 0.0619, "step": 44160 }, { - "epoch": 0.48, - "learning_rate": 0.0002283373353235122, - "loss": 0.0548, + "epoch": 0.29, + "learning_rate": 0.00025723745780543056, + "loss": 0.0692, "step": 44170 }, { - "epoch": 0.48, - "learning_rate": 0.00022832111103900316, - "loss": 0.0663, + "epoch": 0.29, + "learning_rate": 0.00025722777645107364, + "loss": 0.0621, "step": 44180 }, { - "epoch": 0.48, - "learning_rate": 0.0002283048867544941, - "loss": 0.0641, + "epoch": 0.29, + "learning_rate": 0.0002572180950967167, + "loss": 0.0697, "step": 44190 }, { - "epoch": 0.48, - "learning_rate": 0.00022828866246998503, - "loss": 0.0615, + "epoch": 0.29, + "learning_rate": 0.0002572084137423598, + "loss": 0.0644, "step": 44200 }, { - "epoch": 0.48, - "learning_rate": 0.000228272438185476, - "loss": 0.0589, + "epoch": 0.29, + "learning_rate": 0.0002571987323880029, + "loss": 0.0616, "step": 44210 }, { - "epoch": 0.48, - "learning_rate": 0.00022825621390096693, - "loss": 0.0566, + "epoch": 0.29, + "learning_rate": 0.0002571890510336459, + "loss": 0.0723, "step": 44220 }, { - "epoch": 0.48, - "learning_rate": 0.0002282399896164579, - "loss": 0.0513, + "epoch": 0.29, + "learning_rate": 0.000257179369679289, + "loss": 0.0644, "step": 44230 }, { - "epoch": 0.48, - "learning_rate": 0.00022822376533194883, - "loss": 0.0559, + "epoch": 0.29, + "learning_rate": 0.00025716968832493206, + "loss": 0.0705, "step": 44240 }, { - "epoch": 0.48, - "learning_rate": 0.00022820754104743978, - "loss": 0.067, + "epoch": 0.29, + "learning_rate": 0.00025716000697057514, + "loss": 0.0706, "step": 44250 }, { - "epoch": 0.48, - "learning_rate": 0.00022819131676293073, - "loss": 0.0593, + "epoch": 0.29, + "learning_rate": 0.00025715032561621817, + "loss": 0.0756, "step": 44260 }, { - "epoch": 0.48, - "learning_rate": 0.00022817509247842168, - "loss": 0.0666, + "epoch": 0.29, + "learning_rate": 0.00025714064426186125, + "loss": 0.0716, "step": 44270 }, { - "epoch": 0.48, - "learning_rate": 0.0002281588681939126, - "loss": 0.0577, + "epoch": 0.29, + "learning_rate": 0.00025713096290750433, + "loss": 0.0763, "step": 44280 }, { - "epoch": 0.48, - "learning_rate": 0.00022814264390940358, - "loss": 0.0674, + "epoch": 0.29, + "learning_rate": 0.00025712128155314735, + "loss": 0.0647, "step": 44290 }, { - "epoch": 0.48, - "learning_rate": 0.0002281264196248945, - "loss": 0.055, + "epoch": 0.29, + "learning_rate": 0.00025711160019879043, + "loss": 0.0632, "step": 44300 }, { - "epoch": 0.48, - "learning_rate": 0.00022811019534038548, - "loss": 0.0592, + "epoch": 0.29, + "learning_rate": 0.0002571019188444335, + "loss": 0.0652, "step": 44310 }, { - "epoch": 0.48, - "learning_rate": 0.0002280939710558764, - "loss": 0.0641, + "epoch": 0.29, + "learning_rate": 0.0002570922374900766, + "loss": 0.0643, "step": 44320 }, { - "epoch": 0.48, - "learning_rate": 0.00022807774677136738, - "loss": 0.0627, + "epoch": 0.29, + "learning_rate": 0.00025708255613571967, + "loss": 0.0671, "step": 44330 }, { - "epoch": 0.48, - "learning_rate": 0.0002280615224868583, - "loss": 0.0587, + "epoch": 0.29, + "learning_rate": 0.00025707287478136275, + "loss": 0.0691, "step": 44340 }, { - "epoch": 0.48, - "learning_rate": 0.00022804529820234925, - "loss": 0.0643, + "epoch": 0.29, + "learning_rate": 0.00025706319342700583, + "loss": 0.0661, "step": 44350 }, { - "epoch": 0.48, - "learning_rate": 0.0002280290739178402, - "loss": 0.063, + "epoch": 0.29, + "learning_rate": 0.00025705351207264886, + "loss": 0.0646, "step": 44360 }, { - "epoch": 0.48, - "learning_rate": 0.00022801284963333115, - "loss": 0.0563, + "epoch": 0.29, + "learning_rate": 0.00025704383071829194, + "loss": 0.0625, "step": 44370 }, { - "epoch": 0.48, - "learning_rate": 0.00022799662534882207, - "loss": 0.0621, + "epoch": 0.29, + "learning_rate": 0.000257034149363935, + "loss": 0.0648, "step": 44380 }, { - "epoch": 0.48, - "learning_rate": 0.00022798040106431305, - "loss": 0.0621, + "epoch": 0.29, + "learning_rate": 0.00025702446800957804, + "loss": 0.0709, "step": 44390 }, { - "epoch": 0.48, - "learning_rate": 0.00022796417677980397, - "loss": 0.0538, + "epoch": 0.29, + "learning_rate": 0.0002570147866552211, + "loss": 0.0663, "step": 44400 }, { - "epoch": 0.48, - "learning_rate": 0.00022794795249529495, - "loss": 0.057, + "epoch": 0.29, + "learning_rate": 0.0002570051053008642, + "loss": 0.0609, "step": 44410 }, { - "epoch": 0.48, - "learning_rate": 0.00022793172821078587, - "loss": 0.0582, + "epoch": 0.29, + "learning_rate": 0.0002569954239465073, + "loss": 0.0613, "step": 44420 }, { - "epoch": 0.48, - "learning_rate": 0.00022791550392627682, - "loss": 0.0557, + "epoch": 0.29, + "learning_rate": 0.0002569857425921503, + "loss": 0.0673, "step": 44430 }, { - "epoch": 0.48, - "learning_rate": 0.00022789927964176777, - "loss": 0.0556, + "epoch": 0.29, + "learning_rate": 0.0002569760612377934, + "loss": 0.0679, "step": 44440 }, { - "epoch": 0.48, - "learning_rate": 0.00022788305535725872, - "loss": 0.0547, + "epoch": 0.29, + "learning_rate": 0.00025696637988343647, + "loss": 0.065, "step": 44450 }, { - "epoch": 0.48, - "learning_rate": 0.00022786683107274964, - "loss": 0.0612, + "epoch": 0.29, + "learning_rate": 0.00025695669852907955, + "loss": 0.0717, "step": 44460 }, { - "epoch": 0.48, - "learning_rate": 0.00022785060678824062, - "loss": 0.0502, + "epoch": 0.29, + "learning_rate": 0.00025694701717472263, + "loss": 0.0729, "step": 44470 }, { - "epoch": 0.48, - "learning_rate": 0.00022783438250373154, - "loss": 0.0536, + "epoch": 0.29, + "learning_rate": 0.0002569373358203657, + "loss": 0.0653, "step": 44480 }, { - "epoch": 0.48, - "learning_rate": 0.00022781815821922252, - "loss": 0.0637, + "epoch": 0.29, + "learning_rate": 0.00025692765446600873, + "loss": 0.0746, "step": 44490 }, { - "epoch": 0.48, - "learning_rate": 0.00022780193393471344, - "loss": 0.0636, + "epoch": 0.29, + "learning_rate": 0.0002569179731116518, + "loss": 0.0721, "step": 44500 }, { - "epoch": 0.48, - "learning_rate": 0.00022778570965020442, - "loss": 0.0673, + "epoch": 0.29, + "learning_rate": 0.0002569082917572949, + "loss": 0.0773, "step": 44510 }, { - "epoch": 0.48, - "learning_rate": 0.00022776948536569534, - "loss": 0.0545, + "epoch": 0.29, + "learning_rate": 0.0002568986104029379, + "loss": 0.0734, "step": 44520 }, { - "epoch": 0.48, - "learning_rate": 0.0002277532610811863, - "loss": 0.0635, + "epoch": 0.29, + "learning_rate": 0.000256888929048581, + "loss": 0.0738, "step": 44530 }, { - "epoch": 0.48, - "learning_rate": 0.00022773703679667724, - "loss": 0.0629, + "epoch": 0.29, + "learning_rate": 0.0002568792476942241, + "loss": 0.0617, "step": 44540 }, { - "epoch": 0.48, - "learning_rate": 0.0002277208125121682, - "loss": 0.0557, + "epoch": 0.29, + "learning_rate": 0.00025686956633986716, + "loss": 0.0606, "step": 44550 }, { - "epoch": 0.48, - "learning_rate": 0.00022770458822765911, - "loss": 0.0589, + "epoch": 0.29, + "learning_rate": 0.00025685988498551024, + "loss": 0.0709, "step": 44560 }, { - "epoch": 0.48, - "learning_rate": 0.0002276883639431501, - "loss": 0.0587, + "epoch": 0.29, + "learning_rate": 0.00025685020363115326, + "loss": 0.0705, "step": 44570 }, { - "epoch": 0.48, - "learning_rate": 0.00022767213965864101, - "loss": 0.057, + "epoch": 0.29, + "learning_rate": 0.00025684052227679634, + "loss": 0.0686, "step": 44580 }, { - "epoch": 0.48, - "learning_rate": 0.000227655915374132, - "loss": 0.0548, + "epoch": 0.29, + "learning_rate": 0.0002568308409224394, + "loss": 0.0762, "step": 44590 }, { - "epoch": 0.48, - "learning_rate": 0.00022763969108962294, - "loss": 0.0556, + "epoch": 0.29, + "learning_rate": 0.0002568211595680825, + "loss": 0.0704, "step": 44600 }, { - "epoch": 0.48, - "learning_rate": 0.00022762346680511386, - "loss": 0.0543, + "epoch": 0.29, + "learning_rate": 0.0002568114782137256, + "loss": 0.0646, "step": 44610 }, { - "epoch": 0.48, - "learning_rate": 0.00022760724252060484, - "loss": 0.0619, + "epoch": 0.29, + "learning_rate": 0.00025680179685936866, + "loss": 0.0696, "step": 44620 }, { - "epoch": 0.48, - "learning_rate": 0.00022759101823609576, - "loss": 0.0582, + "epoch": 0.29, + "learning_rate": 0.0002567921155050117, + "loss": 0.0622, "step": 44630 }, { - "epoch": 0.48, - "learning_rate": 0.00022757479395158674, - "loss": 0.0581, + "epoch": 0.29, + "learning_rate": 0.00025678243415065477, + "loss": 0.0643, "step": 44640 }, { - "epoch": 0.48, - "learning_rate": 0.00022755856966707766, - "loss": 0.0629, + "epoch": 0.29, + "learning_rate": 0.00025677275279629785, + "loss": 0.0595, "step": 44650 }, { - "epoch": 0.48, - "learning_rate": 0.0002275423453825686, - "loss": 0.0588, + "epoch": 0.29, + "learning_rate": 0.00025676307144194087, + "loss": 0.0645, "step": 44660 }, { - "epoch": 0.48, - "learning_rate": 0.00022752612109805956, - "loss": 0.0585, + "epoch": 0.29, + "learning_rate": 0.00025675339008758395, + "loss": 0.0689, "step": 44670 }, { - "epoch": 0.48, - "learning_rate": 0.0002275098968135505, - "loss": 0.0593, + "epoch": 0.29, + "learning_rate": 0.00025674370873322703, + "loss": 0.0639, "step": 44680 }, { - "epoch": 0.48, - "learning_rate": 0.00022749367252904146, - "loss": 0.0607, + "epoch": 0.29, + "learning_rate": 0.0002567340273788701, + "loss": 0.0678, "step": 44690 }, { - "epoch": 0.48, - "learning_rate": 0.0002274774482445324, - "loss": 0.0575, + "epoch": 0.29, + "learning_rate": 0.0002567243460245132, + "loss": 0.0649, "step": 44700 }, { - "epoch": 0.48, - "learning_rate": 0.00022746122396002333, - "loss": 0.0594, + "epoch": 0.29, + "learning_rate": 0.0002567146646701562, + "loss": 0.0597, "step": 44710 }, { - "epoch": 0.48, - "learning_rate": 0.0002274449996755143, - "loss": 0.0662, + "epoch": 0.29, + "learning_rate": 0.0002567049833157993, + "loss": 0.0617, "step": 44720 }, { - "epoch": 0.48, - "learning_rate": 0.00022742877539100523, - "loss": 0.0617, + "epoch": 0.29, + "learning_rate": 0.0002566953019614424, + "loss": 0.0679, "step": 44730 }, { - "epoch": 0.48, - "learning_rate": 0.0002274125511064962, - "loss": 0.0561, + "epoch": 0.29, + "learning_rate": 0.00025668562060708546, + "loss": 0.0602, "step": 44740 }, { - "epoch": 0.48, - "learning_rate": 0.00022739632682198713, - "loss": 0.0562, + "epoch": 0.29, + "learning_rate": 0.00025667593925272854, + "loss": 0.0671, "step": 44750 }, { - "epoch": 0.48, - "learning_rate": 0.00022738010253747808, - "loss": 0.0631, + "epoch": 0.29, + "learning_rate": 0.00025666625789837156, + "loss": 0.0603, "step": 44760 }, { - "epoch": 0.48, - "learning_rate": 0.00022736387825296903, - "loss": 0.0552, + "epoch": 0.29, + "learning_rate": 0.00025665657654401464, + "loss": 0.0555, "step": 44770 }, { - "epoch": 0.48, - "learning_rate": 0.00022734765396845998, - "loss": 0.0618, + "epoch": 0.29, + "learning_rate": 0.0002566468951896577, + "loss": 0.0689, "step": 44780 }, { - "epoch": 0.48, - "learning_rate": 0.0002273314296839509, - "loss": 0.0632, + "epoch": 0.29, + "learning_rate": 0.00025663721383530075, + "loss": 0.0605, "step": 44790 }, { - "epoch": 0.48, - "learning_rate": 0.00022731520539944188, - "loss": 0.0598, + "epoch": 0.29, + "learning_rate": 0.0002566275324809438, + "loss": 0.0686, "step": 44800 }, { - "epoch": 0.48, - "learning_rate": 0.0002272989811149328, - "loss": 0.0556, + "epoch": 0.29, + "learning_rate": 0.0002566178511265869, + "loss": 0.0647, "step": 44810 }, { - "epoch": 0.48, - "learning_rate": 0.00022728275683042378, - "loss": 0.0537, + "epoch": 0.29, + "learning_rate": 0.00025660816977223, + "loss": 0.0639, "step": 44820 }, { - "epoch": 0.48, - "learning_rate": 0.0002272665325459147, - "loss": 0.0639, + "epoch": 0.29, + "learning_rate": 0.00025659848841787307, + "loss": 0.0689, "step": 44830 }, { - "epoch": 0.48, - "learning_rate": 0.00022725030826140565, - "loss": 0.0556, + "epoch": 0.29, + "learning_rate": 0.0002565888070635161, + "loss": 0.0701, "step": 44840 }, { - "epoch": 0.49, - "learning_rate": 0.0002272340839768966, - "loss": 0.0622, + "epoch": 0.29, + "learning_rate": 0.00025657912570915917, + "loss": 0.0795, "step": 44850 }, { - "epoch": 0.49, - "learning_rate": 0.00022721785969238755, - "loss": 0.0573, + "epoch": 0.29, + "learning_rate": 0.00025656944435480225, + "loss": 0.0622, "step": 44860 }, { - "epoch": 0.49, - "learning_rate": 0.0002272016354078785, - "loss": 0.0563, + "epoch": 0.29, + "learning_rate": 0.00025655976300044533, + "loss": 0.0654, "step": 44870 }, { - "epoch": 0.49, - "learning_rate": 0.00022718541112336945, - "loss": 0.0581, + "epoch": 0.29, + "learning_rate": 0.0002565500816460884, + "loss": 0.0756, "step": 44880 }, { - "epoch": 0.49, - "learning_rate": 0.00022716918683886038, - "loss": 0.0623, + "epoch": 0.29, + "learning_rate": 0.00025654040029173144, + "loss": 0.0748, "step": 44890 }, { - "epoch": 0.49, - "learning_rate": 0.00022715296255435135, - "loss": 0.0554, + "epoch": 0.29, + "learning_rate": 0.0002565307189373745, + "loss": 0.0676, "step": 44900 }, { - "epoch": 0.49, - "learning_rate": 0.00022713673826984227, - "loss": 0.0621, + "epoch": 0.29, + "learning_rate": 0.0002565210375830176, + "loss": 0.0689, "step": 44910 }, { - "epoch": 0.49, - "learning_rate": 0.00022712051398533325, - "loss": 0.0666, + "epoch": 0.29, + "learning_rate": 0.0002565113562286606, + "loss": 0.0657, "step": 44920 }, { - "epoch": 0.49, - "learning_rate": 0.00022710428970082417, - "loss": 0.0529, + "epoch": 0.29, + "learning_rate": 0.0002565016748743037, + "loss": 0.0706, "step": 44930 }, { - "epoch": 0.49, - "learning_rate": 0.00022708806541631512, - "loss": 0.0579, + "epoch": 0.29, + "learning_rate": 0.0002564919935199468, + "loss": 0.0619, "step": 44940 }, { - "epoch": 0.49, - "learning_rate": 0.00022707184113180607, - "loss": 0.0558, + "epoch": 0.29, + "learning_rate": 0.00025648231216558986, + "loss": 0.0735, "step": 44950 }, { - "epoch": 0.49, - "learning_rate": 0.00022705561684729702, - "loss": 0.0586, + "epoch": 0.29, + "learning_rate": 0.00025647263081123294, + "loss": 0.0783, "step": 44960 }, { - "epoch": 0.49, - "learning_rate": 0.00022703939256278795, - "loss": 0.0546, + "epoch": 0.29, + "learning_rate": 0.000256462949456876, + "loss": 0.0677, "step": 44970 }, { - "epoch": 0.49, - "learning_rate": 0.00022702316827827892, - "loss": 0.0526, + "epoch": 0.29, + "learning_rate": 0.00025645326810251905, + "loss": 0.0649, "step": 44980 }, { - "epoch": 0.49, - "learning_rate": 0.00022700694399376985, - "loss": 0.0475, + "epoch": 0.29, + "learning_rate": 0.0002564435867481621, + "loss": 0.0676, "step": 44990 }, { - "epoch": 0.49, - "learning_rate": 0.00022699071970926082, - "loss": 0.0573, + "epoch": 0.29, + "learning_rate": 0.0002564339053938052, + "loss": 0.0657, "step": 45000 }, { - "epoch": 0.49, - "eval_cer": 0.921223237051212, - "eval_loss": 0.04102905094623566, - "eval_runtime": 119.3665, - "eval_samples_per_second": 16.755, - "eval_steps_per_second": 4.189, + "epoch": 0.29, + "eval_cer": 0.920057846571009, + "eval_loss": 0.0462675541639328, + "eval_runtime": 120.4879, + "eval_samples_per_second": 16.599, + "eval_steps_per_second": 4.15, "step": 45000 }, { - "epoch": 0.49, - "learning_rate": 0.00022697449542475175, - "loss": 0.0619, + "epoch": 0.29, + "learning_rate": 0.0002564242240394483, + "loss": 0.0645, "step": 45010 }, { - "epoch": 0.49, - "learning_rate": 0.00022695827114024272, - "loss": 0.0551, + "epoch": 0.29, + "learning_rate": 0.00025641454268509137, + "loss": 0.0675, "step": 45020 }, { - "epoch": 0.49, - "learning_rate": 0.00022694204685573365, - "loss": 0.067, + "epoch": 0.29, + "learning_rate": 0.0002564048613307344, + "loss": 0.0607, "step": 45030 }, { - "epoch": 0.49, - "learning_rate": 0.0002269258225712246, - "loss": 0.0573, + "epoch": 0.29, + "learning_rate": 0.00025639517997637747, + "loss": 0.0618, "step": 45040 }, { - "epoch": 0.49, - "learning_rate": 0.00022690959828671554, - "loss": 0.0523, + "epoch": 0.29, + "learning_rate": 0.00025638549862202055, + "loss": 0.078, "step": 45050 }, { - "epoch": 0.49, - "learning_rate": 0.0002268933740022065, - "loss": 0.0555, + "epoch": 0.29, + "learning_rate": 0.0002563758172676636, + "loss": 0.0671, "step": 45060 }, { - "epoch": 0.49, - "learning_rate": 0.00022687714971769742, - "loss": 0.0566, + "epoch": 0.29, + "learning_rate": 0.00025636613591330666, + "loss": 0.0702, "step": 45070 }, { - "epoch": 0.49, - "learning_rate": 0.0002268609254331884, - "loss": 0.0598, + "epoch": 0.29, + "learning_rate": 0.00025635645455894974, + "loss": 0.066, "step": 45080 }, { - "epoch": 0.49, - "learning_rate": 0.00022684470114867932, - "loss": 0.0642, + "epoch": 0.29, + "learning_rate": 0.0002563467732045928, + "loss": 0.0788, "step": 45090 }, { - "epoch": 0.49, - "learning_rate": 0.0002268284768641703, - "loss": 0.0545, + "epoch": 0.29, + "learning_rate": 0.0002563370918502359, + "loss": 0.0636, "step": 45100 }, { - "epoch": 0.49, - "learning_rate": 0.00022681225257966122, - "loss": 0.0649, + "epoch": 0.29, + "learning_rate": 0.000256327410495879, + "loss": 0.0667, "step": 45110 }, { - "epoch": 0.49, - "learning_rate": 0.00022679602829515217, - "loss": 0.0571, + "epoch": 0.29, + "learning_rate": 0.000256317729141522, + "loss": 0.0676, "step": 45120 }, { - "epoch": 0.49, - "learning_rate": 0.00022677980401064312, - "loss": 0.0747, + "epoch": 0.29, + "learning_rate": 0.0002563080477871651, + "loss": 0.0787, "step": 45130 }, { - "epoch": 0.49, - "learning_rate": 0.00022676357972613407, - "loss": 0.0539, + "epoch": 0.29, + "learning_rate": 0.00025629836643280816, + "loss": 0.0548, "step": 45140 }, { - "epoch": 0.49, - "learning_rate": 0.000226747355441625, - "loss": 0.0608, + "epoch": 0.29, + "learning_rate": 0.00025628868507845124, + "loss": 0.0644, "step": 45150 }, { - "epoch": 0.49, - "learning_rate": 0.00022673113115711597, - "loss": 0.0712, + "epoch": 0.29, + "learning_rate": 0.00025627900372409427, + "loss": 0.0636, "step": 45160 }, { - "epoch": 0.49, - "learning_rate": 0.0002267149068726069, - "loss": 0.0687, + "epoch": 0.29, + "learning_rate": 0.00025626932236973735, + "loss": 0.0734, "step": 45170 }, { - "epoch": 0.49, - "learning_rate": 0.00022669868258809786, - "loss": 0.0618, + "epoch": 0.29, + "learning_rate": 0.0002562596410153804, + "loss": 0.075, "step": 45180 }, { - "epoch": 0.49, - "learning_rate": 0.0002266824583035888, - "loss": 0.0587, + "epoch": 0.29, + "learning_rate": 0.00025624995966102345, + "loss": 0.0622, "step": 45190 }, { - "epoch": 0.49, - "learning_rate": 0.00022666623401907976, - "loss": 0.0525, + "epoch": 0.29, + "learning_rate": 0.00025624027830666653, + "loss": 0.0602, "step": 45200 }, { - "epoch": 0.49, - "learning_rate": 0.0002266500097345707, - "loss": 0.0601, + "epoch": 0.29, + "learning_rate": 0.0002562305969523096, + "loss": 0.0619, "step": 45210 }, { - "epoch": 0.49, - "learning_rate": 0.00022663378545006164, - "loss": 0.0585, + "epoch": 0.29, + "learning_rate": 0.0002562209155979527, + "loss": 0.0645, "step": 45220 }, { - "epoch": 0.49, - "learning_rate": 0.00022661756116555259, - "loss": 0.0603, + "epoch": 0.29, + "learning_rate": 0.00025621123424359577, + "loss": 0.0652, "step": 45230 }, { - "epoch": 0.49, - "learning_rate": 0.00022660133688104354, - "loss": 0.0639, + "epoch": 0.29, + "learning_rate": 0.00025620155288923885, + "loss": 0.06, "step": 45240 }, { - "epoch": 0.49, - "learning_rate": 0.00022658511259653446, - "loss": 0.0596, + "epoch": 0.29, + "learning_rate": 0.00025619187153488193, + "loss": 0.0673, "step": 45250 }, { - "epoch": 0.49, - "learning_rate": 0.00022656888831202544, - "loss": 0.058, + "epoch": 0.29, + "learning_rate": 0.00025618219018052495, + "loss": 0.0605, "step": 45260 }, { - "epoch": 0.49, - "learning_rate": 0.00022655266402751636, - "loss": 0.0544, + "epoch": 0.29, + "learning_rate": 0.00025617250882616803, + "loss": 0.0762, "step": 45270 }, { - "epoch": 0.49, - "learning_rate": 0.00022653643974300734, - "loss": 0.0665, + "epoch": 0.29, + "learning_rate": 0.0002561628274718111, + "loss": 0.0688, "step": 45280 }, { - "epoch": 0.49, - "learning_rate": 0.00022652021545849826, - "loss": 0.05, + "epoch": 0.29, + "learning_rate": 0.00025615314611745414, + "loss": 0.0673, "step": 45290 }, { - "epoch": 0.49, - "learning_rate": 0.0002265039911739892, - "loss": 0.0696, + "epoch": 0.29, + "learning_rate": 0.0002561434647630972, + "loss": 0.0794, "step": 45300 }, { - "epoch": 0.49, - "learning_rate": 0.00022648776688948016, - "loss": 0.0535, + "epoch": 0.29, + "learning_rate": 0.0002561337834087403, + "loss": 0.0654, "step": 45310 }, { - "epoch": 0.49, - "learning_rate": 0.0002264715426049711, - "loss": 0.0585, + "epoch": 0.29, + "learning_rate": 0.0002561241020543834, + "loss": 0.0693, "step": 45320 }, { - "epoch": 0.49, - "learning_rate": 0.00022645531832046203, - "loss": 0.0529, + "epoch": 0.29, + "learning_rate": 0.0002561144207000264, + "loss": 0.0638, "step": 45330 }, { - "epoch": 0.49, - "learning_rate": 0.000226439094035953, - "loss": 0.0756, + "epoch": 0.29, + "learning_rate": 0.0002561047393456695, + "loss": 0.06, "step": 45340 }, { - "epoch": 0.49, - "learning_rate": 0.00022642286975144393, - "loss": 0.0517, + "epoch": 0.29, + "learning_rate": 0.00025609505799131256, + "loss": 0.0642, "step": 45350 }, { - "epoch": 0.49, - "learning_rate": 0.0002264066454669349, - "loss": 0.0509, + "epoch": 0.29, + "learning_rate": 0.00025608537663695564, + "loss": 0.0681, "step": 45360 }, { - "epoch": 0.49, - "learning_rate": 0.00022639042118242583, - "loss": 0.0532, + "epoch": 0.29, + "learning_rate": 0.0002560756952825987, + "loss": 0.0674, "step": 45370 }, { - "epoch": 0.49, - "learning_rate": 0.0002263741968979168, - "loss": 0.0589, + "epoch": 0.29, + "learning_rate": 0.0002560660139282418, + "loss": 0.0648, "step": 45380 }, { - "epoch": 0.49, - "learning_rate": 0.00022635797261340773, - "loss": 0.0548, + "epoch": 0.29, + "learning_rate": 0.0002560563325738849, + "loss": 0.0665, "step": 45390 }, { - "epoch": 0.49, - "learning_rate": 0.00022634174832889868, - "loss": 0.0626, + "epoch": 0.29, + "learning_rate": 0.0002560466512195279, + "loss": 0.0688, "step": 45400 }, { - "epoch": 0.49, - "learning_rate": 0.00022632552404438963, - "loss": 0.0557, + "epoch": 0.29, + "learning_rate": 0.000256036969865171, + "loss": 0.0669, "step": 45410 }, { - "epoch": 0.49, - "learning_rate": 0.00022630929975988058, - "loss": 0.0613, + "epoch": 0.29, + "learning_rate": 0.00025602728851081407, + "loss": 0.0691, "step": 45420 }, { - "epoch": 0.49, - "learning_rate": 0.0002262930754753715, - "loss": 0.0539, + "epoch": 0.29, + "learning_rate": 0.0002560176071564571, + "loss": 0.0633, "step": 45430 }, { - "epoch": 0.49, - "learning_rate": 0.00022627685119086248, - "loss": 0.0616, + "epoch": 0.29, + "learning_rate": 0.0002560079258021002, + "loss": 0.0652, "step": 45440 }, { - "epoch": 0.49, - "learning_rate": 0.0002262606269063534, - "loss": 0.0511, + "epoch": 0.29, + "learning_rate": 0.00025599824444774325, + "loss": 0.0664, "step": 45450 }, { - "epoch": 0.49, - "learning_rate": 0.00022624440262184438, - "loss": 0.0628, + "epoch": 0.29, + "learning_rate": 0.00025598856309338633, + "loss": 0.0576, "step": 45460 }, { - "epoch": 0.49, - "learning_rate": 0.0002262281783373353, - "loss": 0.062, + "epoch": 0.29, + "learning_rate": 0.00025597888173902936, + "loss": 0.0624, "step": 45470 }, { - "epoch": 0.49, - "learning_rate": 0.00022621195405282625, - "loss": 0.0596, + "epoch": 0.29, + "learning_rate": 0.00025596920038467244, + "loss": 0.0687, "step": 45480 }, { - "epoch": 0.49, - "learning_rate": 0.0002261957297683172, - "loss": 0.0569, + "epoch": 0.29, + "learning_rate": 0.0002559595190303155, + "loss": 0.0691, "step": 45490 }, { - "epoch": 0.49, - "learning_rate": 0.00022617950548380815, - "loss": 0.0564, + "epoch": 0.29, + "learning_rate": 0.0002559498376759586, + "loss": 0.0665, "step": 45500 }, { - "epoch": 0.49, - "learning_rate": 0.00022616328119929907, - "loss": 0.0622, + "epoch": 0.29, + "learning_rate": 0.0002559401563216017, + "loss": 0.0639, "step": 45510 }, { - "epoch": 0.49, - "learning_rate": 0.00022614705691479005, - "loss": 0.0592, + "epoch": 0.29, + "learning_rate": 0.00025593047496724476, + "loss": 0.0681, "step": 45520 }, { - "epoch": 0.49, - "learning_rate": 0.00022613083263028097, - "loss": 0.0565, + "epoch": 0.29, + "learning_rate": 0.0002559207936128878, + "loss": 0.0714, "step": 45530 }, { - "epoch": 0.49, - "learning_rate": 0.00022611460834577195, - "loss": 0.0599, + "epoch": 0.29, + "learning_rate": 0.00025591111225853086, + "loss": 0.0622, "step": 45540 }, { - "epoch": 0.49, - "learning_rate": 0.00022609838406126287, - "loss": 0.0632, + "epoch": 0.29, + "learning_rate": 0.00025590143090417394, + "loss": 0.068, "step": 45550 }, { - "epoch": 0.49, - "learning_rate": 0.00022608215977675385, - "loss": 0.0645, + "epoch": 0.29, + "learning_rate": 0.00025589174954981697, + "loss": 0.0679, "step": 45560 }, { - "epoch": 0.49, - "learning_rate": 0.00022606593549224477, - "loss": 0.0616, + "epoch": 0.29, + "learning_rate": 0.00025588206819546005, + "loss": 0.0748, "step": 45570 }, { - "epoch": 0.49, - "learning_rate": 0.00022604971120773572, - "loss": 0.0637, + "epoch": 0.29, + "learning_rate": 0.00025587238684110313, + "loss": 0.0667, "step": 45580 }, { - "epoch": 0.49, - "learning_rate": 0.00022603348692322667, - "loss": 0.0583, + "epoch": 0.29, + "learning_rate": 0.0002558627054867462, + "loss": 0.0679, "step": 45590 }, { - "epoch": 0.49, - "learning_rate": 0.00022601726263871762, - "loss": 0.0597, + "epoch": 0.29, + "learning_rate": 0.0002558530241323893, + "loss": 0.07, "step": 45600 }, { - "epoch": 0.49, - "learning_rate": 0.00022600103835420854, - "loss": 0.0583, + "epoch": 0.29, + "learning_rate": 0.0002558433427780323, + "loss": 0.0647, "step": 45610 }, { - "epoch": 0.49, - "learning_rate": 0.00022598481406969952, - "loss": 0.0537, + "epoch": 0.29, + "learning_rate": 0.0002558336614236754, + "loss": 0.07, "step": 45620 }, { - "epoch": 0.49, - "learning_rate": 0.00022596858978519044, - "loss": 0.0534, + "epoch": 0.29, + "learning_rate": 0.0002558239800693185, + "loss": 0.0591, "step": 45630 }, { - "epoch": 0.49, - "learning_rate": 0.00022595236550068142, - "loss": 0.0566, + "epoch": 0.29, + "learning_rate": 0.00025581429871496155, + "loss": 0.0748, "step": 45640 }, { - "epoch": 0.49, - "learning_rate": 0.00022593614121617234, - "loss": 0.0546, + "epoch": 0.29, + "learning_rate": 0.00025580461736060463, + "loss": 0.0684, "step": 45650 }, { - "epoch": 0.49, - "learning_rate": 0.0002259199169316633, - "loss": 0.0556, + "epoch": 0.29, + "learning_rate": 0.0002557949360062477, + "loss": 0.0585, "step": 45660 }, { - "epoch": 0.49, - "learning_rate": 0.00022590369264715424, - "loss": 0.0588, + "epoch": 0.29, + "learning_rate": 0.00025578525465189074, + "loss": 0.068, "step": 45670 }, { - "epoch": 0.49, - "learning_rate": 0.0002258874683626452, - "loss": 0.0523, + "epoch": 0.29, + "learning_rate": 0.0002557755732975338, + "loss": 0.067, "step": 45680 }, { - "epoch": 0.49, - "learning_rate": 0.0002258712440781361, - "loss": 0.0586, + "epoch": 0.29, + "learning_rate": 0.00025576589194317684, + "loss": 0.0695, "step": 45690 }, { - "epoch": 0.49, - "learning_rate": 0.0002258550197936271, - "loss": 0.0612, + "epoch": 0.29, + "learning_rate": 0.0002557562105888199, + "loss": 0.0614, "step": 45700 }, { - "epoch": 0.49, - "learning_rate": 0.000225838795509118, - "loss": 0.0657, + "epoch": 0.3, + "learning_rate": 0.000255746529234463, + "loss": 0.0618, "step": 45710 }, { - "epoch": 0.49, - "learning_rate": 0.000225822571224609, - "loss": 0.0649, + "epoch": 0.3, + "learning_rate": 0.0002557368478801061, + "loss": 0.065, "step": 45720 }, { - "epoch": 0.49, - "learning_rate": 0.0002258063469400999, - "loss": 0.06, + "epoch": 0.3, + "learning_rate": 0.00025572716652574916, + "loss": 0.0662, "step": 45730 }, { - "epoch": 0.49, - "learning_rate": 0.0002257901226555909, - "loss": 0.0573, + "epoch": 0.3, + "learning_rate": 0.00025571748517139224, + "loss": 0.0653, "step": 45740 }, { - "epoch": 0.49, - "learning_rate": 0.0002257738983710818, - "loss": 0.0549, + "epoch": 0.3, + "learning_rate": 0.00025570780381703527, + "loss": 0.0651, "step": 45750 }, { - "epoch": 0.49, - "learning_rate": 0.00022575767408657276, - "loss": 0.0636, + "epoch": 0.3, + "learning_rate": 0.00025569812246267835, + "loss": 0.0618, "step": 45760 }, { - "epoch": 0.5, - "learning_rate": 0.0002257414498020637, - "loss": 0.0504, + "epoch": 0.3, + "learning_rate": 0.00025568844110832143, + "loss": 0.0706, "step": 45770 }, { - "epoch": 0.5, - "learning_rate": 0.00022572522551755466, - "loss": 0.0651, + "epoch": 0.3, + "learning_rate": 0.0002556787597539645, + "loss": 0.0779, "step": 45780 }, { - "epoch": 0.5, - "learning_rate": 0.00022570900123304558, - "loss": 0.0619, + "epoch": 0.3, + "learning_rate": 0.0002556690783996076, + "loss": 0.0739, "step": 45790 }, { - "epoch": 0.5, - "learning_rate": 0.00022569277694853656, - "loss": 0.0563, + "epoch": 0.3, + "learning_rate": 0.0002556593970452506, + "loss": 0.0755, "step": 45800 }, { - "epoch": 0.5, - "learning_rate": 0.00022567655266402748, - "loss": 0.0649, + "epoch": 0.3, + "learning_rate": 0.0002556497156908937, + "loss": 0.0684, "step": 45810 }, { - "epoch": 0.5, - "learning_rate": 0.00022566032837951846, - "loss": 0.0564, + "epoch": 0.3, + "learning_rate": 0.00025564003433653677, + "loss": 0.0649, "step": 45820 }, { - "epoch": 0.5, - "learning_rate": 0.00022564410409500938, - "loss": 0.0535, + "epoch": 0.3, + "learning_rate": 0.0002556303529821798, + "loss": 0.0682, "step": 45830 }, { - "epoch": 0.5, - "learning_rate": 0.00022562787981050033, - "loss": 0.0529, + "epoch": 0.3, + "learning_rate": 0.0002556206716278229, + "loss": 0.0622, "step": 45840 }, { - "epoch": 0.5, - "learning_rate": 0.00022561165552599128, - "loss": 0.0581, + "epoch": 0.3, + "learning_rate": 0.00025561099027346596, + "loss": 0.0626, "step": 45850 }, { - "epoch": 0.5, - "learning_rate": 0.00022559543124148223, - "loss": 0.0559, + "epoch": 0.3, + "learning_rate": 0.00025560130891910904, + "loss": 0.0741, "step": 45860 }, { - "epoch": 0.5, - "learning_rate": 0.00022557920695697318, - "loss": 0.0594, + "epoch": 0.3, + "learning_rate": 0.0002555916275647521, + "loss": 0.0659, "step": 45870 }, { - "epoch": 0.5, - "learning_rate": 0.00022556298267246413, - "loss": 0.059, + "epoch": 0.3, + "learning_rate": 0.0002555819462103952, + "loss": 0.0723, "step": 45880 }, { - "epoch": 0.5, - "learning_rate": 0.00022554675838795505, - "loss": 0.0537, + "epoch": 0.3, + "learning_rate": 0.0002555722648560382, + "loss": 0.0642, "step": 45890 }, { - "epoch": 0.5, - "learning_rate": 0.00022553053410344603, - "loss": 0.056, + "epoch": 0.3, + "learning_rate": 0.0002555625835016813, + "loss": 0.071, "step": 45900 }, { - "epoch": 0.5, - "learning_rate": 0.00022551430981893695, - "loss": 0.0528, + "epoch": 0.3, + "learning_rate": 0.0002555529021473244, + "loss": 0.064, "step": 45910 }, { - "epoch": 0.5, - "learning_rate": 0.00022549808553442793, - "loss": 0.0603, + "epoch": 0.3, + "learning_rate": 0.00025554322079296746, + "loss": 0.0663, "step": 45920 }, { - "epoch": 0.5, - "learning_rate": 0.00022548186124991885, - "loss": 0.0608, + "epoch": 0.3, + "learning_rate": 0.0002555335394386105, + "loss": 0.0715, "step": 45930 }, { - "epoch": 0.5, - "learning_rate": 0.0002254656369654098, - "loss": 0.049, + "epoch": 0.3, + "learning_rate": 0.00025552385808425357, + "loss": 0.0687, "step": 45940 }, { - "epoch": 0.5, - "learning_rate": 0.00022544941268090075, - "loss": 0.0693, + "epoch": 0.3, + "learning_rate": 0.00025551417672989665, + "loss": 0.0753, "step": 45950 }, { - "epoch": 0.5, - "learning_rate": 0.0002254331883963917, - "loss": 0.0605, + "epoch": 0.3, + "learning_rate": 0.0002555044953755397, + "loss": 0.068, "step": 45960 }, { - "epoch": 0.5, - "learning_rate": 0.00022541696411188263, - "loss": 0.06, + "epoch": 0.3, + "learning_rate": 0.00025549481402118275, + "loss": 0.0648, "step": 45970 }, { - "epoch": 0.5, - "learning_rate": 0.0002254007398273736, - "loss": 0.0544, + "epoch": 0.3, + "learning_rate": 0.00025548513266682583, + "loss": 0.0669, "step": 45980 }, { - "epoch": 0.5, - "learning_rate": 0.00022538451554286452, - "loss": 0.0604, + "epoch": 0.3, + "learning_rate": 0.0002554754513124689, + "loss": 0.0662, "step": 45990 }, { - "epoch": 0.5, - "learning_rate": 0.0002253682912583555, - "loss": 0.0568, + "epoch": 0.3, + "learning_rate": 0.000255465769958112, + "loss": 0.0649, "step": 46000 }, { - "epoch": 0.5, - "eval_cer": 0.9213001001871219, - "eval_loss": 0.04061218351125717, - "eval_runtime": 119.4072, - "eval_samples_per_second": 16.749, - "eval_steps_per_second": 4.187, + "epoch": 0.3, + "eval_cer": 0.9200388656648967, + "eval_loss": 0.04449348524212837, + "eval_runtime": 120.161, + "eval_samples_per_second": 16.644, + "eval_steps_per_second": 4.161, "step": 46000 }, { - "epoch": 0.5, - "learning_rate": 0.00022535206697384642, - "loss": 0.0701, + "epoch": 0.3, + "learning_rate": 0.00025545608860375507, + "loss": 0.0767, "step": 46010 }, { - "epoch": 0.5, - "learning_rate": 0.00022533584268933737, - "loss": 0.0643, + "epoch": 0.3, + "learning_rate": 0.00025544640724939815, + "loss": 0.0647, "step": 46020 }, { - "epoch": 0.5, - "learning_rate": 0.00022531961840482832, - "loss": 0.0602, + "epoch": 0.3, + "learning_rate": 0.0002554367258950412, + "loss": 0.0625, "step": 46030 }, { - "epoch": 0.5, - "learning_rate": 0.00022530339412031927, - "loss": 0.0661, + "epoch": 0.3, + "learning_rate": 0.00025542704454068426, + "loss": 0.0721, "step": 46040 }, { - "epoch": 0.5, - "learning_rate": 0.00022528716983581022, - "loss": 0.0646, + "epoch": 0.3, + "learning_rate": 0.00025541736318632734, + "loss": 0.0633, "step": 46050 }, { - "epoch": 0.5, - "learning_rate": 0.00022527094555130117, - "loss": 0.0544, + "epoch": 0.3, + "learning_rate": 0.0002554076818319704, + "loss": 0.0611, "step": 46060 }, { - "epoch": 0.5, - "learning_rate": 0.0002252547212667921, - "loss": 0.0629, + "epoch": 0.3, + "learning_rate": 0.00025539800047761344, + "loss": 0.0655, "step": 46070 }, { - "epoch": 0.5, - "learning_rate": 0.00022523849698228307, - "loss": 0.0583, + "epoch": 0.3, + "learning_rate": 0.0002553883191232565, + "loss": 0.0611, "step": 46080 }, { - "epoch": 0.5, - "learning_rate": 0.000225222272697774, - "loss": 0.0652, + "epoch": 0.3, + "learning_rate": 0.0002553786377688996, + "loss": 0.0644, "step": 46090 }, { - "epoch": 0.5, - "learning_rate": 0.00022520604841326497, - "loss": 0.0565, + "epoch": 0.3, + "learning_rate": 0.00025536895641454263, + "loss": 0.0626, "step": 46100 }, { - "epoch": 0.5, - "learning_rate": 0.0002251898241287559, - "loss": 0.067, + "epoch": 0.3, + "learning_rate": 0.0002553592750601857, + "loss": 0.0716, "step": 46110 }, { - "epoch": 0.5, - "learning_rate": 0.00022517359984424684, - "loss": 0.0571, + "epoch": 0.3, + "learning_rate": 0.0002553495937058288, + "loss": 0.0608, "step": 46120 }, { - "epoch": 0.5, - "learning_rate": 0.0002251573755597378, - "loss": 0.0558, + "epoch": 0.3, + "learning_rate": 0.00025533991235147187, + "loss": 0.0611, "step": 46130 }, { - "epoch": 0.5, - "learning_rate": 0.00022514115127522874, - "loss": 0.0572, + "epoch": 0.3, + "learning_rate": 0.00025533023099711495, + "loss": 0.0703, "step": 46140 }, { - "epoch": 0.5, - "learning_rate": 0.00022512492699071967, - "loss": 0.0574, + "epoch": 0.3, + "learning_rate": 0.000255320549642758, + "loss": 0.0652, "step": 46150 }, { - "epoch": 0.5, - "learning_rate": 0.00022510870270621064, - "loss": 0.0546, + "epoch": 0.3, + "learning_rate": 0.0002553108682884011, + "loss": 0.0652, "step": 46160 }, { - "epoch": 0.5, - "learning_rate": 0.00022509247842170157, - "loss": 0.0577, + "epoch": 0.3, + "learning_rate": 0.00025530118693404413, + "loss": 0.0731, "step": 46170 }, { - "epoch": 0.5, - "learning_rate": 0.00022507625413719254, - "loss": 0.0572, + "epoch": 0.3, + "learning_rate": 0.0002552915055796872, + "loss": 0.0669, "step": 46180 }, { - "epoch": 0.5, - "learning_rate": 0.00022506002985268347, - "loss": 0.0626, + "epoch": 0.3, + "learning_rate": 0.0002552818242253303, + "loss": 0.0674, "step": 46190 }, { - "epoch": 0.5, - "learning_rate": 0.00022504380556817442, - "loss": 0.056, + "epoch": 0.3, + "learning_rate": 0.0002552721428709733, + "loss": 0.0676, "step": 46200 }, { - "epoch": 0.5, - "learning_rate": 0.00022502758128366537, - "loss": 0.0598, + "epoch": 0.3, + "learning_rate": 0.0002552624615166164, + "loss": 0.0677, "step": 46210 }, { - "epoch": 0.5, - "learning_rate": 0.00022501135699915632, - "loss": 0.0547, + "epoch": 0.3, + "learning_rate": 0.0002552527801622595, + "loss": 0.0591, "step": 46220 }, { - "epoch": 0.5, - "learning_rate": 0.00022499513271464727, - "loss": 0.0537, + "epoch": 0.3, + "learning_rate": 0.00025524309880790256, + "loss": 0.0644, "step": 46230 }, { - "epoch": 0.5, - "learning_rate": 0.00022497890843013821, - "loss": 0.0598, + "epoch": 0.3, + "learning_rate": 0.0002552334174535456, + "loss": 0.0715, "step": 46240 }, { - "epoch": 0.5, - "learning_rate": 0.00022496268414562914, - "loss": 0.072, + "epoch": 0.3, + "learning_rate": 0.00025522373609918866, + "loss": 0.0703, "step": 46250 }, { - "epoch": 0.5, - "learning_rate": 0.00022494645986112011, - "loss": 0.0643, + "epoch": 0.3, + "learning_rate": 0.00025521405474483174, + "loss": 0.0733, "step": 46260 }, { - "epoch": 0.5, - "learning_rate": 0.00022493023557661104, - "loss": 0.0568, + "epoch": 0.3, + "learning_rate": 0.0002552043733904748, + "loss": 0.0597, "step": 46270 }, { - "epoch": 0.5, - "learning_rate": 0.00022491401129210201, - "loss": 0.0617, + "epoch": 0.3, + "learning_rate": 0.0002551946920361179, + "loss": 0.0608, "step": 46280 }, { - "epoch": 0.5, - "learning_rate": 0.00022489778700759294, - "loss": 0.0552, + "epoch": 0.3, + "learning_rate": 0.000255185010681761, + "loss": 0.0695, "step": 46290 }, { - "epoch": 0.5, - "learning_rate": 0.0002248815627230839, - "loss": 0.0511, + "epoch": 0.3, + "learning_rate": 0.000255175329327404, + "loss": 0.0592, "step": 46300 }, { - "epoch": 0.5, - "learning_rate": 0.00022486533843857484, - "loss": 0.0587, + "epoch": 0.3, + "learning_rate": 0.0002551656479730471, + "loss": 0.0541, "step": 46310 }, { - "epoch": 0.5, - "learning_rate": 0.00022484911415406579, - "loss": 0.0575, + "epoch": 0.3, + "learning_rate": 0.00025515596661869017, + "loss": 0.0623, "step": 46320 }, { - "epoch": 0.5, - "learning_rate": 0.0002248328898695567, - "loss": 0.0603, + "epoch": 0.3, + "learning_rate": 0.0002551462852643332, + "loss": 0.0727, "step": 46330 }, { - "epoch": 0.5, - "learning_rate": 0.00022481666558504769, - "loss": 0.0648, + "epoch": 0.3, + "learning_rate": 0.00025513660390997627, + "loss": 0.0663, "step": 46340 }, { - "epoch": 0.5, - "learning_rate": 0.0002248004413005386, - "loss": 0.053, + "epoch": 0.3, + "learning_rate": 0.00025512692255561935, + "loss": 0.0573, "step": 46350 }, { - "epoch": 0.5, - "learning_rate": 0.00022478421701602959, - "loss": 0.0564, + "epoch": 0.3, + "learning_rate": 0.00025511724120126243, + "loss": 0.0562, "step": 46360 }, { - "epoch": 0.5, - "learning_rate": 0.0002247679927315205, - "loss": 0.0584, + "epoch": 0.3, + "learning_rate": 0.0002551075598469055, + "loss": 0.062, "step": 46370 }, { - "epoch": 0.5, - "learning_rate": 0.00022475176844701146, - "loss": 0.0566, + "epoch": 0.3, + "learning_rate": 0.00025509787849254854, + "loss": 0.0649, "step": 46380 }, { - "epoch": 0.5, - "learning_rate": 0.0002247355441625024, - "loss": 0.0552, + "epoch": 0.3, + "learning_rate": 0.0002550881971381916, + "loss": 0.0702, "step": 46390 }, { - "epoch": 0.5, - "learning_rate": 0.00022471931987799336, - "loss": 0.0519, + "epoch": 0.3, + "learning_rate": 0.0002550785157838347, + "loss": 0.0658, "step": 46400 }, { - "epoch": 0.5, - "learning_rate": 0.0002247030955934843, - "loss": 0.0553, + "epoch": 0.3, + "learning_rate": 0.0002550688344294778, + "loss": 0.0727, "step": 46410 }, { - "epoch": 0.5, - "learning_rate": 0.00022468687130897526, - "loss": 0.0532, + "epoch": 0.3, + "learning_rate": 0.00025505915307512086, + "loss": 0.074, "step": 46420 }, { - "epoch": 0.5, - "learning_rate": 0.00022467064702446618, - "loss": 0.0528, + "epoch": 0.3, + "learning_rate": 0.00025504947172076394, + "loss": 0.0668, "step": 46430 }, { - "epoch": 0.5, - "learning_rate": 0.00022465442273995716, - "loss": 0.0631, + "epoch": 0.3, + "learning_rate": 0.00025503979036640696, + "loss": 0.0767, "step": 46440 }, { - "epoch": 0.5, - "learning_rate": 0.00022463819845544808, - "loss": 0.059, + "epoch": 0.3, + "learning_rate": 0.00025503010901205004, + "loss": 0.067, "step": 46450 }, { - "epoch": 0.5, - "learning_rate": 0.00022462197417093906, - "loss": 0.0609, + "epoch": 0.3, + "learning_rate": 0.0002550204276576931, + "loss": 0.0807, "step": 46460 }, { - "epoch": 0.5, - "learning_rate": 0.00022460574988642998, - "loss": 0.0574, + "epoch": 0.3, + "learning_rate": 0.00025501074630333615, + "loss": 0.0659, "step": 46470 }, { - "epoch": 0.5, - "learning_rate": 0.00022458952560192093, - "loss": 0.0635, - "step": 46480 + "epoch": 0.3, + "learning_rate": 0.0002550010649489792, + "loss": 0.0657, + "step": 46480 }, { - "epoch": 0.5, - "learning_rate": 0.00022457330131741188, - "loss": 0.0585, + "epoch": 0.3, + "learning_rate": 0.0002549913835946223, + "loss": 0.0723, "step": 46490 }, { - "epoch": 0.5, - "learning_rate": 0.00022455707703290283, - "loss": 0.0558, + "epoch": 0.3, + "learning_rate": 0.0002549817022402654, + "loss": 0.0594, "step": 46500 }, { - "epoch": 0.5, - "learning_rate": 0.00022454085274839375, - "loss": 0.0624, + "epoch": 0.3, + "learning_rate": 0.00025497202088590847, + "loss": 0.0629, "step": 46510 }, { - "epoch": 0.5, - "learning_rate": 0.00022452462846388473, - "loss": 0.0598, + "epoch": 0.3, + "learning_rate": 0.0002549623395315515, + "loss": 0.0661, "step": 46520 }, { - "epoch": 0.5, - "learning_rate": 0.00022450840417937565, - "loss": 0.0645, + "epoch": 0.3, + "learning_rate": 0.00025495265817719457, + "loss": 0.066, "step": 46530 }, { - "epoch": 0.5, - "learning_rate": 0.00022449217989486663, - "loss": 0.0605, + "epoch": 0.3, + "learning_rate": 0.00025494297682283765, + "loss": 0.0602, "step": 46540 }, { - "epoch": 0.5, - "learning_rate": 0.00022447595561035755, - "loss": 0.0602, + "epoch": 0.3, + "learning_rate": 0.00025493329546848073, + "loss": 0.0605, "step": 46550 }, { - "epoch": 0.5, - "learning_rate": 0.00022445973132584853, - "loss": 0.0576, + "epoch": 0.3, + "learning_rate": 0.0002549236141141238, + "loss": 0.0713, "step": 46560 }, { - "epoch": 0.5, - "learning_rate": 0.00022444350704133945, - "loss": 0.054, + "epoch": 0.3, + "learning_rate": 0.00025491393275976684, + "loss": 0.0715, "step": 46570 }, { - "epoch": 0.5, - "learning_rate": 0.0002244272827568304, - "loss": 0.0521, + "epoch": 0.3, + "learning_rate": 0.0002549042514054099, + "loss": 0.0682, "step": 46580 }, { - "epoch": 0.5, - "learning_rate": 0.00022441105847232135, - "loss": 0.062, + "epoch": 0.3, + "learning_rate": 0.000254894570051053, + "loss": 0.0737, "step": 46590 }, { - "epoch": 0.5, - "learning_rate": 0.0002243948341878123, - "loss": 0.0625, + "epoch": 0.3, + "learning_rate": 0.000254884888696696, + "loss": 0.0627, "step": 46600 }, { - "epoch": 0.5, - "learning_rate": 0.00022437860990330322, - "loss": 0.0602, + "epoch": 0.3, + "learning_rate": 0.0002548752073423391, + "loss": 0.0646, "step": 46610 }, { - "epoch": 0.5, - "learning_rate": 0.0002243623856187942, - "loss": 0.0647, + "epoch": 0.3, + "learning_rate": 0.0002548655259879822, + "loss": 0.0604, "step": 46620 }, { - "epoch": 0.5, - "learning_rate": 0.00022434616133428512, - "loss": 0.0676, + "epoch": 0.3, + "learning_rate": 0.00025485584463362526, + "loss": 0.0631, "step": 46630 }, { - "epoch": 0.5, - "learning_rate": 0.0002243299370497761, - "loss": 0.0584, + "epoch": 0.3, + "learning_rate": 0.00025484616327926834, + "loss": 0.066, "step": 46640 }, { - "epoch": 0.5, - "learning_rate": 0.00022431371276526702, - "loss": 0.0533, + "epoch": 0.3, + "learning_rate": 0.0002548364819249114, + "loss": 0.0631, "step": 46650 }, { - "epoch": 0.5, - "learning_rate": 0.00022429748848075797, - "loss": 0.0577, + "epoch": 0.3, + "learning_rate": 0.00025482680057055445, + "loss": 0.0655, "step": 46660 }, { - "epoch": 0.5, - "learning_rate": 0.00022428126419624892, - "loss": 0.0538, + "epoch": 0.3, + "learning_rate": 0.0002548171192161975, + "loss": 0.063, "step": 46670 }, { - "epoch": 0.5, - "learning_rate": 0.00022426503991173987, - "loss": 0.0585, + "epoch": 0.3, + "learning_rate": 0.0002548074378618406, + "loss": 0.0702, "step": 46680 }, { - "epoch": 0.51, - "learning_rate": 0.0002242488156272308, - "loss": 0.0557, + "epoch": 0.3, + "learning_rate": 0.0002547977565074837, + "loss": 0.0603, "step": 46690 }, { - "epoch": 0.51, - "learning_rate": 0.00022423259134272177, - "loss": 0.0643, + "epoch": 0.3, + "learning_rate": 0.0002547880751531267, + "loss": 0.0612, "step": 46700 }, { - "epoch": 0.51, - "learning_rate": 0.0002242163670582127, - "loss": 0.0528, + "epoch": 0.3, + "learning_rate": 0.0002547783937987698, + "loss": 0.0783, "step": 46710 }, { - "epoch": 0.51, - "learning_rate": 0.00022420014277370367, - "loss": 0.0582, + "epoch": 0.3, + "learning_rate": 0.00025476871244441287, + "loss": 0.0734, "step": 46720 }, { - "epoch": 0.51, - "learning_rate": 0.0002241839184891946, - "loss": 0.0607, + "epoch": 0.3, + "learning_rate": 0.0002547590310900559, + "loss": 0.0591, "step": 46730 }, { - "epoch": 0.51, - "learning_rate": 0.00022416769420468557, - "loss": 0.0525, + "epoch": 0.3, + "learning_rate": 0.000254749349735699, + "loss": 0.0668, "step": 46740 }, { - "epoch": 0.51, - "learning_rate": 0.0002241514699201765, - "loss": 0.0562, + "epoch": 0.3, + "learning_rate": 0.00025473966838134205, + "loss": 0.0613, "step": 46750 }, { - "epoch": 0.51, - "learning_rate": 0.00022413524563566744, - "loss": 0.0685, + "epoch": 0.3, + "learning_rate": 0.00025472998702698513, + "loss": 0.0617, "step": 46760 }, { - "epoch": 0.51, - "learning_rate": 0.0002241190213511584, - "loss": 0.0594, + "epoch": 0.3, + "learning_rate": 0.0002547203056726282, + "loss": 0.0716, "step": 46770 }, { - "epoch": 0.51, - "learning_rate": 0.00022410279706664934, - "loss": 0.0578, + "epoch": 0.3, + "learning_rate": 0.0002547106243182713, + "loss": 0.0663, "step": 46780 }, { - "epoch": 0.51, - "learning_rate": 0.00022408657278214026, - "loss": 0.0592, + "epoch": 0.3, + "learning_rate": 0.0002547009429639144, + "loss": 0.075, "step": 46790 }, { - "epoch": 0.51, - "learning_rate": 0.00022407034849763124, - "loss": 0.0584, + "epoch": 0.3, + "learning_rate": 0.0002546912616095574, + "loss": 0.0644, "step": 46800 }, { - "epoch": 0.51, - "learning_rate": 0.00022405412421312216, - "loss": 0.0501, + "epoch": 0.3, + "learning_rate": 0.0002546815802552005, + "loss": 0.0695, "step": 46810 }, { - "epoch": 0.51, - "learning_rate": 0.00022403789992861314, - "loss": 0.0568, + "epoch": 0.3, + "learning_rate": 0.00025467189890084356, + "loss": 0.0636, "step": 46820 }, { - "epoch": 0.51, - "learning_rate": 0.00022402167564410406, - "loss": 0.0597, + "epoch": 0.3, + "learning_rate": 0.00025466221754648664, + "loss": 0.0619, "step": 46830 }, { - "epoch": 0.51, - "learning_rate": 0.000224005451359595, - "loss": 0.0621, + "epoch": 0.3, + "learning_rate": 0.00025465253619212966, + "loss": 0.0599, "step": 46840 }, { - "epoch": 0.51, - "learning_rate": 0.00022398922707508596, - "loss": 0.0609, + "epoch": 0.3, + "learning_rate": 0.00025464285483777274, + "loss": 0.0679, "step": 46850 }, { - "epoch": 0.51, - "learning_rate": 0.0002239730027905769, - "loss": 0.0686, + "epoch": 0.3, + "learning_rate": 0.0002546331734834158, + "loss": 0.0606, "step": 46860 }, { - "epoch": 0.51, - "learning_rate": 0.00022395677850606783, - "loss": 0.0559, + "epoch": 0.3, + "learning_rate": 0.00025462349212905885, + "loss": 0.0703, "step": 46870 }, { - "epoch": 0.51, - "learning_rate": 0.0002239405542215588, - "loss": 0.0589, + "epoch": 0.3, + "learning_rate": 0.00025461381077470193, + "loss": 0.0722, "step": 46880 }, { - "epoch": 0.51, - "learning_rate": 0.00022392432993704973, - "loss": 0.0553, + "epoch": 0.3, + "learning_rate": 0.000254604129420345, + "loss": 0.0653, "step": 46890 }, { - "epoch": 0.51, - "learning_rate": 0.0002239081056525407, - "loss": 0.0544, + "epoch": 0.3, + "learning_rate": 0.0002545944480659881, + "loss": 0.0623, "step": 46900 }, { - "epoch": 0.51, - "learning_rate": 0.00022389188136803163, - "loss": 0.0555, + "epoch": 0.3, + "learning_rate": 0.00025458476671163117, + "loss": 0.0648, "step": 46910 }, { - "epoch": 0.51, - "learning_rate": 0.0002238756570835226, - "loss": 0.0653, + "epoch": 0.3, + "learning_rate": 0.00025457508535727425, + "loss": 0.0675, "step": 46920 }, { - "epoch": 0.51, - "learning_rate": 0.00022385943279901353, - "loss": 0.1099, + "epoch": 0.3, + "learning_rate": 0.00025456540400291733, + "loss": 0.0837, "step": 46930 }, { - "epoch": 0.51, - "learning_rate": 0.00022384320851450448, - "loss": 0.0579, + "epoch": 0.3, + "learning_rate": 0.00025455572264856035, + "loss": 0.0673, "step": 46940 }, { - "epoch": 0.51, - "learning_rate": 0.00022382698422999546, - "loss": 0.0602, + "epoch": 0.3, + "learning_rate": 0.00025454604129420343, + "loss": 0.0734, "step": 46950 }, { - "epoch": 0.51, - "learning_rate": 0.00022381075994548638, - "loss": 0.0657, + "epoch": 0.3, + "learning_rate": 0.0002545363599398465, + "loss": 0.0666, "step": 46960 }, { - "epoch": 0.51, - "learning_rate": 0.00022379453566097736, - "loss": 0.0706, + "epoch": 0.3, + "learning_rate": 0.00025452667858548954, + "loss": 0.0684, "step": 46970 }, { - "epoch": 0.51, - "learning_rate": 0.00022377831137646828, - "loss": 0.0613, + "epoch": 0.3, + "learning_rate": 0.0002545169972311326, + "loss": 0.0692, "step": 46980 }, { - "epoch": 0.51, - "learning_rate": 0.00022376208709195923, - "loss": 0.0523, + "epoch": 0.3, + "learning_rate": 0.0002545073158767757, + "loss": 0.0638, "step": 46990 }, { - "epoch": 0.51, - "learning_rate": 0.00022374586280745018, - "loss": 0.065, + "epoch": 0.3, + "learning_rate": 0.0002544976345224188, + "loss": 0.069, "step": 47000 }, { - "epoch": 0.51, - "eval_cer": 0.9212912653439139, - "eval_loss": 0.04054510220885277, - "eval_runtime": 119.1798, - "eval_samples_per_second": 16.781, - "eval_steps_per_second": 4.195, + "epoch": 0.3, + "eval_cer": 0.9200750197717772, + "eval_loss": 0.04444407671689987, + "eval_runtime": 120.1079, + "eval_samples_per_second": 16.652, + "eval_steps_per_second": 4.163, "step": 47000 }, { - "epoch": 0.51, - "learning_rate": 0.00022372963852294113, - "loss": 0.058, + "epoch": 0.3, + "learning_rate": 0.0002544879531680618, + "loss": 0.0689, "step": 47010 }, { - "epoch": 0.51, - "learning_rate": 0.00022371341423843205, - "loss": 0.0654, + "epoch": 0.3, + "learning_rate": 0.0002544782718137049, + "loss": 0.0668, "step": 47020 }, { - "epoch": 0.51, - "learning_rate": 0.00022369718995392303, - "loss": 0.049, + "epoch": 0.3, + "learning_rate": 0.00025446859045934796, + "loss": 0.0648, "step": 47030 }, { - "epoch": 0.51, - "learning_rate": 0.00022368096566941395, - "loss": 0.0644, + "epoch": 0.3, + "learning_rate": 0.00025445890910499104, + "loss": 0.0723, "step": 47040 }, { - "epoch": 0.51, - "learning_rate": 0.00022366474138490493, - "loss": 0.0546, + "epoch": 0.3, + "learning_rate": 0.0002544492277506341, + "loss": 0.0617, "step": 47050 }, { - "epoch": 0.51, - "learning_rate": 0.00022364851710039585, - "loss": 0.0584, + "epoch": 0.3, + "learning_rate": 0.0002544395463962772, + "loss": 0.0603, "step": 47060 }, { - "epoch": 0.51, - "learning_rate": 0.0002236322928158868, - "loss": 0.0656, + "epoch": 0.3, + "learning_rate": 0.00025442986504192023, + "loss": 0.063, "step": 47070 }, { - "epoch": 0.51, - "learning_rate": 0.00022361606853137775, - "loss": 0.0478, + "epoch": 0.3, + "learning_rate": 0.0002544201836875633, + "loss": 0.0666, "step": 47080 }, { - "epoch": 0.51, - "learning_rate": 0.0002235998442468687, - "loss": 0.0578, + "epoch": 0.3, + "learning_rate": 0.0002544105023332064, + "loss": 0.0681, "step": 47090 }, { - "epoch": 0.51, - "learning_rate": 0.00022358361996235965, - "loss": 0.0645, + "epoch": 0.3, + "learning_rate": 0.0002544008209788494, + "loss": 0.0644, "step": 47100 }, { - "epoch": 0.51, - "learning_rate": 0.0002235673956778506, - "loss": 0.0568, + "epoch": 0.3, + "learning_rate": 0.0002543911396244925, + "loss": 0.0732, "step": 47110 }, { - "epoch": 0.51, - "learning_rate": 0.00022355117139334152, - "loss": 0.0586, + "epoch": 0.3, + "learning_rate": 0.0002543814582701356, + "loss": 0.0647, "step": 47120 }, { - "epoch": 0.51, - "learning_rate": 0.0002235349471088325, - "loss": 0.051, + "epoch": 0.3, + "learning_rate": 0.00025437177691577865, + "loss": 0.062, "step": 47130 }, { - "epoch": 0.51, - "learning_rate": 0.00022351872282432342, - "loss": 0.0635, + "epoch": 0.3, + "learning_rate": 0.00025436209556142173, + "loss": 0.0628, "step": 47140 }, { - "epoch": 0.51, - "learning_rate": 0.0002235024985398144, - "loss": 0.0533, + "epoch": 0.3, + "learning_rate": 0.00025435241420706476, + "loss": 0.0571, "step": 47150 }, { - "epoch": 0.51, - "learning_rate": 0.00022348627425530532, - "loss": 0.0498, + "epoch": 0.3, + "learning_rate": 0.00025434273285270784, + "loss": 0.0671, "step": 47160 }, { - "epoch": 0.51, - "learning_rate": 0.00022347004997079627, - "loss": 0.0672, + "epoch": 0.3, + "learning_rate": 0.0002543330514983509, + "loss": 0.0713, "step": 47170 }, { - "epoch": 0.51, - "learning_rate": 0.00022345382568628722, - "loss": 0.0584, + "epoch": 0.3, + "learning_rate": 0.000254323370143994, + "loss": 0.0651, "step": 47180 }, { - "epoch": 0.51, - "learning_rate": 0.00022343760140177817, - "loss": 0.0564, + "epoch": 0.3, + "learning_rate": 0.0002543136887896371, + "loss": 0.0639, "step": 47190 }, { - "epoch": 0.51, - "learning_rate": 0.0002234213771172691, - "loss": 0.0548, + "epoch": 0.3, + "learning_rate": 0.00025430400743528016, + "loss": 0.0611, "step": 47200 }, { - "epoch": 0.51, - "learning_rate": 0.00022340515283276007, - "loss": 0.0581, + "epoch": 0.3, + "learning_rate": 0.0002542943260809232, + "loss": 0.0634, "step": 47210 }, { - "epoch": 0.51, - "learning_rate": 0.000223388928548251, - "loss": 0.0673, + "epoch": 0.3, + "learning_rate": 0.00025428464472656626, + "loss": 0.0589, "step": 47220 }, { - "epoch": 0.51, - "learning_rate": 0.00022337270426374197, - "loss": 0.0537, + "epoch": 0.3, + "learning_rate": 0.00025427496337220934, + "loss": 0.0645, "step": 47230 }, { - "epoch": 0.51, - "learning_rate": 0.0002233564799792329, - "loss": 0.0515, + "epoch": 0.3, + "learning_rate": 0.00025426528201785237, + "loss": 0.0743, "step": 47240 }, { - "epoch": 0.51, - "learning_rate": 0.00022334025569472387, - "loss": 0.058, + "epoch": 0.3, + "learning_rate": 0.00025425560066349545, + "loss": 0.072, "step": 47250 }, { - "epoch": 0.51, - "learning_rate": 0.0002233240314102148, - "loss": 0.0581, + "epoch": 0.31, + "learning_rate": 0.00025424591930913853, + "loss": 0.066, "step": 47260 }, { - "epoch": 0.51, - "learning_rate": 0.00022330780712570574, - "loss": 0.0687, + "epoch": 0.31, + "learning_rate": 0.0002542362379547816, + "loss": 0.062, "step": 47270 }, { - "epoch": 0.51, - "learning_rate": 0.0002232915828411967, - "loss": 0.055, + "epoch": 0.31, + "learning_rate": 0.0002542265566004247, + "loss": 0.0658, "step": 47280 }, { - "epoch": 0.51, - "learning_rate": 0.00022327535855668764, - "loss": 0.0572, + "epoch": 0.31, + "learning_rate": 0.0002542168752460677, + "loss": 0.0617, "step": 47290 }, { - "epoch": 0.51, - "learning_rate": 0.00022325913427217857, - "loss": 0.0564, + "epoch": 0.31, + "learning_rate": 0.0002542071938917108, + "loss": 0.0633, "step": 47300 }, { - "epoch": 0.51, - "learning_rate": 0.00022324290998766954, - "loss": 0.0461, + "epoch": 0.31, + "learning_rate": 0.00025419751253735387, + "loss": 0.0649, "step": 47310 }, { - "epoch": 0.51, - "learning_rate": 0.00022322668570316046, - "loss": 0.0542, + "epoch": 0.31, + "learning_rate": 0.00025418783118299695, + "loss": 0.0664, "step": 47320 }, { - "epoch": 0.51, - "learning_rate": 0.00022321046141865144, - "loss": 0.0521, + "epoch": 0.31, + "learning_rate": 0.00025417814982864003, + "loss": 0.0677, "step": 47330 }, { - "epoch": 0.51, - "learning_rate": 0.00022319423713414236, - "loss": 0.0633, + "epoch": 0.31, + "learning_rate": 0.00025416846847428306, + "loss": 0.0754, "step": 47340 }, { - "epoch": 0.51, - "learning_rate": 0.00022317801284963331, - "loss": 0.056, + "epoch": 0.31, + "learning_rate": 0.00025415878711992614, + "loss": 0.0712, "step": 47350 }, { - "epoch": 0.51, - "learning_rate": 0.00022316178856512426, - "loss": 0.0607, + "epoch": 0.31, + "learning_rate": 0.0002541491057655692, + "loss": 0.0717, "step": 47360 }, { - "epoch": 0.51, - "learning_rate": 0.00022314556428061521, - "loss": 0.0563, + "epoch": 0.31, + "learning_rate": 0.00025413942441121224, + "loss": 0.0749, "step": 47370 }, { - "epoch": 0.51, - "learning_rate": 0.00022312933999610614, - "loss": 0.0543, + "epoch": 0.31, + "learning_rate": 0.0002541297430568553, + "loss": 0.0669, "step": 47380 }, { - "epoch": 0.51, - "learning_rate": 0.0002231131157115971, - "loss": 0.0637, + "epoch": 0.31, + "learning_rate": 0.0002541200617024984, + "loss": 0.078, "step": 47390 }, { - "epoch": 0.51, - "learning_rate": 0.00022309689142708804, - "loss": 0.0579, + "epoch": 0.31, + "learning_rate": 0.0002541103803481415, + "loss": 0.0703, "step": 47400 }, { - "epoch": 0.51, - "learning_rate": 0.000223080667142579, - "loss": 0.0556, + "epoch": 0.31, + "learning_rate": 0.00025410069899378456, + "loss": 0.065, "step": 47410 }, { - "epoch": 0.51, - "learning_rate": 0.00022306444285806994, - "loss": 0.0584, + "epoch": 0.31, + "learning_rate": 0.00025409101763942764, + "loss": 0.0667, "step": 47420 }, { - "epoch": 0.51, - "learning_rate": 0.0002230482185735609, - "loss": 0.0583, + "epoch": 0.31, + "learning_rate": 0.00025408133628507067, + "loss": 0.0589, "step": 47430 }, { - "epoch": 0.51, - "learning_rate": 0.00022303199428905184, - "loss": 0.0539, + "epoch": 0.31, + "learning_rate": 0.00025407165493071375, + "loss": 0.0701, "step": 47440 }, { - "epoch": 0.51, - "learning_rate": 0.00022301577000454278, - "loss": 0.056, + "epoch": 0.31, + "learning_rate": 0.00025406197357635683, + "loss": 0.066, "step": 47450 }, { - "epoch": 0.51, - "learning_rate": 0.00022299954572003373, - "loss": 0.0554, + "epoch": 0.31, + "learning_rate": 0.0002540522922219999, + "loss": 0.0632, "step": 47460 }, { - "epoch": 0.51, - "learning_rate": 0.00022298332143552468, - "loss": 0.0521, + "epoch": 0.31, + "learning_rate": 0.00025404261086764293, + "loss": 0.0676, "step": 47470 }, { - "epoch": 0.51, - "learning_rate": 0.0002229670971510156, - "loss": 0.0559, + "epoch": 0.31, + "learning_rate": 0.000254032929513286, + "loss": 0.0624, "step": 47480 }, { - "epoch": 0.51, - "learning_rate": 0.00022295087286650658, - "loss": 0.0557, + "epoch": 0.31, + "learning_rate": 0.0002540232481589291, + "loss": 0.0627, "step": 47490 }, { - "epoch": 0.51, - "learning_rate": 0.0002229346485819975, - "loss": 0.0581, + "epoch": 0.31, + "learning_rate": 0.0002540135668045721, + "loss": 0.061, "step": 47500 }, { - "epoch": 0.51, - "learning_rate": 0.00022291842429748848, - "loss": 0.0573, + "epoch": 0.31, + "learning_rate": 0.0002540038854502152, + "loss": 0.07, "step": 47510 }, { - "epoch": 0.51, - "learning_rate": 0.0002229022000129794, - "loss": 0.0539, + "epoch": 0.31, + "learning_rate": 0.0002539942040958583, + "loss": 0.0615, "step": 47520 }, { - "epoch": 0.51, - "learning_rate": 0.00022288597572847036, - "loss": 0.0643, + "epoch": 0.31, + "learning_rate": 0.00025398452274150136, + "loss": 0.0609, "step": 47530 }, { - "epoch": 0.51, - "learning_rate": 0.0002228697514439613, - "loss": 0.0562, + "epoch": 0.31, + "learning_rate": 0.00025397484138714444, + "loss": 0.0671, "step": 47540 }, { - "epoch": 0.51, - "learning_rate": 0.00022285352715945226, - "loss": 0.0511, + "epoch": 0.31, + "learning_rate": 0.0002539651600327875, + "loss": 0.0684, "step": 47550 }, { - "epoch": 0.51, - "learning_rate": 0.00022283730287494318, - "loss": 0.0619, + "epoch": 0.31, + "learning_rate": 0.0002539554786784306, + "loss": 0.0678, "step": 47560 }, { - "epoch": 0.51, - "learning_rate": 0.00022282107859043416, - "loss": 0.0568, + "epoch": 0.31, + "learning_rate": 0.0002539457973240736, + "loss": 0.0583, "step": 47570 }, { - "epoch": 0.51, - "learning_rate": 0.00022280485430592508, - "loss": 0.0533, + "epoch": 0.31, + "learning_rate": 0.0002539361159697167, + "loss": 0.0624, "step": 47580 }, { - "epoch": 0.51, - "learning_rate": 0.00022278863002141605, - "loss": 0.0593, + "epoch": 0.31, + "learning_rate": 0.0002539264346153598, + "loss": 0.0639, "step": 47590 }, { - "epoch": 0.51, - "learning_rate": 0.00022277240573690698, - "loss": 0.0578, + "epoch": 0.31, + "learning_rate": 0.00025391675326100286, + "loss": 0.063, "step": 47600 }, { - "epoch": 0.51, - "learning_rate": 0.00022275618145239795, - "loss": 0.0546, + "epoch": 0.31, + "learning_rate": 0.0002539070719066459, + "loss": 0.0684, "step": 47610 }, { - "epoch": 0.52, - "learning_rate": 0.00022273995716788888, - "loss": 0.0627, + "epoch": 0.31, + "learning_rate": 0.00025389739055228897, + "loss": 0.0678, "step": 47620 }, { - "epoch": 0.52, - "learning_rate": 0.00022272373288337983, - "loss": 0.0587, + "epoch": 0.31, + "learning_rate": 0.00025388770919793205, + "loss": 0.0648, "step": 47630 }, { - "epoch": 0.52, - "learning_rate": 0.00022270750859887078, - "loss": 0.0581, + "epoch": 0.31, + "learning_rate": 0.00025387802784357507, + "loss": 0.0697, "step": 47640 }, { - "epoch": 0.52, - "learning_rate": 0.00022269128431436173, - "loss": 0.0584, + "epoch": 0.31, + "learning_rate": 0.00025386834648921815, + "loss": 0.0725, "step": 47650 }, { - "epoch": 0.52, - "learning_rate": 0.00022267506002985265, - "loss": 0.0712, + "epoch": 0.31, + "learning_rate": 0.00025385866513486123, + "loss": 0.0628, "step": 47660 }, { - "epoch": 0.52, - "learning_rate": 0.00022265883574534363, - "loss": 0.0641, + "epoch": 0.31, + "learning_rate": 0.0002538489837805043, + "loss": 0.0628, "step": 47670 }, { - "epoch": 0.52, - "learning_rate": 0.00022264261146083455, - "loss": 0.0536, + "epoch": 0.31, + "learning_rate": 0.0002538393024261474, + "loss": 0.0591, "step": 47680 }, { - "epoch": 0.52, - "learning_rate": 0.00022262638717632553, - "loss": 0.0553, + "epoch": 0.31, + "learning_rate": 0.00025382962107179047, + "loss": 0.0637, "step": 47690 }, { - "epoch": 0.52, - "learning_rate": 0.00022261016289181645, - "loss": 0.0506, + "epoch": 0.31, + "learning_rate": 0.00025381993971743355, + "loss": 0.0723, "step": 47700 }, { - "epoch": 0.52, - "learning_rate": 0.0002225939386073074, - "loss": 0.0614, + "epoch": 0.31, + "learning_rate": 0.0002538102583630766, + "loss": 0.0576, "step": 47710 }, { - "epoch": 0.52, - "learning_rate": 0.00022257771432279835, - "loss": 0.0519, + "epoch": 0.31, + "learning_rate": 0.00025380057700871966, + "loss": 0.0602, "step": 47720 }, { - "epoch": 0.52, - "learning_rate": 0.0002225614900382893, - "loss": 0.0718, + "epoch": 0.31, + "learning_rate": 0.00025379089565436274, + "loss": 0.0605, "step": 47730 }, { - "epoch": 0.52, - "learning_rate": 0.00022254526575378022, - "loss": 0.0513, + "epoch": 0.31, + "learning_rate": 0.00025378121430000576, + "loss": 0.0669, "step": 47740 }, { - "epoch": 0.52, - "learning_rate": 0.0002225290414692712, - "loss": 0.0513, - "step": 47750 + "epoch": 0.31, + "learning_rate": 0.00025377153294564884, + "loss": 0.0639, + "step": 47750 }, { - "epoch": 0.52, - "learning_rate": 0.00022251281718476212, - "loss": 0.0537, + "epoch": 0.31, + "learning_rate": 0.0002537618515912919, + "loss": 0.0623, "step": 47760 }, { - "epoch": 0.52, - "learning_rate": 0.0002224965929002531, - "loss": 0.0645, + "epoch": 0.31, + "learning_rate": 0.000253752170236935, + "loss": 0.0622, "step": 47770 }, { - "epoch": 0.52, - "learning_rate": 0.00022248036861574402, - "loss": 0.0563, + "epoch": 0.31, + "learning_rate": 0.000253742488882578, + "loss": 0.0635, "step": 47780 }, { - "epoch": 0.52, - "learning_rate": 0.000222464144331235, - "loss": 0.0511, + "epoch": 0.31, + "learning_rate": 0.0002537328075282211, + "loss": 0.0647, "step": 47790 }, { - "epoch": 0.52, - "learning_rate": 0.00022244792004672592, - "loss": 0.0524, + "epoch": 0.31, + "learning_rate": 0.0002537231261738642, + "loss": 0.0568, "step": 47800 }, { - "epoch": 0.52, - "learning_rate": 0.00022243169576221687, - "loss": 0.0606, + "epoch": 0.31, + "learning_rate": 0.00025371344481950727, + "loss": 0.061, "step": 47810 }, { - "epoch": 0.52, - "learning_rate": 0.00022241547147770782, - "loss": 0.0595, + "epoch": 0.31, + "learning_rate": 0.00025370376346515035, + "loss": 0.0626, "step": 47820 }, { - "epoch": 0.52, - "learning_rate": 0.00022239924719319877, - "loss": 0.0516, + "epoch": 0.31, + "learning_rate": 0.0002536940821107934, + "loss": 0.0632, "step": 47830 }, { - "epoch": 0.52, - "learning_rate": 0.0002223830229086897, - "loss": 0.0528, + "epoch": 0.31, + "learning_rate": 0.0002536844007564365, + "loss": 0.0648, "step": 47840 }, { - "epoch": 0.52, - "learning_rate": 0.00022236679862418067, - "loss": 0.0539, + "epoch": 0.31, + "learning_rate": 0.00025367471940207953, + "loss": 0.0839, "step": 47850 }, { - "epoch": 0.52, - "learning_rate": 0.0002223505743396716, - "loss": 0.0604, + "epoch": 0.31, + "learning_rate": 0.0002536650380477226, + "loss": 0.0665, "step": 47860 }, { - "epoch": 0.52, - "learning_rate": 0.00022233435005516257, - "loss": 0.055, + "epoch": 0.31, + "learning_rate": 0.00025365535669336564, + "loss": 0.0616, "step": 47870 }, { - "epoch": 0.52, - "learning_rate": 0.0002223181257706535, - "loss": 0.0556, + "epoch": 0.31, + "learning_rate": 0.0002536456753390087, + "loss": 0.0705, "step": 47880 }, { - "epoch": 0.52, - "learning_rate": 0.00022230190148614444, - "loss": 0.0496, + "epoch": 0.31, + "learning_rate": 0.0002536359939846518, + "loss": 0.0654, "step": 47890 }, { - "epoch": 0.52, - "learning_rate": 0.0002222856772016354, - "loss": 0.0578, + "epoch": 0.31, + "learning_rate": 0.0002536263126302949, + "loss": 0.0675, "step": 47900 }, { - "epoch": 0.52, - "learning_rate": 0.00022226945291712634, - "loss": 0.0532, + "epoch": 0.31, + "learning_rate": 0.00025361663127593796, + "loss": 0.0669, "step": 47910 }, { - "epoch": 0.52, - "learning_rate": 0.0002222532286326173, - "loss": 0.0592, + "epoch": 0.31, + "learning_rate": 0.000253606949921581, + "loss": 0.0687, "step": 47920 }, { - "epoch": 0.52, - "learning_rate": 0.00022223700434810824, - "loss": 0.0615, + "epoch": 0.31, + "learning_rate": 0.00025359726856722406, + "loss": 0.0632, "step": 47930 }, { - "epoch": 0.52, - "learning_rate": 0.00022222078006359916, - "loss": 0.0516, + "epoch": 0.31, + "learning_rate": 0.00025358758721286714, + "loss": 0.0637, "step": 47940 }, { - "epoch": 0.52, - "learning_rate": 0.00022220455577909014, - "loss": 0.0593, + "epoch": 0.31, + "learning_rate": 0.0002535779058585102, + "loss": 0.0687, "step": 47950 }, { - "epoch": 0.52, - "learning_rate": 0.00022218833149458106, - "loss": 0.0564, + "epoch": 0.31, + "learning_rate": 0.0002535682245041533, + "loss": 0.0601, "step": 47960 }, { - "epoch": 0.52, - "learning_rate": 0.00022217210721007204, - "loss": 0.0553, + "epoch": 0.31, + "learning_rate": 0.0002535585431497964, + "loss": 0.0672, "step": 47970 }, { - "epoch": 0.52, - "learning_rate": 0.00022215588292556296, - "loss": 0.0612, + "epoch": 0.31, + "learning_rate": 0.0002535488617954394, + "loss": 0.056, "step": 47980 }, { - "epoch": 0.52, - "learning_rate": 0.0002221396586410539, - "loss": 0.0676, + "epoch": 0.31, + "learning_rate": 0.0002535391804410825, + "loss": 0.0616, "step": 47990 }, { - "epoch": 0.52, - "learning_rate": 0.00022212343435654486, - "loss": 0.063, + "epoch": 0.31, + "learning_rate": 0.00025352949908672557, + "loss": 0.0655, "step": 48000 }, { - "epoch": 0.52, - "eval_cer": 0.9213018671557636, - "eval_loss": 0.03959682583808899, - "eval_runtime": 119.1605, - "eval_samples_per_second": 16.784, - "eval_steps_per_second": 4.196, + "epoch": 0.31, + "eval_cer": 0.9200316348435205, + "eval_loss": 0.043291497975587845, + "eval_runtime": 120.1252, + "eval_samples_per_second": 16.649, + "eval_steps_per_second": 4.162, "step": 48000 }, { - "epoch": 0.52, - "learning_rate": 0.0002221072100720358, - "loss": 0.063, + "epoch": 0.31, + "learning_rate": 0.0002535198177323686, + "loss": 0.059, "step": 48010 }, { - "epoch": 0.52, - "learning_rate": 0.00022209098578752673, - "loss": 0.0617, + "epoch": 0.31, + "learning_rate": 0.00025351013637801167, + "loss": 0.0606, "step": 48020 }, { - "epoch": 0.52, - "learning_rate": 0.0002220747615030177, - "loss": 0.0587, + "epoch": 0.31, + "learning_rate": 0.00025350045502365475, + "loss": 0.0655, "step": 48030 }, { - "epoch": 0.52, - "learning_rate": 0.00022205853721850863, - "loss": 0.0557, + "epoch": 0.31, + "learning_rate": 0.00025349077366929783, + "loss": 0.0566, "step": 48040 }, { - "epoch": 0.52, - "learning_rate": 0.0002220423129339996, - "loss": 0.0607, + "epoch": 0.31, + "learning_rate": 0.0002534810923149409, + "loss": 0.0613, "step": 48050 }, { - "epoch": 0.52, - "learning_rate": 0.00022202608864949053, - "loss": 0.0564, + "epoch": 0.31, + "learning_rate": 0.00025347141096058394, + "loss": 0.0607, "step": 48060 }, { - "epoch": 0.52, - "learning_rate": 0.00022200986436498148, - "loss": 0.0577, + "epoch": 0.31, + "learning_rate": 0.000253461729606227, + "loss": 0.0685, "step": 48070 }, { - "epoch": 0.52, - "learning_rate": 0.00022199364008047243, - "loss": 0.0569, + "epoch": 0.31, + "learning_rate": 0.0002534520482518701, + "loss": 0.0636, "step": 48080 }, { - "epoch": 0.52, - "learning_rate": 0.00022197741579596338, - "loss": 0.0663, + "epoch": 0.31, + "learning_rate": 0.0002534423668975132, + "loss": 0.0621, "step": 48090 }, { - "epoch": 0.52, - "learning_rate": 0.00022196119151145433, - "loss": 0.0574, + "epoch": 0.31, + "learning_rate": 0.00025343268554315625, + "loss": 0.0653, "step": 48100 }, { - "epoch": 0.52, - "learning_rate": 0.00022194496722694528, - "loss": 0.0582, + "epoch": 0.31, + "learning_rate": 0.0002534230041887993, + "loss": 0.0652, "step": 48110 }, { - "epoch": 0.52, - "learning_rate": 0.0002219287429424362, - "loss": 0.0498, + "epoch": 0.31, + "learning_rate": 0.00025341332283444236, + "loss": 0.0637, "step": 48120 }, { - "epoch": 0.52, - "learning_rate": 0.00022191251865792718, - "loss": 0.0608, + "epoch": 0.31, + "learning_rate": 0.00025340364148008544, + "loss": 0.074, "step": 48130 }, { - "epoch": 0.52, - "learning_rate": 0.0002218962943734181, - "loss": 0.0633, + "epoch": 0.31, + "learning_rate": 0.00025339396012572847, + "loss": 0.0688, "step": 48140 }, { - "epoch": 0.52, - "learning_rate": 0.00022188007008890908, - "loss": 0.0591, + "epoch": 0.31, + "learning_rate": 0.00025338427877137155, + "loss": 0.0654, "step": 48150 }, { - "epoch": 0.52, - "learning_rate": 0.0002218638458044, - "loss": 0.0507, + "epoch": 0.31, + "learning_rate": 0.0002533745974170146, + "loss": 0.0652, "step": 48160 }, { - "epoch": 0.52, - "learning_rate": 0.00022184762151989095, - "loss": 0.0612, + "epoch": 0.31, + "learning_rate": 0.0002533649160626577, + "loss": 0.0709, "step": 48170 }, { - "epoch": 0.52, - "learning_rate": 0.0002218313972353819, - "loss": 0.0615, + "epoch": 0.31, + "learning_rate": 0.0002533552347083008, + "loss": 0.057, "step": 48180 }, { - "epoch": 0.52, - "learning_rate": 0.00022181517295087285, - "loss": 0.0636, + "epoch": 0.31, + "learning_rate": 0.00025334555335394386, + "loss": 0.0617, "step": 48190 }, { - "epoch": 0.52, - "learning_rate": 0.00022179894866636377, - "loss": 0.0554, + "epoch": 0.31, + "learning_rate": 0.0002533358719995869, + "loss": 0.0739, "step": 48200 }, { - "epoch": 0.52, - "learning_rate": 0.00022178272438185475, - "loss": 0.0549, + "epoch": 0.31, + "learning_rate": 0.00025332619064522997, + "loss": 0.0703, "step": 48210 }, { - "epoch": 0.52, - "learning_rate": 0.00022176650009734567, - "loss": 0.0595, + "epoch": 0.31, + "learning_rate": 0.00025331650929087305, + "loss": 0.0711, "step": 48220 }, { - "epoch": 0.52, - "learning_rate": 0.00022175027581283665, - "loss": 0.0549, + "epoch": 0.31, + "learning_rate": 0.00025330682793651613, + "loss": 0.0656, "step": 48230 }, { - "epoch": 0.52, - "learning_rate": 0.00022173405152832757, - "loss": 0.06, + "epoch": 0.31, + "learning_rate": 0.0002532971465821592, + "loss": 0.0709, "step": 48240 }, { - "epoch": 0.52, - "learning_rate": 0.00022171782724381852, - "loss": 0.056, + "epoch": 0.31, + "learning_rate": 0.00025328746522780223, + "loss": 0.0664, "step": 48250 }, { - "epoch": 0.52, - "learning_rate": 0.00022170160295930947, - "loss": 0.0646, + "epoch": 0.31, + "learning_rate": 0.0002532777838734453, + "loss": 0.0576, "step": 48260 }, { - "epoch": 0.52, - "learning_rate": 0.00022168537867480042, - "loss": 0.059, + "epoch": 0.31, + "learning_rate": 0.00025326810251908834, + "loss": 0.0598, "step": 48270 }, { - "epoch": 0.52, - "learning_rate": 0.00022166915439029137, - "loss": 0.0608, + "epoch": 0.31, + "learning_rate": 0.0002532584211647314, + "loss": 0.0579, "step": 48280 }, { - "epoch": 0.52, - "learning_rate": 0.00022165293010578232, - "loss": 0.0701, + "epoch": 0.31, + "learning_rate": 0.0002532487398103745, + "loss": 0.0584, "step": 48290 }, { - "epoch": 0.52, - "learning_rate": 0.00022163670582127324, - "loss": 0.0574, + "epoch": 0.31, + "learning_rate": 0.0002532390584560176, + "loss": 0.0717, "step": 48300 }, { - "epoch": 0.52, - "learning_rate": 0.00022162048153676422, - "loss": 0.0549, + "epoch": 0.31, + "learning_rate": 0.00025322937710166066, + "loss": 0.0635, "step": 48310 }, { - "epoch": 0.52, - "learning_rate": 0.00022160425725225514, - "loss": 0.052, + "epoch": 0.31, + "learning_rate": 0.00025321969574730374, + "loss": 0.0675, "step": 48320 }, { - "epoch": 0.52, - "learning_rate": 0.00022158803296774612, - "loss": 0.058, + "epoch": 0.31, + "learning_rate": 0.0002532100143929468, + "loss": 0.0682, "step": 48330 }, { - "epoch": 0.52, - "learning_rate": 0.00022157180868323704, - "loss": 0.0543, + "epoch": 0.31, + "learning_rate": 0.00025320033303858984, + "loss": 0.0581, "step": 48340 }, { - "epoch": 0.52, - "learning_rate": 0.000221555584398728, - "loss": 0.0544, + "epoch": 0.31, + "learning_rate": 0.0002531906516842329, + "loss": 0.0626, "step": 48350 }, { - "epoch": 0.52, - "learning_rate": 0.00022153936011421894, - "loss": 0.0593, + "epoch": 0.31, + "learning_rate": 0.000253180970329876, + "loss": 0.0534, "step": 48360 }, { - "epoch": 0.52, - "learning_rate": 0.0002215231358297099, - "loss": 0.0589, + "epoch": 0.31, + "learning_rate": 0.0002531712889755191, + "loss": 0.063, "step": 48370 }, { - "epoch": 0.52, - "learning_rate": 0.00022150691154520082, - "loss": 0.0544, + "epoch": 0.31, + "learning_rate": 0.0002531616076211621, + "loss": 0.062, "step": 48380 }, { - "epoch": 0.52, - "learning_rate": 0.0002214906872606918, - "loss": 0.0557, + "epoch": 0.31, + "learning_rate": 0.0002531519262668052, + "loss": 0.0688, "step": 48390 }, { - "epoch": 0.52, - "learning_rate": 0.00022147446297618271, - "loss": 0.0544, + "epoch": 0.31, + "learning_rate": 0.00025314224491244827, + "loss": 0.069, "step": 48400 }, { - "epoch": 0.52, - "learning_rate": 0.0002214582386916737, - "loss": 0.0567, + "epoch": 0.31, + "learning_rate": 0.0002531325635580913, + "loss": 0.0714, "step": 48410 }, { - "epoch": 0.52, - "learning_rate": 0.00022144201440716461, - "loss": 0.0523, + "epoch": 0.31, + "learning_rate": 0.0002531228822037344, + "loss": 0.0657, "step": 48420 }, { - "epoch": 0.52, - "learning_rate": 0.00022142579012265556, - "loss": 0.0556, + "epoch": 0.31, + "learning_rate": 0.00025311320084937745, + "loss": 0.0691, "step": 48430 }, { - "epoch": 0.52, - "learning_rate": 0.00022140956583814651, - "loss": 0.058, + "epoch": 0.31, + "learning_rate": 0.00025310351949502053, + "loss": 0.0593, "step": 48440 }, { - "epoch": 0.52, - "learning_rate": 0.00022139334155363746, - "loss": 0.0574, + "epoch": 0.31, + "learning_rate": 0.0002530938381406636, + "loss": 0.061, "step": 48450 }, { - "epoch": 0.52, - "learning_rate": 0.00022137711726912841, - "loss": 0.0693, + "epoch": 0.31, + "learning_rate": 0.0002530841567863067, + "loss": 0.073, "step": 48460 }, { - "epoch": 0.52, - "learning_rate": 0.00022136089298461936, - "loss": 0.0557, + "epoch": 0.31, + "learning_rate": 0.0002530744754319498, + "loss": 0.0719, "step": 48470 }, { - "epoch": 0.52, - "learning_rate": 0.00022134466870011029, - "loss": 0.0627, + "epoch": 0.31, + "learning_rate": 0.0002530647940775928, + "loss": 0.0629, "step": 48480 }, { - "epoch": 0.52, - "learning_rate": 0.00022132844441560126, - "loss": 0.0611, + "epoch": 0.31, + "learning_rate": 0.0002530551127232359, + "loss": 0.069, "step": 48490 }, { - "epoch": 0.52, - "learning_rate": 0.00022131222013109219, - "loss": 0.0551, + "epoch": 0.31, + "learning_rate": 0.00025304543136887896, + "loss": 0.067, "step": 48500 }, { - "epoch": 0.52, - "learning_rate": 0.00022129599584658316, - "loss": 0.061, + "epoch": 0.31, + "learning_rate": 0.000253035750014522, + "loss": 0.0707, "step": 48510 }, { - "epoch": 0.52, - "learning_rate": 0.00022127977156207409, - "loss": 0.0622, + "epoch": 0.31, + "learning_rate": 0.00025302606866016506, + "loss": 0.0651, "step": 48520 }, { - "epoch": 0.52, - "learning_rate": 0.00022126354727756503, - "loss": 0.056, + "epoch": 0.31, + "learning_rate": 0.00025301638730580814, + "loss": 0.0644, "step": 48530 }, { - "epoch": 0.53, - "learning_rate": 0.00022124732299305598, - "loss": 0.0578, + "epoch": 0.31, + "learning_rate": 0.0002530067059514512, + "loss": 0.0626, "step": 48540 }, { - "epoch": 0.53, - "learning_rate": 0.00022123109870854693, - "loss": 0.0606, + "epoch": 0.31, + "learning_rate": 0.00025299702459709425, + "loss": 0.0572, "step": 48550 }, { - "epoch": 0.53, - "learning_rate": 0.00022121487442403786, - "loss": 0.0595, + "epoch": 0.31, + "learning_rate": 0.00025298734324273733, + "loss": 0.0598, "step": 48560 }, { - "epoch": 0.53, - "learning_rate": 0.00022119865013952883, - "loss": 0.0612, + "epoch": 0.31, + "learning_rate": 0.0002529776618883804, + "loss": 0.0613, "step": 48570 }, { - "epoch": 0.53, - "learning_rate": 0.00022118242585501976, - "loss": 0.0517, + "epoch": 0.31, + "learning_rate": 0.0002529679805340235, + "loss": 0.0669, "step": 48580 }, { - "epoch": 0.53, - "learning_rate": 0.00022116620157051073, - "loss": 0.0541, + "epoch": 0.31, + "learning_rate": 0.00025295829917966657, + "loss": 0.0673, "step": 48590 }, { - "epoch": 0.53, - "learning_rate": 0.00022114997728600166, - "loss": 0.0553, + "epoch": 0.31, + "learning_rate": 0.00025294861782530965, + "loss": 0.0653, "step": 48600 }, { - "epoch": 0.53, - "learning_rate": 0.00022113375300149263, - "loss": 0.0546, + "epoch": 0.31, + "learning_rate": 0.00025293893647095273, + "loss": 0.0609, "step": 48610 }, { - "epoch": 0.53, - "learning_rate": 0.00022111752871698356, - "loss": 0.0597, + "epoch": 0.31, + "learning_rate": 0.00025292925511659575, + "loss": 0.0621, "step": 48620 }, { - "epoch": 0.53, - "learning_rate": 0.0002211013044324745, - "loss": 0.0505, + "epoch": 0.31, + "learning_rate": 0.00025291957376223883, + "loss": 0.0724, "step": 48630 }, { - "epoch": 0.53, - "learning_rate": 0.00022108508014796546, - "loss": 0.0508, + "epoch": 0.31, + "learning_rate": 0.0002529098924078819, + "loss": 0.0593, "step": 48640 }, { - "epoch": 0.53, - "learning_rate": 0.0002210688558634564, - "loss": 0.0576, + "epoch": 0.31, + "learning_rate": 0.00025290021105352494, + "loss": 0.0646, "step": 48650 }, { - "epoch": 0.53, - "learning_rate": 0.00022105263157894733, - "loss": 0.0607, + "epoch": 0.31, + "learning_rate": 0.000252890529699168, + "loss": 0.0641, "step": 48660 }, { - "epoch": 0.53, - "learning_rate": 0.0002210364072944383, - "loss": 0.0513, + "epoch": 0.31, + "learning_rate": 0.0002528808483448111, + "loss": 0.0627, "step": 48670 }, { - "epoch": 0.53, - "learning_rate": 0.00022102018300992923, - "loss": 0.0574, + "epoch": 0.31, + "learning_rate": 0.0002528711669904542, + "loss": 0.0634, "step": 48680 }, { - "epoch": 0.53, - "learning_rate": 0.0002210039587254202, - "loss": 0.0534, + "epoch": 0.31, + "learning_rate": 0.0002528614856360972, + "loss": 0.0627, "step": 48690 }, { - "epoch": 0.53, - "learning_rate": 0.00022098773444091113, - "loss": 0.0609, + "epoch": 0.31, + "learning_rate": 0.0002528518042817403, + "loss": 0.0674, "step": 48700 }, { - "epoch": 0.53, - "learning_rate": 0.00022097151015640208, - "loss": 0.0575, + "epoch": 0.31, + "learning_rate": 0.00025284212292738336, + "loss": 0.0664, "step": 48710 }, { - "epoch": 0.53, - "learning_rate": 0.00022095528587189303, - "loss": 0.0555, + "epoch": 0.31, + "learning_rate": 0.00025283244157302644, + "loss": 0.0734, "step": 48720 }, { - "epoch": 0.53, - "learning_rate": 0.00022093906158738398, - "loss": 0.0591, + "epoch": 0.31, + "learning_rate": 0.0002528227602186695, + "loss": 0.0677, "step": 48730 }, { - "epoch": 0.53, - "learning_rate": 0.0002209228373028749, - "loss": 0.0605, + "epoch": 0.31, + "learning_rate": 0.0002528130788643126, + "loss": 0.0643, "step": 48740 }, { - "epoch": 0.53, - "learning_rate": 0.00022090661301836588, - "loss": 0.059, + "epoch": 0.31, + "learning_rate": 0.00025280339750995563, + "loss": 0.0596, "step": 48750 }, { - "epoch": 0.53, - "learning_rate": 0.0002208903887338568, - "loss": 0.0567, + "epoch": 0.31, + "learning_rate": 0.0002527937161555987, + "loss": 0.0657, "step": 48760 }, { - "epoch": 0.53, - "learning_rate": 0.00022087416444934778, - "loss": 0.0571, + "epoch": 0.31, + "learning_rate": 0.0002527840348012418, + "loss": 0.0642, "step": 48770 }, { - "epoch": 0.53, - "learning_rate": 0.0002208579401648387, - "loss": 0.0569, + "epoch": 0.31, + "learning_rate": 0.0002527743534468848, + "loss": 0.0554, "step": 48780 }, { - "epoch": 0.53, - "learning_rate": 0.00022084171588032967, - "loss": 0.0549, + "epoch": 0.31, + "learning_rate": 0.0002527646720925279, + "loss": 0.0611, "step": 48790 }, { - "epoch": 0.53, - "learning_rate": 0.0002208254915958206, - "loss": 0.0724, + "epoch": 0.31, + "learning_rate": 0.00025275499073817097, + "loss": 0.0719, "step": 48800 }, { - "epoch": 0.53, - "learning_rate": 0.00022080926731131155, - "loss": 0.0529, + "epoch": 0.32, + "learning_rate": 0.00025274530938381405, + "loss": 0.0605, "step": 48810 }, { - "epoch": 0.53, - "learning_rate": 0.0002207930430268025, - "loss": 0.0534, + "epoch": 0.32, + "learning_rate": 0.00025273562802945713, + "loss": 0.0646, "step": 48820 }, { - "epoch": 0.53, - "learning_rate": 0.00022077681874229345, - "loss": 0.062, + "epoch": 0.32, + "learning_rate": 0.00025272594667510016, + "loss": 0.0666, "step": 48830 }, { - "epoch": 0.53, - "learning_rate": 0.00022076059445778437, - "loss": 0.0611, + "epoch": 0.32, + "learning_rate": 0.00025271626532074324, + "loss": 0.0676, "step": 48840 }, { - "epoch": 0.53, - "learning_rate": 0.00022074437017327535, - "loss": 0.0579, + "epoch": 0.32, + "learning_rate": 0.0002527065839663863, + "loss": 0.0585, "step": 48850 }, { - "epoch": 0.53, - "learning_rate": 0.00022072814588876627, - "loss": 0.0533, + "epoch": 0.32, + "learning_rate": 0.0002526969026120294, + "loss": 0.0649, "step": 48860 }, { - "epoch": 0.53, - "learning_rate": 0.00022071192160425725, - "loss": 0.0598, + "epoch": 0.32, + "learning_rate": 0.0002526872212576725, + "loss": 0.0564, "step": 48870 }, { - "epoch": 0.53, - "learning_rate": 0.00022069569731974817, - "loss": 0.07, + "epoch": 0.32, + "learning_rate": 0.0002526775399033155, + "loss": 0.0644, "step": 48880 }, { - "epoch": 0.53, - "learning_rate": 0.00022067947303523912, - "loss": 0.0535, + "epoch": 0.32, + "learning_rate": 0.0002526678585489586, + "loss": 0.0618, "step": 48890 }, { - "epoch": 0.53, - "learning_rate": 0.00022066324875073007, - "loss": 0.0688, + "epoch": 0.32, + "learning_rate": 0.00025265817719460166, + "loss": 0.0748, "step": 48900 }, { - "epoch": 0.53, - "learning_rate": 0.00022064702446622102, - "loss": 0.0561, + "epoch": 0.32, + "learning_rate": 0.0002526484958402447, + "loss": 0.0634, "step": 48910 }, { - "epoch": 0.53, - "learning_rate": 0.00022063080018171194, - "loss": 0.0578, + "epoch": 0.32, + "learning_rate": 0.00025263881448588777, + "loss": 0.0665, "step": 48920 }, { - "epoch": 0.53, - "learning_rate": 0.00022061457589720292, - "loss": 0.0618, + "epoch": 0.32, + "learning_rate": 0.00025262913313153085, + "loss": 0.0609, "step": 48930 }, { - "epoch": 0.53, - "learning_rate": 0.00022059835161269384, - "loss": 0.0563, + "epoch": 0.32, + "learning_rate": 0.00025261945177717393, + "loss": 0.0608, "step": 48940 }, { - "epoch": 0.53, - "learning_rate": 0.00022058212732818482, - "loss": 0.0558, + "epoch": 0.32, + "learning_rate": 0.000252609770422817, + "loss": 0.0623, "step": 48950 }, { - "epoch": 0.53, - "learning_rate": 0.00022056590304367574, - "loss": 0.0511, + "epoch": 0.32, + "learning_rate": 0.0002526000890684601, + "loss": 0.0561, "step": 48960 }, { - "epoch": 0.53, - "learning_rate": 0.00022054967875916672, - "loss": 0.0646, + "epoch": 0.32, + "learning_rate": 0.0002525904077141031, + "loss": 0.0576, "step": 48970 }, { - "epoch": 0.53, - "learning_rate": 0.00022053345447465764, - "loss": 0.0543, + "epoch": 0.32, + "learning_rate": 0.0002525807263597462, + "loss": 0.0609, "step": 48980 }, { - "epoch": 0.53, - "learning_rate": 0.0002205172301901486, - "loss": 0.0664, + "epoch": 0.32, + "learning_rate": 0.00025257104500538927, + "loss": 0.0618, "step": 48990 }, { - "epoch": 0.53, - "learning_rate": 0.00022050100590563954, - "loss": 0.0654, + "epoch": 0.32, + "learning_rate": 0.00025256136365103235, + "loss": 0.0592, "step": 49000 }, { - "epoch": 0.53, - "eval_cer": 0.9212894983752723, - "eval_loss": 0.039697159081697464, - "eval_runtime": 119.1948, - "eval_samples_per_second": 16.779, - "eval_steps_per_second": 4.195, + "epoch": 0.32, + "eval_cer": 0.9200677889504011, + "eval_loss": 0.043937765061855316, + "eval_runtime": 120.4874, + "eval_samples_per_second": 16.599, + "eval_steps_per_second": 4.15, "step": 49000 }, { - "epoch": 0.53, - "learning_rate": 0.0002204847816211305, - "loss": 0.0538, + "epoch": 0.32, + "learning_rate": 0.00025255168229667543, + "loss": 0.054, "step": 49010 }, { - "epoch": 0.53, - "learning_rate": 0.0002204685573366214, - "loss": 0.0576, + "epoch": 0.32, + "learning_rate": 0.00025254200094231846, + "loss": 0.0639, "step": 49020 }, { - "epoch": 0.53, - "learning_rate": 0.0002204523330521124, - "loss": 0.0571, + "epoch": 0.32, + "learning_rate": 0.00025253231958796154, + "loss": 0.0631, "step": 49030 }, { - "epoch": 0.53, - "learning_rate": 0.0002204361087676033, - "loss": 0.0612, + "epoch": 0.32, + "learning_rate": 0.0002525226382336046, + "loss": 0.0657, "step": 49040 }, { - "epoch": 0.53, - "learning_rate": 0.0002204198844830943, - "loss": 0.061, + "epoch": 0.32, + "learning_rate": 0.00025251295687924764, + "loss": 0.0623, "step": 49050 }, { - "epoch": 0.53, - "learning_rate": 0.0002204036601985852, - "loss": 0.0546, + "epoch": 0.32, + "learning_rate": 0.0002525032755248907, + "loss": 0.0639, "step": 49060 }, { - "epoch": 0.53, - "learning_rate": 0.00022038743591407616, - "loss": 0.0615, + "epoch": 0.32, + "learning_rate": 0.0002524935941705338, + "loss": 0.0629, "step": 49070 }, { - "epoch": 0.53, - "learning_rate": 0.0002203712116295671, - "loss": 0.0505, + "epoch": 0.32, + "learning_rate": 0.0002524839128161769, + "loss": 0.0662, "step": 49080 }, { - "epoch": 0.53, - "learning_rate": 0.00022035498734505806, - "loss": 0.0497, + "epoch": 0.32, + "learning_rate": 0.00025247423146181996, + "loss": 0.0804, "step": 49090 }, { - "epoch": 0.53, - "learning_rate": 0.00022033876306054898, - "loss": 0.0535, + "epoch": 0.32, + "learning_rate": 0.00025246455010746304, + "loss": 0.0634, "step": 49100 }, { - "epoch": 0.53, - "learning_rate": 0.00022032253877603996, - "loss": 0.058, + "epoch": 0.32, + "learning_rate": 0.00025245486875310607, + "loss": 0.0745, "step": 49110 }, { - "epoch": 0.53, - "learning_rate": 0.00022030631449153088, - "loss": 0.0539, + "epoch": 0.32, + "learning_rate": 0.00025244518739874915, + "loss": 0.066, "step": 49120 }, { - "epoch": 0.53, - "learning_rate": 0.00022029009020702186, - "loss": 0.0479, + "epoch": 0.32, + "learning_rate": 0.0002524355060443922, + "loss": 0.0619, "step": 49130 }, { - "epoch": 0.53, - "learning_rate": 0.00022027386592251278, - "loss": 0.0519, + "epoch": 0.32, + "learning_rate": 0.0002524258246900353, + "loss": 0.0704, "step": 49140 }, { - "epoch": 0.53, - "learning_rate": 0.00022025764163800376, - "loss": 0.0564, + "epoch": 0.32, + "learning_rate": 0.00025241614333567833, + "loss": 0.0674, "step": 49150 }, { - "epoch": 0.53, - "learning_rate": 0.00022024141735349468, - "loss": 0.0583, + "epoch": 0.32, + "learning_rate": 0.0002524064619813214, + "loss": 0.0701, "step": 49160 }, { - "epoch": 0.53, - "learning_rate": 0.00022022519306898563, - "loss": 0.0523, + "epoch": 0.32, + "learning_rate": 0.0002523967806269645, + "loss": 0.0715, "step": 49170 }, { - "epoch": 0.53, - "learning_rate": 0.00022020896878447658, - "loss": 0.0533, + "epoch": 0.32, + "learning_rate": 0.0002523870992726075, + "loss": 0.0618, "step": 49180 }, { - "epoch": 0.53, - "learning_rate": 0.00022019274449996753, - "loss": 0.0622, + "epoch": 0.32, + "learning_rate": 0.0002523774179182506, + "loss": 0.0729, "step": 49190 }, { - "epoch": 0.53, - "learning_rate": 0.00022017652021545845, - "loss": 0.0665, + "epoch": 0.32, + "learning_rate": 0.0002523677365638937, + "loss": 0.0673, "step": 49200 }, { - "epoch": 0.53, - "learning_rate": 0.00022016029593094943, - "loss": 0.0528, + "epoch": 0.32, + "learning_rate": 0.00025235805520953676, + "loss": 0.068, "step": 49210 }, { - "epoch": 0.53, - "learning_rate": 0.00022014407164644035, - "loss": 0.0563, + "epoch": 0.32, + "learning_rate": 0.00025234837385517984, + "loss": 0.0676, "step": 49220 }, { - "epoch": 0.53, - "learning_rate": 0.00022012784736193133, - "loss": 0.0518, + "epoch": 0.32, + "learning_rate": 0.0002523386925008229, + "loss": 0.0772, "step": 49230 }, { - "epoch": 0.53, - "learning_rate": 0.00022011162307742225, - "loss": 0.0512, + "epoch": 0.32, + "learning_rate": 0.000252329011146466, + "loss": 0.0683, "step": 49240 }, { - "epoch": 0.53, - "learning_rate": 0.0002200953987929132, - "loss": 0.0578, + "epoch": 0.32, + "learning_rate": 0.000252319329792109, + "loss": 0.0655, "step": 49250 }, { - "epoch": 0.53, - "learning_rate": 0.00022007917450840415, - "loss": 0.048, + "epoch": 0.32, + "learning_rate": 0.0002523096484377521, + "loss": 0.0726, "step": 49260 }, { - "epoch": 0.53, - "learning_rate": 0.0002200629502238951, - "loss": 0.057, + "epoch": 0.32, + "learning_rate": 0.0002522999670833952, + "loss": 0.0646, "step": 49270 }, { - "epoch": 0.53, - "learning_rate": 0.00022004672593938608, - "loss": 0.05, + "epoch": 0.32, + "learning_rate": 0.0002522902857290382, + "loss": 0.0651, "step": 49280 }, { - "epoch": 0.53, - "learning_rate": 0.000220030501654877, - "loss": 0.0505, + "epoch": 0.32, + "learning_rate": 0.0002522806043746813, + "loss": 0.065, "step": 49290 }, { - "epoch": 0.53, - "learning_rate": 0.00022001427737036798, - "loss": 0.054, + "epoch": 0.32, + "learning_rate": 0.00025227092302032437, + "loss": 0.062, "step": 49300 }, { - "epoch": 0.53, - "learning_rate": 0.0002199980530858589, - "loss": 0.0442, + "epoch": 0.32, + "learning_rate": 0.00025226124166596745, + "loss": 0.0701, "step": 49310 }, { - "epoch": 0.53, - "learning_rate": 0.00021998182880134985, - "loss": 0.0513, + "epoch": 0.32, + "learning_rate": 0.00025225156031161047, + "loss": 0.0597, "step": 49320 }, { - "epoch": 0.53, - "learning_rate": 0.0002199656045168408, - "loss": 0.0514, + "epoch": 0.32, + "learning_rate": 0.00025224187895725355, + "loss": 0.0638, "step": 49330 }, { - "epoch": 0.53, - "learning_rate": 0.00021994938023233175, - "loss": 0.0621, + "epoch": 0.32, + "learning_rate": 0.00025223219760289663, + "loss": 0.0632, "step": 49340 }, { - "epoch": 0.53, - "learning_rate": 0.00021993315594782267, - "loss": 0.057, + "epoch": 0.32, + "learning_rate": 0.0002522225162485397, + "loss": 0.0652, "step": 49350 }, { - "epoch": 0.53, - "learning_rate": 0.00021991693166331365, - "loss": 0.0578, + "epoch": 0.32, + "learning_rate": 0.0002522128348941828, + "loss": 0.0734, "step": 49360 }, { - "epoch": 0.53, - "learning_rate": 0.00021990070737880457, - "loss": 0.058, + "epoch": 0.32, + "learning_rate": 0.00025220315353982587, + "loss": 0.0601, "step": 49370 }, { - "epoch": 0.53, - "learning_rate": 0.00021988448309429555, - "loss": 0.0586, + "epoch": 0.32, + "learning_rate": 0.00025219347218546895, + "loss": 0.0684, "step": 49380 }, { - "epoch": 0.53, - "learning_rate": 0.00021986825880978647, - "loss": 0.0519, + "epoch": 0.32, + "learning_rate": 0.000252183790831112, + "loss": 0.0769, "step": 49390 }, { - "epoch": 0.53, - "learning_rate": 0.00021985203452527742, - "loss": 0.0541, + "epoch": 0.32, + "learning_rate": 0.00025217410947675506, + "loss": 0.062, "step": 49400 }, { - "epoch": 0.53, - "learning_rate": 0.00021983581024076837, - "loss": 0.0537, + "epoch": 0.32, + "learning_rate": 0.00025216442812239814, + "loss": 0.0587, "step": 49410 }, { - "epoch": 0.53, - "learning_rate": 0.00021981958595625932, - "loss": 0.0517, + "epoch": 0.32, + "learning_rate": 0.00025215474676804116, + "loss": 0.0608, "step": 49420 }, { - "epoch": 0.53, - "learning_rate": 0.00021980336167175024, - "loss": 0.062, + "epoch": 0.32, + "learning_rate": 0.00025214506541368424, + "loss": 0.0688, "step": 49430 }, { - "epoch": 0.53, - "learning_rate": 0.00021978713738724122, - "loss": 0.0464, + "epoch": 0.32, + "learning_rate": 0.0002521353840593273, + "loss": 0.0632, "step": 49440 }, { - "epoch": 0.53, - "learning_rate": 0.00021977091310273214, - "loss": 0.0486, + "epoch": 0.32, + "learning_rate": 0.0002521257027049704, + "loss": 0.064, "step": 49450 }, { - "epoch": 0.53, - "learning_rate": 0.00021975468881822312, - "loss": 0.0538, + "epoch": 0.32, + "learning_rate": 0.0002521160213506134, + "loss": 0.0635, "step": 49460 }, { - "epoch": 0.54, - "learning_rate": 0.00021973846453371404, - "loss": 0.0547, + "epoch": 0.32, + "learning_rate": 0.0002521063399962565, + "loss": 0.0687, "step": 49470 }, { - "epoch": 0.54, - "learning_rate": 0.00021972224024920502, - "loss": 0.0547, + "epoch": 0.32, + "learning_rate": 0.0002520966586418996, + "loss": 0.0636, "step": 49480 }, { - "epoch": 0.54, - "learning_rate": 0.00021970601596469594, - "loss": 0.0553, + "epoch": 0.32, + "learning_rate": 0.00025208697728754267, + "loss": 0.0727, "step": 49490 }, { - "epoch": 0.54, - "learning_rate": 0.0002196897916801869, - "loss": 0.0752, + "epoch": 0.32, + "learning_rate": 0.00025207729593318575, + "loss": 0.0598, "step": 49500 }, { - "epoch": 0.54, - "learning_rate": 0.00021967356739567784, - "loss": 0.0533, + "epoch": 0.32, + "learning_rate": 0.0002520676145788288, + "loss": 0.066, "step": 49510 }, { - "epoch": 0.54, - "learning_rate": 0.0002196573431111688, - "loss": 0.0539, + "epoch": 0.32, + "learning_rate": 0.00025205793322447185, + "loss": 0.0593, "step": 49520 }, { - "epoch": 0.54, - "learning_rate": 0.00021964111882665971, - "loss": 0.0568, + "epoch": 0.32, + "learning_rate": 0.00025204825187011493, + "loss": 0.0714, "step": 49530 }, { - "epoch": 0.54, - "learning_rate": 0.0002196248945421507, - "loss": 0.0581, + "epoch": 0.32, + "learning_rate": 0.000252038570515758, + "loss": 0.0651, "step": 49540 }, { - "epoch": 0.54, - "learning_rate": 0.0002196086702576416, - "loss": 0.0578, + "epoch": 0.32, + "learning_rate": 0.00025202888916140104, + "loss": 0.0601, "step": 49550 }, { - "epoch": 0.54, - "learning_rate": 0.0002195924459731326, - "loss": 0.0527, + "epoch": 0.32, + "learning_rate": 0.0002520192078070441, + "loss": 0.0562, "step": 49560 }, { - "epoch": 0.54, - "learning_rate": 0.0002195762216886235, - "loss": 0.0677, + "epoch": 0.32, + "learning_rate": 0.0002520095264526872, + "loss": 0.0702, "step": 49570 }, { - "epoch": 0.54, - "learning_rate": 0.00021955999740411446, - "loss": 0.0646, + "epoch": 0.32, + "learning_rate": 0.0002519998450983303, + "loss": 0.065, "step": 49580 }, { - "epoch": 0.54, - "learning_rate": 0.0002195437731196054, - "loss": 0.0552, + "epoch": 0.32, + "learning_rate": 0.00025199016374397335, + "loss": 0.0666, "step": 49590 }, { - "epoch": 0.54, - "learning_rate": 0.00021952754883509636, - "loss": 0.0632, + "epoch": 0.32, + "learning_rate": 0.0002519804823896164, + "loss": 0.0646, "step": 49600 }, { - "epoch": 0.54, - "learning_rate": 0.00021951132455058728, - "loss": 0.0645, + "epoch": 0.32, + "learning_rate": 0.00025197080103525946, + "loss": 0.0604, "step": 49610 }, { - "epoch": 0.54, - "learning_rate": 0.00021949510026607826, - "loss": 0.0567, + "epoch": 0.32, + "learning_rate": 0.00025196111968090254, + "loss": 0.0618, "step": 49620 }, { - "epoch": 0.54, - "learning_rate": 0.00021947887598156918, - "loss": 0.0587, + "epoch": 0.32, + "learning_rate": 0.0002519514383265456, + "loss": 0.0662, "step": 49630 }, { - "epoch": 0.54, - "learning_rate": 0.00021946265169706016, - "loss": 0.0583, + "epoch": 0.32, + "learning_rate": 0.0002519417569721887, + "loss": 0.0632, "step": 49640 }, { - "epoch": 0.54, - "learning_rate": 0.00021944642741255108, - "loss": 0.0536, + "epoch": 0.32, + "learning_rate": 0.0002519320756178318, + "loss": 0.0699, "step": 49650 }, { - "epoch": 0.54, - "learning_rate": 0.00021943020312804206, - "loss": 0.0671, + "epoch": 0.32, + "learning_rate": 0.0002519223942634748, + "loss": 0.0527, "step": 49660 }, { - "epoch": 0.54, - "learning_rate": 0.00021941397884353298, - "loss": 0.0566, + "epoch": 0.32, + "learning_rate": 0.0002519127129091179, + "loss": 0.0599, "step": 49670 }, { - "epoch": 0.54, - "learning_rate": 0.00021939775455902393, - "loss": 0.0619, + "epoch": 0.32, + "learning_rate": 0.0002519030315547609, + "loss": 0.0631, "step": 49680 }, { - "epoch": 0.54, - "learning_rate": 0.00021938153027451488, - "loss": 0.0624, + "epoch": 0.32, + "learning_rate": 0.000251893350200404, + "loss": 0.0606, "step": 49690 }, { - "epoch": 0.54, - "learning_rate": 0.00021936530599000583, - "loss": 0.0565, + "epoch": 0.32, + "learning_rate": 0.00025188366884604707, + "loss": 0.0614, "step": 49700 }, { - "epoch": 0.54, - "learning_rate": 0.00021934908170549676, - "loss": 0.058, + "epoch": 0.32, + "learning_rate": 0.00025187398749169015, + "loss": 0.0608, "step": 49710 }, { - "epoch": 0.54, - "learning_rate": 0.00021933285742098773, - "loss": 0.0627, + "epoch": 0.32, + "learning_rate": 0.00025186430613733323, + "loss": 0.0557, "step": 49720 }, { - "epoch": 0.54, - "learning_rate": 0.00021931663313647865, - "loss": 0.0548, + "epoch": 0.32, + "learning_rate": 0.0002518546247829763, + "loss": 0.0692, "step": 49730 }, { - "epoch": 0.54, - "learning_rate": 0.00021930040885196963, - "loss": 0.0569, + "epoch": 0.32, + "learning_rate": 0.00025184494342861933, + "loss": 0.0602, "step": 49740 }, { - "epoch": 0.54, - "learning_rate": 0.00021928418456746055, - "loss": 0.0638, + "epoch": 0.32, + "learning_rate": 0.0002518352620742624, + "loss": 0.0648, "step": 49750 }, { - "epoch": 0.54, - "learning_rate": 0.0002192679602829515, - "loss": 0.0594, + "epoch": 0.32, + "learning_rate": 0.0002518255807199055, + "loss": 0.0581, "step": 49760 }, { - "epoch": 0.54, - "learning_rate": 0.00021925173599844245, - "loss": 0.0557, + "epoch": 0.32, + "learning_rate": 0.0002518158993655486, + "loss": 0.0623, "step": 49770 }, { - "epoch": 0.54, - "learning_rate": 0.0002192355117139334, - "loss": 0.0535, + "epoch": 0.32, + "learning_rate": 0.00025180621801119165, + "loss": 0.0551, "step": 49780 }, { - "epoch": 0.54, - "learning_rate": 0.00021921928742942433, - "loss": 0.0552, + "epoch": 0.32, + "learning_rate": 0.0002517965366568347, + "loss": 0.0624, "step": 49790 }, { - "epoch": 0.54, - "learning_rate": 0.0002192030631449153, - "loss": 0.0679, + "epoch": 0.32, + "learning_rate": 0.00025178685530247776, + "loss": 0.0643, "step": 49800 }, { - "epoch": 0.54, - "learning_rate": 0.00021918683886040623, - "loss": 0.0513, + "epoch": 0.32, + "learning_rate": 0.00025177717394812084, + "loss": 0.0681, "step": 49810 }, { - "epoch": 0.54, - "learning_rate": 0.0002191706145758972, - "loss": 0.0603, + "epoch": 0.32, + "learning_rate": 0.00025176749259376386, + "loss": 0.0652, "step": 49820 }, { - "epoch": 0.54, - "learning_rate": 0.00021915439029138813, - "loss": 0.0569, + "epoch": 0.32, + "learning_rate": 0.00025175781123940694, + "loss": 0.0594, "step": 49830 }, { - "epoch": 0.54, - "learning_rate": 0.0002191381660068791, - "loss": 0.0516, + "epoch": 0.32, + "learning_rate": 0.00025174812988505, + "loss": 0.0647, "step": 49840 }, { - "epoch": 0.54, - "learning_rate": 0.00021912194172237003, - "loss": 0.0508, + "epoch": 0.32, + "learning_rate": 0.0002517384485306931, + "loss": 0.0604, "step": 49850 }, { - "epoch": 0.54, - "learning_rate": 0.00021910571743786097, - "loss": 0.0496, + "epoch": 0.32, + "learning_rate": 0.0002517287671763362, + "loss": 0.0611, "step": 49860 }, { - "epoch": 0.54, - "learning_rate": 0.00021908949315335192, - "loss": 0.054, + "epoch": 0.32, + "learning_rate": 0.00025171908582197926, + "loss": 0.0628, "step": 49870 }, { - "epoch": 0.54, - "learning_rate": 0.00021907326886884287, - "loss": 0.0563, + "epoch": 0.32, + "learning_rate": 0.0002517094044676223, + "loss": 0.059, "step": 49880 }, { - "epoch": 0.54, - "learning_rate": 0.0002190570445843338, - "loss": 0.0623, + "epoch": 0.32, + "learning_rate": 0.00025169972311326537, + "loss": 0.0569, "step": 49890 }, { - "epoch": 0.54, - "learning_rate": 0.00021904082029982477, - "loss": 0.0605, + "epoch": 0.32, + "learning_rate": 0.00025169004175890845, + "loss": 0.0595, "step": 49900 }, { - "epoch": 0.54, - "learning_rate": 0.0002190245960153157, - "loss": 0.0589, + "epoch": 0.32, + "learning_rate": 0.00025168036040455153, + "loss": 0.0629, "step": 49910 }, { - "epoch": 0.54, - "learning_rate": 0.00021900837173080667, - "loss": 0.0557, + "epoch": 0.32, + "learning_rate": 0.00025167067905019455, + "loss": 0.0659, "step": 49920 }, { - "epoch": 0.54, - "learning_rate": 0.0002189921474462976, - "loss": 0.0621, + "epoch": 0.32, + "learning_rate": 0.00025166099769583763, + "loss": 0.0661, "step": 49930 }, { - "epoch": 0.54, - "learning_rate": 0.00021897592316178855, - "loss": 0.0504, + "epoch": 0.32, + "learning_rate": 0.0002516513163414807, + "loss": 0.0669, "step": 49940 }, { - "epoch": 0.54, - "learning_rate": 0.0002189596988772795, - "loss": 0.0553, + "epoch": 0.32, + "learning_rate": 0.00025164163498712374, + "loss": 0.0602, "step": 49950 }, { - "epoch": 0.54, - "learning_rate": 0.00021894347459277045, - "loss": 0.0502, + "epoch": 0.32, + "learning_rate": 0.0002516319536327668, + "loss": 0.0668, "step": 49960 }, { - "epoch": 0.54, - "learning_rate": 0.00021892725030826137, - "loss": 0.0562, + "epoch": 0.32, + "learning_rate": 0.0002516222722784099, + "loss": 0.0655, "step": 49970 }, { - "epoch": 0.54, - "learning_rate": 0.00021891102602375235, - "loss": 0.0537, + "epoch": 0.32, + "learning_rate": 0.000251612590924053, + "loss": 0.0634, "step": 49980 }, { - "epoch": 0.54, - "learning_rate": 0.00021889480173924327, - "loss": 0.0494, + "epoch": 0.32, + "learning_rate": 0.00025160290956969606, + "loss": 0.0629, "step": 49990 }, { - "epoch": 0.54, - "learning_rate": 0.00021887857745473424, - "loss": 0.0506, + "epoch": 0.32, + "learning_rate": 0.00025159322821533914, + "loss": 0.0623, "step": 50000 }, { - "epoch": 0.54, - "eval_cer": 0.9212108682707209, - "eval_loss": 0.03913816064596176, - "eval_runtime": 119.3899, - "eval_samples_per_second": 16.752, - "eval_steps_per_second": 4.188, + "epoch": 0.32, + "eval_cer": 0.9200958083832336, + "eval_loss": 0.043299414217472076, + "eval_runtime": 120.2242, + "eval_samples_per_second": 16.636, + "eval_steps_per_second": 4.159, "step": 50000 }, { - "epoch": 0.54, - "learning_rate": 0.00021886235317022517, - "loss": 0.062, + "epoch": 0.32, + "learning_rate": 0.0002515835468609822, + "loss": 0.0586, "step": 50010 }, { - "epoch": 0.54, - "learning_rate": 0.00021884612888571614, - "loss": 0.0557, + "epoch": 0.32, + "learning_rate": 0.00025157386550662524, + "loss": 0.066, "step": 50020 }, { - "epoch": 0.54, - "learning_rate": 0.00021882990460120707, - "loss": 0.0551, + "epoch": 0.32, + "learning_rate": 0.0002515641841522683, + "loss": 0.0684, "step": 50030 }, { - "epoch": 0.54, - "learning_rate": 0.00021881368031669802, - "loss": 0.0598, + "epoch": 0.32, + "learning_rate": 0.0002515545027979114, + "loss": 0.0709, "step": 50040 }, { - "epoch": 0.54, - "learning_rate": 0.00021879745603218897, - "loss": 0.0486, + "epoch": 0.32, + "learning_rate": 0.0002515448214435545, + "loss": 0.0642, "step": 50050 }, { - "epoch": 0.54, - "learning_rate": 0.00021878123174767992, - "loss": 0.0495, + "epoch": 0.32, + "learning_rate": 0.0002515351400891975, + "loss": 0.0642, "step": 50060 }, { - "epoch": 0.54, - "learning_rate": 0.00021876500746317084, - "loss": 0.0511, + "epoch": 0.32, + "learning_rate": 0.0002515254587348406, + "loss": 0.0642, "step": 50070 }, { - "epoch": 0.54, - "learning_rate": 0.00021874878317866182, - "loss": 0.0512, + "epoch": 0.32, + "learning_rate": 0.00025151577738048367, + "loss": 0.0681, "step": 50080 }, { - "epoch": 0.54, - "learning_rate": 0.00021873255889415274, - "loss": 0.0543, + "epoch": 0.32, + "learning_rate": 0.0002515060960261267, + "loss": 0.0626, "step": 50090 }, { - "epoch": 0.54, - "learning_rate": 0.00021871633460964372, - "loss": 0.0563, + "epoch": 0.32, + "learning_rate": 0.0002514964146717698, + "loss": 0.0633, "step": 50100 }, { - "epoch": 0.54, - "learning_rate": 0.00021870011032513464, - "loss": 0.0657, + "epoch": 0.32, + "learning_rate": 0.00025148673331741285, + "loss": 0.0702, "step": 50110 }, { - "epoch": 0.54, - "learning_rate": 0.0002186838860406256, - "loss": 0.0474, + "epoch": 0.32, + "learning_rate": 0.00025147705196305593, + "loss": 0.0651, "step": 50120 }, { - "epoch": 0.54, - "learning_rate": 0.00021866766175611654, - "loss": 0.0527, + "epoch": 0.32, + "learning_rate": 0.000251467370608699, + "loss": 0.063, "step": 50130 }, { - "epoch": 0.54, - "learning_rate": 0.0002186514374716075, - "loss": 0.0625, + "epoch": 0.32, + "learning_rate": 0.0002514576892543421, + "loss": 0.0668, "step": 50140 }, { - "epoch": 0.54, - "learning_rate": 0.00021863521318709844, - "loss": 0.0532, + "epoch": 0.32, + "learning_rate": 0.00025144800789998517, + "loss": 0.0661, "step": 50150 }, { - "epoch": 0.54, - "learning_rate": 0.0002186189889025894, - "loss": 0.0544, + "epoch": 0.32, + "learning_rate": 0.0002514383265456282, + "loss": 0.0735, "step": 50160 }, { - "epoch": 0.54, - "learning_rate": 0.0002186027646180803, - "loss": 0.0629, + "epoch": 0.32, + "learning_rate": 0.0002514286451912713, + "loss": 0.058, "step": 50170 }, { - "epoch": 0.54, - "learning_rate": 0.00021858654033357129, - "loss": 0.0583, + "epoch": 0.32, + "learning_rate": 0.00025141896383691436, + "loss": 0.0576, "step": 50180 }, { - "epoch": 0.54, - "learning_rate": 0.0002185703160490622, - "loss": 0.0598, + "epoch": 0.32, + "learning_rate": 0.0002514092824825574, + "loss": 0.0683, "step": 50190 }, { - "epoch": 0.54, - "learning_rate": 0.00021855409176455319, - "loss": 0.0599, + "epoch": 0.32, + "learning_rate": 0.00025139960112820046, + "loss": 0.056, "step": 50200 }, { - "epoch": 0.54, - "learning_rate": 0.0002185378674800441, - "loss": 0.0544, + "epoch": 0.32, + "learning_rate": 0.00025138991977384354, + "loss": 0.0637, "step": 50210 }, { - "epoch": 0.54, - "learning_rate": 0.00021852164319553506, - "loss": 0.0527, + "epoch": 0.32, + "learning_rate": 0.0002513802384194866, + "loss": 0.0689, "step": 50220 }, { - "epoch": 0.54, - "learning_rate": 0.000218505418911026, - "loss": 0.0548, + "epoch": 0.32, + "learning_rate": 0.00025137055706512965, + "loss": 0.0652, "step": 50230 }, { - "epoch": 0.54, - "learning_rate": 0.00021848919462651696, - "loss": 0.05, + "epoch": 0.32, + "learning_rate": 0.00025136087571077273, + "loss": 0.0631, "step": 50240 }, { - "epoch": 0.54, - "learning_rate": 0.00021847297034200788, - "loss": 0.0543, + "epoch": 0.32, + "learning_rate": 0.0002513511943564158, + "loss": 0.059, "step": 50250 }, { - "epoch": 0.54, - "learning_rate": 0.00021845674605749886, - "loss": 0.0511, + "epoch": 0.32, + "learning_rate": 0.0002513415130020589, + "loss": 0.0645, "step": 50260 }, { - "epoch": 0.54, - "learning_rate": 0.00021844052177298978, - "loss": 0.0589, + "epoch": 0.32, + "learning_rate": 0.00025133183164770197, + "loss": 0.0637, "step": 50270 }, { - "epoch": 0.54, - "learning_rate": 0.00021842429748848076, - "loss": 0.0582, + "epoch": 0.32, + "learning_rate": 0.00025132215029334505, + "loss": 0.0662, "step": 50280 }, { - "epoch": 0.54, - "learning_rate": 0.00021840807320397168, - "loss": 0.0559, - "step": 50290 + "epoch": 0.32, + "learning_rate": 0.00025131246893898807, + "loss": 0.0668, + "step": 50290 }, { - "epoch": 0.54, - "learning_rate": 0.00021839184891946263, - "loss": 0.0493, + "epoch": 0.32, + "learning_rate": 0.00025130278758463115, + "loss": 0.0601, "step": 50300 }, { - "epoch": 0.54, - "learning_rate": 0.00021837562463495358, - "loss": 0.0572, + "epoch": 0.32, + "learning_rate": 0.00025129310623027423, + "loss": 0.0634, "step": 50310 }, { - "epoch": 0.54, - "learning_rate": 0.00021835940035044453, - "loss": 0.0536, + "epoch": 0.32, + "learning_rate": 0.00025128342487591726, + "loss": 0.0582, "step": 50320 }, { - "epoch": 0.54, - "learning_rate": 0.00021834317606593548, - "loss": 0.0548, + "epoch": 0.32, + "learning_rate": 0.00025127374352156034, + "loss": 0.0703, "step": 50330 }, { - "epoch": 0.54, - "learning_rate": 0.00021832695178142643, - "loss": 0.0565, + "epoch": 0.32, + "learning_rate": 0.0002512640621672034, + "loss": 0.061, "step": 50340 }, { - "epoch": 0.54, - "learning_rate": 0.00021831072749691735, - "loss": 0.058, + "epoch": 0.32, + "learning_rate": 0.0002512543808128465, + "loss": 0.0616, "step": 50350 }, { - "epoch": 0.54, - "learning_rate": 0.00021829450321240833, - "loss": 0.0629, + "epoch": 0.33, + "learning_rate": 0.0002512446994584896, + "loss": 0.0611, "step": 50360 }, { - "epoch": 0.54, - "learning_rate": 0.00021827827892789925, - "loss": 0.0546, + "epoch": 0.33, + "learning_rate": 0.0002512350181041326, + "loss": 0.0572, "step": 50370 }, { - "epoch": 0.54, - "learning_rate": 0.00021826205464339023, - "loss": 0.0524, + "epoch": 0.33, + "learning_rate": 0.0002512253367497757, + "loss": 0.0607, "step": 50380 }, { - "epoch": 0.55, - "learning_rate": 0.00021824583035888115, - "loss": 0.0672, + "epoch": 0.33, + "learning_rate": 0.00025121565539541876, + "loss": 0.0632, "step": 50390 }, { - "epoch": 0.55, - "learning_rate": 0.0002182296060743721, - "loss": 0.0599, + "epoch": 0.33, + "learning_rate": 0.00025120597404106184, + "loss": 0.0669, "step": 50400 }, { - "epoch": 0.55, - "learning_rate": 0.00021821338178986305, - "loss": 0.0578, + "epoch": 0.33, + "learning_rate": 0.0002511962926867049, + "loss": 0.0575, "step": 50410 }, { - "epoch": 0.55, - "learning_rate": 0.000218197157505354, - "loss": 0.0625, + "epoch": 0.33, + "learning_rate": 0.000251186611332348, + "loss": 0.0697, "step": 50420 }, { - "epoch": 0.55, - "learning_rate": 0.00021818093322084492, - "loss": 0.0603, + "epoch": 0.33, + "learning_rate": 0.00025117692997799103, + "loss": 0.0564, "step": 50430 }, { - "epoch": 0.55, - "learning_rate": 0.0002181647089363359, - "loss": 0.0577, + "epoch": 0.33, + "learning_rate": 0.0002511672486236341, + "loss": 0.0661, "step": 50440 }, { - "epoch": 0.55, - "learning_rate": 0.00021814848465182682, - "loss": 0.0555, + "epoch": 0.33, + "learning_rate": 0.0002511575672692772, + "loss": 0.0575, "step": 50450 }, { - "epoch": 0.55, - "learning_rate": 0.0002181322603673178, - "loss": 0.0726, + "epoch": 0.33, + "learning_rate": 0.0002511478859149202, + "loss": 0.0548, "step": 50460 }, { - "epoch": 0.55, - "learning_rate": 0.00021811603608280872, - "loss": 0.0569, + "epoch": 0.33, + "learning_rate": 0.0002511382045605633, + "loss": 0.0705, "step": 50470 }, { - "epoch": 0.55, - "learning_rate": 0.00021809981179829967, - "loss": 0.0589, + "epoch": 0.33, + "learning_rate": 0.00025112852320620637, + "loss": 0.0636, "step": 50480 }, { - "epoch": 0.55, - "learning_rate": 0.00021808358751379062, - "loss": 0.0564, + "epoch": 0.33, + "learning_rate": 0.00025111884185184945, + "loss": 0.065, "step": 50490 }, { - "epoch": 0.55, - "learning_rate": 0.00021806736322928157, - "loss": 0.0561, + "epoch": 0.33, + "learning_rate": 0.00025110916049749253, + "loss": 0.0564, "step": 50500 }, { - "epoch": 0.55, - "learning_rate": 0.00021805113894477252, - "loss": 0.0672, + "epoch": 0.33, + "learning_rate": 0.00025109947914313556, + "loss": 0.068, "step": 50510 }, { - "epoch": 0.55, - "learning_rate": 0.00021803491466026347, - "loss": 0.0562, + "epoch": 0.33, + "learning_rate": 0.00025108979778877864, + "loss": 0.0638, "step": 50520 }, { - "epoch": 0.55, - "learning_rate": 0.0002180186903757544, - "loss": 0.0622, + "epoch": 0.33, + "learning_rate": 0.0002510801164344217, + "loss": 0.0649, "step": 50530 }, { - "epoch": 0.55, - "learning_rate": 0.00021800246609124537, - "loss": 0.0637, + "epoch": 0.33, + "learning_rate": 0.0002510704350800648, + "loss": 0.059, "step": 50540 }, { - "epoch": 0.55, - "learning_rate": 0.0002179862418067363, - "loss": 0.0528, + "epoch": 0.33, + "learning_rate": 0.0002510607537257079, + "loss": 0.0582, "step": 50550 }, { - "epoch": 0.55, - "learning_rate": 0.00021797001752222727, - "loss": 0.0637, + "epoch": 0.33, + "learning_rate": 0.0002510510723713509, + "loss": 0.0571, "step": 50560 }, { - "epoch": 0.55, - "learning_rate": 0.0002179537932377182, - "loss": 0.0683, + "epoch": 0.33, + "learning_rate": 0.000251041391016994, + "loss": 0.0545, "step": 50570 }, { - "epoch": 0.55, - "learning_rate": 0.00021793756895320914, - "loss": 0.0613, + "epoch": 0.33, + "learning_rate": 0.00025103170966263706, + "loss": 0.0661, "step": 50580 }, { - "epoch": 0.55, - "learning_rate": 0.0002179213446687001, - "loss": 0.0576, + "epoch": 0.33, + "learning_rate": 0.0002510220283082801, + "loss": 0.0638, "step": 50590 }, { - "epoch": 0.55, - "learning_rate": 0.00021790512038419104, - "loss": 0.0521, + "epoch": 0.33, + "learning_rate": 0.00025101234695392317, + "loss": 0.056, "step": 50600 }, { - "epoch": 0.55, - "learning_rate": 0.00021788889609968196, - "loss": 0.0604, + "epoch": 0.33, + "learning_rate": 0.00025100266559956625, + "loss": 0.0667, "step": 50610 }, { - "epoch": 0.55, - "learning_rate": 0.00021787267181517294, - "loss": 0.0625, + "epoch": 0.33, + "learning_rate": 0.0002509929842452093, + "loss": 0.0644, "step": 50620 }, { - "epoch": 0.55, - "learning_rate": 0.00021785644753066386, - "loss": 0.0606, + "epoch": 0.33, + "learning_rate": 0.0002509833028908524, + "loss": 0.0611, "step": 50630 }, { - "epoch": 0.55, - "learning_rate": 0.00021784022324615484, - "loss": 0.0564, + "epoch": 0.33, + "learning_rate": 0.0002509736215364955, + "loss": 0.061, "step": 50640 }, { - "epoch": 0.55, - "learning_rate": 0.00021782399896164576, - "loss": 0.0565, + "epoch": 0.33, + "learning_rate": 0.0002509639401821385, + "loss": 0.0659, "step": 50650 }, { - "epoch": 0.55, - "learning_rate": 0.0002178077746771367, - "loss": 0.0625, + "epoch": 0.33, + "learning_rate": 0.0002509542588277816, + "loss": 0.0656, "step": 50660 }, { - "epoch": 0.55, - "learning_rate": 0.00021779155039262766, - "loss": 0.0614, + "epoch": 0.33, + "learning_rate": 0.00025094457747342467, + "loss": 0.0627, "step": 50670 }, { - "epoch": 0.55, - "learning_rate": 0.0002177753261081186, - "loss": 0.0548, + "epoch": 0.33, + "learning_rate": 0.00025093489611906775, + "loss": 0.062, "step": 50680 }, { - "epoch": 0.55, - "learning_rate": 0.00021775910182360956, - "loss": 0.0614, + "epoch": 0.33, + "learning_rate": 0.0002509252147647108, + "loss": 0.0613, "step": 50690 }, { - "epoch": 0.55, - "learning_rate": 0.0002177428775391005, - "loss": 0.0572, + "epoch": 0.33, + "learning_rate": 0.00025091553341035386, + "loss": 0.065, "step": 50700 }, { - "epoch": 0.55, - "learning_rate": 0.00021772665325459143, - "loss": 0.0518, + "epoch": 0.33, + "learning_rate": 0.00025090585205599694, + "loss": 0.0651, "step": 50710 }, { - "epoch": 0.55, - "learning_rate": 0.0002177104289700824, - "loss": 0.0572, + "epoch": 0.33, + "learning_rate": 0.00025089617070163996, + "loss": 0.0655, "step": 50720 }, { - "epoch": 0.55, - "learning_rate": 0.00021769420468557333, - "loss": 0.0615, + "epoch": 0.33, + "learning_rate": 0.00025088648934728304, + "loss": 0.0596, "step": 50730 }, { - "epoch": 0.55, - "learning_rate": 0.0002176779804010643, - "loss": 0.0517, + "epoch": 0.33, + "learning_rate": 0.0002508768079929261, + "loss": 0.0735, "step": 50740 }, { - "epoch": 0.55, - "learning_rate": 0.00021766175611655523, - "loss": 0.0688, + "epoch": 0.33, + "learning_rate": 0.0002508671266385692, + "loss": 0.0616, "step": 50750 }, { - "epoch": 0.55, - "learning_rate": 0.00021764553183204618, - "loss": 0.0614, + "epoch": 0.33, + "learning_rate": 0.0002508574452842123, + "loss": 0.0613, "step": 50760 }, { - "epoch": 0.55, - "learning_rate": 0.00021762930754753713, - "loss": 0.0529, + "epoch": 0.33, + "learning_rate": 0.00025084776392985536, + "loss": 0.0579, "step": 50770 }, { - "epoch": 0.55, - "learning_rate": 0.00021761308326302808, - "loss": 0.0558, + "epoch": 0.33, + "learning_rate": 0.00025083808257549844, + "loss": 0.0551, "step": 50780 }, { - "epoch": 0.55, - "learning_rate": 0.000217596858978519, - "loss": 0.0581, + "epoch": 0.33, + "learning_rate": 0.00025082840122114147, + "loss": 0.0683, "step": 50790 }, { - "epoch": 0.55, - "learning_rate": 0.00021758063469400998, - "loss": 0.0574, + "epoch": 0.33, + "learning_rate": 0.00025081871986678455, + "loss": 0.0612, "step": 50800 }, { - "epoch": 0.55, - "learning_rate": 0.0002175644104095009, - "loss": 0.0669, + "epoch": 0.33, + "learning_rate": 0.0002508090385124276, + "loss": 0.0648, "step": 50810 }, { - "epoch": 0.55, - "learning_rate": 0.00021754818612499188, - "loss": 0.0532, + "epoch": 0.33, + "learning_rate": 0.0002507993571580707, + "loss": 0.0672, "step": 50820 }, { - "epoch": 0.55, - "learning_rate": 0.0002175319618404828, - "loss": 0.0628, + "epoch": 0.33, + "learning_rate": 0.00025078967580371373, + "loss": 0.0621, "step": 50830 }, { - "epoch": 0.55, - "learning_rate": 0.00021751573755597378, - "loss": 0.0557, + "epoch": 0.33, + "learning_rate": 0.0002507799944493568, + "loss": 0.0627, "step": 50840 }, { - "epoch": 0.55, - "learning_rate": 0.0002174995132714647, - "loss": 0.0582, + "epoch": 0.33, + "learning_rate": 0.0002507703130949999, + "loss": 0.0631, "step": 50850 }, { - "epoch": 0.55, - "learning_rate": 0.00021748328898695565, - "loss": 0.0637, + "epoch": 0.33, + "learning_rate": 0.0002507606317406429, + "loss": 0.0646, "step": 50860 }, { - "epoch": 0.55, - "learning_rate": 0.0002174670647024466, - "loss": 0.0548, + "epoch": 0.33, + "learning_rate": 0.000250750950386286, + "loss": 0.057, "step": 50870 }, { - "epoch": 0.55, - "learning_rate": 0.00021745084041793755, - "loss": 0.0516, + "epoch": 0.33, + "learning_rate": 0.0002507412690319291, + "loss": 0.0646, "step": 50880 }, { - "epoch": 0.55, - "learning_rate": 0.00021743461613342848, - "loss": 0.0582, + "epoch": 0.33, + "learning_rate": 0.00025073158767757216, + "loss": 0.0665, "step": 50890 }, { - "epoch": 0.55, - "learning_rate": 0.00021741839184891945, - "loss": 0.0555, + "epoch": 0.33, + "learning_rate": 0.00025072190632321524, + "loss": 0.0632, "step": 50900 }, { - "epoch": 0.55, - "learning_rate": 0.00021740216756441038, - "loss": 0.0488, + "epoch": 0.33, + "learning_rate": 0.0002507122249688583, + "loss": 0.0647, "step": 50910 }, { - "epoch": 0.55, - "learning_rate": 0.00021738594327990135, - "loss": 0.0514, + "epoch": 0.33, + "learning_rate": 0.0002507025436145014, + "loss": 0.0592, "step": 50920 }, { - "epoch": 0.55, - "learning_rate": 0.00021736971899539228, - "loss": 0.0516, + "epoch": 0.33, + "learning_rate": 0.0002506928622601444, + "loss": 0.0751, "step": 50930 }, { - "epoch": 0.55, - "learning_rate": 0.00021735349471088322, - "loss": 0.0583, + "epoch": 0.33, + "learning_rate": 0.0002506831809057875, + "loss": 0.0639, "step": 50940 }, { - "epoch": 0.55, - "learning_rate": 0.00021733727042637417, - "loss": 0.0579, + "epoch": 0.33, + "learning_rate": 0.0002506734995514306, + "loss": 0.0594, "step": 50950 }, { - "epoch": 0.55, - "learning_rate": 0.00021732104614186512, - "loss": 0.049, + "epoch": 0.33, + "learning_rate": 0.0002506638181970736, + "loss": 0.0649, "step": 50960 }, { - "epoch": 0.55, - "learning_rate": 0.00021730482185735605, - "loss": 0.0531, + "epoch": 0.33, + "learning_rate": 0.0002506541368427167, + "loss": 0.0653, "step": 50970 }, { - "epoch": 0.55, - "learning_rate": 0.00021728859757284702, - "loss": 0.0532, + "epoch": 0.33, + "learning_rate": 0.00025064445548835977, + "loss": 0.0619, "step": 50980 }, { - "epoch": 0.55, - "learning_rate": 0.00021727237328833795, - "loss": 0.047, + "epoch": 0.33, + "learning_rate": 0.00025063477413400285, + "loss": 0.0611, "step": 50990 }, { - "epoch": 0.55, - "learning_rate": 0.00021725614900382892, - "loss": 0.0573, + "epoch": 0.33, + "learning_rate": 0.00025062509277964587, + "loss": 0.074, "step": 51000 }, { - "epoch": 0.55, - "eval_cer": 0.9212629938456482, - "eval_loss": 0.0382036492228508, - "eval_runtime": 119.2652, - "eval_samples_per_second": 16.769, - "eval_steps_per_second": 4.192, + "epoch": 0.33, + "eval_cer": 0.9201572703649306, + "eval_loss": 0.04186994954943657, + "eval_runtime": 120.029, + "eval_samples_per_second": 16.663, + "eval_steps_per_second": 4.166, "step": 51000 }, { - "epoch": 0.55, - "learning_rate": 0.00021723992471931985, - "loss": 0.0594, + "epoch": 0.33, + "learning_rate": 0.00025061541142528895, + "loss": 0.0675, "step": 51010 }, { - "epoch": 0.55, - "learning_rate": 0.00021722370043481082, - "loss": 0.0586, + "epoch": 0.33, + "learning_rate": 0.00025060573007093203, + "loss": 0.0638, "step": 51020 }, { - "epoch": 0.55, - "learning_rate": 0.00021720747615030175, - "loss": 0.0542, + "epoch": 0.33, + "learning_rate": 0.0002505960487165751, + "loss": 0.0624, "step": 51030 }, { - "epoch": 0.55, - "learning_rate": 0.0002171912518657927, - "loss": 0.0547, + "epoch": 0.33, + "learning_rate": 0.0002505863673622182, + "loss": 0.065, "step": 51040 }, { - "epoch": 0.55, - "learning_rate": 0.00021717502758128365, - "loss": 0.047, + "epoch": 0.33, + "learning_rate": 0.00025057668600786127, + "loss": 0.0603, "step": 51050 }, { - "epoch": 0.55, - "learning_rate": 0.0002171588032967746, - "loss": 0.0505, + "epoch": 0.33, + "learning_rate": 0.0002505670046535043, + "loss": 0.059, "step": 51060 }, { - "epoch": 0.55, - "learning_rate": 0.00021714257901226552, - "loss": 0.0557, + "epoch": 0.33, + "learning_rate": 0.0002505573232991474, + "loss": 0.0636, "step": 51070 }, { - "epoch": 0.55, - "learning_rate": 0.0002171263547277565, - "loss": 0.049, + "epoch": 0.33, + "learning_rate": 0.00025054764194479045, + "loss": 0.06, "step": 51080 }, { - "epoch": 0.55, - "learning_rate": 0.00021711013044324742, - "loss": 0.0565, + "epoch": 0.33, + "learning_rate": 0.0002505379605904335, + "loss": 0.0596, "step": 51090 }, { - "epoch": 0.55, - "learning_rate": 0.0002170939061587384, - "loss": 0.0563, + "epoch": 0.33, + "learning_rate": 0.00025052827923607656, + "loss": 0.0594, "step": 51100 }, { - "epoch": 0.55, - "learning_rate": 0.00021707768187422932, - "loss": 0.0475, + "epoch": 0.33, + "learning_rate": 0.00025051859788171964, + "loss": 0.0575, "step": 51110 }, { - "epoch": 0.55, - "learning_rate": 0.00021706145758972027, - "loss": 0.0643, + "epoch": 0.33, + "learning_rate": 0.0002505089165273627, + "loss": 0.0663, "step": 51120 }, { - "epoch": 0.55, - "learning_rate": 0.00021704523330521122, - "loss": 0.0556, + "epoch": 0.33, + "learning_rate": 0.0002504992351730058, + "loss": 0.0614, "step": 51130 }, { - "epoch": 0.55, - "learning_rate": 0.00021702900902070217, - "loss": 0.0583, + "epoch": 0.33, + "learning_rate": 0.0002504895538186488, + "loss": 0.0693, "step": 51140 }, { - "epoch": 0.55, - "learning_rate": 0.0002170127847361931, - "loss": 0.0505, + "epoch": 0.33, + "learning_rate": 0.0002504798724642919, + "loss": 0.0624, "step": 51150 }, { - "epoch": 0.55, - "learning_rate": 0.00021699656045168407, - "loss": 0.0573, + "epoch": 0.33, + "learning_rate": 0.000250470191109935, + "loss": 0.0651, "step": 51160 }, { - "epoch": 0.55, - "learning_rate": 0.000216980336167175, - "loss": 0.0599, + "epoch": 0.33, + "learning_rate": 0.00025046050975557806, + "loss": 0.0582, "step": 51170 }, { - "epoch": 0.55, - "learning_rate": 0.00021696411188266597, - "loss": 0.0577, + "epoch": 0.33, + "learning_rate": 0.00025045082840122114, + "loss": 0.0652, "step": 51180 }, { - "epoch": 0.55, - "learning_rate": 0.0002169478875981569, - "loss": 0.0529, + "epoch": 0.33, + "learning_rate": 0.0002504411470468642, + "loss": 0.0625, "step": 51190 }, { - "epoch": 0.55, - "learning_rate": 0.00021693166331364786, - "loss": 0.0584, + "epoch": 0.33, + "learning_rate": 0.00025043146569250725, + "loss": 0.0611, "step": 51200 }, { - "epoch": 0.55, - "learning_rate": 0.0002169154390291388, - "loss": 0.0583, + "epoch": 0.33, + "learning_rate": 0.00025042178433815033, + "loss": 0.0564, "step": 51210 }, { - "epoch": 0.55, - "learning_rate": 0.00021689921474462974, - "loss": 0.0567, + "epoch": 0.33, + "learning_rate": 0.0002504121029837934, + "loss": 0.0596, "step": 51220 }, { - "epoch": 0.55, - "learning_rate": 0.0002168829904601207, - "loss": 0.0561, + "epoch": 0.33, + "learning_rate": 0.00025040242162943643, + "loss": 0.0715, "step": 51230 }, { - "epoch": 0.55, - "learning_rate": 0.00021686676617561164, - "loss": 0.0564, + "epoch": 0.33, + "learning_rate": 0.0002503927402750795, + "loss": 0.0616, "step": 51240 }, { - "epoch": 0.55, - "learning_rate": 0.00021685054189110256, - "loss": 0.0546, + "epoch": 0.33, + "learning_rate": 0.0002503830589207226, + "loss": 0.0692, "step": 51250 }, { - "epoch": 0.55, - "learning_rate": 0.00021683431760659354, - "loss": 0.0484, + "epoch": 0.33, + "learning_rate": 0.0002503733775663657, + "loss": 0.0689, "step": 51260 }, { - "epoch": 0.55, - "learning_rate": 0.00021681809332208446, - "loss": 0.0557, + "epoch": 0.33, + "learning_rate": 0.00025036369621200875, + "loss": 0.0568, "step": 51270 }, { - "epoch": 0.55, - "learning_rate": 0.00021680186903757544, - "loss": 0.0606, + "epoch": 0.33, + "learning_rate": 0.0002503540148576518, + "loss": 0.0659, "step": 51280 }, { - "epoch": 0.55, - "learning_rate": 0.00021678564475306636, - "loss": 0.0563, + "epoch": 0.33, + "learning_rate": 0.00025034433350329486, + "loss": 0.0706, "step": 51290 }, { - "epoch": 0.55, - "learning_rate": 0.0002167694204685573, - "loss": 0.0591, + "epoch": 0.33, + "learning_rate": 0.00025033465214893794, + "loss": 0.0621, "step": 51300 }, { - "epoch": 0.55, - "learning_rate": 0.00021675319618404826, - "loss": 0.0523, + "epoch": 0.33, + "learning_rate": 0.000250324970794581, + "loss": 0.0577, "step": 51310 }, { - "epoch": 0.56, - "learning_rate": 0.0002167369718995392, - "loss": 0.0535, + "epoch": 0.33, + "learning_rate": 0.0002503152894402241, + "loss": 0.0581, "step": 51320 }, { - "epoch": 0.56, - "learning_rate": 0.00021672074761503013, - "loss": 0.0543, + "epoch": 0.33, + "learning_rate": 0.0002503056080858671, + "loss": 0.0585, "step": 51330 }, { - "epoch": 0.56, - "learning_rate": 0.0002167045233305211, - "loss": 0.0583, + "epoch": 0.33, + "learning_rate": 0.0002502959267315102, + "loss": 0.0574, "step": 51340 }, { - "epoch": 0.56, - "learning_rate": 0.00021668829904601203, - "loss": 0.0521, + "epoch": 0.33, + "learning_rate": 0.0002502862453771533, + "loss": 0.0698, "step": 51350 }, { - "epoch": 0.56, - "learning_rate": 0.000216672074761503, - "loss": 0.0516, + "epoch": 0.33, + "learning_rate": 0.0002502765640227963, + "loss": 0.0624, "step": 51360 }, { - "epoch": 0.56, - "learning_rate": 0.00021665585047699393, - "loss": 0.0515, + "epoch": 0.33, + "learning_rate": 0.0002502668826684394, + "loss": 0.0607, "step": 51370 }, { - "epoch": 0.56, - "learning_rate": 0.0002166396261924849, - "loss": 0.0524, + "epoch": 0.33, + "learning_rate": 0.00025025720131408247, + "loss": 0.0629, "step": 51380 }, { - "epoch": 0.56, - "learning_rate": 0.00021662340190797583, - "loss": 0.0547, + "epoch": 0.33, + "learning_rate": 0.00025024751995972555, + "loss": 0.0582, "step": 51390 }, { - "epoch": 0.56, - "learning_rate": 0.00021660717762346678, - "loss": 0.0517, + "epoch": 0.33, + "learning_rate": 0.00025023783860536863, + "loss": 0.0712, "step": 51400 }, { - "epoch": 0.56, - "learning_rate": 0.00021659095333895773, - "loss": 0.055, + "epoch": 0.33, + "learning_rate": 0.0002502281572510117, + "loss": 0.0763, "step": 51410 }, { - "epoch": 0.56, - "learning_rate": 0.00021657472905444868, - "loss": 0.0505, + "epoch": 0.33, + "learning_rate": 0.00025021847589665473, + "loss": 0.063, "step": 51420 }, { - "epoch": 0.56, - "learning_rate": 0.0002165585047699396, - "loss": 0.0704, + "epoch": 0.33, + "learning_rate": 0.0002502087945422978, + "loss": 0.0688, "step": 51430 }, { - "epoch": 0.56, - "learning_rate": 0.00021654228048543058, - "loss": 0.0604, + "epoch": 0.33, + "learning_rate": 0.0002501991131879409, + "loss": 0.062, "step": 51440 }, { - "epoch": 0.56, - "learning_rate": 0.0002165260562009215, - "loss": 0.0572, + "epoch": 0.33, + "learning_rate": 0.000250189431833584, + "loss": 0.0583, "step": 51450 }, { - "epoch": 0.56, - "learning_rate": 0.00021650983191641248, - "loss": 0.0518, + "epoch": 0.33, + "learning_rate": 0.000250179750479227, + "loss": 0.0603, "step": 51460 }, { - "epoch": 0.56, - "learning_rate": 0.0002164936076319034, - "loss": 0.0526, + "epoch": 0.33, + "learning_rate": 0.0002501700691248701, + "loss": 0.0642, "step": 51470 }, { - "epoch": 0.56, - "learning_rate": 0.00021647738334739435, - "loss": 0.0596, + "epoch": 0.33, + "learning_rate": 0.00025016038777051316, + "loss": 0.0559, "step": 51480 }, { - "epoch": 0.56, - "learning_rate": 0.0002164611590628853, - "loss": 0.0522, + "epoch": 0.33, + "learning_rate": 0.0002501507064161562, + "loss": 0.0589, "step": 51490 }, { - "epoch": 0.56, - "learning_rate": 0.00021644493477837625, - "loss": 0.0545, + "epoch": 0.33, + "learning_rate": 0.00025014102506179926, + "loss": 0.0579, "step": 51500 }, { - "epoch": 0.56, - "learning_rate": 0.0002164287104938672, - "loss": 0.0546, + "epoch": 0.33, + "learning_rate": 0.00025013134370744234, + "loss": 0.07, "step": 51510 }, { - "epoch": 0.56, - "learning_rate": 0.00021641248620935815, - "loss": 0.0465, + "epoch": 0.33, + "learning_rate": 0.0002501216623530854, + "loss": 0.0624, "step": 51520 }, { - "epoch": 0.56, - "learning_rate": 0.00021639626192484907, - "loss": 0.0576, + "epoch": 0.33, + "learning_rate": 0.0002501119809987285, + "loss": 0.0623, "step": 51530 }, { - "epoch": 0.56, - "learning_rate": 0.00021638003764034005, - "loss": 0.0598, + "epoch": 0.33, + "learning_rate": 0.0002501022996443716, + "loss": 0.0615, "step": 51540 }, { - "epoch": 0.56, - "learning_rate": 0.00021636381335583097, - "loss": 0.0567, + "epoch": 0.33, + "learning_rate": 0.00025009261829001466, + "loss": 0.0666, "step": 51550 }, { - "epoch": 0.56, - "learning_rate": 0.00021634758907132195, - "loss": 0.0585, - "step": 51560 + "epoch": 0.33, + "learning_rate": 0.0002500829369356577, + "loss": 0.0566, + "step": 51560 }, { - "epoch": 0.56, - "learning_rate": 0.00021633136478681287, - "loss": 0.0471, + "epoch": 0.33, + "learning_rate": 0.00025007325558130077, + "loss": 0.0629, "step": 51570 }, { - "epoch": 0.56, - "learning_rate": 0.00021631514050230382, - "loss": 0.0538, + "epoch": 0.33, + "learning_rate": 0.00025006357422694385, + "loss": 0.0574, "step": 51580 }, { - "epoch": 0.56, - "learning_rate": 0.00021629891621779477, - "loss": 0.0498, + "epoch": 0.33, + "learning_rate": 0.00025005389287258693, + "loss": 0.0648, "step": 51590 }, { - "epoch": 0.56, - "learning_rate": 0.00021628269193328572, - "loss": 0.0595, + "epoch": 0.33, + "learning_rate": 0.00025004421151822995, + "loss": 0.0571, "step": 51600 }, { - "epoch": 0.56, - "learning_rate": 0.00021626646764877664, - "loss": 0.0536, + "epoch": 0.33, + "learning_rate": 0.00025003453016387303, + "loss": 0.0684, "step": 51610 }, { - "epoch": 0.56, - "learning_rate": 0.00021625024336426762, - "loss": 0.0609, + "epoch": 0.33, + "learning_rate": 0.0002500248488095161, + "loss": 0.0597, "step": 51620 }, { - "epoch": 0.56, - "learning_rate": 0.00021623401907975857, - "loss": 0.0572, + "epoch": 0.33, + "learning_rate": 0.00025001516745515914, + "loss": 0.058, "step": 51630 }, { - "epoch": 0.56, - "learning_rate": 0.00021621779479524952, - "loss": 0.0614, + "epoch": 0.33, + "learning_rate": 0.0002500054861008022, + "loss": 0.0705, "step": 51640 }, { - "epoch": 0.56, - "learning_rate": 0.00021620157051074047, - "loss": 0.0594, + "epoch": 0.33, + "learning_rate": 0.0002499958047464453, + "loss": 0.0575, "step": 51650 }, { - "epoch": 0.56, - "learning_rate": 0.0002161853462262314, - "loss": 0.0534, + "epoch": 0.33, + "learning_rate": 0.0002499861233920884, + "loss": 0.0678, "step": 51660 }, { - "epoch": 0.56, - "learning_rate": 0.00021616912194172237, - "loss": 0.0588, + "epoch": 0.33, + "learning_rate": 0.00024997644203773146, + "loss": 0.0749, "step": 51670 }, { - "epoch": 0.56, - "learning_rate": 0.0002161528976572133, - "loss": 0.0488, + "epoch": 0.33, + "learning_rate": 0.00024996676068337454, + "loss": 0.0607, "step": 51680 }, { - "epoch": 0.56, - "learning_rate": 0.00021613667337270427, - "loss": 0.0488, + "epoch": 0.33, + "learning_rate": 0.00024995707932901756, + "loss": 0.0674, "step": 51690 }, { - "epoch": 0.56, - "learning_rate": 0.0002161204490881952, - "loss": 0.0566, + "epoch": 0.33, + "learning_rate": 0.00024994739797466064, + "loss": 0.0631, "step": 51700 }, { - "epoch": 0.56, - "learning_rate": 0.00021610422480368617, - "loss": 0.0564, + "epoch": 0.33, + "learning_rate": 0.0002499377166203037, + "loss": 0.0595, "step": 51710 }, { - "epoch": 0.56, - "learning_rate": 0.0002160880005191771, - "loss": 0.0598, + "epoch": 0.33, + "learning_rate": 0.0002499280352659468, + "loss": 0.0622, "step": 51720 }, { - "epoch": 0.56, - "learning_rate": 0.00021607177623466804, - "loss": 0.0521, + "epoch": 0.33, + "learning_rate": 0.00024991835391158983, + "loss": 0.0632, "step": 51730 }, { - "epoch": 0.56, - "learning_rate": 0.000216055551950159, - "loss": 0.0562, + "epoch": 0.33, + "learning_rate": 0.0002499086725572329, + "loss": 0.0603, "step": 51740 }, { - "epoch": 0.56, - "learning_rate": 0.00021603932766564994, - "loss": 0.058, + "epoch": 0.33, + "learning_rate": 0.000249898991202876, + "loss": 0.065, "step": 51750 }, { - "epoch": 0.56, - "learning_rate": 0.00021602310338114086, - "loss": 0.0595, + "epoch": 0.33, + "learning_rate": 0.000249889309848519, + "loss": 0.0608, "step": 51760 }, { - "epoch": 0.56, - "learning_rate": 0.00021600687909663184, - "loss": 0.0577, + "epoch": 0.33, + "learning_rate": 0.0002498796284941621, + "loss": 0.0613, "step": 51770 }, { - "epoch": 0.56, - "learning_rate": 0.00021599065481212276, - "loss": 0.0572, + "epoch": 0.33, + "learning_rate": 0.00024986994713980517, + "loss": 0.0627, "step": 51780 }, { - "epoch": 0.56, - "learning_rate": 0.00021597443052761374, - "loss": 0.0602, + "epoch": 0.33, + "learning_rate": 0.00024986026578544825, + "loss": 0.0622, "step": 51790 }, { - "epoch": 0.56, - "learning_rate": 0.00021595820624310466, - "loss": 0.0557, + "epoch": 0.33, + "learning_rate": 0.00024985058443109133, + "loss": 0.07, "step": 51800 }, { - "epoch": 0.56, - "learning_rate": 0.0002159419819585956, - "loss": 0.0521, + "epoch": 0.33, + "learning_rate": 0.0002498409030767344, + "loss": 0.0534, "step": 51810 }, { - "epoch": 0.56, - "learning_rate": 0.00021592575767408656, - "loss": 0.0516, + "epoch": 0.33, + "learning_rate": 0.0002498312217223775, + "loss": 0.0588, "step": 51820 }, { - "epoch": 0.56, - "learning_rate": 0.0002159095333895775, - "loss": 0.05, + "epoch": 0.33, + "learning_rate": 0.0002498215403680205, + "loss": 0.0647, "step": 51830 }, { - "epoch": 0.56, - "learning_rate": 0.00021589330910506843, - "loss": 0.0567, + "epoch": 0.33, + "learning_rate": 0.0002498118590136636, + "loss": 0.0699, "step": 51840 }, { - "epoch": 0.56, - "learning_rate": 0.0002158770848205594, - "loss": 0.0594, + "epoch": 0.33, + "learning_rate": 0.0002498021776593067, + "loss": 0.0678, "step": 51850 }, { - "epoch": 0.56, - "learning_rate": 0.00021586086053605033, - "loss": 0.0523, + "epoch": 0.33, + "learning_rate": 0.0002497924963049497, + "loss": 0.0578, "step": 51860 }, { - "epoch": 0.56, - "learning_rate": 0.0002158446362515413, - "loss": 0.0589, + "epoch": 0.33, + "learning_rate": 0.0002497828149505928, + "loss": 0.0592, "step": 51870 }, { - "epoch": 0.56, - "learning_rate": 0.00021582841196703223, - "loss": 0.0577, + "epoch": 0.33, + "learning_rate": 0.00024977313359623586, + "loss": 0.0738, "step": 51880 }, { - "epoch": 0.56, - "learning_rate": 0.0002158121876825232, - "loss": 0.0548, + "epoch": 0.33, + "learning_rate": 0.00024976345224187894, + "loss": 0.0621, "step": 51890 }, { - "epoch": 0.56, - "learning_rate": 0.00021579596339801413, - "loss": 0.0554, + "epoch": 0.33, + "learning_rate": 0.00024975377088752197, + "loss": 0.0603, "step": 51900 }, { - "epoch": 0.56, - "learning_rate": 0.00021577973911350508, - "loss": 0.0502, + "epoch": 0.34, + "learning_rate": 0.00024974408953316505, + "loss": 0.0614, "step": 51910 }, { - "epoch": 0.56, - "learning_rate": 0.00021576351482899603, - "loss": 0.0595, + "epoch": 0.34, + "learning_rate": 0.00024973440817880813, + "loss": 0.0588, "step": 51920 }, { - "epoch": 0.56, - "learning_rate": 0.00021574729054448698, - "loss": 0.057, + "epoch": 0.34, + "learning_rate": 0.0002497247268244512, + "loss": 0.0674, "step": 51930 }, { - "epoch": 0.56, - "learning_rate": 0.0002157310662599779, - "loss": 0.0492, + "epoch": 0.34, + "learning_rate": 0.0002497150454700943, + "loss": 0.0591, "step": 51940 }, { - "epoch": 0.56, - "learning_rate": 0.00021571484197546888, - "loss": 0.0599, + "epoch": 0.34, + "learning_rate": 0.00024970536411573737, + "loss": 0.0638, "step": 51950 }, { - "epoch": 0.56, - "learning_rate": 0.0002156986176909598, - "loss": 0.0705, + "epoch": 0.34, + "learning_rate": 0.00024969568276138045, + "loss": 0.0645, "step": 51960 }, { - "epoch": 0.56, - "learning_rate": 0.00021568239340645078, - "loss": 0.0587, + "epoch": 0.34, + "learning_rate": 0.00024968600140702347, + "loss": 0.0638, "step": 51970 }, { - "epoch": 0.56, - "learning_rate": 0.0002156661691219417, - "loss": 0.0496, + "epoch": 0.34, + "learning_rate": 0.00024967632005266655, + "loss": 0.0657, "step": 51980 }, { - "epoch": 0.56, - "learning_rate": 0.00021564994483743265, - "loss": 0.0636, + "epoch": 0.34, + "learning_rate": 0.00024966663869830963, + "loss": 0.0654, "step": 51990 }, { - "epoch": 0.56, - "learning_rate": 0.0002156337205529236, - "loss": 0.0569, + "epoch": 0.34, + "learning_rate": 0.00024965695734395266, + "loss": 0.0602, "step": 52000 }, { - "epoch": 0.56, - "eval_cer": 0.9214423411627714, - "eval_loss": 0.03814411908388138, - "eval_runtime": 119.3539, - "eval_samples_per_second": 16.757, - "eval_steps_per_second": 4.189, + "epoch": 0.34, + "eval_cer": 0.9201572703649306, + "eval_loss": 0.040952201932668686, + "eval_runtime": 120.0447, + "eval_samples_per_second": 16.66, + "eval_steps_per_second": 4.165, "step": 52000 }, { - "epoch": 0.56, - "learning_rate": 0.00021561749626841455, - "loss": 0.0516, + "epoch": 0.34, + "learning_rate": 0.00024964727598959574, + "loss": 0.0582, "step": 52010 }, { - "epoch": 0.56, - "learning_rate": 0.00021560127198390547, - "loss": 0.0593, + "epoch": 0.34, + "learning_rate": 0.0002496375946352388, + "loss": 0.0636, "step": 52020 }, { - "epoch": 0.56, - "learning_rate": 0.00021558504769939645, - "loss": 0.0558, + "epoch": 0.34, + "learning_rate": 0.0002496279132808819, + "loss": 0.0618, "step": 52030 }, { - "epoch": 0.56, - "learning_rate": 0.00021556882341488737, - "loss": 0.0511, + "epoch": 0.34, + "learning_rate": 0.0002496182319265249, + "loss": 0.0594, "step": 52040 }, { - "epoch": 0.56, - "learning_rate": 0.00021555259913037835, - "loss": 0.0514, + "epoch": 0.34, + "learning_rate": 0.000249608550572168, + "loss": 0.0545, "step": 52050 }, { - "epoch": 0.56, - "learning_rate": 0.00021553637484586927, - "loss": 0.0625, + "epoch": 0.34, + "learning_rate": 0.0002495988692178111, + "loss": 0.0647, "step": 52060 }, { - "epoch": 0.56, - "learning_rate": 0.00021552015056136025, - "loss": 0.0567, + "epoch": 0.34, + "learning_rate": 0.00024958918786345416, + "loss": 0.0549, "step": 52070 }, { - "epoch": 0.56, - "learning_rate": 0.00021550392627685117, - "loss": 0.0589, + "epoch": 0.34, + "learning_rate": 0.00024957950650909724, + "loss": 0.0639, "step": 52080 }, { - "epoch": 0.56, - "learning_rate": 0.00021548770199234212, - "loss": 0.054, + "epoch": 0.34, + "learning_rate": 0.0002495698251547403, + "loss": 0.0636, "step": 52090 }, { - "epoch": 0.56, - "learning_rate": 0.00021547147770783307, - "loss": 0.0573, + "epoch": 0.34, + "learning_rate": 0.00024956014380038335, + "loss": 0.0581, "step": 52100 }, { - "epoch": 0.56, - "learning_rate": 0.00021545525342332402, - "loss": 0.0528, + "epoch": 0.34, + "learning_rate": 0.0002495504624460264, + "loss": 0.0681, "step": 52110 }, { - "epoch": 0.56, - "learning_rate": 0.00021543902913881495, - "loss": 0.0503, + "epoch": 0.34, + "learning_rate": 0.0002495407810916695, + "loss": 0.059, "step": 52120 }, { - "epoch": 0.56, - "learning_rate": 0.00021542280485430592, - "loss": 0.066, + "epoch": 0.34, + "learning_rate": 0.00024953109973731253, + "loss": 0.0626, "step": 52130 }, { - "epoch": 0.56, - "learning_rate": 0.00021540658056979684, - "loss": 0.0532, + "epoch": 0.34, + "learning_rate": 0.0002495214183829556, + "loss": 0.0619, "step": 52140 }, { - "epoch": 0.56, - "learning_rate": 0.00021539035628528782, - "loss": 0.0556, + "epoch": 0.34, + "learning_rate": 0.0002495117370285987, + "loss": 0.0641, "step": 52150 }, { - "epoch": 0.56, - "learning_rate": 0.00021537413200077874, - "loss": 0.0543, + "epoch": 0.34, + "learning_rate": 0.00024950205567424177, + "loss": 0.0691, "step": 52160 }, { - "epoch": 0.56, - "learning_rate": 0.0002153579077162697, - "loss": 0.054, + "epoch": 0.34, + "learning_rate": 0.00024949237431988485, + "loss": 0.0593, "step": 52170 }, { - "epoch": 0.56, - "learning_rate": 0.00021534168343176064, - "loss": 0.0603, + "epoch": 0.34, + "learning_rate": 0.0002494826929655279, + "loss": 0.0672, "step": 52180 }, { - "epoch": 0.56, - "learning_rate": 0.0002153254591472516, - "loss": 0.0565, + "epoch": 0.34, + "learning_rate": 0.00024947301161117096, + "loss": 0.0692, "step": 52190 }, { - "epoch": 0.56, - "learning_rate": 0.00021530923486274254, - "loss": 0.0688, + "epoch": 0.34, + "learning_rate": 0.00024946333025681404, + "loss": 0.0603, "step": 52200 }, { - "epoch": 0.56, - "learning_rate": 0.0002152930105782335, - "loss": 0.0551, + "epoch": 0.34, + "learning_rate": 0.0002494536489024571, + "loss": 0.0603, "step": 52210 }, { - "epoch": 0.56, - "learning_rate": 0.00021527678629372442, - "loss": 0.0536, + "epoch": 0.34, + "learning_rate": 0.0002494439675481002, + "loss": 0.067, "step": 52220 }, { - "epoch": 0.56, - "learning_rate": 0.0002152605620092154, - "loss": 0.0684, + "epoch": 0.34, + "learning_rate": 0.0002494342861937433, + "loss": 0.0678, "step": 52230 }, { - "epoch": 0.57, - "learning_rate": 0.00021524433772470632, - "loss": 0.0524, + "epoch": 0.34, + "learning_rate": 0.0002494246048393863, + "loss": 0.0654, "step": 52240 }, { - "epoch": 0.57, - "learning_rate": 0.0002152281134401973, - "loss": 0.0532, + "epoch": 0.34, + "learning_rate": 0.0002494149234850294, + "loss": 0.0684, "step": 52250 }, { - "epoch": 0.57, - "learning_rate": 0.00021521188915568822, - "loss": 0.0561, + "epoch": 0.34, + "learning_rate": 0.0002494052421306724, + "loss": 0.0568, "step": 52260 }, { - "epoch": 0.57, - "learning_rate": 0.00021519566487117916, - "loss": 0.055, + "epoch": 0.34, + "learning_rate": 0.0002493955607763155, + "loss": 0.0671, "step": 52270 }, { - "epoch": 0.57, - "learning_rate": 0.00021517944058667011, - "loss": 0.0607, + "epoch": 0.34, + "learning_rate": 0.00024938587942195857, + "loss": 0.0662, "step": 52280 }, { - "epoch": 0.57, - "learning_rate": 0.00021516321630216106, - "loss": 0.0509, + "epoch": 0.34, + "learning_rate": 0.00024937619806760165, + "loss": 0.0617, "step": 52290 }, { - "epoch": 0.57, - "learning_rate": 0.000215146992017652, - "loss": 0.0633, + "epoch": 0.34, + "learning_rate": 0.0002493665167132447, + "loss": 0.0585, "step": 52300 }, { - "epoch": 0.57, - "learning_rate": 0.00021513076773314296, - "loss": 0.058, + "epoch": 0.34, + "learning_rate": 0.0002493568353588878, + "loss": 0.068, "step": 52310 }, { - "epoch": 0.57, - "learning_rate": 0.0002151145434486339, - "loss": 0.0549, + "epoch": 0.34, + "learning_rate": 0.00024934715400453083, + "loss": 0.0613, "step": 52320 }, { - "epoch": 0.57, - "learning_rate": 0.00021509831916412486, - "loss": 0.0497, + "epoch": 0.34, + "learning_rate": 0.0002493374726501739, + "loss": 0.0667, "step": 52330 }, { - "epoch": 0.57, - "learning_rate": 0.00021508209487961579, - "loss": 0.0589, + "epoch": 0.34, + "learning_rate": 0.000249327791295817, + "loss": 0.0623, "step": 52340 }, { - "epoch": 0.57, - "learning_rate": 0.00021506587059510674, - "loss": 0.0466, + "epoch": 0.34, + "learning_rate": 0.00024931810994146007, + "loss": 0.0634, "step": 52350 }, { - "epoch": 0.57, - "learning_rate": 0.00021504964631059769, - "loss": 0.0561, + "epoch": 0.34, + "learning_rate": 0.00024930842858710315, + "loss": 0.0579, "step": 52360 }, { - "epoch": 0.57, - "learning_rate": 0.00021503342202608864, - "loss": 0.058, + "epoch": 0.34, + "learning_rate": 0.0002492987472327462, + "loss": 0.0732, "step": 52370 }, { - "epoch": 0.57, - "learning_rate": 0.00021501719774157959, - "loss": 0.0664, + "epoch": 0.34, + "learning_rate": 0.00024928906587838926, + "loss": 0.0671, "step": 52380 }, { - "epoch": 0.57, - "learning_rate": 0.00021500097345707054, - "loss": 0.0534, + "epoch": 0.34, + "learning_rate": 0.00024927938452403234, + "loss": 0.0605, "step": 52390 }, { - "epoch": 0.57, - "learning_rate": 0.00021498474917256146, - "loss": 0.0541, + "epoch": 0.34, + "learning_rate": 0.00024926970316967536, + "loss": 0.075, "step": 52400 }, { - "epoch": 0.57, - "learning_rate": 0.00021496852488805243, - "loss": 0.0662, + "epoch": 0.34, + "learning_rate": 0.00024926002181531844, + "loss": 0.0734, "step": 52410 }, { - "epoch": 0.57, - "learning_rate": 0.00021495230060354336, - "loss": 0.0522, + "epoch": 0.34, + "learning_rate": 0.0002492503404609615, + "loss": 0.0573, "step": 52420 }, { - "epoch": 0.57, - "learning_rate": 0.00021493607631903433, - "loss": 0.0564, + "epoch": 0.34, + "learning_rate": 0.0002492406591066046, + "loss": 0.0726, "step": 52430 }, { - "epoch": 0.57, - "learning_rate": 0.00021491985203452526, - "loss": 0.0599, + "epoch": 0.34, + "learning_rate": 0.0002492309777522477, + "loss": 0.0688, "step": 52440 }, { - "epoch": 0.57, - "learning_rate": 0.0002149036277500162, - "loss": 0.053, + "epoch": 0.34, + "learning_rate": 0.00024922129639789076, + "loss": 0.0613, "step": 52450 }, { - "epoch": 0.57, - "learning_rate": 0.00021488740346550716, - "loss": 0.0476, + "epoch": 0.34, + "learning_rate": 0.0002492116150435338, + "loss": 0.0611, "step": 52460 }, { - "epoch": 0.57, - "learning_rate": 0.0002148711791809981, - "loss": 0.0512, + "epoch": 0.34, + "learning_rate": 0.00024920193368917687, + "loss": 0.0659, "step": 52470 }, { - "epoch": 0.57, - "learning_rate": 0.00021485495489648903, - "loss": 0.0569, + "epoch": 0.34, + "learning_rate": 0.00024919225233481995, + "loss": 0.0575, "step": 52480 }, { - "epoch": 0.57, - "learning_rate": 0.00021483873061198, - "loss": 0.0612, + "epoch": 0.34, + "learning_rate": 0.000249182570980463, + "loss": 0.0661, "step": 52490 }, { - "epoch": 0.57, - "learning_rate": 0.00021482250632747093, - "loss": 0.0545, + "epoch": 0.34, + "learning_rate": 0.00024917288962610605, + "loss": 0.0612, "step": 52500 }, { - "epoch": 0.57, - "learning_rate": 0.0002148062820429619, - "loss": 0.0583, + "epoch": 0.34, + "learning_rate": 0.00024916320827174913, + "loss": 0.0628, "step": 52510 }, { - "epoch": 0.57, - "learning_rate": 0.00021479005775845283, - "loss": 0.0544, + "epoch": 0.34, + "learning_rate": 0.0002491535269173922, + "loss": 0.0585, "step": 52520 }, { - "epoch": 0.57, - "learning_rate": 0.00021477383347394378, - "loss": 0.0624, + "epoch": 0.34, + "learning_rate": 0.00024914384556303524, + "loss": 0.057, "step": 52530 }, { - "epoch": 0.57, - "learning_rate": 0.00021475760918943473, - "loss": 0.0583, + "epoch": 0.34, + "learning_rate": 0.0002491341642086783, + "loss": 0.06, "step": 52540 }, { - "epoch": 0.57, - "learning_rate": 0.00021474138490492568, - "loss": 0.0533, + "epoch": 0.34, + "learning_rate": 0.0002491244828543214, + "loss": 0.0564, "step": 52550 }, { - "epoch": 0.57, - "learning_rate": 0.00021472516062041663, - "loss": 0.0571, + "epoch": 0.34, + "learning_rate": 0.0002491148014999645, + "loss": 0.0609, "step": 52560 }, { - "epoch": 0.57, - "learning_rate": 0.00021470893633590758, - "loss": 0.052, + "epoch": 0.34, + "learning_rate": 0.00024910512014560755, + "loss": 0.0643, "step": 52570 }, { - "epoch": 0.57, - "learning_rate": 0.0002146927120513985, - "loss": 0.0469, + "epoch": 0.34, + "learning_rate": 0.00024909543879125063, + "loss": 0.0581, "step": 52580 }, { - "epoch": 0.57, - "learning_rate": 0.00021467648776688948, - "loss": 0.0617, + "epoch": 0.34, + "learning_rate": 0.0002490857574368937, + "loss": 0.0524, "step": 52590 }, { - "epoch": 0.57, - "learning_rate": 0.0002146602634823804, - "loss": 0.0475, + "epoch": 0.34, + "learning_rate": 0.00024907607608253674, + "loss": 0.0565, "step": 52600 }, { - "epoch": 0.57, - "learning_rate": 0.00021464403919787138, - "loss": 0.0562, + "epoch": 0.34, + "learning_rate": 0.0002490663947281798, + "loss": 0.0687, "step": 52610 }, { - "epoch": 0.57, - "learning_rate": 0.0002146278149133623, - "loss": 0.0514, + "epoch": 0.34, + "learning_rate": 0.0002490567133738229, + "loss": 0.0582, "step": 52620 }, { - "epoch": 0.57, - "learning_rate": 0.00021461159062885325, - "loss": 0.0594, + "epoch": 0.34, + "learning_rate": 0.000249047032019466, + "loss": 0.0578, "step": 52630 }, { - "epoch": 0.57, - "learning_rate": 0.0002145953663443442, - "loss": 0.0576, + "epoch": 0.34, + "learning_rate": 0.000249037350665109, + "loss": 0.0788, "step": 52640 }, { - "epoch": 0.57, - "learning_rate": 0.00021457914205983515, - "loss": 0.055, + "epoch": 0.34, + "learning_rate": 0.0002490276693107521, + "loss": 0.063, "step": 52650 }, { - "epoch": 0.57, - "learning_rate": 0.00021456291777532607, - "loss": 0.0555, + "epoch": 0.34, + "learning_rate": 0.00024901798795639516, + "loss": 0.068, "step": 52660 }, { - "epoch": 0.57, - "learning_rate": 0.00021454669349081705, - "loss": 0.0571, + "epoch": 0.34, + "learning_rate": 0.0002490083066020382, + "loss": 0.0653, "step": 52670 }, { - "epoch": 0.57, - "learning_rate": 0.00021453046920630797, - "loss": 0.0567, + "epoch": 0.34, + "learning_rate": 0.00024899862524768127, + "loss": 0.0631, "step": 52680 }, { - "epoch": 0.57, - "learning_rate": 0.00021451424492179895, - "loss": 0.0613, + "epoch": 0.34, + "learning_rate": 0.00024898894389332435, + "loss": 0.0571, "step": 52690 }, { - "epoch": 0.57, - "learning_rate": 0.00021449802063728987, - "loss": 0.0596, + "epoch": 0.34, + "learning_rate": 0.00024897926253896743, + "loss": 0.0595, "step": 52700 }, { - "epoch": 0.57, - "learning_rate": 0.00021448179635278082, - "loss": 0.0613, + "epoch": 0.34, + "learning_rate": 0.0002489695811846105, + "loss": 0.0592, "step": 52710 }, { - "epoch": 0.57, - "learning_rate": 0.00021446557206827177, - "loss": 0.0552, + "epoch": 0.34, + "learning_rate": 0.0002489598998302536, + "loss": 0.06, "step": 52720 }, { - "epoch": 0.57, - "learning_rate": 0.00021444934778376272, - "loss": 0.0546, + "epoch": 0.34, + "learning_rate": 0.00024895021847589667, + "loss": 0.0586, "step": 52730 }, { - "epoch": 0.57, - "learning_rate": 0.00021443312349925367, - "loss": 0.0545, + "epoch": 0.34, + "learning_rate": 0.0002489405371215397, + "loss": 0.0651, "step": 52740 }, { - "epoch": 0.57, - "learning_rate": 0.00021441689921474462, - "loss": 0.0542, + "epoch": 0.34, + "learning_rate": 0.0002489308557671828, + "loss": 0.0694, "step": 52750 }, { - "epoch": 0.57, - "learning_rate": 0.00021440067493023554, - "loss": 0.0524, + "epoch": 0.34, + "learning_rate": 0.00024892117441282585, + "loss": 0.0581, "step": 52760 }, { - "epoch": 0.57, - "learning_rate": 0.00021438445064572652, - "loss": 0.0531, + "epoch": 0.34, + "learning_rate": 0.0002489114930584689, + "loss": 0.0562, "step": 52770 }, { - "epoch": 0.57, - "learning_rate": 0.00021436822636121744, - "loss": 0.0568, + "epoch": 0.34, + "learning_rate": 0.00024890181170411196, + "loss": 0.0589, "step": 52780 }, { - "epoch": 0.57, - "learning_rate": 0.00021435200207670842, - "loss": 0.0544, + "epoch": 0.34, + "learning_rate": 0.00024889213034975504, + "loss": 0.0569, "step": 52790 }, { - "epoch": 0.57, - "learning_rate": 0.00021433577779219934, - "loss": 0.0516, + "epoch": 0.34, + "learning_rate": 0.0002488824489953981, + "loss": 0.0637, "step": 52800 }, { - "epoch": 0.57, - "learning_rate": 0.0002143195535076903, - "loss": 0.0532, + "epoch": 0.34, + "learning_rate": 0.00024887276764104114, + "loss": 0.0654, "step": 52810 }, { - "epoch": 0.57, - "learning_rate": 0.00021430332922318124, - "loss": 0.0476, + "epoch": 0.34, + "learning_rate": 0.0002488630862866842, + "loss": 0.065, "step": 52820 }, { - "epoch": 0.57, - "learning_rate": 0.0002142871049386722, - "loss": 0.0543, - "step": 52830 + "epoch": 0.34, + "learning_rate": 0.0002488534049323273, + "loss": 0.0582, + "step": 52830 }, { - "epoch": 0.57, - "learning_rate": 0.0002142708806541631, - "loss": 0.0505, + "epoch": 0.34, + "learning_rate": 0.0002488437235779704, + "loss": 0.0569, "step": 52840 }, { - "epoch": 0.57, - "learning_rate": 0.0002142546563696541, - "loss": 0.0516, + "epoch": 0.34, + "learning_rate": 0.00024883404222361346, + "loss": 0.0593, "step": 52850 }, { - "epoch": 0.57, - "learning_rate": 0.000214238432085145, - "loss": 0.0554, + "epoch": 0.34, + "learning_rate": 0.00024882436086925654, + "loss": 0.0559, "step": 52860 }, { - "epoch": 0.57, - "learning_rate": 0.000214222207800636, - "loss": 0.061, + "epoch": 0.34, + "learning_rate": 0.00024881467951489957, + "loss": 0.0614, "step": 52870 }, { - "epoch": 0.57, - "learning_rate": 0.0002142059835161269, - "loss": 0.0475, + "epoch": 0.34, + "learning_rate": 0.00024880499816054265, + "loss": 0.0683, "step": 52880 }, { - "epoch": 0.57, - "learning_rate": 0.0002141897592316179, - "loss": 0.0528, + "epoch": 0.34, + "learning_rate": 0.00024879531680618573, + "loss": 0.0662, "step": 52890 }, { - "epoch": 0.57, - "learning_rate": 0.0002141735349471088, - "loss": 0.0472, + "epoch": 0.34, + "learning_rate": 0.00024878563545182875, + "loss": 0.0639, "step": 52900 }, { - "epoch": 0.57, - "learning_rate": 0.00021415731066259976, - "loss": 0.0507, + "epoch": 0.34, + "learning_rate": 0.00024877595409747183, + "loss": 0.0541, "step": 52910 }, { - "epoch": 0.57, - "learning_rate": 0.0002141410863780907, - "loss": 0.0496, + "epoch": 0.34, + "learning_rate": 0.0002487662727431149, + "loss": 0.0611, "step": 52920 }, { - "epoch": 0.57, - "learning_rate": 0.00021412486209358166, - "loss": 0.0512, + "epoch": 0.34, + "learning_rate": 0.000248756591388758, + "loss": 0.059, "step": 52930 }, { - "epoch": 0.57, - "learning_rate": 0.00021410863780907258, - "loss": 0.0577, + "epoch": 0.34, + "learning_rate": 0.0002487469100344011, + "loss": 0.0683, "step": 52940 }, { - "epoch": 0.57, - "learning_rate": 0.00021409241352456356, - "loss": 0.0522, + "epoch": 0.34, + "learning_rate": 0.0002487372286800441, + "loss": 0.053, "step": 52950 }, { - "epoch": 0.57, - "learning_rate": 0.00021407618924005448, - "loss": 0.0466, + "epoch": 0.34, + "learning_rate": 0.0002487275473256872, + "loss": 0.0587, "step": 52960 }, { - "epoch": 0.57, - "learning_rate": 0.00021405996495554546, - "loss": 0.0616, + "epoch": 0.34, + "learning_rate": 0.00024871786597133026, + "loss": 0.0614, "step": 52970 }, { - "epoch": 0.57, - "learning_rate": 0.00021404374067103638, - "loss": 0.0539, + "epoch": 0.34, + "learning_rate": 0.00024870818461697334, + "loss": 0.0611, "step": 52980 }, { - "epoch": 0.57, - "learning_rate": 0.00021402751638652733, - "loss": 0.0517, + "epoch": 0.34, + "learning_rate": 0.0002486985032626164, + "loss": 0.0595, "step": 52990 }, { - "epoch": 0.57, - "learning_rate": 0.00021401129210201828, - "loss": 0.0597, + "epoch": 0.34, + "learning_rate": 0.0002486888219082595, + "loss": 0.0672, "step": 53000 }, { - "epoch": 0.57, - "eval_cer": 0.9212497415808362, - "eval_loss": 0.038132600486278534, - "eval_runtime": 118.9435, - "eval_samples_per_second": 16.815, - "eval_steps_per_second": 4.204, + "epoch": 0.34, + "eval_cer": 0.9201590780702745, + "eval_loss": 0.041813936084508896, + "eval_runtime": 120.1824, + "eval_samples_per_second": 16.641, + "eval_steps_per_second": 4.16, "step": 53000 }, { - "epoch": 0.57, - "learning_rate": 0.00021399506781750923, - "loss": 0.0518, + "epoch": 0.34, + "learning_rate": 0.0002486791405539025, + "loss": 0.0609, "step": 53010 }, { - "epoch": 0.57, - "learning_rate": 0.00021397884353300015, - "loss": 0.0567, + "epoch": 0.34, + "learning_rate": 0.0002486694591995456, + "loss": 0.0576, "step": 53020 }, { - "epoch": 0.57, - "learning_rate": 0.00021396261924849113, - "loss": 0.0498, + "epoch": 0.34, + "learning_rate": 0.0002486597778451887, + "loss": 0.0647, "step": 53030 }, { - "epoch": 0.57, - "learning_rate": 0.00021394639496398205, - "loss": 0.0563, + "epoch": 0.34, + "learning_rate": 0.0002486500964908317, + "loss": 0.0553, "step": 53040 }, { - "epoch": 0.57, - "learning_rate": 0.00021393017067947303, - "loss": 0.0501, + "epoch": 0.34, + "learning_rate": 0.0002486404151364748, + "loss": 0.0677, "step": 53050 }, { - "epoch": 0.57, - "learning_rate": 0.00021391394639496395, - "loss": 0.0492, + "epoch": 0.34, + "learning_rate": 0.00024863073378211787, + "loss": 0.0665, "step": 53060 }, { - "epoch": 0.57, - "learning_rate": 0.00021389772211045493, - "loss": 0.0581, + "epoch": 0.34, + "learning_rate": 0.00024862105242776095, + "loss": 0.0554, "step": 53070 }, { - "epoch": 0.57, - "learning_rate": 0.00021388149782594585, - "loss": 0.052, + "epoch": 0.34, + "learning_rate": 0.00024861137107340403, + "loss": 0.0621, "step": 53080 }, { - "epoch": 0.57, - "learning_rate": 0.0002138652735414368, - "loss": 0.0548, + "epoch": 0.34, + "learning_rate": 0.00024860168971904705, + "loss": 0.0654, "step": 53090 }, { - "epoch": 0.57, - "learning_rate": 0.00021384904925692775, - "loss": 0.0609, + "epoch": 0.34, + "learning_rate": 0.00024859200836469013, + "loss": 0.0627, "step": 53100 }, { - "epoch": 0.57, - "learning_rate": 0.0002138328249724187, - "loss": 0.0613, + "epoch": 0.34, + "learning_rate": 0.0002485823270103332, + "loss": 0.0671, "step": 53110 }, { - "epoch": 0.57, - "learning_rate": 0.00021381660068790962, - "loss": 0.0548, + "epoch": 0.34, + "learning_rate": 0.0002485726456559763, + "loss": 0.0691, "step": 53120 }, { - "epoch": 0.57, - "learning_rate": 0.0002138003764034006, - "loss": 0.0525, + "epoch": 0.34, + "learning_rate": 0.00024856296430161937, + "loss": 0.06, "step": 53130 }, { - "epoch": 0.57, - "learning_rate": 0.00021378415211889152, - "loss": 0.0456, + "epoch": 0.34, + "learning_rate": 0.0002485532829472624, + "loss": 0.0622, "step": 53140 }, { - "epoch": 0.57, - "learning_rate": 0.0002137679278343825, - "loss": 0.0448, + "epoch": 0.34, + "learning_rate": 0.0002485436015929055, + "loss": 0.0616, "step": 53150 }, { - "epoch": 0.57, - "learning_rate": 0.00021375170354987342, - "loss": 0.0517, + "epoch": 0.34, + "learning_rate": 0.00024853392023854856, + "loss": 0.0606, "step": 53160 }, { - "epoch": 0.58, - "learning_rate": 0.00021373547926536437, - "loss": 0.0488, + "epoch": 0.34, + "learning_rate": 0.0002485242388841916, + "loss": 0.0595, "step": 53170 }, { - "epoch": 0.58, - "learning_rate": 0.00021371925498085532, - "loss": 0.05, + "epoch": 0.34, + "learning_rate": 0.00024851455752983466, + "loss": 0.0599, "step": 53180 }, { - "epoch": 0.58, - "learning_rate": 0.00021370303069634627, - "loss": 0.0547, + "epoch": 0.34, + "learning_rate": 0.00024850487617547774, + "loss": 0.0713, "step": 53190 }, { - "epoch": 0.58, - "learning_rate": 0.0002136868064118372, - "loss": 0.0484, + "epoch": 0.34, + "learning_rate": 0.0002484951948211208, + "loss": 0.0687, "step": 53200 }, { - "epoch": 0.58, - "learning_rate": 0.00021367058212732817, - "loss": 0.054, + "epoch": 0.34, + "learning_rate": 0.0002484855134667639, + "loss": 0.0619, "step": 53210 }, { - "epoch": 0.58, - "learning_rate": 0.0002136543578428191, - "loss": 0.0595, + "epoch": 0.34, + "learning_rate": 0.000248475832112407, + "loss": 0.0604, "step": 53220 }, { - "epoch": 0.58, - "learning_rate": 0.00021363813355831007, - "loss": 0.0536, + "epoch": 0.34, + "learning_rate": 0.00024846615075805, + "loss": 0.0609, "step": 53230 }, { - "epoch": 0.58, - "learning_rate": 0.000213621909273801, - "loss": 0.0577, + "epoch": 0.34, + "learning_rate": 0.0002484564694036931, + "loss": 0.0579, "step": 53240 }, { - "epoch": 0.58, - "learning_rate": 0.00021360568498929197, - "loss": 0.0567, + "epoch": 0.34, + "learning_rate": 0.00024844678804933617, + "loss": 0.0616, "step": 53250 }, { - "epoch": 0.58, - "learning_rate": 0.0002135894607047829, - "loss": 0.057, + "epoch": 0.34, + "learning_rate": 0.00024843710669497925, + "loss": 0.063, "step": 53260 }, { - "epoch": 0.58, - "learning_rate": 0.00021357323642027384, - "loss": 0.0488, + "epoch": 0.34, + "learning_rate": 0.0002484274253406223, + "loss": 0.0532, "step": 53270 }, { - "epoch": 0.58, - "learning_rate": 0.0002135570121357648, - "loss": 0.0505, + "epoch": 0.34, + "learning_rate": 0.00024841774398626535, + "loss": 0.0561, "step": 53280 }, { - "epoch": 0.58, - "learning_rate": 0.00021354078785125574, - "loss": 0.0561, + "epoch": 0.34, + "learning_rate": 0.00024840806263190843, + "loss": 0.0582, "step": 53290 }, { - "epoch": 0.58, - "learning_rate": 0.00021352456356674667, - "loss": 0.0484, + "epoch": 0.34, + "learning_rate": 0.00024839838127755146, + "loss": 0.0715, "step": 53300 }, { - "epoch": 0.58, - "learning_rate": 0.00021350833928223764, - "loss": 0.0584, + "epoch": 0.34, + "learning_rate": 0.00024838869992319454, + "loss": 0.0604, "step": 53310 }, { - "epoch": 0.58, - "learning_rate": 0.00021349211499772857, - "loss": 0.0574, + "epoch": 0.34, + "learning_rate": 0.0002483790185688376, + "loss": 0.063, "step": 53320 }, { - "epoch": 0.58, - "learning_rate": 0.00021347589071321954, - "loss": 0.0525, + "epoch": 0.34, + "learning_rate": 0.0002483693372144807, + "loss": 0.0607, "step": 53330 }, { - "epoch": 0.58, - "learning_rate": 0.00021345966642871047, - "loss": 0.053, + "epoch": 0.34, + "learning_rate": 0.0002483596558601238, + "loss": 0.0637, "step": 53340 }, { - "epoch": 0.58, - "learning_rate": 0.00021344344214420141, - "loss": 0.0579, + "epoch": 0.34, + "learning_rate": 0.00024834997450576686, + "loss": 0.0576, "step": 53350 }, { - "epoch": 0.58, - "learning_rate": 0.00021342721785969236, - "loss": 0.0559, + "epoch": 0.34, + "learning_rate": 0.00024834029315140994, + "loss": 0.0593, "step": 53360 }, { - "epoch": 0.58, - "learning_rate": 0.00021341099357518331, - "loss": 0.0519, + "epoch": 0.34, + "learning_rate": 0.00024833061179705296, + "loss": 0.057, "step": 53370 }, { - "epoch": 0.58, - "learning_rate": 0.00021339476929067424, - "loss": 0.0536, + "epoch": 0.34, + "learning_rate": 0.00024832093044269604, + "loss": 0.0639, "step": 53380 }, { - "epoch": 0.58, - "learning_rate": 0.00021337854500616521, - "loss": 0.055, + "epoch": 0.34, + "learning_rate": 0.0002483112490883391, + "loss": 0.0597, "step": 53390 }, { - "epoch": 0.58, - "learning_rate": 0.00021336232072165614, - "loss": 0.0653, + "epoch": 0.34, + "learning_rate": 0.0002483015677339822, + "loss": 0.0599, "step": 53400 }, { - "epoch": 0.58, - "learning_rate": 0.0002133460964371471, - "loss": 0.0539, + "epoch": 0.34, + "learning_rate": 0.00024829188637962523, + "loss": 0.0676, "step": 53410 }, { - "epoch": 0.58, - "learning_rate": 0.00021332987215263804, - "loss": 0.0566, + "epoch": 0.34, + "learning_rate": 0.0002482822050252683, + "loss": 0.0592, "step": 53420 }, { - "epoch": 0.58, - "learning_rate": 0.000213313647868129, - "loss": 0.0552, + "epoch": 0.34, + "learning_rate": 0.0002482725236709114, + "loss": 0.0688, "step": 53430 }, { - "epoch": 0.58, - "learning_rate": 0.00021329742358361994, - "loss": 0.0574, + "epoch": 0.34, + "learning_rate": 0.0002482628423165544, + "loss": 0.0701, "step": 53440 }, { - "epoch": 0.58, - "learning_rate": 0.00021328119929911089, - "loss": 0.0509, + "epoch": 0.34, + "learning_rate": 0.0002482531609621975, + "loss": 0.0662, "step": 53450 }, { - "epoch": 0.58, - "learning_rate": 0.00021326497501460184, - "loss": 0.0516, + "epoch": 0.35, + "learning_rate": 0.00024824347960784057, + "loss": 0.0562, "step": 53460 }, { - "epoch": 0.58, - "learning_rate": 0.00021324875073009278, - "loss": 0.055, + "epoch": 0.35, + "learning_rate": 0.00024823379825348365, + "loss": 0.0546, "step": 53470 }, { - "epoch": 0.58, - "learning_rate": 0.0002132325264455837, - "loss": 0.0662, + "epoch": 0.35, + "learning_rate": 0.00024822411689912673, + "loss": 0.0614, "step": 53480 }, { - "epoch": 0.58, - "learning_rate": 0.00021321630216107468, - "loss": 0.0498, + "epoch": 0.35, + "learning_rate": 0.0002482144355447698, + "loss": 0.0595, "step": 53490 }, { - "epoch": 0.58, - "learning_rate": 0.0002132000778765656, - "loss": 0.0626, + "epoch": 0.35, + "learning_rate": 0.0002482047541904129, + "loss": 0.0692, "step": 53500 }, { - "epoch": 0.58, - "learning_rate": 0.00021318385359205658, - "loss": 0.0667, + "epoch": 0.35, + "learning_rate": 0.0002481950728360559, + "loss": 0.0597, "step": 53510 }, { - "epoch": 0.58, - "learning_rate": 0.0002131676293075475, - "loss": 0.0574, + "epoch": 0.35, + "learning_rate": 0.000248185391481699, + "loss": 0.0641, "step": 53520 }, { - "epoch": 0.58, - "learning_rate": 0.00021315140502303846, - "loss": 0.055, + "epoch": 0.35, + "learning_rate": 0.0002481757101273421, + "loss": 0.0631, "step": 53530 }, { - "epoch": 0.58, - "learning_rate": 0.0002131351807385294, - "loss": 0.0575, + "epoch": 0.35, + "learning_rate": 0.0002481660287729851, + "loss": 0.0573, "step": 53540 }, { - "epoch": 0.58, - "learning_rate": 0.00021311895645402036, - "loss": 0.0543, + "epoch": 0.35, + "learning_rate": 0.0002481563474186282, + "loss": 0.0568, "step": 53550 }, { - "epoch": 0.58, - "learning_rate": 0.00021310273216951128, - "loss": 0.0521, + "epoch": 0.35, + "learning_rate": 0.00024814666606427126, + "loss": 0.0674, "step": 53560 }, { - "epoch": 0.58, - "learning_rate": 0.00021308650788500226, - "loss": 0.0457, + "epoch": 0.35, + "learning_rate": 0.00024813698470991434, + "loss": 0.065, "step": 53570 }, { - "epoch": 0.58, - "learning_rate": 0.00021307028360049318, - "loss": 0.0477, + "epoch": 0.35, + "learning_rate": 0.00024812730335555737, + "loss": 0.0566, "step": 53580 }, { - "epoch": 0.58, - "learning_rate": 0.00021305405931598416, - "loss": 0.0499, + "epoch": 0.35, + "learning_rate": 0.00024811762200120045, + "loss": 0.0597, "step": 53590 }, { - "epoch": 0.58, - "learning_rate": 0.00021303783503147508, - "loss": 0.0511, + "epoch": 0.35, + "learning_rate": 0.0002481079406468435, + "loss": 0.0627, "step": 53600 }, { - "epoch": 0.58, - "learning_rate": 0.00021302161074696605, - "loss": 0.0473, + "epoch": 0.35, + "learning_rate": 0.0002480982592924866, + "loss": 0.0641, "step": 53610 }, { - "epoch": 0.58, - "learning_rate": 0.00021300538646245698, - "loss": 0.0498, + "epoch": 0.35, + "learning_rate": 0.0002480885779381297, + "loss": 0.0587, "step": 53620 }, { - "epoch": 0.58, - "learning_rate": 0.00021298916217794793, - "loss": 0.0516, + "epoch": 0.35, + "learning_rate": 0.00024807889658377277, + "loss": 0.0661, "step": 53630 }, { - "epoch": 0.58, - "learning_rate": 0.00021297293789343888, - "loss": 0.0517, + "epoch": 0.35, + "learning_rate": 0.0002480692152294158, + "loss": 0.0667, "step": 53640 }, { - "epoch": 0.58, - "learning_rate": 0.00021295671360892983, - "loss": 0.0554, + "epoch": 0.35, + "learning_rate": 0.00024805953387505887, + "loss": 0.0653, "step": 53650 }, { - "epoch": 0.58, - "learning_rate": 0.00021294048932442075, - "loss": 0.0492, + "epoch": 0.35, + "learning_rate": 0.00024804985252070195, + "loss": 0.0643, "step": 53660 }, { - "epoch": 0.58, - "learning_rate": 0.00021292426503991173, - "loss": 0.0542, + "epoch": 0.35, + "learning_rate": 0.000248040171166345, + "loss": 0.0702, "step": 53670 }, { - "epoch": 0.58, - "learning_rate": 0.00021290804075540265, - "loss": 0.0632, + "epoch": 0.35, + "learning_rate": 0.00024803048981198806, + "loss": 0.0675, "step": 53680 }, { - "epoch": 0.58, - "learning_rate": 0.00021289181647089363, - "loss": 0.0632, + "epoch": 0.35, + "learning_rate": 0.00024802080845763114, + "loss": 0.0685, "step": 53690 }, { - "epoch": 0.58, - "learning_rate": 0.00021287559218638455, - "loss": 0.0544, + "epoch": 0.35, + "learning_rate": 0.0002480111271032742, + "loss": 0.0707, "step": 53700 }, { - "epoch": 0.58, - "learning_rate": 0.0002128593679018755, - "loss": 0.0576, + "epoch": 0.35, + "learning_rate": 0.0002480014457489173, + "loss": 0.0573, "step": 53710 }, { - "epoch": 0.58, - "learning_rate": 0.00021284314361736645, - "loss": 0.0595, + "epoch": 0.35, + "learning_rate": 0.0002479917643945603, + "loss": 0.0641, "step": 53720 }, { - "epoch": 0.58, - "learning_rate": 0.0002128269193328574, - "loss": 0.0531, + "epoch": 0.35, + "learning_rate": 0.0002479820830402034, + "loss": 0.0652, "step": 53730 }, { - "epoch": 0.58, - "learning_rate": 0.00021281069504834835, - "loss": 0.0577, + "epoch": 0.35, + "learning_rate": 0.0002479724016858465, + "loss": 0.0592, "step": 53740 }, { - "epoch": 0.58, - "learning_rate": 0.0002127944707638393, - "loss": 0.0589, + "epoch": 0.35, + "learning_rate": 0.00024796272033148956, + "loss": 0.0588, "step": 53750 }, { - "epoch": 0.58, - "learning_rate": 0.00021277824647933022, - "loss": 0.0576, + "epoch": 0.35, + "learning_rate": 0.00024795303897713264, + "loss": 0.0608, "step": 53760 }, { - "epoch": 0.58, - "learning_rate": 0.0002127620221948212, - "loss": 0.054, + "epoch": 0.35, + "learning_rate": 0.0002479433576227757, + "loss": 0.0579, "step": 53770 }, { - "epoch": 0.58, - "learning_rate": 0.00021274579791031212, - "loss": 0.0479, + "epoch": 0.35, + "learning_rate": 0.00024793367626841875, + "loss": 0.0632, "step": 53780 }, { - "epoch": 0.58, - "learning_rate": 0.0002127295736258031, - "loss": 0.0527, + "epoch": 0.35, + "learning_rate": 0.0002479239949140618, + "loss": 0.0566, "step": 53790 }, { - "epoch": 0.58, - "learning_rate": 0.00021271334934129402, - "loss": 0.0533, + "epoch": 0.35, + "learning_rate": 0.0002479143135597049, + "loss": 0.0641, "step": 53800 }, { - "epoch": 0.58, - "learning_rate": 0.00021269712505678497, - "loss": 0.0472, + "epoch": 0.35, + "learning_rate": 0.00024790463220534793, + "loss": 0.0738, "step": 53810 }, { - "epoch": 0.58, - "learning_rate": 0.00021268090077227592, - "loss": 0.0498, + "epoch": 0.35, + "learning_rate": 0.000247894950850991, + "loss": 0.0672, "step": 53820 }, { - "epoch": 0.58, - "learning_rate": 0.00021266467648776687, - "loss": 0.055, + "epoch": 0.35, + "learning_rate": 0.0002478852694966341, + "loss": 0.061, "step": 53830 }, { - "epoch": 0.58, - "learning_rate": 0.0002126484522032578, - "loss": 0.0568, + "epoch": 0.35, + "learning_rate": 0.00024787558814227717, + "loss": 0.0635, "step": 53840 }, { - "epoch": 0.58, - "learning_rate": 0.00021263222791874877, - "loss": 0.0622, + "epoch": 0.35, + "learning_rate": 0.00024786590678792025, + "loss": 0.0609, "step": 53850 }, { - "epoch": 0.58, - "learning_rate": 0.0002126160036342397, - "loss": 0.0619, + "epoch": 0.35, + "learning_rate": 0.0002478562254335633, + "loss": 0.0658, "step": 53860 }, { - "epoch": 0.58, - "learning_rate": 0.00021259977934973067, - "loss": 0.0611, + "epoch": 0.35, + "learning_rate": 0.00024784654407920636, + "loss": 0.0699, "step": 53870 }, { - "epoch": 0.58, - "learning_rate": 0.0002125835550652216, - "loss": 0.0559, + "epoch": 0.35, + "learning_rate": 0.00024783686272484944, + "loss": 0.0606, "step": 53880 }, { - "epoch": 0.58, - "learning_rate": 0.00021256733078071254, - "loss": 0.0603, + "epoch": 0.35, + "learning_rate": 0.0002478271813704925, + "loss": 0.0643, "step": 53890 }, { - "epoch": 0.58, - "learning_rate": 0.0002125511064962035, - "loss": 0.0566, + "epoch": 0.35, + "learning_rate": 0.0002478175000161356, + "loss": 0.0577, "step": 53900 }, { - "epoch": 0.58, - "learning_rate": 0.00021253488221169444, - "loss": 0.0494, + "epoch": 0.35, + "learning_rate": 0.0002478078186617786, + "loss": 0.0632, "step": 53910 }, { - "epoch": 0.58, - "learning_rate": 0.0002125186579271854, - "loss": 0.0603, + "epoch": 0.35, + "learning_rate": 0.0002477981373074217, + "loss": 0.0582, "step": 53920 }, { - "epoch": 0.58, - "learning_rate": 0.00021250243364267634, - "loss": 0.0514, + "epoch": 0.35, + "learning_rate": 0.0002477884559530648, + "loss": 0.0655, "step": 53930 }, { - "epoch": 0.58, - "learning_rate": 0.00021248620935816726, - "loss": 0.0581, + "epoch": 0.35, + "learning_rate": 0.0002477787745987078, + "loss": 0.0689, "step": 53940 }, { - "epoch": 0.58, - "learning_rate": 0.00021246998507365824, - "loss": 0.0595, + "epoch": 0.35, + "learning_rate": 0.0002477690932443509, + "loss": 0.0773, "step": 53950 }, { - "epoch": 0.58, - "learning_rate": 0.00021245376078914916, - "loss": 0.0561, + "epoch": 0.35, + "learning_rate": 0.00024775941188999397, + "loss": 0.0687, "step": 53960 }, { - "epoch": 0.58, - "learning_rate": 0.00021243753650464014, - "loss": 0.0521, + "epoch": 0.35, + "learning_rate": 0.00024774973053563705, + "loss": 0.0621, "step": 53970 }, { - "epoch": 0.58, - "learning_rate": 0.0002124213122201311, - "loss": 0.0503, + "epoch": 0.35, + "learning_rate": 0.0002477400491812801, + "loss": 0.0618, "step": 53980 }, { - "epoch": 0.58, - "learning_rate": 0.000212405087935622, - "loss": 0.0501, + "epoch": 0.35, + "learning_rate": 0.0002477303678269232, + "loss": 0.065, "step": 53990 }, { - "epoch": 0.58, - "learning_rate": 0.000212388863651113, - "loss": 0.0543, + "epoch": 0.35, + "learning_rate": 0.00024772068647256623, + "loss": 0.063, "step": 54000 }, { - "epoch": 0.58, - "eval_cer": 0.9212833139850267, - "eval_loss": 0.03740408644080162, - "eval_runtime": 119.0069, - "eval_samples_per_second": 16.806, - "eval_steps_per_second": 4.201, + "epoch": 0.35, + "eval_cer": 0.9200108462320642, + "eval_loss": 0.04245748743414879, + "eval_runtime": 120.2121, + "eval_samples_per_second": 16.637, + "eval_steps_per_second": 4.159, "step": 54000 }, { - "epoch": 0.58, - "learning_rate": 0.0002123726393666039, - "loss": 0.0556, + "epoch": 0.35, + "learning_rate": 0.0002477110051182093, + "loss": 0.0614, "step": 54010 }, { - "epoch": 0.58, - "learning_rate": 0.0002123564150820949, - "loss": 0.0547, + "epoch": 0.35, + "learning_rate": 0.0002477013237638524, + "loss": 0.0582, "step": 54020 }, { - "epoch": 0.58, - "learning_rate": 0.0002123401907975858, - "loss": 0.0543, + "epoch": 0.35, + "learning_rate": 0.00024769164240949547, + "loss": 0.0706, "step": 54030 }, { - "epoch": 0.58, - "learning_rate": 0.00021232396651307676, - "loss": 0.0632, + "epoch": 0.35, + "learning_rate": 0.00024768196105513855, + "loss": 0.0636, "step": 54040 }, { - "epoch": 0.58, - "learning_rate": 0.0002123077422285677, - "loss": 0.059, + "epoch": 0.35, + "learning_rate": 0.0002476722797007816, + "loss": 0.0647, "step": 54050 }, { - "epoch": 0.58, - "learning_rate": 0.00021229151794405866, - "loss": 0.0502, + "epoch": 0.35, + "learning_rate": 0.00024766259834642465, + "loss": 0.0565, "step": 54060 }, { - "epoch": 0.58, - "learning_rate": 0.00021227529365954958, - "loss": 0.0607, + "epoch": 0.35, + "learning_rate": 0.0002476529169920677, + "loss": 0.0747, "step": 54070 }, { - "epoch": 0.58, - "learning_rate": 0.00021225906937504056, - "loss": 0.0612, + "epoch": 0.35, + "learning_rate": 0.00024764323563771076, + "loss": 0.0598, "step": 54080 }, { - "epoch": 0.59, - "learning_rate": 0.00021224284509053148, - "loss": 0.0535, + "epoch": 0.35, + "learning_rate": 0.00024763355428335384, + "loss": 0.0644, "step": 54090 }, { - "epoch": 0.59, - "learning_rate": 0.00021222662080602246, - "loss": 0.0558, + "epoch": 0.35, + "learning_rate": 0.0002476238729289969, + "loss": 0.0645, "step": 54100 }, { - "epoch": 0.59, - "learning_rate": 0.00021221039652151338, - "loss": 0.0584, + "epoch": 0.35, + "learning_rate": 0.00024761419157464, + "loss": 0.0626, "step": 54110 }, { - "epoch": 0.59, - "learning_rate": 0.00021219417223700436, - "loss": 0.0544, + "epoch": 0.35, + "learning_rate": 0.0002476045102202831, + "loss": 0.0685, "step": 54120 }, { - "epoch": 0.59, - "learning_rate": 0.00021217794795249528, - "loss": 0.0532, + "epoch": 0.35, + "learning_rate": 0.00024759482886592616, + "loss": 0.0626, "step": 54130 }, { - "epoch": 0.59, - "learning_rate": 0.00021216172366798623, - "loss": 0.0553, + "epoch": 0.35, + "learning_rate": 0.0002475851475115692, + "loss": 0.0631, "step": 54140 }, { - "epoch": 0.59, - "learning_rate": 0.00021214549938347718, - "loss": 0.0577, + "epoch": 0.35, + "learning_rate": 0.00024757546615721226, + "loss": 0.0558, "step": 54150 }, { - "epoch": 0.59, - "learning_rate": 0.00021212927509896813, - "loss": 0.0537, + "epoch": 0.35, + "learning_rate": 0.00024756578480285534, + "loss": 0.0654, "step": 54160 }, { - "epoch": 0.59, - "learning_rate": 0.00021211305081445905, - "loss": 0.0606, + "epoch": 0.35, + "learning_rate": 0.0002475561034484984, + "loss": 0.0623, "step": 54170 }, { - "epoch": 0.59, - "learning_rate": 0.00021209682652995003, - "loss": 0.0529, + "epoch": 0.35, + "learning_rate": 0.00024754642209414145, + "loss": 0.0648, "step": 54180 }, { - "epoch": 0.59, - "learning_rate": 0.00021208060224544095, - "loss": 0.0512, + "epoch": 0.35, + "learning_rate": 0.00024753674073978453, + "loss": 0.0601, "step": 54190 }, { - "epoch": 0.59, - "learning_rate": 0.00021206437796093193, - "loss": 0.0554, + "epoch": 0.35, + "learning_rate": 0.0002475270593854276, + "loss": 0.0704, "step": 54200 }, { - "epoch": 0.59, - "learning_rate": 0.00021204815367642285, - "loss": 0.053, + "epoch": 0.35, + "learning_rate": 0.00024751737803107063, + "loss": 0.0617, "step": 54210 }, { - "epoch": 0.59, - "learning_rate": 0.0002120319293919138, - "loss": 0.0616, + "epoch": 0.35, + "learning_rate": 0.0002475076966767137, + "loss": 0.0598, "step": 54220 }, { - "epoch": 0.59, - "learning_rate": 0.00021201570510740475, - "loss": 0.0585, + "epoch": 0.35, + "learning_rate": 0.0002474980153223568, + "loss": 0.0737, "step": 54230 }, { - "epoch": 0.59, - "learning_rate": 0.0002119994808228957, - "loss": 0.0513, + "epoch": 0.35, + "learning_rate": 0.0002474883339679999, + "loss": 0.0679, "step": 54240 }, { - "epoch": 0.59, - "learning_rate": 0.00021198325653838662, - "loss": 0.0555, + "epoch": 0.35, + "learning_rate": 0.00024747865261364295, + "loss": 0.0599, "step": 54250 }, { - "epoch": 0.59, - "learning_rate": 0.0002119670322538776, - "loss": 0.0467, + "epoch": 0.35, + "learning_rate": 0.00024746897125928603, + "loss": 0.0668, "step": 54260 }, { - "epoch": 0.59, - "learning_rate": 0.00021195080796936852, - "loss": 0.0631, + "epoch": 0.35, + "learning_rate": 0.0002474592899049291, + "loss": 0.0756, "step": 54270 }, { - "epoch": 0.59, - "learning_rate": 0.0002119345836848595, - "loss": 0.0574, + "epoch": 0.35, + "learning_rate": 0.00024744960855057214, + "loss": 0.0591, "step": 54280 }, { - "epoch": 0.59, - "learning_rate": 0.00021191835940035042, - "loss": 0.0691, + "epoch": 0.35, + "learning_rate": 0.0002474399271962152, + "loss": 0.0665, "step": 54290 }, { - "epoch": 0.59, - "learning_rate": 0.0002119021351158414, - "loss": 0.0533, + "epoch": 0.35, + "learning_rate": 0.0002474302458418583, + "loss": 0.0601, "step": 54300 }, { - "epoch": 0.59, - "learning_rate": 0.00021188591083133232, - "loss": 0.057, + "epoch": 0.35, + "learning_rate": 0.0002474205644875013, + "loss": 0.0611, "step": 54310 }, { - "epoch": 0.59, - "learning_rate": 0.00021186968654682327, - "loss": 0.0618, + "epoch": 0.35, + "learning_rate": 0.0002474108831331444, + "loss": 0.0614, "step": 54320 }, { - "epoch": 0.59, - "learning_rate": 0.00021185346226231422, - "loss": 0.0493, + "epoch": 0.35, + "learning_rate": 0.0002474012017787875, + "loss": 0.0575, "step": 54330 }, { - "epoch": 0.59, - "learning_rate": 0.00021183723797780517, - "loss": 0.0521, + "epoch": 0.35, + "learning_rate": 0.00024739152042443056, + "loss": 0.0589, "step": 54340 }, { - "epoch": 0.59, - "learning_rate": 0.0002118210136932961, - "loss": 0.0552, + "epoch": 0.35, + "learning_rate": 0.0002473818390700736, + "loss": 0.0555, "step": 54350 }, { - "epoch": 0.59, - "learning_rate": 0.00021180478940878707, - "loss": 0.0683, + "epoch": 0.35, + "learning_rate": 0.00024737215771571667, + "loss": 0.0617, "step": 54360 }, { - "epoch": 0.59, - "learning_rate": 0.000211788565124278, - "loss": 0.0689, + "epoch": 0.35, + "learning_rate": 0.00024736247636135975, + "loss": 0.059, "step": 54370 }, { - "epoch": 0.59, - "learning_rate": 0.00021177234083976897, - "loss": 0.0579, + "epoch": 0.35, + "learning_rate": 0.00024735279500700283, + "loss": 0.0524, "step": 54380 }, { - "epoch": 0.59, - "learning_rate": 0.0002117561165552599, - "loss": 0.0505, + "epoch": 0.35, + "learning_rate": 0.0002473431136526459, + "loss": 0.0599, "step": 54390 }, { - "epoch": 0.59, - "learning_rate": 0.00021173989227075084, - "loss": 0.0526, + "epoch": 0.35, + "learning_rate": 0.000247333432298289, + "loss": 0.0573, "step": 54400 }, { - "epoch": 0.59, - "learning_rate": 0.0002117236679862418, - "loss": 0.053, + "epoch": 0.35, + "learning_rate": 0.00024732375094393207, + "loss": 0.065, "step": 54410 }, { - "epoch": 0.59, - "learning_rate": 0.00021170744370173274, - "loss": 0.0565, + "epoch": 0.35, + "learning_rate": 0.0002473140695895751, + "loss": 0.0596, "step": 54420 }, { - "epoch": 0.59, - "learning_rate": 0.0002116912194172237, - "loss": 0.049, + "epoch": 0.35, + "learning_rate": 0.0002473043882352182, + "loss": 0.0616, "step": 54430 }, { - "epoch": 0.59, - "learning_rate": 0.00021167499513271464, - "loss": 0.0522, + "epoch": 0.35, + "learning_rate": 0.00024729470688086125, + "loss": 0.0634, "step": 54440 }, { - "epoch": 0.59, - "learning_rate": 0.00021165877084820556, - "loss": 0.051, + "epoch": 0.35, + "learning_rate": 0.0002472850255265043, + "loss": 0.0579, "step": 54450 }, { - "epoch": 0.59, - "learning_rate": 0.00021164254656369654, - "loss": 0.0616, + "epoch": 0.35, + "learning_rate": 0.00024727534417214736, + "loss": 0.0522, "step": 54460 }, { - "epoch": 0.59, - "learning_rate": 0.00021162632227918746, - "loss": 0.0538, + "epoch": 0.35, + "learning_rate": 0.00024726566281779044, + "loss": 0.0575, "step": 54470 }, { - "epoch": 0.59, - "learning_rate": 0.00021161009799467844, - "loss": 0.0589, + "epoch": 0.35, + "learning_rate": 0.0002472559814634335, + "loss": 0.0719, "step": 54480 }, { - "epoch": 0.59, - "learning_rate": 0.00021159387371016936, - "loss": 0.0571, + "epoch": 0.35, + "learning_rate": 0.00024724630010907654, + "loss": 0.0574, "step": 54490 }, { - "epoch": 0.59, - "learning_rate": 0.0002115776494256603, - "loss": 0.0561, + "epoch": 0.35, + "learning_rate": 0.0002472366187547196, + "loss": 0.0618, "step": 54500 }, { - "epoch": 0.59, - "learning_rate": 0.00021156142514115126, - "loss": 0.0569, + "epoch": 0.35, + "learning_rate": 0.0002472269374003627, + "loss": 0.0615, "step": 54510 }, { - "epoch": 0.59, - "learning_rate": 0.0002115452008566422, - "loss": 0.0582, + "epoch": 0.35, + "learning_rate": 0.0002472172560460058, + "loss": 0.0593, "step": 54520 }, { - "epoch": 0.59, - "learning_rate": 0.00021152897657213314, - "loss": 0.0544, + "epoch": 0.35, + "learning_rate": 0.00024720757469164886, + "loss": 0.0568, "step": 54530 }, { - "epoch": 0.59, - "learning_rate": 0.0002115127522876241, - "loss": 0.0595, + "epoch": 0.35, + "learning_rate": 0.00024719789333729194, + "loss": 0.058, "step": 54540 }, { - "epoch": 0.59, - "learning_rate": 0.00021149652800311503, - "loss": 0.063, + "epoch": 0.35, + "learning_rate": 0.00024718821198293497, + "loss": 0.0584, "step": 54550 }, { - "epoch": 0.59, - "learning_rate": 0.000211480303718606, - "loss": 0.0584, + "epoch": 0.35, + "learning_rate": 0.00024717853062857805, + "loss": 0.0571, "step": 54560 }, { - "epoch": 0.59, - "learning_rate": 0.00021146407943409693, - "loss": 0.0529, + "epoch": 0.35, + "learning_rate": 0.00024716884927422113, + "loss": 0.0675, "step": 54570 }, { - "epoch": 0.59, - "learning_rate": 0.00021144785514958788, - "loss": 0.0522, + "epoch": 0.35, + "learning_rate": 0.00024715916791986415, + "loss": 0.0639, "step": 54580 }, { - "epoch": 0.59, - "learning_rate": 0.00021143163086507883, - "loss": 0.0567, + "epoch": 0.35, + "learning_rate": 0.00024714948656550723, + "loss": 0.0569, "step": 54590 }, { - "epoch": 0.59, - "learning_rate": 0.00021141540658056978, - "loss": 0.0505, + "epoch": 0.35, + "learning_rate": 0.0002471398052111503, + "loss": 0.0589, "step": 54600 }, { - "epoch": 0.59, - "learning_rate": 0.00021139918229606073, - "loss": 0.0552, + "epoch": 0.35, + "learning_rate": 0.0002471301238567934, + "loss": 0.0643, "step": 54610 }, { - "epoch": 0.59, - "learning_rate": 0.00021138295801155168, - "loss": 0.0516, + "epoch": 0.35, + "learning_rate": 0.00024712044250243647, + "loss": 0.0577, "step": 54620 }, { - "epoch": 0.59, - "learning_rate": 0.0002113667337270426, - "loss": 0.0523, + "epoch": 0.35, + "learning_rate": 0.0002471107611480795, + "loss": 0.0568, "step": 54630 }, { - "epoch": 0.59, - "learning_rate": 0.00021135050944253358, - "loss": 0.0554, + "epoch": 0.35, + "learning_rate": 0.0002471010797937226, + "loss": 0.0642, "step": 54640 }, { - "epoch": 0.59, - "learning_rate": 0.0002113342851580245, - "loss": 0.0567, + "epoch": 0.35, + "learning_rate": 0.00024709139843936566, + "loss": 0.0691, "step": 54650 }, { - "epoch": 0.59, - "learning_rate": 0.00021131806087351548, - "loss": 0.0602, + "epoch": 0.35, + "learning_rate": 0.00024708171708500874, + "loss": 0.0626, "step": 54660 }, { - "epoch": 0.59, - "learning_rate": 0.0002113018365890064, - "loss": 0.056, + "epoch": 0.35, + "learning_rate": 0.0002470720357306518, + "loss": 0.0605, "step": 54670 }, { - "epoch": 0.59, - "learning_rate": 0.00021128561230449735, - "loss": 0.056, + "epoch": 0.35, + "learning_rate": 0.00024706235437629484, + "loss": 0.0518, "step": 54680 }, { - "epoch": 0.59, - "learning_rate": 0.0002112693880199883, - "loss": 0.0619, + "epoch": 0.35, + "learning_rate": 0.0002470526730219379, + "loss": 0.0657, "step": 54690 }, { - "epoch": 0.59, - "learning_rate": 0.00021125316373547925, - "loss": 0.0581, + "epoch": 0.35, + "learning_rate": 0.000247042991667581, + "loss": 0.0607, "step": 54700 }, { - "epoch": 0.59, - "learning_rate": 0.00021123693945097018, - "loss": 0.0522, + "epoch": 0.35, + "learning_rate": 0.00024703331031322403, + "loss": 0.0664, "step": 54710 }, { - "epoch": 0.59, - "learning_rate": 0.00021122071516646115, - "loss": 0.0587, + "epoch": 0.35, + "learning_rate": 0.0002470236289588671, + "loss": 0.0607, "step": 54720 }, { - "epoch": 0.59, - "learning_rate": 0.00021120449088195208, - "loss": 0.0565, + "epoch": 0.35, + "learning_rate": 0.0002470139476045102, + "loss": 0.0661, "step": 54730 }, { - "epoch": 0.59, - "learning_rate": 0.00021118826659744305, - "loss": 0.0523, + "epoch": 0.35, + "learning_rate": 0.00024700426625015327, + "loss": 0.0556, "step": 54740 }, { - "epoch": 0.59, - "learning_rate": 0.00021117204231293398, - "loss": 0.0493, + "epoch": 0.35, + "learning_rate": 0.00024699458489579635, + "loss": 0.0604, "step": 54750 }, { - "epoch": 0.59, - "learning_rate": 0.00021115581802842493, - "loss": 0.0518, + "epoch": 0.35, + "learning_rate": 0.00024698490354143943, + "loss": 0.0633, "step": 54760 }, { - "epoch": 0.59, - "learning_rate": 0.00021113959374391588, - "loss": 0.0678, + "epoch": 0.35, + "learning_rate": 0.00024697522218708245, + "loss": 0.0655, "step": 54770 }, { - "epoch": 0.59, - "learning_rate": 0.00021112336945940683, - "loss": 0.0498, + "epoch": 0.35, + "learning_rate": 0.00024696554083272553, + "loss": 0.0582, "step": 54780 }, { - "epoch": 0.59, - "learning_rate": 0.00021110714517489778, - "loss": 0.0609, + "epoch": 0.35, + "learning_rate": 0.0002469558594783686, + "loss": 0.058, "step": 54790 }, { - "epoch": 0.59, - "learning_rate": 0.00021109092089038873, - "loss": 0.0535, + "epoch": 0.35, + "learning_rate": 0.0002469461781240117, + "loss": 0.0594, "step": 54800 }, { - "epoch": 0.59, - "learning_rate": 0.00021107469660587965, - "loss": 0.0514, + "epoch": 0.35, + "learning_rate": 0.00024693649676965477, + "loss": 0.0613, "step": 54810 }, { - "epoch": 0.59, - "learning_rate": 0.00021105847232137062, - "loss": 0.045, + "epoch": 0.35, + "learning_rate": 0.0002469268154152978, + "loss": 0.0592, "step": 54820 }, { - "epoch": 0.59, - "learning_rate": 0.00021104224803686155, - "loss": 0.0495, + "epoch": 0.35, + "learning_rate": 0.0002469171340609409, + "loss": 0.067, "step": 54830 }, { - "epoch": 0.59, - "learning_rate": 0.00021102602375235252, - "loss": 0.0597, + "epoch": 0.35, + "learning_rate": 0.00024690745270658396, + "loss": 0.0618, "step": 54840 }, { - "epoch": 0.59, - "learning_rate": 0.00021100979946784345, - "loss": 0.0476, + "epoch": 0.35, + "learning_rate": 0.000246897771352227, + "loss": 0.0542, "step": 54850 }, { - "epoch": 0.59, - "learning_rate": 0.0002109935751833344, - "loss": 0.065, + "epoch": 0.35, + "learning_rate": 0.00024688808999787006, + "loss": 0.0672, "step": 54860 }, { - "epoch": 0.59, - "learning_rate": 0.00021097735089882535, - "loss": 0.057, + "epoch": 0.35, + "learning_rate": 0.00024687840864351314, + "loss": 0.0657, "step": 54870 }, { - "epoch": 0.59, - "learning_rate": 0.0002109611266143163, - "loss": 0.0443, + "epoch": 0.35, + "learning_rate": 0.0002468687272891562, + "loss": 0.0579, "step": 54880 }, { - "epoch": 0.59, - "learning_rate": 0.00021094490232980722, - "loss": 0.0544, + "epoch": 0.35, + "learning_rate": 0.0002468590459347993, + "loss": 0.0589, "step": 54890 }, { - "epoch": 0.59, - "learning_rate": 0.0002109286780452982, - "loss": 0.0524, + "epoch": 0.35, + "learning_rate": 0.0002468493645804424, + "loss": 0.0579, "step": 54900 }, { - "epoch": 0.59, - "learning_rate": 0.00021091245376078912, - "loss": 0.0492, + "epoch": 0.35, + "learning_rate": 0.0002468396832260854, + "loss": 0.069, "step": 54910 }, { - "epoch": 0.59, - "learning_rate": 0.0002108962294762801, - "loss": 0.0579, + "epoch": 0.35, + "learning_rate": 0.0002468300018717285, + "loss": 0.059, "step": 54920 }, { - "epoch": 0.59, - "learning_rate": 0.00021088000519177102, - "loss": 0.0584, + "epoch": 0.35, + "learning_rate": 0.00024682032051737157, + "loss": 0.0694, "step": 54930 }, { - "epoch": 0.59, - "learning_rate": 0.00021086378090726197, - "loss": 0.0634, + "epoch": 0.35, + "learning_rate": 0.00024681063916301465, + "loss": 0.0635, "step": 54940 }, { - "epoch": 0.59, - "learning_rate": 0.00021084755662275292, - "loss": 0.0608, + "epoch": 0.35, + "learning_rate": 0.00024680095780865767, + "loss": 0.0582, "step": 54950 }, { - "epoch": 0.59, - "learning_rate": 0.00021083133233824387, - "loss": 0.0481, + "epoch": 0.35, + "learning_rate": 0.00024679127645430075, + "loss": 0.0607, "step": 54960 }, { - "epoch": 0.59, - "learning_rate": 0.00021081510805373482, - "loss": 0.0594, + "epoch": 0.35, + "learning_rate": 0.00024678159509994383, + "loss": 0.0653, "step": 54970 }, { - "epoch": 0.59, - "learning_rate": 0.00021079888376922577, - "loss": 0.0535, + "epoch": 0.35, + "learning_rate": 0.00024677191374558686, + "loss": 0.069, "step": 54980 }, { - "epoch": 0.59, - "learning_rate": 0.0002107826594847167, - "loss": 0.0567, + "epoch": 0.35, + "learning_rate": 0.00024676223239122994, + "loss": 0.067, "step": 54990 }, { - "epoch": 0.59, - "learning_rate": 0.00021076643520020767, - "loss": 0.057, + "epoch": 0.35, + "learning_rate": 0.000246752551036873, + "loss": 0.0609, "step": 55000 }, { - "epoch": 0.59, - "eval_cer": 0.9212850809536683, - "eval_loss": 0.03805334493517876, - "eval_runtime": 119.0163, - "eval_samples_per_second": 16.804, - "eval_steps_per_second": 4.201, + "epoch": 0.35, + "eval_cer": 0.9199882499152638, + "eval_loss": 0.040658190846443176, + "eval_runtime": 120.0185, + "eval_samples_per_second": 16.664, + "eval_steps_per_second": 4.166, "step": 55000 }, { - "epoch": 0.59, - "learning_rate": 0.0002107502109156986, - "loss": 0.0533, + "epoch": 0.36, + "learning_rate": 0.0002467428696825161, + "loss": 0.0668, "step": 55010 }, { - "epoch": 0.6, - "learning_rate": 0.00021073398663118957, - "loss": 0.0511, + "epoch": 0.36, + "learning_rate": 0.0002467331883281592, + "loss": 0.0648, "step": 55020 }, { - "epoch": 0.6, - "learning_rate": 0.0002107177623466805, - "loss": 0.059, + "epoch": 0.36, + "learning_rate": 0.00024672350697380226, + "loss": 0.0599, "step": 55030 }, { - "epoch": 0.6, - "learning_rate": 0.00021070153806217144, - "loss": 0.0578, + "epoch": 0.36, + "learning_rate": 0.00024671382561944534, + "loss": 0.06, "step": 55040 }, { - "epoch": 0.6, - "learning_rate": 0.0002106853137776624, - "loss": 0.0554, + "epoch": 0.36, + "learning_rate": 0.00024670414426508836, + "loss": 0.0602, "step": 55050 }, { - "epoch": 0.6, - "learning_rate": 0.00021066908949315334, - "loss": 0.056, + "epoch": 0.36, + "learning_rate": 0.00024669446291073144, + "loss": 0.0638, "step": 55060 }, { - "epoch": 0.6, - "learning_rate": 0.00021065286520864426, - "loss": 0.057, + "epoch": 0.36, + "learning_rate": 0.0002466847815563745, + "loss": 0.0576, "step": 55070 }, { - "epoch": 0.6, - "learning_rate": 0.00021063664092413524, - "loss": 0.0548, + "epoch": 0.36, + "learning_rate": 0.00024667510020201755, + "loss": 0.0564, "step": 55080 }, { - "epoch": 0.6, - "learning_rate": 0.00021062041663962616, - "loss": 0.0498, + "epoch": 0.36, + "learning_rate": 0.0002466654188476606, + "loss": 0.0541, "step": 55090 }, { - "epoch": 0.6, - "learning_rate": 0.00021060419235511714, - "loss": 0.0501, + "epoch": 0.36, + "learning_rate": 0.0002466557374933037, + "loss": 0.0569, "step": 55100 }, { - "epoch": 0.6, - "learning_rate": 0.00021058796807060806, - "loss": 0.0503, + "epoch": 0.36, + "learning_rate": 0.0002466460561389468, + "loss": 0.0665, "step": 55110 }, { - "epoch": 0.6, - "learning_rate": 0.00021057174378609904, - "loss": 0.0556, + "epoch": 0.36, + "learning_rate": 0.0002466363747845898, + "loss": 0.0551, "step": 55120 }, { - "epoch": 0.6, - "learning_rate": 0.00021055551950158996, - "loss": 0.0505, + "epoch": 0.36, + "learning_rate": 0.0002466266934302329, + "loss": 0.0624, "step": 55130 }, { - "epoch": 0.6, - "learning_rate": 0.0002105392952170809, - "loss": 0.0543, + "epoch": 0.36, + "learning_rate": 0.00024661701207587597, + "loss": 0.056, "step": 55140 }, { - "epoch": 0.6, - "learning_rate": 0.00021052307093257186, - "loss": 0.056, + "epoch": 0.36, + "learning_rate": 0.00024660733072151905, + "loss": 0.0649, "step": 55150 }, { - "epoch": 0.6, - "learning_rate": 0.0002105068466480628, - "loss": 0.0575, + "epoch": 0.36, + "learning_rate": 0.00024659764936716213, + "loss": 0.0611, "step": 55160 }, { - "epoch": 0.6, - "learning_rate": 0.00021049062236355373, - "loss": 0.0546, + "epoch": 0.36, + "learning_rate": 0.0002465879680128052, + "loss": 0.0609, "step": 55170 }, { - "epoch": 0.6, - "learning_rate": 0.0002104743980790447, - "loss": 0.0585, + "epoch": 0.36, + "learning_rate": 0.0002465782866584483, + "loss": 0.0618, "step": 55180 }, { - "epoch": 0.6, - "learning_rate": 0.00021045817379453563, - "loss": 0.0473, + "epoch": 0.36, + "learning_rate": 0.0002465686053040913, + "loss": 0.062, "step": 55190 }, { - "epoch": 0.6, - "learning_rate": 0.0002104419495100266, - "loss": 0.0546, + "epoch": 0.36, + "learning_rate": 0.0002465589239497344, + "loss": 0.0612, "step": 55200 }, { - "epoch": 0.6, - "learning_rate": 0.00021042572522551753, - "loss": 0.0541, + "epoch": 0.36, + "learning_rate": 0.0002465492425953775, + "loss": 0.0614, "step": 55210 }, { - "epoch": 0.6, - "learning_rate": 0.00021040950094100848, - "loss": 0.0544, + "epoch": 0.36, + "learning_rate": 0.0002465395612410205, + "loss": 0.0572, "step": 55220 }, { - "epoch": 0.6, - "learning_rate": 0.00021039327665649943, - "loss": 0.0486, + "epoch": 0.36, + "learning_rate": 0.0002465298798866636, + "loss": 0.061, "step": 55230 }, { - "epoch": 0.6, - "learning_rate": 0.00021037705237199038, - "loss": 0.0611, + "epoch": 0.36, + "learning_rate": 0.00024652019853230666, + "loss": 0.0557, "step": 55240 }, { - "epoch": 0.6, - "learning_rate": 0.0002103608280874813, - "loss": 0.0514, + "epoch": 0.36, + "learning_rate": 0.00024651051717794974, + "loss": 0.0617, "step": 55250 }, { - "epoch": 0.6, - "learning_rate": 0.00021034460380297228, - "loss": 0.0599, + "epoch": 0.36, + "learning_rate": 0.00024650083582359277, + "loss": 0.0535, "step": 55260 }, { - "epoch": 0.6, - "learning_rate": 0.0002103283795184632, - "loss": 0.0508, + "epoch": 0.36, + "learning_rate": 0.00024649115446923585, + "loss": 0.0566, "step": 55270 }, { - "epoch": 0.6, - "learning_rate": 0.00021031215523395418, - "loss": 0.0581, + "epoch": 0.36, + "learning_rate": 0.0002464814731148789, + "loss": 0.0578, "step": 55280 }, { - "epoch": 0.6, - "learning_rate": 0.0002102959309494451, - "loss": 0.052, + "epoch": 0.36, + "learning_rate": 0.000246471791760522, + "loss": 0.0608, "step": 55290 }, { - "epoch": 0.6, - "learning_rate": 0.00021027970666493608, - "loss": 0.0578, + "epoch": 0.36, + "learning_rate": 0.0002464621104061651, + "loss": 0.0581, "step": 55300 }, { - "epoch": 0.6, - "learning_rate": 0.000210263482380427, - "loss": 0.0516, + "epoch": 0.36, + "learning_rate": 0.00024645242905180817, + "loss": 0.0638, "step": 55310 }, { - "epoch": 0.6, - "learning_rate": 0.00021024725809591795, - "loss": 0.0625, + "epoch": 0.36, + "learning_rate": 0.0002464427476974512, + "loss": 0.063, "step": 55320 }, { - "epoch": 0.6, - "learning_rate": 0.0002102310338114089, - "loss": 0.0558, + "epoch": 0.36, + "learning_rate": 0.00024643306634309427, + "loss": 0.0617, "step": 55330 }, { - "epoch": 0.6, - "learning_rate": 0.00021021480952689985, - "loss": 0.0589, + "epoch": 0.36, + "learning_rate": 0.00024642338498873735, + "loss": 0.0558, "step": 55340 }, { - "epoch": 0.6, - "learning_rate": 0.00021019858524239077, - "loss": 0.055, + "epoch": 0.36, + "learning_rate": 0.0002464137036343804, + "loss": 0.053, "step": 55350 }, { - "epoch": 0.6, - "learning_rate": 0.00021018236095788175, - "loss": 0.0586, + "epoch": 0.36, + "learning_rate": 0.00024640402228002346, + "loss": 0.0623, "step": 55360 }, { - "epoch": 0.6, - "learning_rate": 0.00021016613667337267, - "loss": 0.0578, - "step": 55370 + "epoch": 0.36, + "learning_rate": 0.00024639434092566654, + "loss": 0.0614, + "step": 55370 }, { - "epoch": 0.6, - "learning_rate": 0.00021014991238886365, - "loss": 0.0595, + "epoch": 0.36, + "learning_rate": 0.0002463846595713096, + "loss": 0.0627, "step": 55380 }, { - "epoch": 0.6, - "learning_rate": 0.00021013368810435457, - "loss": 0.0514, + "epoch": 0.36, + "learning_rate": 0.0002463749782169527, + "loss": 0.0561, "step": 55390 }, { - "epoch": 0.6, - "learning_rate": 0.00021011746381984552, - "loss": 0.0556, + "epoch": 0.36, + "learning_rate": 0.0002463652968625957, + "loss": 0.0695, "step": 55400 }, { - "epoch": 0.6, - "learning_rate": 0.00021010123953533647, - "loss": 0.0525, + "epoch": 0.36, + "learning_rate": 0.0002463556155082388, + "loss": 0.0623, "step": 55410 }, { - "epoch": 0.6, - "learning_rate": 0.00021008501525082742, - "loss": 0.0598, + "epoch": 0.36, + "learning_rate": 0.0002463459341538819, + "loss": 0.0612, "step": 55420 }, { - "epoch": 0.6, - "learning_rate": 0.00021006879096631834, - "loss": 0.0538, + "epoch": 0.36, + "learning_rate": 0.00024633625279952496, + "loss": 0.0579, "step": 55430 }, { - "epoch": 0.6, - "learning_rate": 0.00021005256668180932, - "loss": 0.0575, + "epoch": 0.36, + "learning_rate": 0.00024632657144516804, + "loss": 0.062, "step": 55440 }, { - "epoch": 0.6, - "learning_rate": 0.00021003634239730024, - "loss": 0.0535, + "epoch": 0.36, + "learning_rate": 0.00024631689009081107, + "loss": 0.056, "step": 55450 }, { - "epoch": 0.6, - "learning_rate": 0.00021002011811279122, - "loss": 0.0517, + "epoch": 0.36, + "learning_rate": 0.00024630720873645415, + "loss": 0.061, "step": 55460 }, { - "epoch": 0.6, - "learning_rate": 0.00021000389382828214, - "loss": 0.0543, + "epoch": 0.36, + "learning_rate": 0.0002462975273820972, + "loss": 0.0611, "step": 55470 }, { - "epoch": 0.6, - "learning_rate": 0.00020998766954377312, - "loss": 0.0508, + "epoch": 0.36, + "learning_rate": 0.00024628784602774025, + "loss": 0.0583, "step": 55480 }, { - "epoch": 0.6, - "learning_rate": 0.00020997144525926404, - "loss": 0.0506, + "epoch": 0.36, + "learning_rate": 0.00024627816467338333, + "loss": 0.0562, "step": 55490 }, { - "epoch": 0.6, - "learning_rate": 0.000209955220974755, - "loss": 0.0604, + "epoch": 0.36, + "learning_rate": 0.0002462684833190264, + "loss": 0.0654, "step": 55500 }, { - "epoch": 0.6, - "learning_rate": 0.00020993899669024594, - "loss": 0.0508, + "epoch": 0.36, + "learning_rate": 0.0002462588019646695, + "loss": 0.0609, "step": 55510 }, { - "epoch": 0.6, - "learning_rate": 0.0002099227724057369, - "loss": 0.0484, + "epoch": 0.36, + "learning_rate": 0.00024624912061031257, + "loss": 0.0607, "step": 55520 }, { - "epoch": 0.6, - "learning_rate": 0.00020990654812122781, - "loss": 0.0702, + "epoch": 0.36, + "learning_rate": 0.00024623943925595565, + "loss": 0.0626, "step": 55530 }, { - "epoch": 0.6, - "learning_rate": 0.0002098903238367188, - "loss": 0.0536, + "epoch": 0.36, + "learning_rate": 0.0002462297579015987, + "loss": 0.0572, "step": 55540 }, { - "epoch": 0.6, - "learning_rate": 0.00020987409955220971, - "loss": 0.0558, + "epoch": 0.36, + "learning_rate": 0.00024622007654724175, + "loss": 0.0611, "step": 55550 }, { - "epoch": 0.6, - "learning_rate": 0.0002098578752677007, - "loss": 0.0499, + "epoch": 0.36, + "learning_rate": 0.00024621039519288483, + "loss": 0.0651, "step": 55560 }, { - "epoch": 0.6, - "learning_rate": 0.0002098416509831916, - "loss": 0.0488, + "epoch": 0.36, + "learning_rate": 0.0002462007138385279, + "loss": 0.064, "step": 55570 }, { - "epoch": 0.6, - "learning_rate": 0.00020982542669868256, - "loss": 0.0506, + "epoch": 0.36, + "learning_rate": 0.000246191032484171, + "loss": 0.0685, "step": 55580 }, { - "epoch": 0.6, - "learning_rate": 0.0002098092024141735, - "loss": 0.0504, + "epoch": 0.36, + "learning_rate": 0.000246181351129814, + "loss": 0.0578, "step": 55590 }, { - "epoch": 0.6, - "learning_rate": 0.00020979297812966446, - "loss": 0.0534, + "epoch": 0.36, + "learning_rate": 0.0002461716697754571, + "loss": 0.0635, "step": 55600 }, { - "epoch": 0.6, - "learning_rate": 0.00020977675384515539, - "loss": 0.0443, + "epoch": 0.36, + "learning_rate": 0.0002461619884211002, + "loss": 0.0615, "step": 55610 }, { - "epoch": 0.6, - "learning_rate": 0.00020976052956064636, - "loss": 0.05, + "epoch": 0.36, + "learning_rate": 0.0002461523070667432, + "loss": 0.0663, "step": 55620 }, { - "epoch": 0.6, - "learning_rate": 0.00020974430527613728, - "loss": 0.0547, + "epoch": 0.36, + "learning_rate": 0.0002461426257123863, + "loss": 0.0648, "step": 55630 }, { - "epoch": 0.6, - "learning_rate": 0.00020972808099162826, - "loss": 0.0544, + "epoch": 0.36, + "learning_rate": 0.00024613294435802936, + "loss": 0.0555, "step": 55640 }, { - "epoch": 0.6, - "learning_rate": 0.00020971185670711918, - "loss": 0.058, + "epoch": 0.36, + "learning_rate": 0.00024612326300367244, + "loss": 0.0649, "step": 55650 }, { - "epoch": 0.6, - "learning_rate": 0.00020969563242261016, - "loss": 0.0522, + "epoch": 0.36, + "learning_rate": 0.0002461135816493155, + "loss": 0.0665, "step": 55660 }, { - "epoch": 0.6, - "learning_rate": 0.00020967940813810108, - "loss": 0.06, + "epoch": 0.36, + "learning_rate": 0.0002461039002949586, + "loss": 0.0627, "step": 55670 }, { - "epoch": 0.6, - "learning_rate": 0.00020966318385359203, - "loss": 0.0491, + "epoch": 0.36, + "learning_rate": 0.00024609421894060163, + "loss": 0.0583, "step": 55680 }, { - "epoch": 0.6, - "learning_rate": 0.00020964695956908298, - "loss": 0.0572, + "epoch": 0.36, + "learning_rate": 0.0002460845375862447, + "loss": 0.0582, "step": 55690 }, { - "epoch": 0.6, - "learning_rate": 0.00020963073528457393, - "loss": 0.0581, + "epoch": 0.36, + "learning_rate": 0.0002460748562318878, + "loss": 0.0618, "step": 55700 }, { - "epoch": 0.6, - "learning_rate": 0.00020961451100006486, - "loss": 0.0496, + "epoch": 0.36, + "learning_rate": 0.00024606517487753087, + "loss": 0.0547, "step": 55710 }, { - "epoch": 0.6, - "learning_rate": 0.00020959828671555583, - "loss": 0.0523, + "epoch": 0.36, + "learning_rate": 0.0002460554935231739, + "loss": 0.0595, "step": 55720 }, { - "epoch": 0.6, - "learning_rate": 0.00020958206243104676, - "loss": 0.0553, + "epoch": 0.36, + "learning_rate": 0.000246045812168817, + "loss": 0.061, "step": 55730 }, { - "epoch": 0.6, - "learning_rate": 0.00020956583814653773, - "loss": 0.0586, + "epoch": 0.36, + "learning_rate": 0.00024603613081446005, + "loss": 0.0624, "step": 55740 }, { - "epoch": 0.6, - "learning_rate": 0.00020954961386202866, - "loss": 0.0557, + "epoch": 0.36, + "learning_rate": 0.0002460264494601031, + "loss": 0.0549, "step": 55750 }, { - "epoch": 0.6, - "learning_rate": 0.0002095333895775196, - "loss": 0.062, + "epoch": 0.36, + "learning_rate": 0.00024601676810574616, + "loss": 0.0599, "step": 55760 }, { - "epoch": 0.6, - "learning_rate": 0.00020951716529301055, - "loss": 0.0526, + "epoch": 0.36, + "learning_rate": 0.00024600708675138924, + "loss": 0.0581, "step": 55770 }, { - "epoch": 0.6, - "learning_rate": 0.0002095009410085015, - "loss": 0.0645, + "epoch": 0.36, + "learning_rate": 0.0002459974053970323, + "loss": 0.0651, "step": 55780 }, { - "epoch": 0.6, - "learning_rate": 0.00020948471672399245, - "loss": 0.0584, + "epoch": 0.36, + "learning_rate": 0.0002459877240426754, + "loss": 0.0595, "step": 55790 }, { - "epoch": 0.6, - "learning_rate": 0.0002094684924394834, - "loss": 0.0557, + "epoch": 0.36, + "learning_rate": 0.0002459780426883185, + "loss": 0.067, "step": 55800 }, { - "epoch": 0.6, - "learning_rate": 0.00020945226815497433, - "loss": 0.0509, + "epoch": 0.36, + "learning_rate": 0.00024596836133396156, + "loss": 0.0689, "step": 55810 }, { - "epoch": 0.6, - "learning_rate": 0.0002094360438704653, - "loss": 0.0553, + "epoch": 0.36, + "learning_rate": 0.0002459586799796046, + "loss": 0.0625, "step": 55820 }, { - "epoch": 0.6, - "learning_rate": 0.00020941981958595623, - "loss": 0.0528, + "epoch": 0.36, + "learning_rate": 0.00024594899862524766, + "loss": 0.073, "step": 55830 }, { - "epoch": 0.6, - "learning_rate": 0.0002094035953014472, - "loss": 0.055, + "epoch": 0.36, + "learning_rate": 0.00024593931727089074, + "loss": 0.0612, "step": 55840 }, { - "epoch": 0.6, - "learning_rate": 0.00020938737101693813, - "loss": 0.0534, + "epoch": 0.36, + "learning_rate": 0.00024592963591653377, + "loss": 0.0548, "step": 55850 }, { - "epoch": 0.6, - "learning_rate": 0.00020937114673242908, - "loss": 0.0523, + "epoch": 0.36, + "learning_rate": 0.00024591995456217685, + "loss": 0.0715, "step": 55860 }, { - "epoch": 0.6, - "learning_rate": 0.00020935492244792003, - "loss": 0.0478, + "epoch": 0.36, + "learning_rate": 0.00024591027320781993, + "loss": 0.0546, "step": 55870 }, { - "epoch": 0.6, - "learning_rate": 0.00020933869816341097, - "loss": 0.0534, + "epoch": 0.36, + "learning_rate": 0.000245900591853463, + "loss": 0.062, "step": 55880 }, { - "epoch": 0.6, - "learning_rate": 0.0002093224738789019, - "loss": 0.0478, + "epoch": 0.36, + "learning_rate": 0.00024589091049910603, + "loss": 0.0678, "step": 55890 }, { - "epoch": 0.6, - "learning_rate": 0.00020930624959439287, - "loss": 0.0504, + "epoch": 0.36, + "learning_rate": 0.0002458812291447491, + "loss": 0.0645, "step": 55900 }, { - "epoch": 0.6, - "learning_rate": 0.0002092900253098838, - "loss": 0.0545, + "epoch": 0.36, + "learning_rate": 0.0002458715477903922, + "loss": 0.0651, "step": 55910 }, { - "epoch": 0.6, - "learning_rate": 0.00020927380102537477, - "loss": 0.0578, + "epoch": 0.36, + "learning_rate": 0.0002458618664360353, + "loss": 0.0541, "step": 55920 }, { - "epoch": 0.6, - "learning_rate": 0.0002092575767408657, - "loss": 0.0558, + "epoch": 0.36, + "learning_rate": 0.00024585218508167835, + "loss": 0.0722, "step": 55930 }, { - "epoch": 0.61, - "learning_rate": 0.00020924135245635665, - "loss": 0.0481, + "epoch": 0.36, + "learning_rate": 0.00024584250372732143, + "loss": 0.0566, "step": 55940 }, { - "epoch": 0.61, - "learning_rate": 0.0002092251281718476, - "loss": 0.0563, + "epoch": 0.36, + "learning_rate": 0.0002458328223729645, + "loss": 0.0593, "step": 55950 }, { - "epoch": 0.61, - "learning_rate": 0.00020920890388733855, - "loss": 0.0579, + "epoch": 0.36, + "learning_rate": 0.00024582314101860754, + "loss": 0.0616, "step": 55960 }, { - "epoch": 0.61, - "learning_rate": 0.0002091926796028295, - "loss": 0.055, + "epoch": 0.36, + "learning_rate": 0.0002458134596642506, + "loss": 0.0624, "step": 55970 }, { - "epoch": 0.61, - "learning_rate": 0.00020917645531832045, - "loss": 0.0507, + "epoch": 0.36, + "learning_rate": 0.0002458037783098937, + "loss": 0.0584, "step": 55980 }, { - "epoch": 0.61, - "learning_rate": 0.00020916023103381137, - "loss": 0.0524, + "epoch": 0.36, + "learning_rate": 0.0002457940969555367, + "loss": 0.0569, "step": 55990 }, { - "epoch": 0.61, - "learning_rate": 0.00020914400674930235, - "loss": 0.058, + "epoch": 0.36, + "learning_rate": 0.0002457844156011798, + "loss": 0.0583, "step": 56000 }, { - "epoch": 0.61, - "eval_cer": 0.9212029169118335, - "eval_loss": 0.037965867668390274, - "eval_runtime": 119.2009, - "eval_samples_per_second": 16.778, - "eval_steps_per_second": 4.195, + "epoch": 0.36, + "eval_cer": 0.9199855383572477, + "eval_loss": 0.03988322243094444, + "eval_runtime": 119.9115, + "eval_samples_per_second": 16.679, + "eval_steps_per_second": 4.17, "step": 56000 }, { - "epoch": 0.61, - "learning_rate": 0.00020912778246479327, - "loss": 0.0493, + "epoch": 0.36, + "learning_rate": 0.0002457747342468229, + "loss": 0.0637, "step": 56010 }, { - "epoch": 0.61, - "learning_rate": 0.00020911155818028424, - "loss": 0.0526, + "epoch": 0.36, + "learning_rate": 0.00024576505289246596, + "loss": 0.0654, "step": 56020 }, { - "epoch": 0.61, - "learning_rate": 0.00020909533389577517, - "loss": 0.0648, + "epoch": 0.36, + "learning_rate": 0.000245755371538109, + "loss": 0.0611, "step": 56030 }, { - "epoch": 0.61, - "learning_rate": 0.00020907910961126612, - "loss": 0.0479, + "epoch": 0.36, + "learning_rate": 0.00024574569018375207, + "loss": 0.0631, "step": 56040 }, { - "epoch": 0.61, - "learning_rate": 0.00020906288532675707, - "loss": 0.0514, + "epoch": 0.36, + "learning_rate": 0.00024573600882939515, + "loss": 0.069, "step": 56050 }, { - "epoch": 0.61, - "learning_rate": 0.00020904666104224802, - "loss": 0.0481, + "epoch": 0.36, + "learning_rate": 0.00024572632747503823, + "loss": 0.0659, "step": 56060 }, { - "epoch": 0.61, - "learning_rate": 0.00020903043675773894, - "loss": 0.0544, + "epoch": 0.36, + "learning_rate": 0.0002457166461206813, + "loss": 0.0756, "step": 56070 }, { - "epoch": 0.61, - "learning_rate": 0.00020901421247322992, - "loss": 0.0559, + "epoch": 0.36, + "learning_rate": 0.0002457069647663244, + "loss": 0.0597, "step": 56080 }, { - "epoch": 0.61, - "learning_rate": 0.00020899798818872084, - "loss": 0.0532, + "epoch": 0.36, + "learning_rate": 0.0002456972834119674, + "loss": 0.057, "step": 56090 }, { - "epoch": 0.61, - "learning_rate": 0.00020898176390421182, - "loss": 0.0578, + "epoch": 0.36, + "learning_rate": 0.0002456876020576105, + "loss": 0.0696, "step": 56100 }, { - "epoch": 0.61, - "learning_rate": 0.00020896553961970274, - "loss": 0.0537, + "epoch": 0.36, + "learning_rate": 0.00024567792070325357, + "loss": 0.0725, "step": 56110 }, { - "epoch": 0.61, - "learning_rate": 0.0002089493153351937, - "loss": 0.0557, + "epoch": 0.36, + "learning_rate": 0.0002456682393488966, + "loss": 0.0612, "step": 56120 }, { - "epoch": 0.61, - "learning_rate": 0.00020893309105068464, - "loss": 0.0515, + "epoch": 0.36, + "learning_rate": 0.0002456585579945397, + "loss": 0.0608, "step": 56130 }, { - "epoch": 0.61, - "learning_rate": 0.0002089168667661756, - "loss": 0.0534, + "epoch": 0.36, + "learning_rate": 0.00024564887664018276, + "loss": 0.0599, "step": 56140 }, { - "epoch": 0.61, - "learning_rate": 0.00020890064248166654, - "loss": 0.0558, + "epoch": 0.36, + "learning_rate": 0.00024563919528582584, + "loss": 0.0589, "step": 56150 }, { - "epoch": 0.61, - "learning_rate": 0.0002088844181971575, - "loss": 0.071, + "epoch": 0.36, + "learning_rate": 0.0002456295139314689, + "loss": 0.0668, "step": 56160 }, { - "epoch": 0.61, - "learning_rate": 0.0002088681939126484, - "loss": 0.055, + "epoch": 0.36, + "learning_rate": 0.00024561983257711194, + "loss": 0.0629, "step": 56170 }, { - "epoch": 0.61, - "learning_rate": 0.0002088519696281394, - "loss": 0.0499, + "epoch": 0.36, + "learning_rate": 0.000245610151222755, + "loss": 0.0547, "step": 56180 }, { - "epoch": 0.61, - "learning_rate": 0.0002088357453436303, - "loss": 0.0521, + "epoch": 0.36, + "learning_rate": 0.0002456004698683981, + "loss": 0.0626, "step": 56190 }, { - "epoch": 0.61, - "learning_rate": 0.00020881952105912129, - "loss": 0.0484, + "epoch": 0.36, + "learning_rate": 0.0002455907885140412, + "loss": 0.0548, "step": 56200 }, { - "epoch": 0.61, - "learning_rate": 0.0002088032967746122, - "loss": 0.0462, + "epoch": 0.36, + "learning_rate": 0.00024558110715968426, + "loss": 0.0622, "step": 56210 }, { - "epoch": 0.61, - "learning_rate": 0.00020878707249010316, - "loss": 0.0525, + "epoch": 0.36, + "learning_rate": 0.00024557142580532734, + "loss": 0.0621, "step": 56220 }, { - "epoch": 0.61, - "learning_rate": 0.0002087708482055941, - "loss": 0.0481, + "epoch": 0.36, + "learning_rate": 0.00024556174445097037, + "loss": 0.0653, "step": 56230 }, { - "epoch": 0.61, - "learning_rate": 0.00020875462392108506, - "loss": 0.0481, + "epoch": 0.36, + "learning_rate": 0.00024555206309661345, + "loss": 0.0607, "step": 56240 }, { - "epoch": 0.61, - "learning_rate": 0.00020873839963657598, - "loss": 0.0568, + "epoch": 0.36, + "learning_rate": 0.0002455423817422565, + "loss": 0.0529, "step": 56250 }, { - "epoch": 0.61, - "learning_rate": 0.00020872217535206696, - "loss": 0.0491, + "epoch": 0.36, + "learning_rate": 0.00024553270038789955, + "loss": 0.0514, "step": 56260 }, { - "epoch": 0.61, - "learning_rate": 0.00020870595106755788, - "loss": 0.0629, + "epoch": 0.36, + "learning_rate": 0.00024552301903354263, + "loss": 0.0626, "step": 56270 }, { - "epoch": 0.61, - "learning_rate": 0.00020868972678304886, - "loss": 0.0531, + "epoch": 0.36, + "learning_rate": 0.0002455133376791857, + "loss": 0.0619, "step": 56280 }, { - "epoch": 0.61, - "learning_rate": 0.00020867350249853978, - "loss": 0.0568, + "epoch": 0.36, + "learning_rate": 0.0002455036563248288, + "loss": 0.0527, "step": 56290 }, { - "epoch": 0.61, - "learning_rate": 0.00020865727821403073, - "loss": 0.0562, + "epoch": 0.36, + "learning_rate": 0.00024549397497047187, + "loss": 0.06, "step": 56300 }, { - "epoch": 0.61, - "learning_rate": 0.00020864105392952168, - "loss": 0.0572, + "epoch": 0.36, + "learning_rate": 0.0002454842936161149, + "loss": 0.057, "step": 56310 }, { - "epoch": 0.61, - "learning_rate": 0.00020862482964501263, - "loss": 0.0563, + "epoch": 0.36, + "learning_rate": 0.000245474612261758, + "loss": 0.0621, "step": 56320 }, { - "epoch": 0.61, - "learning_rate": 0.0002086086053605036, - "loss": 0.0531, + "epoch": 0.36, + "learning_rate": 0.00024546493090740106, + "loss": 0.0558, "step": 56330 }, { - "epoch": 0.61, - "learning_rate": 0.00020859238107599453, - "loss": 0.056, + "epoch": 0.36, + "learning_rate": 0.00024545524955304414, + "loss": 0.0588, "step": 56340 }, { - "epoch": 0.61, - "learning_rate": 0.0002085761567914855, - "loss": 0.0471, + "epoch": 0.36, + "learning_rate": 0.0002454455681986872, + "loss": 0.0569, "step": 56350 }, { - "epoch": 0.61, - "learning_rate": 0.00020855993250697643, - "loss": 0.0474, + "epoch": 0.36, + "learning_rate": 0.00024543588684433024, + "loss": 0.0529, "step": 56360 }, { - "epoch": 0.61, - "learning_rate": 0.00020854370822246738, - "loss": 0.0539, + "epoch": 0.36, + "learning_rate": 0.0002454262054899733, + "loss": 0.0615, "step": 56370 }, { - "epoch": 0.61, - "learning_rate": 0.00020852748393795833, - "loss": 0.0564, + "epoch": 0.36, + "learning_rate": 0.0002454165241356164, + "loss": 0.0686, "step": 56380 }, { - "epoch": 0.61, - "learning_rate": 0.00020851125965344928, - "loss": 0.0456, + "epoch": 0.36, + "learning_rate": 0.00024540684278125943, + "loss": 0.0568, "step": 56390 }, { - "epoch": 0.61, - "learning_rate": 0.0002084950353689402, - "loss": 0.0566, + "epoch": 0.36, + "learning_rate": 0.0002453971614269025, + "loss": 0.06, "step": 56400 }, { - "epoch": 0.61, - "learning_rate": 0.00020847881108443118, - "loss": 0.0565, + "epoch": 0.36, + "learning_rate": 0.0002453874800725456, + "loss": 0.0643, "step": 56410 }, { - "epoch": 0.61, - "learning_rate": 0.0002084625867999221, - "loss": 0.057, + "epoch": 0.36, + "learning_rate": 0.00024537779871818867, + "loss": 0.0619, "step": 56420 }, { - "epoch": 0.61, - "learning_rate": 0.00020844636251541308, - "loss": 0.0578, + "epoch": 0.36, + "learning_rate": 0.00024536811736383175, + "loss": 0.0638, "step": 56430 }, { - "epoch": 0.61, - "learning_rate": 0.000208430138230904, - "loss": 0.0579, + "epoch": 0.36, + "learning_rate": 0.0002453584360094748, + "loss": 0.0614, "step": 56440 }, { - "epoch": 0.61, - "learning_rate": 0.00020841391394639495, - "loss": 0.0507, + "epoch": 0.36, + "learning_rate": 0.00024534875465511785, + "loss": 0.0599, "step": 56450 }, { - "epoch": 0.61, - "learning_rate": 0.0002083976896618859, - "loss": 0.0567, + "epoch": 0.36, + "learning_rate": 0.00024533907330076093, + "loss": 0.0585, "step": 56460 }, { - "epoch": 0.61, - "learning_rate": 0.00020838146537737685, - "loss": 0.0536, + "epoch": 0.36, + "learning_rate": 0.000245329391946404, + "loss": 0.0612, "step": 56470 }, { - "epoch": 0.61, - "learning_rate": 0.0002083652410928678, - "loss": 0.0537, + "epoch": 0.36, + "learning_rate": 0.0002453197105920471, + "loss": 0.0631, "step": 56480 }, { - "epoch": 0.61, - "learning_rate": 0.00020834901680835875, - "loss": 0.0537, + "epoch": 0.36, + "learning_rate": 0.0002453100292376901, + "loss": 0.0605, "step": 56490 }, { - "epoch": 0.61, - "learning_rate": 0.00020833279252384967, - "loss": 0.0518, + "epoch": 0.36, + "learning_rate": 0.0002453003478833332, + "loss": 0.0557, "step": 56500 }, { - "epoch": 0.61, - "learning_rate": 0.00020831656823934065, - "loss": 0.0464, + "epoch": 0.36, + "learning_rate": 0.0002452906665289763, + "loss": 0.0622, "step": 56510 }, { - "epoch": 0.61, - "learning_rate": 0.00020830034395483157, - "loss": 0.0637, + "epoch": 0.36, + "learning_rate": 0.0002452809851746193, + "loss": 0.0671, "step": 56520 }, { - "epoch": 0.61, - "learning_rate": 0.00020828411967032255, - "loss": 0.0505, + "epoch": 0.36, + "learning_rate": 0.0002452713038202624, + "loss": 0.0633, "step": 56530 }, { - "epoch": 0.61, - "learning_rate": 0.00020826789538581347, - "loss": 0.0573, + "epoch": 0.36, + "learning_rate": 0.00024526162246590546, + "loss": 0.058, "step": 56540 }, { - "epoch": 0.61, - "learning_rate": 0.00020825167110130442, - "loss": 0.0528, + "epoch": 0.36, + "learning_rate": 0.00024525194111154854, + "loss": 0.0534, "step": 56550 }, { - "epoch": 0.61, - "learning_rate": 0.00020823544681679537, - "loss": 0.0504, + "epoch": 0.37, + "learning_rate": 0.0002452422597571916, + "loss": 0.0614, "step": 56560 }, { - "epoch": 0.61, - "learning_rate": 0.00020821922253228632, - "loss": 0.0542, + "epoch": 0.37, + "learning_rate": 0.0002452325784028347, + "loss": 0.0544, "step": 56570 }, { - "epoch": 0.61, - "learning_rate": 0.00020820299824777724, - "loss": 0.0459, + "epoch": 0.37, + "learning_rate": 0.0002452228970484778, + "loss": 0.0534, "step": 56580 }, { - "epoch": 0.61, - "learning_rate": 0.00020818677396326822, - "loss": 0.0501, + "epoch": 0.37, + "learning_rate": 0.0002452132156941208, + "loss": 0.0628, "step": 56590 }, { - "epoch": 0.61, - "learning_rate": 0.00020817054967875914, - "loss": 0.0573, + "epoch": 0.37, + "learning_rate": 0.0002452035343397639, + "loss": 0.0588, "step": 56600 }, { - "epoch": 0.61, - "learning_rate": 0.00020815432539425012, - "loss": 0.0531, + "epoch": 0.37, + "learning_rate": 0.00024519385298540697, + "loss": 0.0626, "step": 56610 }, { - "epoch": 0.61, - "learning_rate": 0.00020813810110974104, - "loss": 0.05, + "epoch": 0.37, + "learning_rate": 0.00024518417163105005, + "loss": 0.0773, "step": 56620 }, { - "epoch": 0.61, - "learning_rate": 0.000208121876825232, - "loss": 0.0506, + "epoch": 0.37, + "learning_rate": 0.00024517449027669307, + "loss": 0.059, "step": 56630 }, { - "epoch": 0.61, - "learning_rate": 0.00020810565254072294, - "loss": 0.049, - "step": 56640 + "epoch": 0.37, + "learning_rate": 0.00024516480892233615, + "loss": 0.0577, + "step": 56640 }, { - "epoch": 0.61, - "learning_rate": 0.0002080894282562139, - "loss": 0.0505, + "epoch": 0.37, + "learning_rate": 0.00024515512756797923, + "loss": 0.0667, "step": 56650 }, { - "epoch": 0.61, - "learning_rate": 0.00020807320397170484, - "loss": 0.0399, + "epoch": 0.37, + "learning_rate": 0.00024514544621362226, + "loss": 0.0684, "step": 56660 }, { - "epoch": 0.61, - "learning_rate": 0.0002080569796871958, - "loss": 0.0497, + "epoch": 0.37, + "learning_rate": 0.00024513576485926534, + "loss": 0.0576, "step": 56670 }, { - "epoch": 0.61, - "learning_rate": 0.0002080407554026867, - "loss": 0.0505, + "epoch": 0.37, + "learning_rate": 0.0002451260835049084, + "loss": 0.0606, "step": 56680 }, { - "epoch": 0.61, - "learning_rate": 0.0002080245311181777, - "loss": 0.054, + "epoch": 0.37, + "learning_rate": 0.0002451164021505515, + "loss": 0.0621, "step": 56690 }, { - "epoch": 0.61, - "learning_rate": 0.0002080083068336686, - "loss": 0.0519, + "epoch": 0.37, + "learning_rate": 0.0002451067207961946, + "loss": 0.058, "step": 56700 }, { - "epoch": 0.61, - "learning_rate": 0.0002079920825491596, - "loss": 0.0473, + "epoch": 0.37, + "learning_rate": 0.00024509703944183766, + "loss": 0.0642, "step": 56710 }, { - "epoch": 0.61, - "learning_rate": 0.0002079758582646505, - "loss": 0.0637, + "epoch": 0.37, + "learning_rate": 0.00024508735808748074, + "loss": 0.0621, "step": 56720 }, { - "epoch": 0.61, - "learning_rate": 0.00020795963398014146, - "loss": 0.053, + "epoch": 0.37, + "learning_rate": 0.00024507767673312376, + "loss": 0.0601, "step": 56730 }, { - "epoch": 0.61, - "learning_rate": 0.0002079434096956324, - "loss": 0.0571, + "epoch": 0.37, + "learning_rate": 0.00024506799537876684, + "loss": 0.0625, "step": 56740 }, { - "epoch": 0.61, - "learning_rate": 0.00020792718541112336, - "loss": 0.053, + "epoch": 0.37, + "learning_rate": 0.0002450583140244099, + "loss": 0.0592, "step": 56750 }, { - "epoch": 0.61, - "learning_rate": 0.00020791096112661428, - "loss": 0.047, + "epoch": 0.37, + "learning_rate": 0.00024504863267005295, + "loss": 0.0589, "step": 56760 }, { - "epoch": 0.61, - "learning_rate": 0.00020789473684210526, - "loss": 0.0473, + "epoch": 0.37, + "learning_rate": 0.000245038951315696, + "loss": 0.0514, "step": 56770 }, { - "epoch": 0.61, - "learning_rate": 0.00020787851255759618, - "loss": 0.0572, + "epoch": 0.37, + "learning_rate": 0.0002450292699613391, + "loss": 0.0626, "step": 56780 }, { - "epoch": 0.61, - "learning_rate": 0.00020786228827308716, - "loss": 0.0517, + "epoch": 0.37, + "learning_rate": 0.0002450195886069822, + "loss": 0.0577, "step": 56790 }, { - "epoch": 0.61, - "learning_rate": 0.00020784606398857808, - "loss": 0.0564, + "epoch": 0.37, + "learning_rate": 0.0002450099072526252, + "loss": 0.0614, "step": 56800 }, { - "epoch": 0.61, - "learning_rate": 0.00020782983970406903, - "loss": 0.0536, + "epoch": 0.37, + "learning_rate": 0.0002450002258982683, + "loss": 0.0604, "step": 56810 }, { - "epoch": 0.61, - "learning_rate": 0.00020781361541955998, - "loss": 0.0465, + "epoch": 0.37, + "learning_rate": 0.00024499054454391137, + "loss": 0.062, "step": 56820 }, { - "epoch": 0.61, - "learning_rate": 0.00020779739113505093, - "loss": 0.0597, + "epoch": 0.37, + "learning_rate": 0.00024498086318955445, + "loss": 0.0593, "step": 56830 }, { - "epoch": 0.61, - "learning_rate": 0.00020778116685054188, - "loss": 0.0475, + "epoch": 0.37, + "learning_rate": 0.00024497118183519753, + "loss": 0.063, "step": 56840 }, { - "epoch": 0.61, - "learning_rate": 0.00020776494256603283, - "loss": 0.0509, + "epoch": 0.37, + "learning_rate": 0.0002449615004808406, + "loss": 0.0589, "step": 56850 }, { - "epoch": 0.62, - "learning_rate": 0.00020774871828152375, - "loss": 0.0479, + "epoch": 0.37, + "learning_rate": 0.00024495181912648364, + "loss": 0.0617, "step": 56860 }, { - "epoch": 0.62, - "learning_rate": 0.00020773249399701473, - "loss": 0.0543, + "epoch": 0.37, + "learning_rate": 0.0002449421377721267, + "loss": 0.0608, "step": 56870 }, { - "epoch": 0.62, - "learning_rate": 0.00020771626971250565, - "loss": 0.0502, + "epoch": 0.37, + "learning_rate": 0.0002449324564177698, + "loss": 0.0583, "step": 56880 }, { - "epoch": 0.62, - "learning_rate": 0.00020770004542799663, - "loss": 0.0493, + "epoch": 0.37, + "learning_rate": 0.0002449227750634128, + "loss": 0.0567, "step": 56890 }, { - "epoch": 0.62, - "learning_rate": 0.00020768382114348755, - "loss": 0.0556, + "epoch": 0.37, + "learning_rate": 0.0002449130937090559, + "loss": 0.0626, "step": 56900 }, { - "epoch": 0.62, - "learning_rate": 0.0002076675968589785, - "loss": 0.0528, + "epoch": 0.37, + "learning_rate": 0.000244903412354699, + "loss": 0.056, "step": 56910 }, { - "epoch": 0.62, - "learning_rate": 0.00020765137257446945, - "loss": 0.0592, + "epoch": 0.37, + "learning_rate": 0.00024489373100034206, + "loss": 0.0546, "step": 56920 }, { - "epoch": 0.62, - "learning_rate": 0.0002076351482899604, - "loss": 0.0524, + "epoch": 0.37, + "learning_rate": 0.00024488404964598514, + "loss": 0.0562, "step": 56930 }, { - "epoch": 0.62, - "learning_rate": 0.00020761892400545133, - "loss": 0.0499, + "epoch": 0.37, + "learning_rate": 0.00024487436829162817, + "loss": 0.0504, "step": 56940 }, { - "epoch": 0.62, - "learning_rate": 0.0002076026997209423, - "loss": 0.0575, + "epoch": 0.37, + "learning_rate": 0.00024486468693727125, + "loss": 0.0507, "step": 56950 }, { - "epoch": 0.62, - "learning_rate": 0.00020758647543643322, - "loss": 0.0528, + "epoch": 0.37, + "learning_rate": 0.0002448550055829143, + "loss": 0.0567, "step": 56960 }, { - "epoch": 0.62, - "learning_rate": 0.0002075702511519242, - "loss": 0.0536, + "epoch": 0.37, + "learning_rate": 0.0002448453242285574, + "loss": 0.0596, "step": 56970 }, { - "epoch": 0.62, - "learning_rate": 0.00020755402686741512, - "loss": 0.0521, + "epoch": 0.37, + "learning_rate": 0.0002448356428742005, + "loss": 0.0588, "step": 56980 }, { - "epoch": 0.62, - "learning_rate": 0.00020753780258290607, - "loss": 0.053, + "epoch": 0.37, + "learning_rate": 0.00024482596151984356, + "loss": 0.0612, "step": 56990 }, { - "epoch": 0.62, - "learning_rate": 0.00020752157829839702, - "loss": 0.0481, + "epoch": 0.37, + "learning_rate": 0.0002448162801654866, + "loss": 0.0602, "step": 57000 }, { - "epoch": 0.62, - "eval_cer": 0.9213177698735381, - "eval_loss": 0.03662886098027229, - "eval_runtime": 118.8577, - "eval_samples_per_second": 16.827, - "eval_steps_per_second": 4.207, + "epoch": 0.37, + "eval_cer": 0.9200777313297932, + "eval_loss": 0.04003721475601196, + "eval_runtime": 120.0958, + "eval_samples_per_second": 16.653, + "eval_steps_per_second": 4.163, "step": 57000 }, { - "epoch": 0.62, - "learning_rate": 0.00020750535401388797, - "loss": 0.0543, + "epoch": 0.37, + "learning_rate": 0.00024480659881112967, + "loss": 0.067, "step": 57010 }, { - "epoch": 0.62, - "learning_rate": 0.00020748912972937892, - "loss": 0.0506, + "epoch": 0.37, + "learning_rate": 0.00024479691745677275, + "loss": 0.0599, "step": 57020 }, { - "epoch": 0.62, - "learning_rate": 0.00020747290544486987, - "loss": 0.066, + "epoch": 0.37, + "learning_rate": 0.0002447872361024158, + "loss": 0.0546, "step": 57030 }, { - "epoch": 0.62, - "learning_rate": 0.0002074566811603608, - "loss": 0.0477, + "epoch": 0.37, + "learning_rate": 0.00024477755474805885, + "loss": 0.0567, "step": 57040 }, { - "epoch": 0.62, - "learning_rate": 0.00020744045687585177, - "loss": 0.057, + "epoch": 0.37, + "learning_rate": 0.00024476787339370193, + "loss": 0.0594, "step": 57050 }, { - "epoch": 0.62, - "learning_rate": 0.0002074242325913427, - "loss": 0.0578, + "epoch": 0.37, + "learning_rate": 0.000244758192039345, + "loss": 0.0585, "step": 57060 }, { - "epoch": 0.62, - "learning_rate": 0.00020740800830683367, - "loss": 0.0584, + "epoch": 0.37, + "learning_rate": 0.0002447485106849881, + "loss": 0.0665, "step": 57070 }, { - "epoch": 0.62, - "learning_rate": 0.0002073917840223246, - "loss": 0.0518, + "epoch": 0.37, + "learning_rate": 0.0002447388293306311, + "loss": 0.0604, "step": 57080 }, { - "epoch": 0.62, - "learning_rate": 0.00020737555973781554, - "loss": 0.0495, + "epoch": 0.37, + "learning_rate": 0.0002447291479762742, + "loss": 0.0536, "step": 57090 }, { - "epoch": 0.62, - "learning_rate": 0.0002073593354533065, - "loss": 0.0545, + "epoch": 0.37, + "learning_rate": 0.0002447194666219173, + "loss": 0.0561, "step": 57100 }, { - "epoch": 0.62, - "learning_rate": 0.00020734311116879744, - "loss": 0.0513, + "epoch": 0.37, + "learning_rate": 0.00024470978526756036, + "loss": 0.0694, "step": 57110 }, { - "epoch": 0.62, - "learning_rate": 0.00020732688688428837, - "loss": 0.0567, + "epoch": 0.37, + "learning_rate": 0.00024470010391320344, + "loss": 0.0653, "step": 57120 }, { - "epoch": 0.62, - "learning_rate": 0.00020731066259977934, - "loss": 0.0564, + "epoch": 0.37, + "learning_rate": 0.00024469042255884646, + "loss": 0.0602, "step": 57130 }, { - "epoch": 0.62, - "learning_rate": 0.00020729443831527027, - "loss": 0.0641, + "epoch": 0.37, + "learning_rate": 0.00024468074120448954, + "loss": 0.0581, "step": 57140 }, { - "epoch": 0.62, - "learning_rate": 0.00020727821403076124, - "loss": 0.0428, + "epoch": 0.37, + "learning_rate": 0.0002446710598501326, + "loss": 0.0664, "step": 57150 }, { - "epoch": 0.62, - "learning_rate": 0.00020726198974625217, - "loss": 0.0547, + "epoch": 0.37, + "learning_rate": 0.00024466137849577565, + "loss": 0.0661, "step": 57160 }, { - "epoch": 0.62, - "learning_rate": 0.00020724576546174314, - "loss": 0.0586, + "epoch": 0.37, + "learning_rate": 0.00024465169714141873, + "loss": 0.0637, "step": 57170 }, { - "epoch": 0.62, - "learning_rate": 0.00020722954117723407, - "loss": 0.0596, + "epoch": 0.37, + "learning_rate": 0.0002446420157870618, + "loss": 0.0643, "step": 57180 }, { - "epoch": 0.62, - "learning_rate": 0.00020721331689272502, - "loss": 0.0513, + "epoch": 0.37, + "learning_rate": 0.0002446323344327049, + "loss": 0.0629, "step": 57190 }, { - "epoch": 0.62, - "learning_rate": 0.00020719709260821597, - "loss": 0.0459, + "epoch": 0.37, + "learning_rate": 0.00024462265307834797, + "loss": 0.0567, "step": 57200 }, { - "epoch": 0.62, - "learning_rate": 0.00020718086832370692, - "loss": 0.0566, + "epoch": 0.37, + "learning_rate": 0.00024461297172399105, + "loss": 0.0586, "step": 57210 }, { - "epoch": 0.62, - "learning_rate": 0.00020716464403919784, - "loss": 0.0505, + "epoch": 0.37, + "learning_rate": 0.0002446032903696341, + "loss": 0.0562, "step": 57220 }, { - "epoch": 0.62, - "learning_rate": 0.00020714841975468881, - "loss": 0.0455, + "epoch": 0.37, + "learning_rate": 0.00024459360901527715, + "loss": 0.0598, "step": 57230 }, { - "epoch": 0.62, - "learning_rate": 0.00020713219547017974, - "loss": 0.0533, + "epoch": 0.37, + "learning_rate": 0.00024458392766092023, + "loss": 0.0574, "step": 57240 }, { - "epoch": 0.62, - "learning_rate": 0.00020711597118567071, - "loss": 0.0497, + "epoch": 0.37, + "learning_rate": 0.0002445742463065633, + "loss": 0.0642, "step": 57250 }, { - "epoch": 0.62, - "learning_rate": 0.00020709974690116164, - "loss": 0.0501, + "epoch": 0.37, + "learning_rate": 0.00024456456495220634, + "loss": 0.0589, "step": 57260 }, { - "epoch": 0.62, - "learning_rate": 0.0002070835226166526, - "loss": 0.0499, + "epoch": 0.37, + "learning_rate": 0.0002445548835978494, + "loss": 0.0549, "step": 57270 }, { - "epoch": 0.62, - "learning_rate": 0.00020706729833214354, - "loss": 0.0603, + "epoch": 0.37, + "learning_rate": 0.0002445452022434925, + "loss": 0.0693, "step": 57280 }, { - "epoch": 0.62, - "learning_rate": 0.00020705107404763449, - "loss": 0.0516, + "epoch": 0.37, + "learning_rate": 0.0002445355208891355, + "loss": 0.0637, "step": 57290 }, { - "epoch": 0.62, - "learning_rate": 0.0002070348497631254, - "loss": 0.0606, + "epoch": 0.37, + "learning_rate": 0.0002445258395347786, + "loss": 0.0545, "step": 57300 }, { - "epoch": 0.62, - "learning_rate": 0.00020701862547861639, - "loss": 0.0541, + "epoch": 0.37, + "learning_rate": 0.0002445161581804217, + "loss": 0.0526, "step": 57310 }, { - "epoch": 0.62, - "learning_rate": 0.0002070024011941073, - "loss": 0.0543, + "epoch": 0.37, + "learning_rate": 0.00024450647682606476, + "loss": 0.0638, "step": 57320 }, { - "epoch": 0.62, - "learning_rate": 0.00020698617690959829, - "loss": 0.0519, + "epoch": 0.37, + "learning_rate": 0.00024449679547170784, + "loss": 0.0517, "step": 57330 }, { - "epoch": 0.62, - "learning_rate": 0.0002069699526250892, - "loss": 0.0578, + "epoch": 0.37, + "learning_rate": 0.0002444871141173509, + "loss": 0.0654, "step": 57340 }, { - "epoch": 0.62, - "learning_rate": 0.00020695372834058018, - "loss": 0.0495, + "epoch": 0.37, + "learning_rate": 0.000244477432762994, + "loss": 0.0577, "step": 57350 }, { - "epoch": 0.62, - "learning_rate": 0.0002069375040560711, - "loss": 0.0511, + "epoch": 0.37, + "learning_rate": 0.00024446775140863703, + "loss": 0.0579, "step": 57360 }, { - "epoch": 0.62, - "learning_rate": 0.00020692127977156206, - "loss": 0.0561, + "epoch": 0.37, + "learning_rate": 0.0002444580700542801, + "loss": 0.0748, "step": 57370 }, { - "epoch": 0.62, - "learning_rate": 0.000206905055487053, - "loss": 0.0505, + "epoch": 0.37, + "learning_rate": 0.0002444483886999232, + "loss": 0.0589, "step": 57380 }, { - "epoch": 0.62, - "learning_rate": 0.00020688883120254396, - "loss": 0.0634, + "epoch": 0.37, + "learning_rate": 0.00024443870734556627, + "loss": 0.0572, "step": 57390 }, { - "epoch": 0.62, - "learning_rate": 0.00020687260691803488, - "loss": 0.0565, + "epoch": 0.37, + "learning_rate": 0.0002444290259912093, + "loss": 0.0628, "step": 57400 }, { - "epoch": 0.62, - "learning_rate": 0.00020685638263352586, - "loss": 0.0534, + "epoch": 0.37, + "learning_rate": 0.0002444193446368524, + "loss": 0.0634, "step": 57410 }, { - "epoch": 0.62, - "learning_rate": 0.00020684015834901678, - "loss": 0.0532, + "epoch": 0.37, + "learning_rate": 0.00024440966328249545, + "loss": 0.078, "step": 57420 }, { - "epoch": 0.62, - "learning_rate": 0.00020682393406450776, - "loss": 0.0675, + "epoch": 0.37, + "learning_rate": 0.0002443999819281385, + "loss": 0.0672, "step": 57430 }, { - "epoch": 0.62, - "learning_rate": 0.00020680770977999868, - "loss": 0.0562, + "epoch": 0.37, + "learning_rate": 0.00024439030057378156, + "loss": 0.0632, "step": 57440 }, { - "epoch": 0.62, - "learning_rate": 0.00020679148549548963, - "loss": 0.0498, + "epoch": 0.37, + "learning_rate": 0.00024438061921942464, + "loss": 0.0533, "step": 57450 }, { - "epoch": 0.62, - "learning_rate": 0.00020677526121098058, - "loss": 0.0552, + "epoch": 0.37, + "learning_rate": 0.0002443709378650677, + "loss": 0.0567, "step": 57460 }, { - "epoch": 0.62, - "learning_rate": 0.00020675903692647153, - "loss": 0.0554, + "epoch": 0.37, + "learning_rate": 0.0002443612565107108, + "loss": 0.0706, "step": 57470 }, { - "epoch": 0.62, - "learning_rate": 0.00020674281264196245, - "loss": 0.0619, + "epoch": 0.37, + "learning_rate": 0.0002443515751563539, + "loss": 0.0631, "step": 57480 }, { - "epoch": 0.62, - "learning_rate": 0.00020672658835745343, - "loss": 0.0534, + "epoch": 0.37, + "learning_rate": 0.00024434189380199696, + "loss": 0.0604, "step": 57490 }, { - "epoch": 0.62, - "learning_rate": 0.00020671036407294435, - "loss": 0.0557, + "epoch": 0.37, + "learning_rate": 0.00024433221244764, + "loss": 0.0618, "step": 57500 }, { - "epoch": 0.62, - "learning_rate": 0.00020669413978843533, - "loss": 0.0536, + "epoch": 0.37, + "learning_rate": 0.00024432253109328306, + "loss": 0.056, "step": 57510 }, { - "epoch": 0.62, - "learning_rate": 0.00020667791550392625, - "loss": 0.0458, + "epoch": 0.37, + "learning_rate": 0.00024431284973892614, + "loss": 0.0641, "step": 57520 }, { - "epoch": 0.62, - "learning_rate": 0.00020666169121941723, - "loss": 0.0549, + "epoch": 0.37, + "learning_rate": 0.00024430316838456917, + "loss": 0.0649, "step": 57530 }, { - "epoch": 0.62, - "learning_rate": 0.00020664546693490815, - "loss": 0.0652, + "epoch": 0.37, + "learning_rate": 0.00024429348703021225, + "loss": 0.0651, "step": 57540 }, { - "epoch": 0.62, - "learning_rate": 0.0002066292426503991, - "loss": 0.0521, + "epoch": 0.37, + "learning_rate": 0.00024428380567585533, + "loss": 0.0656, "step": 57550 }, { - "epoch": 0.62, - "learning_rate": 0.00020661301836589005, - "loss": 0.0453, + "epoch": 0.37, + "learning_rate": 0.0002442741243214984, + "loss": 0.0667, "step": 57560 }, { - "epoch": 0.62, - "learning_rate": 0.000206596794081381, - "loss": 0.0555, + "epoch": 0.37, + "learning_rate": 0.00024426444296714143, + "loss": 0.0593, "step": 57570 }, { - "epoch": 0.62, - "learning_rate": 0.00020658056979687192, - "loss": 0.052, + "epoch": 0.37, + "learning_rate": 0.0002442547616127845, + "loss": 0.0585, "step": 57580 }, { - "epoch": 0.62, - "learning_rate": 0.0002065643455123629, - "loss": 0.0539, + "epoch": 0.37, + "learning_rate": 0.0002442450802584276, + "loss": 0.0609, "step": 57590 }, { - "epoch": 0.62, - "learning_rate": 0.00020654812122785382, - "loss": 0.0579, + "epoch": 0.37, + "learning_rate": 0.00024423539890407067, + "loss": 0.0558, "step": 57600 }, { - "epoch": 0.62, - "learning_rate": 0.0002065318969433448, - "loss": 0.051, + "epoch": 0.37, + "learning_rate": 0.00024422571754971375, + "loss": 0.0668, "step": 57610 }, { - "epoch": 0.62, - "learning_rate": 0.00020651567265883572, - "loss": 0.053, + "epoch": 0.37, + "learning_rate": 0.00024421603619535683, + "loss": 0.0618, "step": 57620 }, { - "epoch": 0.62, - "learning_rate": 0.00020649944837432667, - "loss": 0.056, + "epoch": 0.37, + "learning_rate": 0.00024420635484099986, + "loss": 0.0709, "step": 57630 }, { - "epoch": 0.62, - "learning_rate": 0.00020648322408981762, - "loss": 0.053, + "epoch": 0.37, + "learning_rate": 0.00024419667348664294, + "loss": 0.0569, "step": 57640 }, { - "epoch": 0.62, - "learning_rate": 0.00020646699980530857, - "loss": 0.0534, + "epoch": 0.37, + "learning_rate": 0.000244186992132286, + "loss": 0.0627, "step": 57650 }, { - "epoch": 0.62, - "learning_rate": 0.0002064507755207995, - "loss": 0.0515, + "epoch": 0.37, + "learning_rate": 0.00024417731077792904, + "loss": 0.0575, "step": 57660 }, { - "epoch": 0.62, - "learning_rate": 0.00020643455123629047, - "loss": 0.0502, + "epoch": 0.37, + "learning_rate": 0.0002441676294235721, + "loss": 0.0518, "step": 57670 }, { - "epoch": 0.62, - "learning_rate": 0.0002064183269517814, - "loss": 0.0506, + "epoch": 0.37, + "learning_rate": 0.0002441579480692152, + "loss": 0.061, "step": 57680 }, { - "epoch": 0.62, - "learning_rate": 0.00020640210266727237, - "loss": 0.0425, + "epoch": 0.37, + "learning_rate": 0.0002441482667148583, + "loss": 0.0669, "step": 57690 }, { - "epoch": 0.62, - "learning_rate": 0.0002063858783827633, - "loss": 0.0539, + "epoch": 0.37, + "learning_rate": 0.00024413858536050136, + "loss": 0.0571, "step": 57700 }, { - "epoch": 0.62, - "learning_rate": 0.00020636965409825427, - "loss": 0.0545, + "epoch": 0.37, + "learning_rate": 0.0002441289040061444, + "loss": 0.062, "step": 57710 }, { - "epoch": 0.62, - "learning_rate": 0.0002063534298137452, - "loss": 0.0508, + "epoch": 0.37, + "learning_rate": 0.00024411922265178747, + "loss": 0.0673, "step": 57720 }, { - "epoch": 0.62, - "learning_rate": 0.00020633720552923614, - "loss": 0.0465, + "epoch": 0.37, + "learning_rate": 0.00024410954129743055, + "loss": 0.0594, "step": 57730 }, { - "epoch": 0.62, - "learning_rate": 0.0002063209812447271, - "loss": 0.0525, + "epoch": 0.37, + "learning_rate": 0.00024409985994307363, + "loss": 0.0543, "step": 57740 }, { - "epoch": 0.62, - "learning_rate": 0.00020630475696021804, - "loss": 0.0487, + "epoch": 0.37, + "learning_rate": 0.00024409017858871668, + "loss": 0.0597, "step": 57750 }, { - "epoch": 0.62, - "learning_rate": 0.00020628853267570896, - "loss": 0.0518, + "epoch": 0.37, + "learning_rate": 0.00024408049723435976, + "loss": 0.0634, "step": 57760 }, { - "epoch": 0.62, - "learning_rate": 0.00020627230839119994, - "loss": 0.0452, + "epoch": 0.37, + "learning_rate": 0.00024407081588000284, + "loss": 0.0595, "step": 57770 }, { - "epoch": 0.62, - "learning_rate": 0.00020625608410669086, - "loss": 0.0513, + "epoch": 0.37, + "learning_rate": 0.00024406113452564587, + "loss": 0.0607, "step": 57780 }, { - "epoch": 0.63, - "learning_rate": 0.00020623985982218184, - "loss": 0.0538, + "epoch": 0.37, + "learning_rate": 0.00024405145317128894, + "loss": 0.0588, "step": 57790 }, { - "epoch": 0.63, - "learning_rate": 0.00020622363553767276, - "loss": 0.0493, + "epoch": 0.37, + "learning_rate": 0.00024404177181693202, + "loss": 0.0649, "step": 57800 }, { - "epoch": 0.63, - "learning_rate": 0.0002062074112531637, - "loss": 0.0541, + "epoch": 0.37, + "learning_rate": 0.0002440320904625751, + "loss": 0.0719, "step": 57810 }, { - "epoch": 0.63, - "learning_rate": 0.00020619118696865466, - "loss": 0.0532, + "epoch": 0.37, + "learning_rate": 0.00024402240910821816, + "loss": 0.0612, "step": 57820 }, { - "epoch": 0.63, - "learning_rate": 0.0002061749626841456, - "loss": 0.048, + "epoch": 0.37, + "learning_rate": 0.00024401272775386124, + "loss": 0.0499, "step": 57830 }, { - "epoch": 0.63, - "learning_rate": 0.00020615873839963653, - "loss": 0.0535, + "epoch": 0.37, + "learning_rate": 0.00024400304639950432, + "loss": 0.0552, "step": 57840 }, { - "epoch": 0.63, - "learning_rate": 0.0002061425141151275, - "loss": 0.0517, + "epoch": 0.37, + "learning_rate": 0.00024399336504514734, + "loss": 0.0534, "step": 57850 }, { - "epoch": 0.63, - "learning_rate": 0.00020612628983061843, - "loss": 0.053, + "epoch": 0.37, + "learning_rate": 0.00024398368369079042, + "loss": 0.0544, "step": 57860 }, { - "epoch": 0.63, - "learning_rate": 0.0002061100655461094, - "loss": 0.0454, + "epoch": 0.37, + "learning_rate": 0.0002439740023364335, + "loss": 0.0556, "step": 57870 }, { - "epoch": 0.63, - "learning_rate": 0.00020609384126160033, - "loss": 0.0603, + "epoch": 0.37, + "learning_rate": 0.00024396432098207655, + "loss": 0.0612, "step": 57880 }, { - "epoch": 0.63, - "learning_rate": 0.0002060776169770913, - "loss": 0.0518, + "epoch": 0.37, + "learning_rate": 0.00024395463962771963, + "loss": 0.0611, "step": 57890 }, { - "epoch": 0.63, - "learning_rate": 0.00020606139269258223, - "loss": 0.0482, + "epoch": 0.37, + "learning_rate": 0.00024394495827336271, + "loss": 0.0531, "step": 57900 }, { - "epoch": 0.63, - "learning_rate": 0.00020604516840807318, - "loss": 0.0476, - "step": 57910 + "epoch": 0.37, + "learning_rate": 0.0002439352769190058, + "loss": 0.0552, + "step": 57910 }, { - "epoch": 0.63, - "learning_rate": 0.00020602894412356413, - "loss": 0.0577, + "epoch": 0.37, + "learning_rate": 0.00024392559556464882, + "loss": 0.0553, "step": 57920 }, { - "epoch": 0.63, - "learning_rate": 0.00020601271983905508, - "loss": 0.0506, + "epoch": 0.37, + "learning_rate": 0.0002439159142102919, + "loss": 0.056, "step": 57930 }, { - "epoch": 0.63, - "learning_rate": 0.000205996495554546, - "loss": 0.0499, + "epoch": 0.37, + "learning_rate": 0.00024390623285593498, + "loss": 0.0637, "step": 57940 }, { - "epoch": 0.63, - "learning_rate": 0.00020598027127003698, - "loss": 0.0509, + "epoch": 0.37, + "learning_rate": 0.00024389655150157803, + "loss": 0.0628, "step": 57950 }, { - "epoch": 0.63, - "learning_rate": 0.0002059640469855279, - "loss": 0.0521, + "epoch": 0.37, + "learning_rate": 0.0002438868701472211, + "loss": 0.0542, "step": 57960 }, { - "epoch": 0.63, - "learning_rate": 0.00020594782270101888, - "loss": 0.0479, + "epoch": 0.37, + "learning_rate": 0.0002438771887928642, + "loss": 0.0644, "step": 57970 }, { - "epoch": 0.63, - "learning_rate": 0.0002059315984165098, - "loss": 0.0561, + "epoch": 0.37, + "learning_rate": 0.00024386750743850727, + "loss": 0.073, "step": 57980 }, { - "epoch": 0.63, - "learning_rate": 0.00020591537413200075, - "loss": 0.0548, + "epoch": 0.37, + "learning_rate": 0.0002438578260841503, + "loss": 0.0717, "step": 57990 }, { - "epoch": 0.63, - "learning_rate": 0.0002058991498474917, - "loss": 0.0581, + "epoch": 0.37, + "learning_rate": 0.00024384814472979338, + "loss": 0.0707, "step": 58000 }, { - "epoch": 0.63, - "eval_cer": 0.921205567364796, - "eval_loss": 0.03674168139696121, - "eval_runtime": 118.9546, - "eval_samples_per_second": 16.813, - "eval_steps_per_second": 4.203, + "epoch": 0.37, + "eval_cer": 0.9200162693480962, + "eval_loss": 0.03994331881403923, + "eval_runtime": 120.3621, + "eval_samples_per_second": 16.617, + "eval_steps_per_second": 4.154, "step": 58000 }, { - "epoch": 0.63, - "learning_rate": 0.00020588292556298265, - "loss": 0.0461, + "epoch": 0.37, + "learning_rate": 0.00024383846337543646, + "loss": 0.0753, "step": 58010 }, { - "epoch": 0.63, - "learning_rate": 0.0002058667012784736, - "loss": 0.055, + "epoch": 0.37, + "learning_rate": 0.0002438287820210795, + "loss": 0.0633, "step": 58020 }, { - "epoch": 0.63, - "learning_rate": 0.00020585047699396455, - "loss": 0.0559, + "epoch": 0.37, + "learning_rate": 0.0002438191006667226, + "loss": 0.0555, "step": 58030 }, { - "epoch": 0.63, - "learning_rate": 0.00020583425270945547, - "loss": 0.0463, + "epoch": 0.37, + "learning_rate": 0.00024380941931236567, + "loss": 0.0604, "step": 58040 }, { - "epoch": 0.63, - "learning_rate": 0.00020581802842494645, - "loss": 0.0478, + "epoch": 0.37, + "learning_rate": 0.00024379973795800872, + "loss": 0.0606, "step": 58050 }, { - "epoch": 0.63, - "learning_rate": 0.00020580180414043737, - "loss": 0.0561, + "epoch": 0.37, + "learning_rate": 0.00024379005660365177, + "loss": 0.0616, "step": 58060 }, { - "epoch": 0.63, - "learning_rate": 0.00020578557985592835, - "loss": 0.0418, + "epoch": 0.37, + "learning_rate": 0.00024378037524929485, + "loss": 0.1009, "step": 58070 }, { - "epoch": 0.63, - "learning_rate": 0.00020576935557141927, - "loss": 0.0557, + "epoch": 0.37, + "learning_rate": 0.0002437706938949379, + "loss": 0.0569, "step": 58080 }, { - "epoch": 0.63, - "learning_rate": 0.00020575313128691022, - "loss": 0.0458, + "epoch": 0.37, + "learning_rate": 0.00024376101254058099, + "loss": 0.0587, "step": 58090 }, { - "epoch": 0.63, - "learning_rate": 0.00020573690700240117, - "loss": 0.0577, + "epoch": 0.37, + "learning_rate": 0.00024375133118622407, + "loss": 0.0677, "step": 58100 }, { - "epoch": 0.63, - "learning_rate": 0.00020572068271789212, - "loss": 0.0534, + "epoch": 0.38, + "learning_rate": 0.00024374164983186715, + "loss": 0.0568, "step": 58110 }, { - "epoch": 0.63, - "learning_rate": 0.00020570445843338305, - "loss": 0.0508, + "epoch": 0.38, + "learning_rate": 0.0002437319684775102, + "loss": 0.058, "step": 58120 }, { - "epoch": 0.63, - "learning_rate": 0.00020568823414887402, - "loss": 0.0556, + "epoch": 0.38, + "learning_rate": 0.00024372228712315325, + "loss": 0.0567, "step": 58130 }, { - "epoch": 0.63, - "learning_rate": 0.00020567200986436495, - "loss": 0.0558, + "epoch": 0.38, + "learning_rate": 0.00024371260576879633, + "loss": 0.0575, "step": 58140 }, { - "epoch": 0.63, - "learning_rate": 0.00020565578557985592, - "loss": 0.0491, + "epoch": 0.38, + "learning_rate": 0.00024370292441443938, + "loss": 0.0636, "step": 58150 }, { - "epoch": 0.63, - "learning_rate": 0.00020563956129534685, - "loss": 0.0528, + "epoch": 0.38, + "learning_rate": 0.00024369324306008246, + "loss": 0.061, "step": 58160 }, { - "epoch": 0.63, - "learning_rate": 0.0002056233370108378, - "loss": 0.0537, + "epoch": 0.38, + "learning_rate": 0.00024368356170572554, + "loss": 0.0598, "step": 58170 }, { - "epoch": 0.63, - "learning_rate": 0.00020560711272632874, - "loss": 0.0484, + "epoch": 0.38, + "learning_rate": 0.00024367388035136862, + "loss": 0.0589, "step": 58180 }, { - "epoch": 0.63, - "learning_rate": 0.0002055908884418197, - "loss": 0.0506, + "epoch": 0.38, + "learning_rate": 0.00024366419899701168, + "loss": 0.0613, "step": 58190 }, { - "epoch": 0.63, - "learning_rate": 0.00020557466415731064, - "loss": 0.0489, + "epoch": 0.38, + "learning_rate": 0.00024365451764265473, + "loss": 0.0575, "step": 58200 }, { - "epoch": 0.63, - "learning_rate": 0.0002055584398728016, - "loss": 0.0524, + "epoch": 0.38, + "learning_rate": 0.0002436448362882978, + "loss": 0.0642, "step": 58210 }, { - "epoch": 0.63, - "learning_rate": 0.00020554221558829252, - "loss": 0.0486, + "epoch": 0.38, + "learning_rate": 0.00024363515493394086, + "loss": 0.0595, "step": 58220 }, { - "epoch": 0.63, - "learning_rate": 0.0002055259913037835, - "loss": 0.056, + "epoch": 0.38, + "learning_rate": 0.00024362547357958394, + "loss": 0.0671, "step": 58230 }, { - "epoch": 0.63, - "learning_rate": 0.00020550976701927442, - "loss": 0.045, + "epoch": 0.38, + "learning_rate": 0.00024361579222522702, + "loss": 0.0629, "step": 58240 }, { - "epoch": 0.63, - "learning_rate": 0.0002054935427347654, - "loss": 0.0477, + "epoch": 0.38, + "learning_rate": 0.00024360611087087007, + "loss": 0.0625, "step": 58250 }, { - "epoch": 0.63, - "learning_rate": 0.00020547731845025632, - "loss": 0.0547, + "epoch": 0.38, + "learning_rate": 0.00024359642951651315, + "loss": 0.0604, "step": 58260 }, { - "epoch": 0.63, - "learning_rate": 0.00020546109416574727, - "loss": 0.0552, + "epoch": 0.38, + "learning_rate": 0.0002435867481621562, + "loss": 0.0595, "step": 58270 }, { - "epoch": 0.63, - "learning_rate": 0.00020544486988123822, - "loss": 0.051, + "epoch": 0.38, + "learning_rate": 0.00024357706680779926, + "loss": 0.0586, "step": 58280 }, { - "epoch": 0.63, - "learning_rate": 0.00020542864559672916, - "loss": 0.0539, + "epoch": 0.38, + "learning_rate": 0.00024356738545344234, + "loss": 0.0593, "step": 58290 }, { - "epoch": 0.63, - "learning_rate": 0.0002054124213122201, - "loss": 0.0483, + "epoch": 0.38, + "learning_rate": 0.00024355770409908542, + "loss": 0.0594, "step": 58300 }, { - "epoch": 0.63, - "learning_rate": 0.00020539619702771106, - "loss": 0.0515, + "epoch": 0.38, + "learning_rate": 0.0002435480227447285, + "loss": 0.0622, "step": 58310 }, { - "epoch": 0.63, - "learning_rate": 0.000205379972743202, - "loss": 0.0469, + "epoch": 0.38, + "learning_rate": 0.00024353834139037155, + "loss": 0.0658, "step": 58320 }, { - "epoch": 0.63, - "learning_rate": 0.00020536374845869296, - "loss": 0.0541, + "epoch": 0.38, + "learning_rate": 0.00024352866003601463, + "loss": 0.0674, "step": 58330 }, { - "epoch": 0.63, - "learning_rate": 0.0002053475241741839, - "loss": 0.0503, + "epoch": 0.38, + "learning_rate": 0.00024351897868165768, + "loss": 0.0639, "step": 58340 }, { - "epoch": 0.63, - "learning_rate": 0.00020533129988967484, - "loss": 0.0479, + "epoch": 0.38, + "learning_rate": 0.00024350929732730074, + "loss": 0.0715, "step": 58350 }, { - "epoch": 0.63, - "learning_rate": 0.00020531507560516579, - "loss": 0.0584, + "epoch": 0.38, + "learning_rate": 0.00024349961597294382, + "loss": 0.0642, "step": 58360 }, { - "epoch": 0.63, - "learning_rate": 0.00020529885132065674, - "loss": 0.0508, + "epoch": 0.38, + "learning_rate": 0.0002434899346185869, + "loss": 0.0567, "step": 58370 }, { - "epoch": 0.63, - "learning_rate": 0.00020528262703614769, - "loss": 0.0585, + "epoch": 0.38, + "learning_rate": 0.00024348025326422997, + "loss": 0.0582, "step": 58380 }, { - "epoch": 0.63, - "learning_rate": 0.00020526640275163864, - "loss": 0.0504, + "epoch": 0.38, + "learning_rate": 0.00024347057190987303, + "loss": 0.0615, "step": 58390 }, { - "epoch": 0.63, - "learning_rate": 0.00020525017846712956, - "loss": 0.0422, + "epoch": 0.38, + "learning_rate": 0.0002434608905555161, + "loss": 0.0578, "step": 58400 }, { - "epoch": 0.63, - "learning_rate": 0.00020523395418262054, - "loss": 0.0487, + "epoch": 0.38, + "learning_rate": 0.00024345120920115916, + "loss": 0.0655, "step": 58410 }, { - "epoch": 0.63, - "learning_rate": 0.00020521772989811146, - "loss": 0.0534, + "epoch": 0.38, + "learning_rate": 0.0002434415278468022, + "loss": 0.0636, "step": 58420 }, { - "epoch": 0.63, - "learning_rate": 0.00020520150561360243, - "loss": 0.048, + "epoch": 0.38, + "learning_rate": 0.0002434318464924453, + "loss": 0.0593, "step": 58430 }, { - "epoch": 0.63, - "learning_rate": 0.00020518528132909336, - "loss": 0.0556, + "epoch": 0.38, + "learning_rate": 0.00024342216513808837, + "loss": 0.0599, "step": 58440 }, { - "epoch": 0.63, - "learning_rate": 0.0002051690570445843, - "loss": 0.0511, + "epoch": 0.38, + "learning_rate": 0.00024341248378373143, + "loss": 0.0664, "step": 58450 }, { - "epoch": 0.63, - "learning_rate": 0.00020515283276007526, - "loss": 0.057, + "epoch": 0.38, + "learning_rate": 0.0002434028024293745, + "loss": 0.061, "step": 58460 }, { - "epoch": 0.63, - "learning_rate": 0.0002051366084755662, - "loss": 0.0508, + "epoch": 0.38, + "learning_rate": 0.00024339312107501758, + "loss": 0.0655, "step": 58470 }, { - "epoch": 0.63, - "learning_rate": 0.00020512038419105713, - "loss": 0.0525, + "epoch": 0.38, + "learning_rate": 0.0002433834397206606, + "loss": 0.0548, "step": 58480 }, { - "epoch": 0.63, - "learning_rate": 0.0002051041599065481, - "loss": 0.0615, + "epoch": 0.38, + "learning_rate": 0.0002433737583663037, + "loss": 0.0562, "step": 58490 }, { - "epoch": 0.63, - "learning_rate": 0.00020508793562203903, - "loss": 0.0501, + "epoch": 0.38, + "learning_rate": 0.00024336407701194677, + "loss": 0.0614, "step": 58500 }, { - "epoch": 0.63, - "learning_rate": 0.00020507171133753, - "loss": 0.0533, + "epoch": 0.38, + "learning_rate": 0.00024335439565758985, + "loss": 0.0532, "step": 58510 }, { - "epoch": 0.63, - "learning_rate": 0.00020505548705302093, - "loss": 0.0495, + "epoch": 0.38, + "learning_rate": 0.0002433447143032329, + "loss": 0.0575, "step": 58520 }, { - "epoch": 0.63, - "learning_rate": 0.00020503926276851188, - "loss": 0.0509, + "epoch": 0.38, + "learning_rate": 0.00024333503294887598, + "loss": 0.0609, "step": 58530 }, { - "epoch": 0.63, - "learning_rate": 0.00020502303848400283, - "loss": 0.0509, + "epoch": 0.38, + "learning_rate": 0.00024332535159451903, + "loss": 0.0589, "step": 58540 }, { - "epoch": 0.63, - "learning_rate": 0.00020500681419949378, - "loss": 0.0511, + "epoch": 0.38, + "learning_rate": 0.0002433156702401621, + "loss": 0.0548, "step": 58550 }, { - "epoch": 0.63, - "learning_rate": 0.00020499058991498473, - "loss": 0.0567, + "epoch": 0.38, + "learning_rate": 0.00024330598888580517, + "loss": 0.0595, "step": 58560 }, { - "epoch": 0.63, - "learning_rate": 0.00020497436563047568, - "loss": 0.0511, + "epoch": 0.38, + "learning_rate": 0.00024329630753144825, + "loss": 0.0558, "step": 58570 }, { - "epoch": 0.63, - "learning_rate": 0.0002049581413459666, - "loss": 0.0584, + "epoch": 0.38, + "learning_rate": 0.00024328662617709133, + "loss": 0.0575, "step": 58580 }, { - "epoch": 0.63, - "learning_rate": 0.00020494191706145758, - "loss": 0.0521, + "epoch": 0.38, + "learning_rate": 0.00024327694482273438, + "loss": 0.0591, "step": 58590 }, { - "epoch": 0.63, - "learning_rate": 0.0002049256927769485, - "loss": 0.051, + "epoch": 0.38, + "learning_rate": 0.00024326726346837746, + "loss": 0.0615, "step": 58600 }, { - "epoch": 0.63, - "learning_rate": 0.00020490946849243948, - "loss": 0.0475, + "epoch": 0.38, + "learning_rate": 0.0002432575821140205, + "loss": 0.0579, "step": 58610 }, { - "epoch": 0.63, - "learning_rate": 0.0002048932442079304, - "loss": 0.0627, + "epoch": 0.38, + "learning_rate": 0.00024324790075966356, + "loss": 0.0632, "step": 58620 }, { - "epoch": 0.63, - "learning_rate": 0.00020487701992342135, - "loss": 0.0519, + "epoch": 0.38, + "learning_rate": 0.00024323821940530664, + "loss": 0.0678, "step": 58630 }, { - "epoch": 0.63, - "learning_rate": 0.0002048607956389123, - "loss": 0.0514, + "epoch": 0.38, + "learning_rate": 0.00024322853805094972, + "loss": 0.0508, "step": 58640 }, { - "epoch": 0.63, - "learning_rate": 0.00020484457135440325, - "loss": 0.0539, + "epoch": 0.38, + "learning_rate": 0.00024321885669659278, + "loss": 0.0626, "step": 58650 }, { - "epoch": 0.63, - "learning_rate": 0.00020482834706989417, - "loss": 0.0545, + "epoch": 0.38, + "learning_rate": 0.00024320917534223586, + "loss": 0.0605, "step": 58660 }, { - "epoch": 0.63, - "learning_rate": 0.00020481212278538515, - "loss": 0.0578, + "epoch": 0.38, + "learning_rate": 0.00024319949398787894, + "loss": 0.0625, "step": 58670 }, { - "epoch": 0.63, - "learning_rate": 0.0002047958985008761, - "loss": 0.0506, + "epoch": 0.38, + "learning_rate": 0.00024318981263352196, + "loss": 0.0578, "step": 58680 }, { - "epoch": 0.63, - "learning_rate": 0.00020477967421636705, - "loss": 0.0582, + "epoch": 0.38, + "learning_rate": 0.00024318013127916504, + "loss": 0.0596, "step": 58690 }, { - "epoch": 0.63, - "learning_rate": 0.000204763449931858, - "loss": 0.0546, + "epoch": 0.38, + "learning_rate": 0.00024317044992480812, + "loss": 0.0596, "step": 58700 }, { - "epoch": 0.64, - "learning_rate": 0.00020474722564734895, - "loss": 0.0457, + "epoch": 0.38, + "learning_rate": 0.0002431607685704512, + "loss": 0.062, "step": 58710 }, { - "epoch": 0.64, - "learning_rate": 0.0002047310013628399, - "loss": 0.0563, + "epoch": 0.38, + "learning_rate": 0.00024315108721609425, + "loss": 0.0626, "step": 58720 }, { - "epoch": 0.64, - "learning_rate": 0.00020471477707833082, - "loss": 0.0541, + "epoch": 0.38, + "learning_rate": 0.00024314140586173733, + "loss": 0.0563, "step": 58730 }, { - "epoch": 0.64, - "learning_rate": 0.0002046985527938218, - "loss": 0.0554, + "epoch": 0.38, + "learning_rate": 0.00024313172450738041, + "loss": 0.0637, "step": 58740 }, { - "epoch": 0.64, - "learning_rate": 0.00020468232850931272, - "loss": 0.0529, + "epoch": 0.38, + "learning_rate": 0.00024312204315302344, + "loss": 0.0693, "step": 58750 }, { - "epoch": 0.64, - "learning_rate": 0.0002046661042248037, - "loss": 0.0497, + "epoch": 0.38, + "learning_rate": 0.00024311236179866652, + "loss": 0.0618, "step": 58760 }, { - "epoch": 0.64, - "learning_rate": 0.00020464987994029462, - "loss": 0.0565, + "epoch": 0.38, + "learning_rate": 0.0002431026804443096, + "loss": 0.0599, "step": 58770 }, { - "epoch": 0.64, - "learning_rate": 0.00020463365565578557, - "loss": 0.0476, + "epoch": 0.38, + "learning_rate": 0.00024309299908995268, + "loss": 0.0575, "step": 58780 }, { - "epoch": 0.64, - "learning_rate": 0.00020461743137127652, - "loss": 0.0579, + "epoch": 0.38, + "learning_rate": 0.00024308331773559573, + "loss": 0.0516, "step": 58790 }, { - "epoch": 0.64, - "learning_rate": 0.00020460120708676747, - "loss": 0.0523, + "epoch": 0.38, + "learning_rate": 0.0002430736363812388, + "loss": 0.0634, "step": 58800 }, { - "epoch": 0.64, - "learning_rate": 0.0002045849828022584, - "loss": 0.0489, + "epoch": 0.38, + "learning_rate": 0.0002430639550268819, + "loss": 0.0554, "step": 58810 }, { - "epoch": 0.64, - "learning_rate": 0.00020456875851774937, - "loss": 0.0529, + "epoch": 0.38, + "learning_rate": 0.00024305427367252492, + "loss": 0.0603, "step": 58820 }, { - "epoch": 0.64, - "learning_rate": 0.0002045525342332403, - "loss": 0.0463, + "epoch": 0.38, + "learning_rate": 0.000243044592318168, + "loss": 0.0613, "step": 58830 }, { - "epoch": 0.64, - "learning_rate": 0.00020453630994873127, - "loss": 0.0569, + "epoch": 0.38, + "learning_rate": 0.00024303491096381108, + "loss": 0.062, "step": 58840 }, { - "epoch": 0.64, - "learning_rate": 0.0002045200856642222, - "loss": 0.0484, + "epoch": 0.38, + "learning_rate": 0.00024302522960945413, + "loss": 0.0578, "step": 58850 }, { - "epoch": 0.64, - "learning_rate": 0.00020450386137971314, - "loss": 0.0447, + "epoch": 0.38, + "learning_rate": 0.0002430155482550972, + "loss": 0.0655, "step": 58860 }, { - "epoch": 0.64, - "learning_rate": 0.0002044876370952041, - "loss": 0.057, + "epoch": 0.38, + "learning_rate": 0.0002430058669007403, + "loss": 0.0651, "step": 58870 }, { - "epoch": 0.64, - "learning_rate": 0.00020447141281069504, - "loss": 0.0448, + "epoch": 0.38, + "learning_rate": 0.00024299618554638337, + "loss": 0.064, "step": 58880 }, { - "epoch": 0.64, - "learning_rate": 0.000204455188526186, - "loss": 0.051, + "epoch": 0.38, + "learning_rate": 0.0002429865041920264, + "loss": 0.0584, "step": 58890 }, { - "epoch": 0.64, - "learning_rate": 0.00020443896424167694, - "loss": 0.0492, + "epoch": 0.38, + "learning_rate": 0.00024297682283766947, + "loss": 0.0593, "step": 58900 }, { - "epoch": 0.64, - "learning_rate": 0.00020442273995716786, - "loss": 0.0519, + "epoch": 0.38, + "learning_rate": 0.00024296714148331255, + "loss": 0.0522, "step": 58910 }, { - "epoch": 0.64, - "learning_rate": 0.00020440651567265884, - "loss": 0.0481, + "epoch": 0.38, + "learning_rate": 0.0002429574601289556, + "loss": 0.0588, "step": 58920 }, { - "epoch": 0.64, - "learning_rate": 0.00020439029138814976, - "loss": 0.046, + "epoch": 0.38, + "learning_rate": 0.00024294777877459869, + "loss": 0.0638, "step": 58930 }, { - "epoch": 0.64, - "learning_rate": 0.00020437406710364074, - "loss": 0.0778, + "epoch": 0.38, + "learning_rate": 0.00024293809742024177, + "loss": 0.0602, "step": 58940 }, { - "epoch": 0.64, - "learning_rate": 0.00020435784281913166, - "loss": 0.0556, + "epoch": 0.38, + "learning_rate": 0.00024292841606588485, + "loss": 0.0558, "step": 58950 }, { - "epoch": 0.64, - "learning_rate": 0.0002043416185346226, - "loss": 0.0515, + "epoch": 0.38, + "learning_rate": 0.00024291873471152787, + "loss": 0.0597, "step": 58960 }, { - "epoch": 0.64, - "learning_rate": 0.00020432539425011356, - "loss": 0.0565, + "epoch": 0.38, + "learning_rate": 0.00024290905335717095, + "loss": 0.0538, "step": 58970 }, { - "epoch": 0.64, - "learning_rate": 0.0002043091699656045, - "loss": 0.0462, + "epoch": 0.38, + "learning_rate": 0.00024289937200281403, + "loss": 0.0572, "step": 58980 }, { - "epoch": 0.64, - "learning_rate": 0.00020429294568109543, - "loss": 0.0557, + "epoch": 0.38, + "learning_rate": 0.00024288969064845708, + "loss": 0.0677, "step": 58990 }, { - "epoch": 0.64, - "learning_rate": 0.0002042767213965864, - "loss": 0.0521, + "epoch": 0.38, + "learning_rate": 0.00024288000929410016, + "loss": 0.0628, "step": 59000 }, { - "epoch": 0.64, - "eval_cer": 0.9212638773299691, - "eval_loss": 0.03626423701643944, - "eval_runtime": 118.9983, - "eval_samples_per_second": 16.807, - "eval_steps_per_second": 4.202, + "epoch": 0.38, + "eval_cer": 0.9200515196023048, + "eval_loss": 0.04011645168066025, + "eval_runtime": 120.0848, + "eval_samples_per_second": 16.655, + "eval_steps_per_second": 4.164, "step": 59000 }, { - "epoch": 0.64, - "learning_rate": 0.00020426049711207733, - "loss": 0.0566, + "epoch": 0.38, + "learning_rate": 0.00024287032793974324, + "loss": 0.0547, "step": 59010 }, { - "epoch": 0.64, - "learning_rate": 0.0002042442728275683, - "loss": 0.0529, + "epoch": 0.38, + "learning_rate": 0.00024286064658538632, + "loss": 0.0595, "step": 59020 }, { - "epoch": 0.64, - "learning_rate": 0.00020422804854305923, - "loss": 0.0427, + "epoch": 0.38, + "learning_rate": 0.00024285096523102935, + "loss": 0.0618, "step": 59030 }, { - "epoch": 0.64, - "learning_rate": 0.00020421182425855018, - "loss": 0.0531, + "epoch": 0.38, + "learning_rate": 0.00024284128387667243, + "loss": 0.0574, "step": 59040 }, { - "epoch": 0.64, - "learning_rate": 0.00020419559997404113, - "loss": 0.0565, + "epoch": 0.38, + "learning_rate": 0.00024283160252231548, + "loss": 0.0639, "step": 59050 }, { - "epoch": 0.64, - "learning_rate": 0.00020417937568953208, - "loss": 0.0545, + "epoch": 0.38, + "learning_rate": 0.00024282192116795856, + "loss": 0.0611, "step": 59060 }, { - "epoch": 0.64, - "learning_rate": 0.00020416315140502303, - "loss": 0.0515, + "epoch": 0.38, + "learning_rate": 0.00024281223981360164, + "loss": 0.056, "step": 59070 }, { - "epoch": 0.64, - "learning_rate": 0.00020414692712051398, - "loss": 0.0561, + "epoch": 0.38, + "learning_rate": 0.00024280255845924472, + "loss": 0.0568, "step": 59080 }, { - "epoch": 0.64, - "learning_rate": 0.0002041307028360049, - "loss": 0.0561, + "epoch": 0.38, + "learning_rate": 0.00024279287710488777, + "loss": 0.0539, "step": 59090 }, { - "epoch": 0.64, - "learning_rate": 0.00020411447855149588, - "loss": 0.0558, + "epoch": 0.38, + "learning_rate": 0.00024278319575053083, + "loss": 0.0547, "step": 59100 }, { - "epoch": 0.64, - "learning_rate": 0.0002040982542669868, - "loss": 0.0474, + "epoch": 0.38, + "learning_rate": 0.0002427735143961739, + "loss": 0.0584, "step": 59110 }, { - "epoch": 0.64, - "learning_rate": 0.00020408202998247778, - "loss": 0.0511, + "epoch": 0.38, + "learning_rate": 0.00024276383304181696, + "loss": 0.0609, "step": 59120 }, { - "epoch": 0.64, - "learning_rate": 0.0002040658056979687, - "loss": 0.0413, + "epoch": 0.38, + "learning_rate": 0.00024275415168746004, + "loss": 0.0546, "step": 59130 }, { - "epoch": 0.64, - "learning_rate": 0.00020404958141345965, - "loss": 0.0497, + "epoch": 0.38, + "learning_rate": 0.00024274447033310312, + "loss": 0.0596, "step": 59140 }, { - "epoch": 0.64, - "learning_rate": 0.0002040333571289506, - "loss": 0.0509, + "epoch": 0.38, + "learning_rate": 0.0002427347889787462, + "loss": 0.0644, "step": 59150 }, { - "epoch": 0.64, - "learning_rate": 0.00020401713284444155, - "loss": 0.0576, + "epoch": 0.38, + "learning_rate": 0.00024272510762438925, + "loss": 0.0606, "step": 59160 }, { - "epoch": 0.64, - "learning_rate": 0.00020400090855993247, - "loss": 0.0489, + "epoch": 0.38, + "learning_rate": 0.0002427154262700323, + "loss": 0.0571, "step": 59170 }, { - "epoch": 0.64, - "learning_rate": 0.00020398468427542345, - "loss": 0.0475, + "epoch": 0.38, + "learning_rate": 0.00024270574491567538, + "loss": 0.0617, "step": 59180 }, { - "epoch": 0.64, - "learning_rate": 0.00020396845999091437, - "loss": 0.0478, + "epoch": 0.38, + "learning_rate": 0.00024269606356131844, + "loss": 0.0602, "step": 59190 }, { - "epoch": 0.64, - "learning_rate": 0.00020395223570640535, - "loss": 0.0457, + "epoch": 0.38, + "learning_rate": 0.00024268638220696151, + "loss": 0.0628, "step": 59200 }, { - "epoch": 0.64, - "learning_rate": 0.00020393601142189627, - "loss": 0.0555, + "epoch": 0.38, + "learning_rate": 0.0002426767008526046, + "loss": 0.0521, "step": 59210 }, { - "epoch": 0.64, - "learning_rate": 0.00020391978713738722, - "loss": 0.0475, + "epoch": 0.38, + "learning_rate": 0.00024266701949824767, + "loss": 0.0593, "step": 59220 }, { - "epoch": 0.64, - "learning_rate": 0.00020390356285287817, - "loss": 0.0566, + "epoch": 0.38, + "learning_rate": 0.00024265733814389073, + "loss": 0.0647, "step": 59230 }, { - "epoch": 0.64, - "learning_rate": 0.00020388733856836912, - "loss": 0.0456, + "epoch": 0.38, + "learning_rate": 0.00024264765678953378, + "loss": 0.0756, "step": 59240 }, { - "epoch": 0.64, - "learning_rate": 0.00020387111428386007, - "loss": 0.0496, + "epoch": 0.38, + "learning_rate": 0.00024263797543517683, + "loss": 0.0608, "step": 59250 }, { - "epoch": 0.64, - "learning_rate": 0.00020385488999935102, - "loss": 0.0525, + "epoch": 0.38, + "learning_rate": 0.0002426282940808199, + "loss": 0.0545, "step": 59260 }, { - "epoch": 0.64, - "learning_rate": 0.00020383866571484194, - "loss": 0.0461, + "epoch": 0.38, + "learning_rate": 0.000242618612726463, + "loss": 0.0574, "step": 59270 }, { - "epoch": 0.64, - "learning_rate": 0.00020382244143033292, - "loss": 0.0541, + "epoch": 0.38, + "learning_rate": 0.00024260893137210607, + "loss": 0.0571, "step": 59280 }, { - "epoch": 0.64, - "learning_rate": 0.00020380621714582384, - "loss": 0.0586, + "epoch": 0.38, + "learning_rate": 0.00024259925001774912, + "loss": 0.0587, "step": 59290 }, { - "epoch": 0.64, - "learning_rate": 0.00020378999286131482, - "loss": 0.0447, + "epoch": 0.38, + "learning_rate": 0.0002425895686633922, + "loss": 0.0512, "step": 59300 }, { - "epoch": 0.64, - "learning_rate": 0.00020377376857680574, - "loss": 0.0515, + "epoch": 0.38, + "learning_rate": 0.00024257988730903526, + "loss": 0.0593, "step": 59310 }, { - "epoch": 0.64, - "learning_rate": 0.0002037575442922967, - "loss": 0.0509, + "epoch": 0.38, + "learning_rate": 0.0002425702059546783, + "loss": 0.0621, "step": 59320 }, { - "epoch": 0.64, - "learning_rate": 0.00020374132000778764, - "loss": 0.0422, + "epoch": 0.38, + "learning_rate": 0.0002425605246003214, + "loss": 0.0572, "step": 59330 }, { - "epoch": 0.64, - "learning_rate": 0.0002037250957232786, - "loss": 0.049, + "epoch": 0.38, + "learning_rate": 0.00024255084324596447, + "loss": 0.0654, "step": 59340 }, { - "epoch": 0.64, - "learning_rate": 0.00020370887143876952, - "loss": 0.0499, + "epoch": 0.38, + "learning_rate": 0.00024254116189160755, + "loss": 0.0541, "step": 59350 }, { - "epoch": 0.64, - "learning_rate": 0.0002036926471542605, - "loss": 0.0598, + "epoch": 0.38, + "learning_rate": 0.0002425314805372506, + "loss": 0.0627, "step": 59360 }, { - "epoch": 0.64, - "learning_rate": 0.00020367642286975141, - "loss": 0.0546, + "epoch": 0.38, + "learning_rate": 0.00024252179918289368, + "loss": 0.0572, "step": 59370 }, { - "epoch": 0.64, - "learning_rate": 0.0002036601985852424, - "loss": 0.0487, + "epoch": 0.38, + "learning_rate": 0.00024251211782853673, + "loss": 0.0545, "step": 59380 }, { - "epoch": 0.64, - "learning_rate": 0.00020364397430073331, - "loss": 0.0517, + "epoch": 0.38, + "learning_rate": 0.0002425024364741798, + "loss": 0.0626, "step": 59390 }, { - "epoch": 0.64, - "learning_rate": 0.0002036277500162243, - "loss": 0.0492, + "epoch": 0.38, + "learning_rate": 0.00024249275511982287, + "loss": 0.0613, "step": 59400 }, { - "epoch": 0.64, - "learning_rate": 0.00020361152573171521, - "loss": 0.0525, + "epoch": 0.38, + "learning_rate": 0.00024248307376546595, + "loss": 0.054, "step": 59410 }, { - "epoch": 0.64, - "learning_rate": 0.00020359530144720616, - "loss": 0.0463, + "epoch": 0.38, + "learning_rate": 0.00024247339241110903, + "loss": 0.0632, "step": 59420 }, { - "epoch": 0.64, - "learning_rate": 0.00020357907716269711, - "loss": 0.0518, + "epoch": 0.38, + "learning_rate": 0.00024246371105675208, + "loss": 0.0639, "step": 59430 }, { - "epoch": 0.64, - "learning_rate": 0.00020356285287818806, - "loss": 0.0525, + "epoch": 0.38, + "learning_rate": 0.00024245402970239516, + "loss": 0.0654, "step": 59440 }, { - "epoch": 0.64, - "learning_rate": 0.00020354662859367899, - "loss": 0.055, + "epoch": 0.38, + "learning_rate": 0.00024244434834803818, + "loss": 0.0637, "step": 59450 }, { - "epoch": 0.64, - "learning_rate": 0.00020353040430916996, - "loss": 0.0486, + "epoch": 0.38, + "learning_rate": 0.00024243466699368126, + "loss": 0.0624, "step": 59460 }, { - "epoch": 0.64, - "learning_rate": 0.00020351418002466089, - "loss": 0.0515, + "epoch": 0.38, + "learning_rate": 0.00024242498563932434, + "loss": 0.0615, "step": 59470 }, { - "epoch": 0.64, - "learning_rate": 0.00020349795574015186, - "loss": 0.0552, + "epoch": 0.38, + "learning_rate": 0.00024241530428496742, + "loss": 0.0537, "step": 59480 }, { - "epoch": 0.64, - "learning_rate": 0.00020348173145564279, - "loss": 0.0543, + "epoch": 0.38, + "learning_rate": 0.00024240562293061048, + "loss": 0.0662, "step": 59490 }, { - "epoch": 0.64, - "learning_rate": 0.00020346550717113373, - "loss": 0.0522, + "epoch": 0.38, + "learning_rate": 0.00024239594157625356, + "loss": 0.0689, "step": 59500 }, { - "epoch": 0.64, - "learning_rate": 0.00020344928288662468, - "loss": 0.0556, + "epoch": 0.38, + "learning_rate": 0.00024238626022189664, + "loss": 0.0605, "step": 59510 }, { - "epoch": 0.64, - "learning_rate": 0.00020343305860211563, - "loss": 0.0627, + "epoch": 0.38, + "learning_rate": 0.00024237657886753966, + "loss": 0.0552, "step": 59520 }, { - "epoch": 0.64, - "learning_rate": 0.00020341683431760656, - "loss": 0.056, + "epoch": 0.38, + "learning_rate": 0.00024236689751318274, + "loss": 0.0607, "step": 59530 }, { - "epoch": 0.64, - "learning_rate": 0.00020340061003309753, - "loss": 0.0507, + "epoch": 0.38, + "learning_rate": 0.00024235721615882582, + "loss": 0.0588, "step": 59540 }, { - "epoch": 0.64, - "learning_rate": 0.00020338438574858846, - "loss": 0.0515, + "epoch": 0.38, + "learning_rate": 0.0002423475348044689, + "loss": 0.0583, "step": 59550 }, { - "epoch": 0.64, - "learning_rate": 0.00020336816146407943, - "loss": 0.0485, + "epoch": 0.38, + "learning_rate": 0.00024233785345011195, + "loss": 0.0572, "step": 59560 }, { - "epoch": 0.64, - "learning_rate": 0.00020335193717957036, - "loss": 0.052, + "epoch": 0.38, + "learning_rate": 0.00024232817209575503, + "loss": 0.0547, "step": 59570 }, { - "epoch": 0.64, - "learning_rate": 0.00020333571289506133, - "loss": 0.0473, + "epoch": 0.38, + "learning_rate": 0.0002423184907413981, + "loss": 0.06, "step": 59580 }, { - "epoch": 0.64, - "learning_rate": 0.00020331948861055226, - "loss": 0.0527, + "epoch": 0.38, + "learning_rate": 0.00024230880938704114, + "loss": 0.0599, "step": 59590 }, { - "epoch": 0.64, - "learning_rate": 0.0002033032643260432, - "loss": 0.0491, + "epoch": 0.38, + "learning_rate": 0.00024229912803268422, + "loss": 0.0667, "step": 59600 }, { - "epoch": 0.64, - "learning_rate": 0.00020328704004153416, - "loss": 0.0536, + "epoch": 0.38, + "learning_rate": 0.0002422894466783273, + "loss": 0.0615, "step": 59610 }, { - "epoch": 0.64, - "learning_rate": 0.0002032708157570251, - "loss": 0.0551, + "epoch": 0.38, + "learning_rate": 0.00024227976532397038, + "loss": 0.0682, "step": 59620 }, { - "epoch": 0.64, - "learning_rate": 0.00020325459147251603, - "loss": 0.0521, + "epoch": 0.38, + "learning_rate": 0.00024227008396961343, + "loss": 0.059, "step": 59630 }, { - "epoch": 0.65, - "learning_rate": 0.000203238367188007, - "loss": 0.0535, + "epoch": 0.38, + "learning_rate": 0.0002422604026152565, + "loss": 0.0648, "step": 59640 }, { - "epoch": 0.65, - "learning_rate": 0.00020322214290349793, - "loss": 0.0507, + "epoch": 0.38, + "learning_rate": 0.0002422507212608996, + "loss": 0.0607, "step": 59650 }, { - "epoch": 0.65, - "learning_rate": 0.0002032059186189889, - "loss": 0.0495, + "epoch": 0.39, + "learning_rate": 0.00024224103990654262, + "loss": 0.0555, "step": 59660 }, { - "epoch": 0.65, - "learning_rate": 0.00020318969433447983, - "loss": 0.0535, + "epoch": 0.39, + "learning_rate": 0.0002422313585521857, + "loss": 0.0624, "step": 59670 }, { - "epoch": 0.65, - "learning_rate": 0.00020317347004997078, - "loss": 0.0558, + "epoch": 0.39, + "learning_rate": 0.00024222167719782878, + "loss": 0.0641, "step": 59680 }, { - "epoch": 0.65, - "learning_rate": 0.00020315724576546173, - "loss": 0.0547, + "epoch": 0.39, + "learning_rate": 0.00024221199584347183, + "loss": 0.06, "step": 59690 }, { - "epoch": 0.65, - "learning_rate": 0.00020314102148095268, - "loss": 0.0564, + "epoch": 0.39, + "learning_rate": 0.0002422023144891149, + "loss": 0.0601, "step": 59700 }, { - "epoch": 0.65, - "learning_rate": 0.0002031247971964436, - "loss": 0.0508, + "epoch": 0.39, + "learning_rate": 0.000242192633134758, + "loss": 0.0696, "step": 59710 }, { - "epoch": 0.65, - "learning_rate": 0.00020310857291193458, - "loss": 0.0554, + "epoch": 0.39, + "learning_rate": 0.00024218295178040107, + "loss": 0.0556, "step": 59720 }, { - "epoch": 0.65, - "learning_rate": 0.0002030923486274255, - "loss": 0.0477, + "epoch": 0.39, + "learning_rate": 0.0002421732704260441, + "loss": 0.0567, "step": 59730 }, { - "epoch": 0.65, - "learning_rate": 0.00020307612434291648, - "loss": 0.0454, + "epoch": 0.39, + "learning_rate": 0.00024216358907168717, + "loss": 0.0634, "step": 59740 }, { - "epoch": 0.65, - "learning_rate": 0.0002030599000584074, - "loss": 0.0563, + "epoch": 0.39, + "learning_rate": 0.00024215390771733025, + "loss": 0.0606, "step": 59750 }, { - "epoch": 0.65, - "learning_rate": 0.00020304367577389837, - "loss": 0.0488, + "epoch": 0.39, + "learning_rate": 0.0002421442263629733, + "loss": 0.0603, "step": 59760 }, { - "epoch": 0.65, - "learning_rate": 0.0002030274514893893, - "loss": 0.0541, + "epoch": 0.39, + "learning_rate": 0.00024213454500861639, + "loss": 0.0604, "step": 59770 }, { - "epoch": 0.65, - "learning_rate": 0.00020301122720488025, - "loss": 0.0528, + "epoch": 0.39, + "learning_rate": 0.00024212486365425947, + "loss": 0.0545, "step": 59780 }, { - "epoch": 0.65, - "learning_rate": 0.0002029950029203712, - "loss": 0.0565, + "epoch": 0.39, + "learning_rate": 0.00024211518229990255, + "loss": 0.0556, "step": 59790 }, { - "epoch": 0.65, - "learning_rate": 0.00020297877863586215, - "loss": 0.0591, + "epoch": 0.39, + "learning_rate": 0.00024210550094554557, + "loss": 0.0618, "step": 59800 }, { - "epoch": 0.65, - "learning_rate": 0.00020296255435135307, - "loss": 0.0547, + "epoch": 0.39, + "learning_rate": 0.00024209581959118865, + "loss": 0.0553, "step": 59810 }, { - "epoch": 0.65, - "learning_rate": 0.00020294633006684405, - "loss": 0.0575, + "epoch": 0.39, + "learning_rate": 0.00024208613823683173, + "loss": 0.0602, "step": 59820 }, { - "epoch": 0.65, - "learning_rate": 0.00020293010578233497, - "loss": 0.0526, + "epoch": 0.39, + "learning_rate": 0.00024207645688247478, + "loss": 0.0591, "step": 59830 }, { - "epoch": 0.65, - "learning_rate": 0.00020291388149782595, - "loss": 0.0551, + "epoch": 0.39, + "learning_rate": 0.00024206677552811786, + "loss": 0.0573, "step": 59840 }, { - "epoch": 0.65, - "learning_rate": 0.00020289765721331687, - "loss": 0.051, + "epoch": 0.39, + "learning_rate": 0.00024205709417376094, + "loss": 0.0502, "step": 59850 }, { - "epoch": 0.65, - "learning_rate": 0.00020288143292880782, - "loss": 0.0569, + "epoch": 0.39, + "learning_rate": 0.000242047412819404, + "loss": 0.061, "step": 59860 }, { - "epoch": 0.65, - "learning_rate": 0.00020286520864429877, - "loss": 0.0573, + "epoch": 0.39, + "learning_rate": 0.00024203773146504705, + "loss": 0.0576, "step": 59870 }, { - "epoch": 0.65, - "learning_rate": 0.00020284898435978972, - "loss": 0.0471, + "epoch": 0.39, + "learning_rate": 0.00024202805011069013, + "loss": 0.0584, "step": 59880 }, { - "epoch": 0.65, - "learning_rate": 0.00020283276007528064, - "loss": 0.0515, + "epoch": 0.39, + "learning_rate": 0.00024201836875633318, + "loss": 0.0589, "step": 59890 }, { - "epoch": 0.65, - "learning_rate": 0.00020281653579077162, - "loss": 0.0566, + "epoch": 0.39, + "learning_rate": 0.00024200868740197626, + "loss": 0.0568, "step": 59900 }, { - "epoch": 0.65, - "learning_rate": 0.00020280031150626254, - "loss": 0.0577, + "epoch": 0.39, + "learning_rate": 0.00024199900604761934, + "loss": 0.0539, "step": 59910 }, { - "epoch": 0.65, - "learning_rate": 0.00020278408722175352, - "loss": 0.0514, + "epoch": 0.39, + "learning_rate": 0.00024198932469326242, + "loss": 0.0652, "step": 59920 }, { - "epoch": 0.65, - "learning_rate": 0.00020276786293724444, - "loss": 0.0579, + "epoch": 0.39, + "learning_rate": 0.00024197964333890547, + "loss": 0.0606, "step": 59930 }, { - "epoch": 0.65, - "learning_rate": 0.00020275163865273542, - "loss": 0.0482, + "epoch": 0.39, + "learning_rate": 0.00024196996198454853, + "loss": 0.0568, "step": 59940 }, { - "epoch": 0.65, - "learning_rate": 0.00020273541436822634, - "loss": 0.0509, + "epoch": 0.39, + "learning_rate": 0.0002419602806301916, + "loss": 0.0626, "step": 59950 }, { - "epoch": 0.65, - "learning_rate": 0.0002027191900837173, - "loss": 0.0513, + "epoch": 0.39, + "learning_rate": 0.00024195059927583466, + "loss": 0.0606, "step": 59960 }, { - "epoch": 0.65, - "learning_rate": 0.00020270296579920824, - "loss": 0.0479, + "epoch": 0.39, + "learning_rate": 0.00024194091792147774, + "loss": 0.0511, "step": 59970 }, { - "epoch": 0.65, - "learning_rate": 0.0002026867415146992, - "loss": 0.0475, + "epoch": 0.39, + "learning_rate": 0.00024193123656712082, + "loss": 0.07, "step": 59980 }, { - "epoch": 0.65, - "learning_rate": 0.0002026705172301901, - "loss": 0.0571, + "epoch": 0.39, + "learning_rate": 0.0002419215552127639, + "loss": 0.0555, "step": 59990 }, { - "epoch": 0.65, - "learning_rate": 0.0002026542929456811, - "loss": 0.0543, + "epoch": 0.39, + "learning_rate": 0.00024191187385840695, + "loss": 0.0586, "step": 60000 }, { - "epoch": 0.65, - "eval_cer": 0.9212373728003449, - "eval_loss": 0.035806700587272644, - "eval_runtime": 119.412, - "eval_samples_per_second": 16.749, - "eval_steps_per_second": 4.187, + "epoch": 0.39, + "eval_cer": 0.9201012314992656, + "eval_loss": 0.03904225304722786, + "eval_runtime": 119.7689, + "eval_samples_per_second": 16.699, + "eval_steps_per_second": 4.175, "step": 60000 }, { - "epoch": 0.65, - "learning_rate": 0.000202638068661172, - "loss": 0.0544, + "epoch": 0.39, + "learning_rate": 0.00024190219250405, + "loss": 0.0602, "step": 60010 }, { - "epoch": 0.65, - "learning_rate": 0.000202621844376663, - "loss": 0.0462, + "epoch": 0.39, + "learning_rate": 0.00024189251114969308, + "loss": 0.0578, "step": 60020 }, { - "epoch": 0.65, - "learning_rate": 0.0002026056200921539, - "loss": 0.0489, + "epoch": 0.39, + "learning_rate": 0.00024188282979533613, + "loss": 0.0669, "step": 60030 }, { - "epoch": 0.65, - "learning_rate": 0.00020258939580764486, - "loss": 0.0468, + "epoch": 0.39, + "learning_rate": 0.00024187314844097921, + "loss": 0.0637, "step": 60040 }, { - "epoch": 0.65, - "learning_rate": 0.0002025731715231358, - "loss": 0.051, + "epoch": 0.39, + "learning_rate": 0.0002418634670866223, + "loss": 0.0608, "step": 60050 }, { - "epoch": 0.65, - "learning_rate": 0.00020255694723862676, - "loss": 0.0495, + "epoch": 0.39, + "learning_rate": 0.00024185378573226535, + "loss": 0.0574, "step": 60060 }, { - "epoch": 0.65, - "learning_rate": 0.0002025407229541177, - "loss": 0.0535, + "epoch": 0.39, + "learning_rate": 0.00024184410437790843, + "loss": 0.057, "step": 60070 }, { - "epoch": 0.65, - "learning_rate": 0.00020252449866960866, - "loss": 0.0448, + "epoch": 0.39, + "learning_rate": 0.00024183442302355148, + "loss": 0.055, "step": 60080 }, { - "epoch": 0.65, - "learning_rate": 0.00020250827438509958, - "loss": 0.0534, + "epoch": 0.39, + "learning_rate": 0.00024182474166919453, + "loss": 0.0623, "step": 60090 }, { - "epoch": 0.65, - "learning_rate": 0.00020249205010059056, - "loss": 0.063, + "epoch": 0.39, + "learning_rate": 0.0002418150603148376, + "loss": 0.062, "step": 60100 }, { - "epoch": 0.65, - "learning_rate": 0.00020247582581608148, - "loss": 0.0536, + "epoch": 0.39, + "learning_rate": 0.0002418053789604807, + "loss": 0.0582, "step": 60110 }, { - "epoch": 0.65, - "learning_rate": 0.00020245960153157246, - "loss": 0.0492, + "epoch": 0.39, + "learning_rate": 0.00024179569760612377, + "loss": 0.0612, "step": 60120 }, { - "epoch": 0.65, - "learning_rate": 0.00020244337724706338, - "loss": 0.0511, + "epoch": 0.39, + "learning_rate": 0.00024178601625176682, + "loss": 0.06, "step": 60130 }, { - "epoch": 0.65, - "learning_rate": 0.00020242715296255433, - "loss": 0.0449, + "epoch": 0.39, + "learning_rate": 0.0002417763348974099, + "loss": 0.0606, "step": 60140 }, { - "epoch": 0.65, - "learning_rate": 0.00020241092867804528, - "loss": 0.0568, + "epoch": 0.39, + "learning_rate": 0.00024176665354305296, + "loss": 0.0652, "step": 60150 }, { - "epoch": 0.65, - "learning_rate": 0.00020239470439353623, - "loss": 0.0508, + "epoch": 0.39, + "learning_rate": 0.000241756972188696, + "loss": 0.0615, "step": 60160 }, { - "epoch": 0.65, - "learning_rate": 0.00020237848010902715, - "loss": 0.0524, + "epoch": 0.39, + "learning_rate": 0.0002417472908343391, + "loss": 0.0696, "step": 60170 }, { - "epoch": 0.65, - "learning_rate": 0.00020236225582451813, - "loss": 0.0525, + "epoch": 0.39, + "learning_rate": 0.00024173760947998217, + "loss": 0.0643, "step": 60180 }, { - "epoch": 0.65, - "learning_rate": 0.00020234603154000905, - "loss": 0.0495, + "epoch": 0.39, + "learning_rate": 0.00024172792812562525, + "loss": 0.0618, "step": 60190 }, { - "epoch": 0.65, - "learning_rate": 0.00020232980725550003, - "loss": 0.053, + "epoch": 0.39, + "learning_rate": 0.0002417182467712683, + "loss": 0.058, "step": 60200 }, { - "epoch": 0.65, - "learning_rate": 0.00020231358297099095, - "loss": 0.0477, + "epoch": 0.39, + "learning_rate": 0.00024170856541691138, + "loss": 0.056, "step": 60210 }, { - "epoch": 0.65, - "learning_rate": 0.0002022973586864819, - "loss": 0.0561, + "epoch": 0.39, + "learning_rate": 0.00024169888406255443, + "loss": 0.0645, "step": 60220 }, { - "epoch": 0.65, - "learning_rate": 0.00020228113440197285, - "loss": 0.0515, + "epoch": 0.39, + "learning_rate": 0.0002416892027081975, + "loss": 0.057, "step": 60230 }, { - "epoch": 0.65, - "learning_rate": 0.0002022649101174638, - "loss": 0.0444, + "epoch": 0.39, + "learning_rate": 0.00024167952135384057, + "loss": 0.0576, "step": 60240 }, { - "epoch": 0.65, - "learning_rate": 0.00020224868583295475, - "loss": 0.0501, + "epoch": 0.39, + "learning_rate": 0.00024166983999948365, + "loss": 0.0641, "step": 60250 }, { - "epoch": 0.65, - "learning_rate": 0.0002022324615484457, - "loss": 0.0494, + "epoch": 0.39, + "learning_rate": 0.0002416601586451267, + "loss": 0.0621, "step": 60260 }, { - "epoch": 0.65, - "learning_rate": 0.00020221623726393662, - "loss": 0.0551, + "epoch": 0.39, + "learning_rate": 0.00024165047729076978, + "loss": 0.0567, "step": 60270 }, { - "epoch": 0.65, - "learning_rate": 0.0002022000129794276, - "loss": 0.0502, + "epoch": 0.39, + "learning_rate": 0.00024164079593641286, + "loss": 0.0608, "step": 60280 }, { - "epoch": 0.65, - "learning_rate": 0.00020218378869491852, - "loss": 0.0503, + "epoch": 0.39, + "learning_rate": 0.00024163111458205588, + "loss": 0.0528, "step": 60290 }, { - "epoch": 0.65, - "learning_rate": 0.0002021675644104095, - "loss": 0.0502, + "epoch": 0.39, + "learning_rate": 0.00024162143322769896, + "loss": 0.0605, "step": 60300 }, { - "epoch": 0.65, - "learning_rate": 0.00020215134012590042, - "loss": 0.0515, + "epoch": 0.39, + "learning_rate": 0.00024161175187334204, + "loss": 0.0495, "step": 60310 }, { - "epoch": 0.65, - "learning_rate": 0.00020213511584139137, - "loss": 0.0547, + "epoch": 0.39, + "learning_rate": 0.00024160207051898512, + "loss": 0.0671, "step": 60320 }, { - "epoch": 0.65, - "learning_rate": 0.00020211889155688232, - "loss": 0.0444, + "epoch": 0.39, + "learning_rate": 0.00024159238916462818, + "loss": 0.0568, "step": 60330 }, { - "epoch": 0.65, - "learning_rate": 0.00020210266727237327, - "loss": 0.0511, + "epoch": 0.39, + "learning_rate": 0.00024158270781027126, + "loss": 0.0628, "step": 60340 }, { - "epoch": 0.65, - "learning_rate": 0.0002020864429878642, - "loss": 0.0506, + "epoch": 0.39, + "learning_rate": 0.00024157302645591434, + "loss": 0.061, "step": 60350 }, { - "epoch": 0.65, - "learning_rate": 0.00020207021870335517, - "loss": 0.0523, + "epoch": 0.39, + "learning_rate": 0.00024156334510155736, + "loss": 0.0555, "step": 60360 }, { - "epoch": 0.65, - "learning_rate": 0.0002020539944188461, - "loss": 0.0507, + "epoch": 0.39, + "learning_rate": 0.00024155366374720044, + "loss": 0.0602, "step": 60370 }, { - "epoch": 0.65, - "learning_rate": 0.00020203777013433707, - "loss": 0.0527, + "epoch": 0.39, + "learning_rate": 0.00024154398239284352, + "loss": 0.0611, "step": 60380 }, { - "epoch": 0.65, - "learning_rate": 0.000202021545849828, - "loss": 0.0478, + "epoch": 0.39, + "learning_rate": 0.0002415343010384866, + "loss": 0.0561, "step": 60390 }, { - "epoch": 0.65, - "learning_rate": 0.00020200532156531894, - "loss": 0.0491, + "epoch": 0.39, + "learning_rate": 0.00024152461968412965, + "loss": 0.0536, "step": 60400 }, { - "epoch": 0.65, - "learning_rate": 0.0002019890972808099, - "loss": 0.0503, + "epoch": 0.39, + "learning_rate": 0.00024151493832977273, + "loss": 0.0591, "step": 60410 }, { - "epoch": 0.65, - "learning_rate": 0.00020197287299630084, - "loss": 0.0513, + "epoch": 0.39, + "learning_rate": 0.0002415052569754158, + "loss": 0.0562, "step": 60420 }, { - "epoch": 0.65, - "learning_rate": 0.0002019566487117918, - "loss": 0.0523, + "epoch": 0.39, + "learning_rate": 0.00024149557562105884, + "loss": 0.0567, "step": 60430 }, { - "epoch": 0.65, - "learning_rate": 0.00020194042442728274, - "loss": 0.0552, + "epoch": 0.39, + "learning_rate": 0.00024148589426670192, + "loss": 0.0568, "step": 60440 }, { - "epoch": 0.65, - "learning_rate": 0.00020192420014277366, - "loss": 0.0437, + "epoch": 0.39, + "learning_rate": 0.000241476212912345, + "loss": 0.0622, "step": 60450 }, { - "epoch": 0.65, - "learning_rate": 0.00020190797585826464, - "loss": 0.0473, + "epoch": 0.39, + "learning_rate": 0.00024146653155798805, + "loss": 0.0552, "step": 60460 }, { - "epoch": 0.65, - "learning_rate": 0.00020189175157375556, - "loss": 0.0591, + "epoch": 0.39, + "learning_rate": 0.00024145685020363113, + "loss": 0.0593, "step": 60470 }, { - "epoch": 0.65, - "learning_rate": 0.00020187552728924654, - "loss": 0.047, + "epoch": 0.39, + "learning_rate": 0.0002414471688492742, + "loss": 0.0582, "step": 60480 }, { - "epoch": 0.65, - "learning_rate": 0.00020185930300473746, - "loss": 0.0479, + "epoch": 0.39, + "learning_rate": 0.0002414374874949173, + "loss": 0.0759, "step": 60490 }, { - "epoch": 0.65, - "learning_rate": 0.00020184307872022841, - "loss": 0.0488, + "epoch": 0.39, + "learning_rate": 0.00024142780614056032, + "loss": 0.0568, "step": 60500 }, { - "epoch": 0.65, - "learning_rate": 0.00020182685443571936, - "loss": 0.0456, + "epoch": 0.39, + "learning_rate": 0.0002414181247862034, + "loss": 0.0502, "step": 60510 }, { - "epoch": 0.65, - "learning_rate": 0.0002018106301512103, - "loss": 0.0512, + "epoch": 0.39, + "learning_rate": 0.00024140844343184648, + "loss": 0.0672, "step": 60520 }, { - "epoch": 0.65, - "learning_rate": 0.00020179440586670124, - "loss": 0.0531, + "epoch": 0.39, + "learning_rate": 0.00024139876207748953, + "loss": 0.0583, "step": 60530 }, { - "epoch": 0.65, - "learning_rate": 0.0002017781815821922, - "loss": 0.0497, + "epoch": 0.39, + "learning_rate": 0.0002413890807231326, + "loss": 0.061, "step": 60540 }, { - "epoch": 0.65, - "learning_rate": 0.00020176195729768314, - "loss": 0.0533, + "epoch": 0.39, + "learning_rate": 0.0002413793993687757, + "loss": 0.0552, "step": 60550 }, { - "epoch": 0.66, - "learning_rate": 0.0002017457330131741, - "loss": 0.0492, + "epoch": 0.39, + "learning_rate": 0.00024136971801441877, + "loss": 0.0533, "step": 60560 }, { - "epoch": 0.66, - "learning_rate": 0.00020172950872866504, - "loss": 0.0489, + "epoch": 0.39, + "learning_rate": 0.0002413600366600618, + "loss": 0.0574, "step": 60570 }, { - "epoch": 0.66, - "learning_rate": 0.00020171328444415598, - "loss": 0.06, + "epoch": 0.39, + "learning_rate": 0.00024135035530570487, + "loss": 0.0675, "step": 60580 }, { - "epoch": 0.66, - "learning_rate": 0.00020169706015964693, - "loss": 0.0582, + "epoch": 0.39, + "learning_rate": 0.00024134067395134795, + "loss": 0.0604, "step": 60590 }, { - "epoch": 0.66, - "learning_rate": 0.00020168083587513788, - "loss": 0.0515, + "epoch": 0.39, + "learning_rate": 0.000241330992596991, + "loss": 0.0695, "step": 60600 }, { - "epoch": 0.66, - "learning_rate": 0.00020166461159062883, - "loss": 0.0564, + "epoch": 0.39, + "learning_rate": 0.00024132131124263409, + "loss": 0.058, "step": 60610 }, { - "epoch": 0.66, - "learning_rate": 0.00020164838730611978, - "loss": 0.0513, + "epoch": 0.39, + "learning_rate": 0.00024131162988827716, + "loss": 0.0591, "step": 60620 }, { - "epoch": 0.66, - "learning_rate": 0.0002016321630216107, - "loss": 0.0507, + "epoch": 0.39, + "learning_rate": 0.00024130194853392022, + "loss": 0.0608, "step": 60630 }, { - "epoch": 0.66, - "learning_rate": 0.00020161593873710168, - "loss": 0.0451, + "epoch": 0.39, + "learning_rate": 0.00024129226717956327, + "loss": 0.0683, "step": 60640 }, { - "epoch": 0.66, - "learning_rate": 0.0002015997144525926, - "loss": 0.0446, + "epoch": 0.39, + "learning_rate": 0.00024128258582520635, + "loss": 0.0597, "step": 60650 }, { - "epoch": 0.66, - "learning_rate": 0.00020158349016808358, - "loss": 0.0547, + "epoch": 0.39, + "learning_rate": 0.0002412729044708494, + "loss": 0.0578, "step": 60660 }, { - "epoch": 0.66, - "learning_rate": 0.0002015672658835745, - "loss": 0.0471, + "epoch": 0.39, + "learning_rate": 0.00024126322311649248, + "loss": 0.0652, "step": 60670 }, { - "epoch": 0.66, - "learning_rate": 0.00020155104159906546, - "loss": 0.0495, + "epoch": 0.39, + "learning_rate": 0.00024125354176213556, + "loss": 0.0619, "step": 60680 }, { - "epoch": 0.66, - "learning_rate": 0.0002015348173145564, - "loss": 0.0489, + "epoch": 0.39, + "learning_rate": 0.00024124386040777864, + "loss": 0.0606, "step": 60690 }, { - "epoch": 0.66, - "learning_rate": 0.00020151859303004735, - "loss": 0.0586, + "epoch": 0.39, + "learning_rate": 0.0002412341790534217, + "loss": 0.0578, "step": 60700 }, { - "epoch": 0.66, - "learning_rate": 0.00020150236874553828, - "loss": 0.0525, + "epoch": 0.39, + "learning_rate": 0.00024122449769906475, + "loss": 0.0555, "step": 60710 }, { - "epoch": 0.66, - "learning_rate": 0.00020148614446102925, - "loss": 0.051, + "epoch": 0.39, + "learning_rate": 0.00024121481634470783, + "loss": 0.0653, "step": 60720 }, { - "epoch": 0.66, - "learning_rate": 0.00020146992017652018, - "loss": 0.0495, + "epoch": 0.39, + "learning_rate": 0.00024120513499035088, + "loss": 0.0637, "step": 60730 }, { - "epoch": 0.66, - "learning_rate": 0.00020145369589201115, - "loss": 0.054, + "epoch": 0.39, + "learning_rate": 0.00024119545363599396, + "loss": 0.0625, "step": 60740 }, { - "epoch": 0.66, - "learning_rate": 0.00020143747160750208, - "loss": 0.0486, + "epoch": 0.39, + "learning_rate": 0.00024118577228163704, + "loss": 0.0577, "step": 60750 }, { - "epoch": 0.66, - "learning_rate": 0.00020142124732299305, - "loss": 0.0516, + "epoch": 0.39, + "learning_rate": 0.00024117609092728012, + "loss": 0.0727, "step": 60760 }, { - "epoch": 0.66, - "learning_rate": 0.00020140502303848398, - "loss": 0.0506, + "epoch": 0.39, + "learning_rate": 0.00024116640957292317, + "loss": 0.0565, "step": 60770 }, { - "epoch": 0.66, - "learning_rate": 0.00020138879875397493, - "loss": 0.0502, + "epoch": 0.39, + "learning_rate": 0.00024115672821856622, + "loss": 0.0632, "step": 60780 }, { - "epoch": 0.66, - "learning_rate": 0.00020137257446946588, - "loss": 0.0475, + "epoch": 0.39, + "learning_rate": 0.0002411470468642093, + "loss": 0.0582, "step": 60790 }, { - "epoch": 0.66, - "learning_rate": 0.00020135635018495683, - "loss": 0.0462, + "epoch": 0.39, + "learning_rate": 0.00024113736550985236, + "loss": 0.0575, "step": 60800 }, { - "epoch": 0.66, - "learning_rate": 0.00020134012590044775, - "loss": 0.0562, + "epoch": 0.39, + "learning_rate": 0.00024112768415549544, + "loss": 0.0568, "step": 60810 }, { - "epoch": 0.66, - "learning_rate": 0.00020132390161593873, - "loss": 0.047, + "epoch": 0.39, + "learning_rate": 0.00024111800280113852, + "loss": 0.0592, "step": 60820 }, { - "epoch": 0.66, - "learning_rate": 0.00020130767733142965, - "loss": 0.0511, + "epoch": 0.39, + "learning_rate": 0.00024110832144678157, + "loss": 0.0622, "step": 60830 }, { - "epoch": 0.66, - "learning_rate": 0.00020129145304692062, - "loss": 0.0511, + "epoch": 0.39, + "learning_rate": 0.00024109864009242465, + "loss": 0.063, "step": 60840 }, { - "epoch": 0.66, - "learning_rate": 0.00020127522876241155, - "loss": 0.0462, + "epoch": 0.39, + "learning_rate": 0.0002410889587380677, + "loss": 0.0631, "step": 60850 }, { - "epoch": 0.66, - "learning_rate": 0.0002012590044779025, - "loss": 0.0521, + "epoch": 0.39, + "learning_rate": 0.00024107927738371075, + "loss": 0.0696, "step": 60860 }, { - "epoch": 0.66, - "learning_rate": 0.00020124278019339345, - "loss": 0.0495, + "epoch": 0.39, + "learning_rate": 0.00024106959602935383, + "loss": 0.0633, "step": 60870 }, { - "epoch": 0.66, - "learning_rate": 0.0002012265559088844, - "loss": 0.0508, + "epoch": 0.39, + "learning_rate": 0.00024105991467499691, + "loss": 0.0572, "step": 60880 }, { - "epoch": 0.66, - "learning_rate": 0.00020121033162437532, - "loss": 0.0625, + "epoch": 0.39, + "learning_rate": 0.00024105023332064, + "loss": 0.055, "step": 60890 }, { - "epoch": 0.66, - "learning_rate": 0.0002011941073398663, - "loss": 0.0618, + "epoch": 0.39, + "learning_rate": 0.00024104055196628305, + "loss": 0.0616, "step": 60900 }, { - "epoch": 0.66, - "learning_rate": 0.00020117788305535722, - "loss": 0.0494, + "epoch": 0.39, + "learning_rate": 0.00024103087061192613, + "loss": 0.0654, "step": 60910 }, { - "epoch": 0.66, - "learning_rate": 0.0002011616587708482, - "loss": 0.0575, + "epoch": 0.39, + "learning_rate": 0.00024102118925756918, + "loss": 0.0536, "step": 60920 }, { - "epoch": 0.66, - "learning_rate": 0.00020114543448633912, - "loss": 0.0489, + "epoch": 0.39, + "learning_rate": 0.00024101150790321223, + "loss": 0.0623, "step": 60930 }, { - "epoch": 0.66, - "learning_rate": 0.0002011292102018301, - "loss": 0.047, + "epoch": 0.39, + "learning_rate": 0.0002410018265488553, + "loss": 0.0638, "step": 60940 }, { - "epoch": 0.66, - "learning_rate": 0.00020111298591732102, - "loss": 0.0519, + "epoch": 0.39, + "learning_rate": 0.0002409921451944984, + "loss": 0.0702, "step": 60950 }, { - "epoch": 0.66, - "learning_rate": 0.00020109676163281197, - "loss": 0.0543, + "epoch": 0.39, + "learning_rate": 0.00024098246384014147, + "loss": 0.0557, "step": 60960 }, { - "epoch": 0.66, - "learning_rate": 0.00020108053734830292, - "loss": 0.059, + "epoch": 0.39, + "learning_rate": 0.00024097278248578452, + "loss": 0.0611, "step": 60970 }, { - "epoch": 0.66, - "learning_rate": 0.00020106431306379387, - "loss": 0.0501, + "epoch": 0.39, + "learning_rate": 0.0002409631011314276, + "loss": 0.054, "step": 60980 }, { - "epoch": 0.66, - "learning_rate": 0.0002010480887792848, - "loss": 0.0539, + "epoch": 0.39, + "learning_rate": 0.00024095341977707066, + "loss": 0.0588, "step": 60990 }, { - "epoch": 0.66, - "learning_rate": 0.00020103186449477577, - "loss": 0.0594, + "epoch": 0.39, + "learning_rate": 0.0002409437384227137, + "loss": 0.061, "step": 61000 }, { - "epoch": 0.66, - "eval_cer": 0.9213654780268614, - "eval_loss": 0.035946305841207504, - "eval_runtime": 119.0598, - "eval_samples_per_second": 16.798, - "eval_steps_per_second": 4.2, + "epoch": 0.39, + "eval_cer": 0.9199050954694384, + "eval_loss": 0.04031915217638016, + "eval_runtime": 120.1875, + "eval_samples_per_second": 16.641, + "eval_steps_per_second": 4.16, "step": 61000 }, { - "epoch": 0.66, - "learning_rate": 0.0002010156402102667, - "loss": 0.0501, + "epoch": 0.39, + "learning_rate": 0.0002409340570683568, + "loss": 0.0605, "step": 61010 }, { - "epoch": 0.66, - "learning_rate": 0.00020099941592575767, - "loss": 0.0477, + "epoch": 0.39, + "learning_rate": 0.00024092437571399987, + "loss": 0.0618, "step": 61020 }, { - "epoch": 0.66, - "learning_rate": 0.00020098319164124862, - "loss": 0.0553, + "epoch": 0.39, + "learning_rate": 0.00024091469435964292, + "loss": 0.0597, "step": 61030 }, { - "epoch": 0.66, - "learning_rate": 0.00020096696735673954, - "loss": 0.0533, + "epoch": 0.39, + "learning_rate": 0.000240905013005286, + "loss": 0.0598, "step": 61040 }, { - "epoch": 0.66, - "learning_rate": 0.00020095074307223052, - "loss": 0.0515, + "epoch": 0.39, + "learning_rate": 0.00024089533165092908, + "loss": 0.0537, "step": 61050 }, { - "epoch": 0.66, - "learning_rate": 0.00020093451878772144, - "loss": 0.0596, + "epoch": 0.39, + "learning_rate": 0.0002408856502965721, + "loss": 0.0683, "step": 61060 }, { - "epoch": 0.66, - "learning_rate": 0.00020091829450321242, - "loss": 0.0512, + "epoch": 0.39, + "learning_rate": 0.00024087596894221519, + "loss": 0.0549, "step": 61070 }, { - "epoch": 0.66, - "learning_rate": 0.00020090207021870334, - "loss": 0.0505, + "epoch": 0.39, + "learning_rate": 0.00024086628758785827, + "loss": 0.0547, "step": 61080 }, { - "epoch": 0.66, - "learning_rate": 0.0002008858459341943, - "loss": 0.0576, + "epoch": 0.39, + "learning_rate": 0.00024085660623350135, + "loss": 0.0639, "step": 61090 }, { - "epoch": 0.66, - "learning_rate": 0.00020086962164968524, - "loss": 0.0457, + "epoch": 0.39, + "learning_rate": 0.0002408469248791444, + "loss": 0.0611, "step": 61100 }, { - "epoch": 0.66, - "learning_rate": 0.0002008533973651762, - "loss": 0.0584, + "epoch": 0.39, + "learning_rate": 0.00024083724352478748, + "loss": 0.0512, "step": 61110 }, { - "epoch": 0.66, - "learning_rate": 0.00020083717308066714, - "loss": 0.0565, + "epoch": 0.39, + "learning_rate": 0.00024082756217043056, + "loss": 0.0644, "step": 61120 }, { - "epoch": 0.66, - "learning_rate": 0.0002008209487961581, - "loss": 0.0492, + "epoch": 0.39, + "learning_rate": 0.00024081788081607358, + "loss": 0.0568, "step": 61130 }, { - "epoch": 0.66, - "learning_rate": 0.000200804724511649, - "loss": 0.0586, + "epoch": 0.39, + "learning_rate": 0.00024080819946171666, + "loss": 0.0684, "step": 61140 }, { - "epoch": 0.66, - "learning_rate": 0.00020078850022713999, - "loss": 0.0565, + "epoch": 0.39, + "learning_rate": 0.00024079851810735974, + "loss": 0.0577, "step": 61150 }, { - "epoch": 0.66, - "learning_rate": 0.0002007722759426309, - "loss": 0.0486, + "epoch": 0.39, + "learning_rate": 0.00024078883675300282, + "loss": 0.056, "step": 61160 }, { - "epoch": 0.66, - "learning_rate": 0.00020075605165812189, - "loss": 0.0491, + "epoch": 0.39, + "learning_rate": 0.00024077915539864588, + "loss": 0.0706, "step": 61170 }, { - "epoch": 0.66, - "learning_rate": 0.0002007398273736128, - "loss": 0.0456, + "epoch": 0.39, + "learning_rate": 0.00024076947404428896, + "loss": 0.0624, "step": 61180 }, { - "epoch": 0.66, - "learning_rate": 0.00020072360308910376, - "loss": 0.0494, + "epoch": 0.39, + "learning_rate": 0.00024075979268993204, + "loss": 0.0563, "step": 61190 }, { - "epoch": 0.66, - "learning_rate": 0.0002007073788045947, - "loss": 0.0492, + "epoch": 0.39, + "learning_rate": 0.00024075011133557506, + "loss": 0.0518, "step": 61200 }, { - "epoch": 0.66, - "learning_rate": 0.00020069115452008566, - "loss": 0.3359, + "epoch": 0.4, + "learning_rate": 0.00024074042998121814, + "loss": 0.0594, "step": 61210 }, { - "epoch": 0.66, - "learning_rate": 0.00020067493023557658, - "loss": 0.0919, + "epoch": 0.4, + "learning_rate": 0.00024073074862686122, + "loss": 0.0552, "step": 61220 }, { - "epoch": 0.66, - "learning_rate": 0.00020065870595106756, - "loss": 0.0588, + "epoch": 0.4, + "learning_rate": 0.00024072106727250427, + "loss": 0.0621, "step": 61230 }, { - "epoch": 0.66, - "learning_rate": 0.00020064248166655848, - "loss": 0.0603, + "epoch": 0.4, + "learning_rate": 0.00024071138591814735, + "loss": 0.06, "step": 61240 }, { - "epoch": 0.66, - "learning_rate": 0.00020062625738204946, - "loss": 0.0544, + "epoch": 0.4, + "learning_rate": 0.00024070170456379043, + "loss": 0.0638, "step": 61250 }, { - "epoch": 0.66, - "learning_rate": 0.00020061003309754038, - "loss": 0.0619, + "epoch": 0.4, + "learning_rate": 0.0002406920232094335, + "loss": 0.0628, "step": 61260 }, { - "epoch": 0.66, - "learning_rate": 0.00020059380881303133, - "loss": 0.0551, + "epoch": 0.4, + "learning_rate": 0.00024068234185507654, + "loss": 0.0559, "step": 61270 }, { - "epoch": 0.66, - "learning_rate": 0.00020057758452852228, - "loss": 0.0562, + "epoch": 0.4, + "learning_rate": 0.00024067266050071962, + "loss": 0.0561, "step": 61280 }, { - "epoch": 0.66, - "learning_rate": 0.00020056136024401323, - "loss": 0.0497, + "epoch": 0.4, + "learning_rate": 0.0002406629791463627, + "loss": 0.056, "step": 61290 }, { - "epoch": 0.66, - "learning_rate": 0.00020054513595950418, - "loss": 0.0558, + "epoch": 0.4, + "learning_rate": 0.00024065329779200575, + "loss": 0.0626, "step": 61300 }, { - "epoch": 0.66, - "learning_rate": 0.00020052891167499513, - "loss": 0.0572, + "epoch": 0.4, + "learning_rate": 0.00024064361643764883, + "loss": 0.0543, "step": 61310 }, { - "epoch": 0.66, - "learning_rate": 0.00020051268739048605, - "loss": 0.0549, + "epoch": 0.4, + "learning_rate": 0.0002406339350832919, + "loss": 0.0605, "step": 61320 }, { - "epoch": 0.66, - "learning_rate": 0.00020049646310597703, - "loss": 0.051, + "epoch": 0.4, + "learning_rate": 0.000240624253728935, + "loss": 0.0576, "step": 61330 }, { - "epoch": 0.66, - "learning_rate": 0.00020048023882146795, - "loss": 0.0531, + "epoch": 0.4, + "learning_rate": 0.00024061457237457802, + "loss": 0.0565, "step": 61340 }, { - "epoch": 0.66, - "learning_rate": 0.00020046401453695893, - "loss": 0.0425, + "epoch": 0.4, + "learning_rate": 0.0002406048910202211, + "loss": 0.0588, "step": 61350 }, { - "epoch": 0.66, - "learning_rate": 0.00020044779025244985, - "loss": 0.0496, + "epoch": 0.4, + "learning_rate": 0.00024059520966586417, + "loss": 0.0626, "step": 61360 }, { - "epoch": 0.66, - "learning_rate": 0.0002004315659679408, - "loss": 0.0528, + "epoch": 0.4, + "learning_rate": 0.00024058552831150723, + "loss": 0.0559, "step": 61370 }, { - "epoch": 0.66, - "learning_rate": 0.00020041534168343175, - "loss": 0.0529, + "epoch": 0.4, + "learning_rate": 0.0002405758469571503, + "loss": 0.0582, "step": 61380 }, { - "epoch": 0.66, - "learning_rate": 0.0002003991173989227, - "loss": 0.0553, + "epoch": 0.4, + "learning_rate": 0.0002405661656027934, + "loss": 0.0562, "step": 61390 }, { - "epoch": 0.66, - "learning_rate": 0.00020038289311441362, - "loss": 0.0478, + "epoch": 0.4, + "learning_rate": 0.00024055648424843647, + "loss": 0.0564, "step": 61400 }, { - "epoch": 0.66, - "learning_rate": 0.0002003666688299046, - "loss": 0.0445, + "epoch": 0.4, + "learning_rate": 0.0002405468028940795, + "loss": 0.0624, "step": 61410 }, { - "epoch": 0.66, - "learning_rate": 0.00020035044454539552, - "loss": 0.0487, + "epoch": 0.4, + "learning_rate": 0.00024053712153972257, + "loss": 0.0638, "step": 61420 }, { - "epoch": 0.66, - "learning_rate": 0.0002003342202608865, - "loss": 0.0476, + "epoch": 0.4, + "learning_rate": 0.00024052744018536563, + "loss": 0.0533, "step": 61430 }, { - "epoch": 0.66, - "learning_rate": 0.00020031799597637742, - "loss": 0.0532, + "epoch": 0.4, + "learning_rate": 0.0002405177588310087, + "loss": 0.0535, "step": 61440 }, { - "epoch": 0.66, - "learning_rate": 0.0002003017716918684, - "loss": 0.0471, + "epoch": 0.4, + "learning_rate": 0.00024050807747665178, + "loss": 0.0554, "step": 61450 }, { - "epoch": 0.66, - "learning_rate": 0.00020028554740735932, - "loss": 0.0451, + "epoch": 0.4, + "learning_rate": 0.00024049839612229486, + "loss": 0.0582, "step": 61460 }, { - "epoch": 0.66, - "learning_rate": 0.00020026932312285027, - "loss": 0.0524, + "epoch": 0.4, + "learning_rate": 0.00024048871476793792, + "loss": 0.0579, "step": 61470 }, { - "epoch": 0.66, - "learning_rate": 0.00020025309883834122, - "loss": 0.0505, + "epoch": 0.4, + "learning_rate": 0.00024047903341358097, + "loss": 0.0584, "step": 61480 }, { - "epoch": 0.67, - "learning_rate": 0.00020023687455383217, - "loss": 0.0509, + "epoch": 0.4, + "learning_rate": 0.00024046935205922405, + "loss": 0.0603, "step": 61490 }, { - "epoch": 0.67, - "learning_rate": 0.0002002206502693231, - "loss": 0.0476, + "epoch": 0.4, + "learning_rate": 0.0002404596707048671, + "loss": 0.0674, "step": 61500 }, { - "epoch": 0.67, - "learning_rate": 0.00020020442598481407, - "loss": 0.0503, + "epoch": 0.4, + "learning_rate": 0.00024044998935051018, + "loss": 0.0553, "step": 61510 }, { - "epoch": 0.67, - "learning_rate": 0.000200188201700305, - "loss": 0.0506, + "epoch": 0.4, + "learning_rate": 0.00024044030799615326, + "loss": 0.0551, "step": 61520 }, { - "epoch": 0.67, - "learning_rate": 0.00020017197741579597, - "loss": 0.0433, + "epoch": 0.4, + "learning_rate": 0.00024043062664179634, + "loss": 0.0523, "step": 61530 }, { - "epoch": 0.67, - "learning_rate": 0.0002001557531312869, - "loss": 0.0537, + "epoch": 0.4, + "learning_rate": 0.0002404209452874394, + "loss": 0.0559, "step": 61540 }, { - "epoch": 0.67, - "learning_rate": 0.00020013952884677784, - "loss": 0.0486, + "epoch": 0.4, + "learning_rate": 0.00024041126393308245, + "loss": 0.0612, "step": 61550 }, { - "epoch": 0.67, - "learning_rate": 0.0002001233045622688, - "loss": 0.0481, + "epoch": 0.4, + "learning_rate": 0.00024040158257872553, + "loss": 0.0535, "step": 61560 }, { - "epoch": 0.67, - "learning_rate": 0.00020010708027775974, - "loss": 0.0523, + "epoch": 0.4, + "learning_rate": 0.00024039190122436858, + "loss": 0.0541, "step": 61570 }, { - "epoch": 0.67, - "learning_rate": 0.00020009085599325066, - "loss": 0.0463, + "epoch": 0.4, + "learning_rate": 0.00024038221987001166, + "loss": 0.0669, "step": 61580 }, { - "epoch": 0.67, - "learning_rate": 0.00020007463170874164, - "loss": 0.055, + "epoch": 0.4, + "learning_rate": 0.00024037253851565474, + "loss": 0.0569, "step": 61590 }, { - "epoch": 0.67, - "learning_rate": 0.00020005840742423256, - "loss": 0.0596, + "epoch": 0.4, + "learning_rate": 0.00024036285716129782, + "loss": 0.0591, "step": 61600 }, { - "epoch": 0.67, - "learning_rate": 0.00020004218313972354, - "loss": 0.0591, + "epoch": 0.4, + "learning_rate": 0.00024035317580694087, + "loss": 0.0619, "step": 61610 }, { - "epoch": 0.67, - "learning_rate": 0.00020002595885521446, - "loss": 0.0542, + "epoch": 0.4, + "learning_rate": 0.00024034349445258392, + "loss": 0.0677, "step": 61620 }, { - "epoch": 0.67, - "learning_rate": 0.00020000973457070544, - "loss": 0.0621, + "epoch": 0.4, + "learning_rate": 0.00024033381309822698, + "loss": 0.078, "step": 61630 }, { - "epoch": 0.67, - "learning_rate": 0.00019999351028619636, - "loss": 0.0494, + "epoch": 0.4, + "learning_rate": 0.00024032413174387006, + "loss": 0.0625, "step": 61640 }, { - "epoch": 0.67, - "learning_rate": 0.0001999772860016873, - "loss": 0.0527, + "epoch": 0.4, + "learning_rate": 0.00024031445038951314, + "loss": 0.0574, "step": 61650 }, { - "epoch": 0.67, - "learning_rate": 0.00019996106171717826, - "loss": 0.0427, + "epoch": 0.4, + "learning_rate": 0.00024030476903515622, + "loss": 0.0625, "step": 61660 }, { - "epoch": 0.67, - "learning_rate": 0.0001999448374326692, - "loss": 0.0529, + "epoch": 0.4, + "learning_rate": 0.00024029508768079927, + "loss": 0.0654, "step": 61670 }, { - "epoch": 0.67, - "learning_rate": 0.00019992861314816013, - "loss": 0.0529, + "epoch": 0.4, + "learning_rate": 0.00024028540632644235, + "loss": 0.0532, "step": 61680 }, { - "epoch": 0.67, - "learning_rate": 0.0001999123888636511, - "loss": 0.0493, + "epoch": 0.4, + "learning_rate": 0.0002402757249720854, + "loss": 0.067, "step": 61690 }, { - "epoch": 0.67, - "learning_rate": 0.00019989616457914203, - "loss": 0.0534, + "epoch": 0.4, + "learning_rate": 0.00024026604361772845, + "loss": 0.0661, "step": 61700 }, { - "epoch": 0.67, - "learning_rate": 0.000199879940294633, - "loss": 0.0475, + "epoch": 0.4, + "learning_rate": 0.00024025636226337153, + "loss": 0.0584, "step": 61710 }, { - "epoch": 0.67, - "learning_rate": 0.00019986371601012393, - "loss": 0.0528, + "epoch": 0.4, + "learning_rate": 0.00024024668090901461, + "loss": 0.0538, "step": 61720 }, { - "epoch": 0.67, - "learning_rate": 0.00019984749172561488, - "loss": 0.0519, + "epoch": 0.4, + "learning_rate": 0.0002402369995546577, + "loss": 0.06, "step": 61730 }, { - "epoch": 0.67, - "learning_rate": 0.00019983126744110583, - "loss": 0.0511, + "epoch": 0.4, + "learning_rate": 0.00024022731820030075, + "loss": 0.0648, "step": 61740 }, { - "epoch": 0.67, - "learning_rate": 0.00019981504315659678, - "loss": 0.0464, + "epoch": 0.4, + "learning_rate": 0.00024021763684594383, + "loss": 0.0566, "step": 61750 }, { - "epoch": 0.67, - "learning_rate": 0.0001997988188720877, - "loss": 0.0514, + "epoch": 0.4, + "learning_rate": 0.00024020795549158688, + "loss": 0.0593, "step": 61760 }, { - "epoch": 0.67, - "learning_rate": 0.00019978259458757868, - "loss": 0.0488, + "epoch": 0.4, + "learning_rate": 0.00024019827413722993, + "loss": 0.0583, "step": 61770 }, { - "epoch": 0.67, - "learning_rate": 0.0001997663703030696, - "loss": 0.0538, + "epoch": 0.4, + "learning_rate": 0.000240188592782873, + "loss": 0.0584, "step": 61780 }, { - "epoch": 0.67, - "learning_rate": 0.00019975014601856058, - "loss": 0.0521, + "epoch": 0.4, + "learning_rate": 0.0002401789114285161, + "loss": 0.0558, "step": 61790 }, { - "epoch": 0.67, - "learning_rate": 0.0001997339217340515, - "loss": 0.0544, + "epoch": 0.4, + "learning_rate": 0.00024016923007415917, + "loss": 0.059, "step": 61800 }, { - "epoch": 0.67, - "learning_rate": 0.00019971769744954248, - "loss": 0.0516, + "epoch": 0.4, + "learning_rate": 0.00024015954871980222, + "loss": 0.0654, "step": 61810 }, { - "epoch": 0.67, - "learning_rate": 0.0001997014731650334, - "loss": 0.0483, + "epoch": 0.4, + "learning_rate": 0.0002401498673654453, + "loss": 0.0615, "step": 61820 }, { - "epoch": 0.67, - "learning_rate": 0.00019968524888052435, - "loss": 0.051, + "epoch": 0.4, + "learning_rate": 0.00024014018601108836, + "loss": 0.066, "step": 61830 }, { - "epoch": 0.67, - "learning_rate": 0.0001996690245960153, - "loss": 0.0451, + "epoch": 0.4, + "learning_rate": 0.0002401305046567314, + "loss": 0.0557, "step": 61840 }, { - "epoch": 0.67, - "learning_rate": 0.00019965280031150625, - "loss": 0.0505, + "epoch": 0.4, + "learning_rate": 0.0002401208233023745, + "loss": 0.0554, "step": 61850 }, { - "epoch": 0.67, - "learning_rate": 0.00019963657602699718, - "loss": 0.0611, + "epoch": 0.4, + "learning_rate": 0.00024011114194801757, + "loss": 0.0631, "step": 61860 }, { - "epoch": 0.67, - "learning_rate": 0.00019962035174248815, - "loss": 0.0503, + "epoch": 0.4, + "learning_rate": 0.00024010146059366062, + "loss": 0.0586, "step": 61870 }, { - "epoch": 0.67, - "learning_rate": 0.00019960412745797908, - "loss": 0.0541, + "epoch": 0.4, + "learning_rate": 0.0002400917792393037, + "loss": 0.0587, "step": 61880 }, { - "epoch": 0.67, - "learning_rate": 0.00019958790317347005, - "loss": 0.0561, + "epoch": 0.4, + "learning_rate": 0.00024008209788494678, + "loss": 0.0642, "step": 61890 }, { - "epoch": 0.67, - "learning_rate": 0.00019957167888896098, - "loss": 0.0503, + "epoch": 0.4, + "learning_rate": 0.0002400724165305898, + "loss": 0.0592, "step": 61900 }, { - "epoch": 0.67, - "learning_rate": 0.00019955545460445192, - "loss": 0.0479, + "epoch": 0.4, + "learning_rate": 0.00024006273517623289, + "loss": 0.0583, "step": 61910 }, { - "epoch": 0.67, - "learning_rate": 0.00019953923031994287, - "loss": 0.0514, + "epoch": 0.4, + "learning_rate": 0.00024005305382187597, + "loss": 0.0622, "step": 61920 }, { - "epoch": 0.67, - "learning_rate": 0.00019952300603543382, - "loss": 0.0489, + "epoch": 0.4, + "learning_rate": 0.00024004337246751905, + "loss": 0.0634, "step": 61930 }, { - "epoch": 0.67, - "learning_rate": 0.00019950678175092475, - "loss": 0.0578, + "epoch": 0.4, + "learning_rate": 0.0002400336911131621, + "loss": 0.0665, "step": 61940 }, { - "epoch": 0.67, - "learning_rate": 0.00019949055746641572, - "loss": 0.0524, + "epoch": 0.4, + "learning_rate": 0.00024002400975880518, + "loss": 0.053, "step": 61950 }, { - "epoch": 0.67, - "learning_rate": 0.00019947433318190665, - "loss": 0.0586, + "epoch": 0.4, + "learning_rate": 0.00024001432840444826, + "loss": 0.0561, "step": 61960 }, { - "epoch": 0.67, - "learning_rate": 0.00019945810889739762, - "loss": 0.048, + "epoch": 0.4, + "learning_rate": 0.00024000464705009128, + "loss": 0.0647, "step": 61970 }, { - "epoch": 0.67, - "learning_rate": 0.00019944188461288855, - "loss": 0.0516, + "epoch": 0.4, + "learning_rate": 0.00023999496569573436, + "loss": 0.0626, "step": 61980 }, { - "epoch": 0.67, - "learning_rate": 0.00019942566032837952, - "loss": 0.0533, + "epoch": 0.4, + "learning_rate": 0.00023998528434137744, + "loss": 0.0602, "step": 61990 }, { - "epoch": 0.67, - "learning_rate": 0.00019940943604387045, - "loss": 0.0479, + "epoch": 0.4, + "learning_rate": 0.00023997560298702052, + "loss": 0.0611, "step": 62000 }, { - "epoch": 0.67, - "eval_cer": 0.9212311884100993, - "eval_loss": 0.03535841032862663, - "eval_runtime": 119.0917, - "eval_samples_per_second": 16.794, - "eval_steps_per_second": 4.198, + "epoch": 0.4, + "eval_cer": 0.9200768274771213, + "eval_loss": 0.03882079944014549, + "eval_runtime": 119.9884, + "eval_samples_per_second": 16.668, + "eval_steps_per_second": 4.167, "step": 62000 }, { - "epoch": 0.67, - "learning_rate": 0.0001993932117593614, - "loss": 0.0565, + "epoch": 0.4, + "learning_rate": 0.00023996592163266358, + "loss": 0.0549, "step": 62010 }, { - "epoch": 0.67, - "learning_rate": 0.00019937698747485235, - "loss": 0.0472, + "epoch": 0.4, + "learning_rate": 0.00023995624027830666, + "loss": 0.053, "step": 62020 }, { - "epoch": 0.67, - "learning_rate": 0.0001993607631903433, - "loss": 0.0534, + "epoch": 0.4, + "learning_rate": 0.00023994655892394973, + "loss": 0.0706, "step": 62030 }, { - "epoch": 0.67, - "learning_rate": 0.00019934453890583422, - "loss": 0.0566, + "epoch": 0.4, + "learning_rate": 0.00023993687756959276, + "loss": 0.0513, "step": 62040 }, { - "epoch": 0.67, - "learning_rate": 0.0001993283146213252, - "loss": 0.0598, + "epoch": 0.4, + "learning_rate": 0.00023992719621523584, + "loss": 0.0621, "step": 62050 }, { - "epoch": 0.67, - "learning_rate": 0.00019931209033681612, - "loss": 0.0512, + "epoch": 0.4, + "learning_rate": 0.00023991751486087892, + "loss": 0.0552, "step": 62060 }, { - "epoch": 0.67, - "learning_rate": 0.0001992958660523071, - "loss": 0.0522, + "epoch": 0.4, + "learning_rate": 0.00023990783350652197, + "loss": 0.0653, "step": 62070 }, { - "epoch": 0.67, - "learning_rate": 0.00019927964176779802, - "loss": 0.0592, + "epoch": 0.4, + "learning_rate": 0.00023989815215216505, + "loss": 0.0568, "step": 62080 }, { - "epoch": 0.67, - "learning_rate": 0.00019926341748328897, - "loss": 0.0512, + "epoch": 0.4, + "learning_rate": 0.00023988847079780813, + "loss": 0.0515, "step": 62090 }, { - "epoch": 0.67, - "learning_rate": 0.00019924719319877992, - "loss": 0.0463, + "epoch": 0.4, + "learning_rate": 0.0002398787894434512, + "loss": 0.0508, "step": 62100 }, { - "epoch": 0.67, - "learning_rate": 0.00019923096891427087, - "loss": 0.0531, + "epoch": 0.4, + "learning_rate": 0.00023986910808909424, + "loss": 0.0611, "step": 62110 }, { - "epoch": 0.67, - "learning_rate": 0.0001992147446297618, - "loss": 0.0562, + "epoch": 0.4, + "learning_rate": 0.00023985942673473732, + "loss": 0.0546, "step": 62120 }, { - "epoch": 0.67, - "learning_rate": 0.00019919852034525277, - "loss": 0.0448, + "epoch": 0.4, + "learning_rate": 0.0002398497453803804, + "loss": 0.0519, "step": 62130 }, { - "epoch": 0.67, - "learning_rate": 0.0001991822960607437, - "loss": 0.0526, + "epoch": 0.4, + "learning_rate": 0.00023984006402602345, + "loss": 0.0592, "step": 62140 }, { - "epoch": 0.67, - "learning_rate": 0.00019916607177623467, - "loss": 0.0449, + "epoch": 0.4, + "learning_rate": 0.00023983038267166653, + "loss": 0.0578, "step": 62150 }, { - "epoch": 0.67, - "learning_rate": 0.0001991498474917256, - "loss": 0.0495, + "epoch": 0.4, + "learning_rate": 0.0002398207013173096, + "loss": 0.0523, "step": 62160 }, { - "epoch": 0.67, - "learning_rate": 0.00019913362320721656, - "loss": 0.0477, + "epoch": 0.4, + "learning_rate": 0.0002398110199629527, + "loss": 0.0565, "step": 62170 }, { - "epoch": 0.67, - "learning_rate": 0.0001991173989227075, - "loss": 0.052, + "epoch": 0.4, + "learning_rate": 0.00023980133860859572, + "loss": 0.056, "step": 62180 }, { - "epoch": 0.67, - "learning_rate": 0.00019910117463819844, - "loss": 0.0485, + "epoch": 0.4, + "learning_rate": 0.0002397916572542388, + "loss": 0.0623, "step": 62190 }, { - "epoch": 0.67, - "learning_rate": 0.0001990849503536894, - "loss": 0.0533, + "epoch": 0.4, + "learning_rate": 0.00023978197589988187, + "loss": 0.0543, "step": 62200 }, { - "epoch": 0.67, - "learning_rate": 0.00019906872606918034, - "loss": 0.052, + "epoch": 0.4, + "learning_rate": 0.00023977229454552493, + "loss": 0.0569, "step": 62210 }, { - "epoch": 0.67, - "learning_rate": 0.00019905250178467126, - "loss": 0.0473, + "epoch": 0.4, + "learning_rate": 0.000239762613191168, + "loss": 0.0618, "step": 62220 }, { - "epoch": 0.67, - "learning_rate": 0.00019903627750016224, - "loss": 0.0498, + "epoch": 0.4, + "learning_rate": 0.0002397529318368111, + "loss": 0.0572, "step": 62230 }, { - "epoch": 0.67, - "learning_rate": 0.00019902005321565316, - "loss": 0.0432, + "epoch": 0.4, + "learning_rate": 0.00023974325048245414, + "loss": 0.0637, "step": 62240 }, { - "epoch": 0.67, - "learning_rate": 0.00019900382893114414, - "loss": 0.0647, + "epoch": 0.4, + "learning_rate": 0.0002397335691280972, + "loss": 0.0726, "step": 62250 }, { - "epoch": 0.67, - "learning_rate": 0.00019898760464663506, - "loss": 0.0525, + "epoch": 0.4, + "learning_rate": 0.00023972388777374027, + "loss": 0.0609, "step": 62260 }, { - "epoch": 0.67, - "learning_rate": 0.000198971380362126, - "loss": 0.0472, + "epoch": 0.4, + "learning_rate": 0.00023971420641938332, + "loss": 0.0609, "step": 62270 }, { - "epoch": 0.67, - "learning_rate": 0.00019895515607761696, - "loss": 0.0438, + "epoch": 0.4, + "learning_rate": 0.0002397045250650264, + "loss": 0.0555, "step": 62280 }, { - "epoch": 0.67, - "learning_rate": 0.0001989389317931079, - "loss": 0.0462, + "epoch": 0.4, + "learning_rate": 0.00023969484371066948, + "loss": 0.0513, "step": 62290 }, { - "epoch": 0.67, - "learning_rate": 0.00019892270750859886, - "loss": 0.054, + "epoch": 0.4, + "learning_rate": 0.00023968516235631256, + "loss": 0.0614, "step": 62300 }, { - "epoch": 0.67, - "learning_rate": 0.0001989064832240898, - "loss": 0.0444, + "epoch": 0.4, + "learning_rate": 0.00023967548100195562, + "loss": 0.056, "step": 62310 }, { - "epoch": 0.67, - "learning_rate": 0.00019889025893958073, - "loss": 0.0544, + "epoch": 0.4, + "learning_rate": 0.00023966579964759867, + "loss": 0.0602, "step": 62320 }, { - "epoch": 0.67, - "learning_rate": 0.0001988740346550717, - "loss": 0.0453, + "epoch": 0.4, + "learning_rate": 0.00023965611829324175, + "loss": 0.0681, "step": 62330 }, { - "epoch": 0.67, - "learning_rate": 0.00019885781037056263, - "loss": 0.0504, + "epoch": 0.4, + "learning_rate": 0.0002396464369388848, + "loss": 0.0616, "step": 62340 }, { - "epoch": 0.67, - "learning_rate": 0.0001988415860860536, - "loss": 0.0502, + "epoch": 0.4, + "learning_rate": 0.00023963675558452788, + "loss": 0.0622, "step": 62350 }, { - "epoch": 0.67, - "learning_rate": 0.00019882536180154453, - "loss": 0.0523, + "epoch": 0.4, + "learning_rate": 0.00023962707423017096, + "loss": 0.0529, "step": 62360 }, { - "epoch": 0.67, - "learning_rate": 0.00019880913751703548, - "loss": 0.0475, + "epoch": 0.4, + "learning_rate": 0.00023961739287581404, + "loss": 0.0525, "step": 62370 }, { - "epoch": 0.67, - "learning_rate": 0.00019879291323252643, - "loss": 0.0559, + "epoch": 0.4, + "learning_rate": 0.0002396077115214571, + "loss": 0.0556, "step": 62380 }, { - "epoch": 0.67, - "learning_rate": 0.00019877668894801738, - "loss": 0.0519, + "epoch": 0.4, + "learning_rate": 0.00023959803016710015, + "loss": 0.0629, "step": 62390 }, { - "epoch": 0.67, - "learning_rate": 0.0001987604646635083, - "loss": 0.0499, + "epoch": 0.4, + "learning_rate": 0.00023958834881274323, + "loss": 0.0511, "step": 62400 }, { - "epoch": 0.68, - "learning_rate": 0.00019874424037899928, - "loss": 0.0468, + "epoch": 0.4, + "learning_rate": 0.00023957866745838628, + "loss": 0.0553, "step": 62410 }, { - "epoch": 0.68, - "learning_rate": 0.0001987280160944902, - "loss": 0.0511, + "epoch": 0.4, + "learning_rate": 0.00023956898610402936, + "loss": 0.0521, "step": 62420 }, { - "epoch": 0.68, - "learning_rate": 0.00019871179180998118, - "loss": 0.0572, + "epoch": 0.4, + "learning_rate": 0.00023955930474967244, + "loss": 0.0621, "step": 62430 }, { - "epoch": 0.68, - "learning_rate": 0.0001986955675254721, - "loss": 0.055, + "epoch": 0.4, + "learning_rate": 0.0002395496233953155, + "loss": 0.0609, "step": 62440 }, { - "epoch": 0.68, - "learning_rate": 0.00019867934324096305, - "loss": 0.0484, + "epoch": 0.4, + "learning_rate": 0.00023953994204095857, + "loss": 0.0586, "step": 62450 }, { - "epoch": 0.68, - "learning_rate": 0.000198663118956454, - "loss": 0.0535, + "epoch": 0.4, + "learning_rate": 0.00023953026068660162, + "loss": 0.0539, "step": 62460 }, { - "epoch": 0.68, - "learning_rate": 0.00019864689467194495, - "loss": 0.0481, + "epoch": 0.4, + "learning_rate": 0.00023952057933224468, + "loss": 0.0602, "step": 62470 }, { - "epoch": 0.68, - "learning_rate": 0.0001986306703874359, - "loss": 0.0568, + "epoch": 0.4, + "learning_rate": 0.00023951089797788776, + "loss": 0.0545, "step": 62480 }, { - "epoch": 0.68, - "learning_rate": 0.00019861444610292685, - "loss": 0.05, + "epoch": 0.4, + "learning_rate": 0.00023950121662353084, + "loss": 0.0581, "step": 62490 }, { - "epoch": 0.68, - "learning_rate": 0.00019859822181841777, - "loss": 0.0491, + "epoch": 0.4, + "learning_rate": 0.00023949153526917392, + "loss": 0.0683, "step": 62500 }, { - "epoch": 0.68, - "learning_rate": 0.00019858199753390875, - "loss": 0.0507, + "epoch": 0.4, + "learning_rate": 0.00023948185391481697, + "loss": 0.064, "step": 62510 }, { - "epoch": 0.68, - "learning_rate": 0.00019856577324939967, - "loss": 0.0485, + "epoch": 0.4, + "learning_rate": 0.00023947217256046005, + "loss": 0.0574, "step": 62520 }, { - "epoch": 0.68, - "learning_rate": 0.00019854954896489065, - "loss": 0.0469, + "epoch": 0.4, + "learning_rate": 0.0002394624912061031, + "loss": 0.0659, "step": 62530 }, { - "epoch": 0.68, - "learning_rate": 0.00019853332468038157, - "loss": 0.0504, + "epoch": 0.4, + "learning_rate": 0.00023945280985174615, + "loss": 0.062, "step": 62540 }, { - "epoch": 0.68, - "learning_rate": 0.00019851710039587252, - "loss": 0.053, + "epoch": 0.4, + "learning_rate": 0.00023944312849738923, + "loss": 0.0597, "step": 62550 }, { - "epoch": 0.68, - "learning_rate": 0.00019850087611136347, - "loss": 0.0562, + "epoch": 0.4, + "learning_rate": 0.0002394334471430323, + "loss": 0.0551, "step": 62560 }, { - "epoch": 0.68, - "learning_rate": 0.00019848465182685442, - "loss": 0.0541, + "epoch": 0.4, + "learning_rate": 0.0002394237657886754, + "loss": 0.0569, "step": 62570 }, { - "epoch": 0.68, - "learning_rate": 0.00019846842754234534, - "loss": 0.0483, + "epoch": 0.4, + "learning_rate": 0.00023941408443431845, + "loss": 0.0639, "step": 62580 }, { - "epoch": 0.68, - "learning_rate": 0.00019845220325783632, - "loss": 0.0485, + "epoch": 0.4, + "learning_rate": 0.00023940440307996153, + "loss": 0.0545, "step": 62590 }, { - "epoch": 0.68, - "learning_rate": 0.00019843597897332724, - "loss": 0.0489, + "epoch": 0.4, + "learning_rate": 0.00023939472172560458, + "loss": 0.0561, "step": 62600 }, { - "epoch": 0.68, - "learning_rate": 0.00019841975468881822, - "loss": 0.0508, + "epoch": 0.4, + "learning_rate": 0.00023938504037124763, + "loss": 0.0544, "step": 62610 }, { - "epoch": 0.68, - "learning_rate": 0.00019840353040430914, - "loss": 0.0524, + "epoch": 0.4, + "learning_rate": 0.0002393753590168907, + "loss": 0.056, "step": 62620 }, { - "epoch": 0.68, - "learning_rate": 0.0001983873061198001, - "loss": 0.0488, + "epoch": 0.4, + "learning_rate": 0.0002393656776625338, + "loss": 0.0676, "step": 62630 }, { - "epoch": 0.68, - "learning_rate": 0.00019837108183529104, - "loss": 0.0497, + "epoch": 0.4, + "learning_rate": 0.00023935599630817684, + "loss": 0.0628, "step": 62640 }, { - "epoch": 0.68, - "learning_rate": 0.000198354857550782, - "loss": 0.049, + "epoch": 0.4, + "learning_rate": 0.00023934631495381992, + "loss": 0.0588, "step": 62650 }, { - "epoch": 0.68, - "learning_rate": 0.00019833863326627294, - "loss": 0.0477, + "epoch": 0.4, + "learning_rate": 0.000239336633599463, + "loss": 0.0562, "step": 62660 }, { - "epoch": 0.68, - "learning_rate": 0.0001983224089817639, - "loss": 0.0467, + "epoch": 0.4, + "learning_rate": 0.00023932695224510603, + "loss": 0.0593, "step": 62670 }, { - "epoch": 0.68, - "learning_rate": 0.0001983061846972548, - "loss": 0.0469, + "epoch": 0.4, + "learning_rate": 0.0002393172708907491, + "loss": 0.0594, "step": 62680 }, { - "epoch": 0.68, - "learning_rate": 0.0001982899604127458, - "loss": 0.054, + "epoch": 0.4, + "learning_rate": 0.0002393075895363922, + "loss": 0.0605, "step": 62690 }, { - "epoch": 0.68, - "learning_rate": 0.0001982737361282367, - "loss": 0.0498, + "epoch": 0.4, + "learning_rate": 0.00023929790818203527, + "loss": 0.0566, "step": 62700 }, { - "epoch": 0.68, - "learning_rate": 0.0001982575118437277, - "loss": 0.0606, + "epoch": 0.4, + "learning_rate": 0.00023928822682767832, + "loss": 0.0534, "step": 62710 }, { - "epoch": 0.68, - "learning_rate": 0.0001982412875592186, - "loss": 0.0512, + "epoch": 0.4, + "learning_rate": 0.0002392785454733214, + "loss": 0.0567, "step": 62720 }, { - "epoch": 0.68, - "learning_rate": 0.00019822506327470956, - "loss": 0.0503, + "epoch": 0.4, + "learning_rate": 0.00023926886411896448, + "loss": 0.0666, "step": 62730 }, { - "epoch": 0.68, - "learning_rate": 0.0001982088389902005, - "loss": 0.0448, + "epoch": 0.4, + "learning_rate": 0.0002392591827646075, + "loss": 0.0555, "step": 62740 }, { - "epoch": 0.68, - "learning_rate": 0.00019819261470569146, - "loss": 0.0426, + "epoch": 0.41, + "learning_rate": 0.00023924950141025059, + "loss": 0.0567, "step": 62750 }, { - "epoch": 0.68, - "learning_rate": 0.00019817639042118238, - "loss": 0.05, + "epoch": 0.41, + "learning_rate": 0.00023923982005589367, + "loss": 0.0542, "step": 62760 }, { - "epoch": 0.68, - "learning_rate": 0.00019816016613667336, - "loss": 0.044, + "epoch": 0.41, + "learning_rate": 0.00023923013870153675, + "loss": 0.053, "step": 62770 }, { - "epoch": 0.68, - "learning_rate": 0.00019814394185216428, - "loss": 0.0522, + "epoch": 0.41, + "learning_rate": 0.0002392204573471798, + "loss": 0.0578, "step": 62780 }, { - "epoch": 0.68, - "learning_rate": 0.00019812771756765526, - "loss": 0.0426, + "epoch": 0.41, + "learning_rate": 0.00023921077599282288, + "loss": 0.0495, "step": 62790 }, { - "epoch": 0.68, - "learning_rate": 0.00019811149328314618, - "loss": 0.0426, + "epoch": 0.41, + "learning_rate": 0.00023920109463846596, + "loss": 0.0637, "step": 62800 }, { - "epoch": 0.68, - "learning_rate": 0.00019809526899863713, - "loss": 0.0498, + "epoch": 0.41, + "learning_rate": 0.00023919141328410898, + "loss": 0.0548, "step": 62810 }, { - "epoch": 0.68, - "learning_rate": 0.00019807904471412808, - "loss": 0.0451, + "epoch": 0.41, + "learning_rate": 0.00023918173192975206, + "loss": 0.0529, "step": 62820 }, { - "epoch": 0.68, - "learning_rate": 0.00019806282042961903, - "loss": 0.048, + "epoch": 0.41, + "learning_rate": 0.00023917205057539514, + "loss": 0.0561, "step": 62830 }, { - "epoch": 0.68, - "learning_rate": 0.00019804659614510998, - "loss": 0.0507, + "epoch": 0.41, + "learning_rate": 0.0002391623692210382, + "loss": 0.0643, "step": 62840 }, { - "epoch": 0.68, - "learning_rate": 0.00019803037186060093, - "loss": 0.0472, + "epoch": 0.41, + "learning_rate": 0.00023915268786668128, + "loss": 0.059, "step": 62850 }, { - "epoch": 0.68, - "learning_rate": 0.00019801414757609185, - "loss": 0.0427, + "epoch": 0.41, + "learning_rate": 0.00023914300651232435, + "loss": 0.0574, "step": 62860 }, { - "epoch": 0.68, - "learning_rate": 0.00019799792329158283, - "loss": 0.0462, + "epoch": 0.41, + "learning_rate": 0.00023913332515796743, + "loss": 0.0582, "step": 62870 }, { - "epoch": 0.68, - "learning_rate": 0.00019798169900707375, - "loss": 0.0509, + "epoch": 0.41, + "learning_rate": 0.00023912364380361046, + "loss": 0.0508, "step": 62880 }, { - "epoch": 0.68, - "learning_rate": 0.00019796547472256473, - "loss": 0.0564, + "epoch": 0.41, + "learning_rate": 0.00023911396244925354, + "loss": 0.062, "step": 62890 }, { - "epoch": 0.68, - "learning_rate": 0.00019794925043805565, - "loss": 0.0606, + "epoch": 0.41, + "learning_rate": 0.00023910428109489662, + "loss": 0.0613, "step": 62900 }, { - "epoch": 0.68, - "learning_rate": 0.0001979330261535466, - "loss": 0.0534, + "epoch": 0.41, + "learning_rate": 0.00023909459974053967, + "loss": 0.0531, "step": 62910 }, { - "epoch": 0.68, - "learning_rate": 0.00019791680186903755, - "loss": 0.0453, + "epoch": 0.41, + "learning_rate": 0.00023908491838618275, + "loss": 0.0593, "step": 62920 }, { - "epoch": 0.68, - "learning_rate": 0.0001979005775845285, - "loss": 0.0516, + "epoch": 0.41, + "learning_rate": 0.00023907523703182583, + "loss": 0.0669, "step": 62930 }, { - "epoch": 0.68, - "learning_rate": 0.00019788435330001943, - "loss": 0.0545, + "epoch": 0.41, + "learning_rate": 0.0002390655556774689, + "loss": 0.0592, "step": 62940 }, { - "epoch": 0.68, - "learning_rate": 0.0001978681290155104, - "loss": 0.0435, + "epoch": 0.41, + "learning_rate": 0.00023905587432311194, + "loss": 0.0583, "step": 62950 }, { - "epoch": 0.68, - "learning_rate": 0.00019785190473100133, - "loss": 0.0559, + "epoch": 0.41, + "learning_rate": 0.00023904619296875502, + "loss": 0.0558, "step": 62960 }, { - "epoch": 0.68, - "learning_rate": 0.0001978356804464923, - "loss": 0.0463, + "epoch": 0.41, + "learning_rate": 0.0002390365116143981, + "loss": 0.0628, "step": 62970 }, { - "epoch": 0.68, - "learning_rate": 0.00019781945616198323, - "loss": 0.0602, + "epoch": 0.41, + "learning_rate": 0.00023902683026004115, + "loss": 0.0495, "step": 62980 }, { - "epoch": 0.68, - "learning_rate": 0.0001978032318774742, - "loss": 0.0511, + "epoch": 0.41, + "learning_rate": 0.00023901714890568423, + "loss": 0.0553, "step": 62990 }, { - "epoch": 0.68, - "learning_rate": 0.00019778700759296512, - "loss": 0.0512, - "step": 63000 + "epoch": 0.41, + "learning_rate": 0.0002390074675513273, + "loss": 0.0569, + "step": 63000 }, { - "epoch": 0.68, - "eval_cer": 0.9211366555877732, - "eval_loss": 0.035725947469472885, - "eval_runtime": 119.032, - "eval_samples_per_second": 16.802, - "eval_steps_per_second": 4.201, + "epoch": 0.41, + "eval_cer": 0.919996384589312, + "eval_loss": 0.037891894578933716, + "eval_runtime": 119.8457, + "eval_samples_per_second": 16.688, + "eval_steps_per_second": 4.172, "step": 63000 }, { - "epoch": 0.68, - "learning_rate": 0.00019777078330845607, - "loss": 0.0533, + "epoch": 0.41, + "learning_rate": 0.0002389977861969704, + "loss": 0.0617, "step": 63010 }, { - "epoch": 0.68, - "learning_rate": 0.00019775455902394702, - "loss": 0.0552, + "epoch": 0.41, + "learning_rate": 0.00023898810484261341, + "loss": 0.061, "step": 63020 }, { - "epoch": 0.68, - "learning_rate": 0.00019773833473943797, - "loss": 0.0462, + "epoch": 0.41, + "learning_rate": 0.0002389784234882565, + "loss": 0.0576, "step": 63030 }, { - "epoch": 0.68, - "learning_rate": 0.0001977221104549289, - "loss": 0.0496, + "epoch": 0.41, + "learning_rate": 0.00023896874213389955, + "loss": 0.0585, "step": 63040 }, { - "epoch": 0.68, - "learning_rate": 0.00019770588617041987, - "loss": 0.0483, + "epoch": 0.41, + "learning_rate": 0.00023895906077954263, + "loss": 0.0544, "step": 63050 }, { - "epoch": 0.68, - "learning_rate": 0.0001976896618859108, - "loss": 0.0483, + "epoch": 0.41, + "learning_rate": 0.0002389493794251857, + "loss": 0.06, "step": 63060 }, { - "epoch": 0.68, - "learning_rate": 0.00019767343760140177, - "loss": 0.051, + "epoch": 0.41, + "learning_rate": 0.0002389396980708288, + "loss": 0.0631, "step": 63070 }, { - "epoch": 0.68, - "learning_rate": 0.0001976572133168927, - "loss": 0.0511, + "epoch": 0.41, + "learning_rate": 0.00023893001671647184, + "loss": 0.0571, "step": 63080 }, { - "epoch": 0.68, - "learning_rate": 0.00019764098903238365, - "loss": 0.0507, + "epoch": 0.41, + "learning_rate": 0.0002389203353621149, + "loss": 0.0687, "step": 63090 }, { - "epoch": 0.68, - "learning_rate": 0.0001976247647478746, - "loss": 0.0516, + "epoch": 0.41, + "learning_rate": 0.00023891065400775797, + "loss": 0.0582, "step": 63100 }, { - "epoch": 0.68, - "learning_rate": 0.00019760854046336554, - "loss": 0.056, + "epoch": 0.41, + "learning_rate": 0.00023890097265340102, + "loss": 0.0582, "step": 63110 }, { - "epoch": 0.68, - "learning_rate": 0.00019759231617885647, - "loss": 0.0551, + "epoch": 0.41, + "learning_rate": 0.0002388912912990441, + "loss": 0.0621, "step": 63120 }, { - "epoch": 0.68, - "learning_rate": 0.00019757609189434744, - "loss": 0.0513, + "epoch": 0.41, + "learning_rate": 0.00023888160994468718, + "loss": 0.0508, "step": 63130 }, { - "epoch": 0.68, - "learning_rate": 0.00019755986760983837, - "loss": 0.057, + "epoch": 0.41, + "learning_rate": 0.00023887192859033026, + "loss": 0.058, "step": 63140 }, { - "epoch": 0.68, - "learning_rate": 0.00019754364332532934, - "loss": 0.0459, + "epoch": 0.41, + "learning_rate": 0.00023886224723597332, + "loss": 0.0718, "step": 63150 }, { - "epoch": 0.68, - "learning_rate": 0.00019752741904082027, - "loss": 0.0618, + "epoch": 0.41, + "learning_rate": 0.00023885256588161637, + "loss": 0.0587, "step": 63160 }, { - "epoch": 0.68, - "learning_rate": 0.00019751119475631124, - "loss": 0.0488, + "epoch": 0.41, + "learning_rate": 0.00023884288452725945, + "loss": 0.056, "step": 63170 }, { - "epoch": 0.68, - "learning_rate": 0.00019749497047180217, - "loss": 0.0461, + "epoch": 0.41, + "learning_rate": 0.0002388332031729025, + "loss": 0.0503, "step": 63180 }, { - "epoch": 0.68, - "learning_rate": 0.00019747874618729312, - "loss": 0.0492, + "epoch": 0.41, + "learning_rate": 0.00023882352181854558, + "loss": 0.0592, "step": 63190 }, { - "epoch": 0.68, - "learning_rate": 0.00019746252190278407, - "loss": 0.0535, + "epoch": 0.41, + "learning_rate": 0.00023881384046418866, + "loss": 0.0532, "step": 63200 }, { - "epoch": 0.68, - "learning_rate": 0.00019744629761827502, - "loss": 0.0531, + "epoch": 0.41, + "learning_rate": 0.00023880415910983174, + "loss": 0.0574, "step": 63210 }, { - "epoch": 0.68, - "learning_rate": 0.00019743007333376594, - "loss": 0.0458, + "epoch": 0.41, + "learning_rate": 0.0002387944777554748, + "loss": 0.0617, "step": 63220 }, { - "epoch": 0.68, - "learning_rate": 0.00019741384904925692, - "loss": 0.0492, + "epoch": 0.41, + "learning_rate": 0.00023878479640111785, + "loss": 0.0608, "step": 63230 }, { - "epoch": 0.68, - "learning_rate": 0.00019739762476474784, - "loss": 0.0407, + "epoch": 0.41, + "learning_rate": 0.0002387751150467609, + "loss": 0.0676, "step": 63240 }, { - "epoch": 0.68, - "learning_rate": 0.00019738140048023881, - "loss": 0.0496, + "epoch": 0.41, + "learning_rate": 0.00023876543369240398, + "loss": 0.0566, "step": 63250 }, { - "epoch": 0.68, - "learning_rate": 0.00019736517619572974, - "loss": 0.0535, + "epoch": 0.41, + "learning_rate": 0.00023875575233804706, + "loss": 0.0643, "step": 63260 }, { - "epoch": 0.68, - "learning_rate": 0.0001973489519112207, - "loss": 0.0477, + "epoch": 0.41, + "learning_rate": 0.00023874607098369014, + "loss": 0.0611, "step": 63270 }, { - "epoch": 0.68, - "learning_rate": 0.00019733272762671164, - "loss": 0.0506, + "epoch": 0.41, + "learning_rate": 0.0002387363896293332, + "loss": 0.0572, "step": 63280 }, { - "epoch": 0.68, - "learning_rate": 0.0001973165033422026, - "loss": 0.0486, + "epoch": 0.41, + "learning_rate": 0.00023872670827497627, + "loss": 0.0585, "step": 63290 }, { - "epoch": 0.68, - "learning_rate": 0.0001973002790576935, - "loss": 0.0437, + "epoch": 0.41, + "learning_rate": 0.00023871702692061932, + "loss": 0.0579, "step": 63300 }, { - "epoch": 0.68, - "learning_rate": 0.00019728405477318449, - "loss": 0.0558, + "epoch": 0.41, + "learning_rate": 0.00023870734556626238, + "loss": 0.0557, "step": 63310 }, { - "epoch": 0.68, - "learning_rate": 0.0001972678304886754, - "loss": 0.05, + "epoch": 0.41, + "learning_rate": 0.00023869766421190546, + "loss": 0.0567, "step": 63320 }, { - "epoch": 0.68, - "learning_rate": 0.00019725160620416639, - "loss": 0.0601, + "epoch": 0.41, + "learning_rate": 0.00023868798285754854, + "loss": 0.0634, "step": 63330 }, { - "epoch": 0.69, - "learning_rate": 0.0001972353819196573, - "loss": 0.0521, + "epoch": 0.41, + "learning_rate": 0.00023867830150319162, + "loss": 0.0607, "step": 63340 }, { - "epoch": 0.69, - "learning_rate": 0.00019721915763514829, - "loss": 0.0538, + "epoch": 0.41, + "learning_rate": 0.00023866862014883467, + "loss": 0.0588, "step": 63350 }, { - "epoch": 0.69, - "learning_rate": 0.00019720293335063924, - "loss": 0.0477, + "epoch": 0.41, + "learning_rate": 0.00023865893879447775, + "loss": 0.0625, "step": 63360 }, { - "epoch": 0.69, - "learning_rate": 0.00019718670906613016, - "loss": 0.061, + "epoch": 0.41, + "learning_rate": 0.0002386492574401208, + "loss": 0.0587, "step": 63370 }, { - "epoch": 0.69, - "learning_rate": 0.00019717048478162113, - "loss": 0.0529, + "epoch": 0.41, + "learning_rate": 0.00023863957608576385, + "loss": 0.0581, "step": 63380 }, { - "epoch": 0.69, - "learning_rate": 0.00019715426049711206, - "loss": 0.0538, + "epoch": 0.41, + "learning_rate": 0.00023862989473140693, + "loss": 0.0589, "step": 63390 }, { - "epoch": 0.69, - "learning_rate": 0.00019713803621260303, - "loss": 0.0565, + "epoch": 0.41, + "learning_rate": 0.00023862021337705, + "loss": 0.0719, "step": 63400 }, { - "epoch": 0.69, - "learning_rate": 0.00019712181192809396, - "loss": 0.0504, + "epoch": 0.41, + "learning_rate": 0.0002386105320226931, + "loss": 0.0705, "step": 63410 }, { - "epoch": 0.69, - "learning_rate": 0.0001971055876435849, - "loss": 0.0459, + "epoch": 0.41, + "learning_rate": 0.00023860085066833615, + "loss": 0.0661, "step": 63420 }, { - "epoch": 0.69, - "learning_rate": 0.00019708936335907586, - "loss": 0.0508, + "epoch": 0.41, + "learning_rate": 0.00023859116931397923, + "loss": 0.0597, "step": 63430 }, { - "epoch": 0.69, - "learning_rate": 0.0001970731390745668, - "loss": 0.0499, + "epoch": 0.41, + "learning_rate": 0.00023858148795962225, + "loss": 0.0578, "step": 63440 }, { - "epoch": 0.69, - "learning_rate": 0.00019705691479005773, - "loss": 0.0492, + "epoch": 0.41, + "learning_rate": 0.00023857180660526533, + "loss": 0.0604, "step": 63450 }, { - "epoch": 0.69, - "learning_rate": 0.0001970406905055487, - "loss": 0.0542, + "epoch": 0.41, + "learning_rate": 0.0002385621252509084, + "loss": 0.0555, "step": 63460 }, { - "epoch": 0.69, - "learning_rate": 0.00019702446622103963, - "loss": 0.0556, + "epoch": 0.41, + "learning_rate": 0.0002385524438965515, + "loss": 0.0546, "step": 63470 }, { - "epoch": 0.69, - "learning_rate": 0.0001970082419365306, - "loss": 0.0535, + "epoch": 0.41, + "learning_rate": 0.00023854276254219454, + "loss": 0.0551, "step": 63480 }, { - "epoch": 0.69, - "learning_rate": 0.00019699201765202153, - "loss": 0.0499, + "epoch": 0.41, + "learning_rate": 0.00023853308118783762, + "loss": 0.0528, "step": 63490 }, { - "epoch": 0.69, - "learning_rate": 0.00019697579336751248, - "loss": 0.0491, + "epoch": 0.41, + "learning_rate": 0.0002385233998334807, + "loss": 0.0522, "step": 63500 }, { - "epoch": 0.69, - "learning_rate": 0.00019695956908300343, - "loss": 0.0505, + "epoch": 0.41, + "learning_rate": 0.00023851371847912373, + "loss": 0.0597, "step": 63510 }, { - "epoch": 0.69, - "learning_rate": 0.00019694334479849438, - "loss": 0.0462, + "epoch": 0.41, + "learning_rate": 0.0002385040371247668, + "loss": 0.0549, "step": 63520 }, { - "epoch": 0.69, - "learning_rate": 0.00019692712051398533, - "loss": 0.0436, + "epoch": 0.41, + "learning_rate": 0.0002384943557704099, + "loss": 0.0681, "step": 63530 }, { - "epoch": 0.69, - "learning_rate": 0.00019691089622947628, - "loss": 0.0456, + "epoch": 0.41, + "learning_rate": 0.00023848467441605297, + "loss": 0.057, "step": 63540 }, { - "epoch": 0.69, - "learning_rate": 0.0001968946719449672, - "loss": 0.0556, + "epoch": 0.41, + "learning_rate": 0.00023847499306169602, + "loss": 0.0587, "step": 63550 }, { - "epoch": 0.69, - "learning_rate": 0.00019687844766045818, - "loss": 0.0606, + "epoch": 0.41, + "learning_rate": 0.0002384653117073391, + "loss": 0.0564, "step": 63560 }, { - "epoch": 0.69, - "learning_rate": 0.0001968622233759491, - "loss": 0.0489, + "epoch": 0.41, + "learning_rate": 0.00023845563035298218, + "loss": 0.0543, "step": 63570 }, { - "epoch": 0.69, - "learning_rate": 0.00019684599909144008, - "loss": 0.048, + "epoch": 0.41, + "learning_rate": 0.0002384459489986252, + "loss": 0.0556, "step": 63580 }, { - "epoch": 0.69, - "learning_rate": 0.000196829774806931, - "loss": 0.0456, + "epoch": 0.41, + "learning_rate": 0.00023843626764426829, + "loss": 0.0517, "step": 63590 }, { - "epoch": 0.69, - "learning_rate": 0.00019681355052242195, - "loss": 0.0496, + "epoch": 0.41, + "learning_rate": 0.00023842658628991136, + "loss": 0.0587, "step": 63600 }, { - "epoch": 0.69, - "learning_rate": 0.0001967973262379129, - "loss": 0.0423, + "epoch": 0.41, + "learning_rate": 0.00023841690493555444, + "loss": 0.0536, "step": 63610 }, { - "epoch": 0.69, - "learning_rate": 0.00019678110195340385, - "loss": 0.0501, + "epoch": 0.41, + "learning_rate": 0.0002384072235811975, + "loss": 0.0635, "step": 63620 }, { - "epoch": 0.69, - "learning_rate": 0.00019676487766889477, - "loss": 0.0482, + "epoch": 0.41, + "learning_rate": 0.00023839754222684058, + "loss": 0.0611, "step": 63630 }, { - "epoch": 0.69, - "learning_rate": 0.00019674865338438575, - "loss": 0.0436, + "epoch": 0.41, + "learning_rate": 0.00023838786087248366, + "loss": 0.054, "step": 63640 }, { - "epoch": 0.69, - "learning_rate": 0.00019673242909987667, - "loss": 0.0477, + "epoch": 0.41, + "learning_rate": 0.00023837817951812668, + "loss": 0.0665, "step": 63650 }, { - "epoch": 0.69, - "learning_rate": 0.00019671620481536765, - "loss": 0.0493, + "epoch": 0.41, + "learning_rate": 0.00023836849816376976, + "loss": 0.0588, "step": 63660 }, { - "epoch": 0.69, - "learning_rate": 0.00019669998053085857, - "loss": 0.0468, + "epoch": 0.41, + "learning_rate": 0.00023835881680941284, + "loss": 0.0506, "step": 63670 }, { - "epoch": 0.69, - "learning_rate": 0.00019668375624634955, - "loss": 0.0489, + "epoch": 0.41, + "learning_rate": 0.0002383491354550559, + "loss": 0.0543, "step": 63680 }, { - "epoch": 0.69, - "learning_rate": 0.00019666753196184047, - "loss": 0.0528, + "epoch": 0.41, + "learning_rate": 0.00023833945410069897, + "loss": 0.0577, "step": 63690 }, { - "epoch": 0.69, - "learning_rate": 0.00019665130767733142, - "loss": 0.0484, + "epoch": 0.41, + "learning_rate": 0.00023832977274634205, + "loss": 0.0677, "step": 63700 }, { - "epoch": 0.69, - "learning_rate": 0.00019663508339282237, - "loss": 0.0485, + "epoch": 0.41, + "learning_rate": 0.00023832009139198513, + "loss": 0.0576, "step": 63710 }, { - "epoch": 0.69, - "learning_rate": 0.00019661885910831332, - "loss": 0.0632, + "epoch": 0.41, + "learning_rate": 0.00023831041003762816, + "loss": 0.0664, "step": 63720 }, { - "epoch": 0.69, - "learning_rate": 0.00019660263482380424, - "loss": 0.0448, + "epoch": 0.41, + "learning_rate": 0.00023830072868327124, + "loss": 0.0627, "step": 63730 }, { - "epoch": 0.69, - "learning_rate": 0.00019658641053929522, - "loss": 0.0479, + "epoch": 0.41, + "learning_rate": 0.00023829104732891432, + "loss": 0.0565, "step": 63740 }, { - "epoch": 0.69, - "learning_rate": 0.00019657018625478614, - "loss": 0.0442, + "epoch": 0.41, + "learning_rate": 0.00023828136597455737, + "loss": 0.0582, "step": 63750 }, { - "epoch": 0.69, - "learning_rate": 0.00019655396197027712, - "loss": 0.0536, + "epoch": 0.41, + "learning_rate": 0.00023827168462020045, + "loss": 0.0586, "step": 63760 }, { - "epoch": 0.69, - "learning_rate": 0.00019653773768576804, - "loss": 0.0468, + "epoch": 0.41, + "learning_rate": 0.00023826200326584353, + "loss": 0.0556, "step": 63770 }, { - "epoch": 0.69, - "learning_rate": 0.000196521513401259, - "loss": 0.0476, + "epoch": 0.41, + "learning_rate": 0.0002382523219114866, + "loss": 0.0582, "step": 63780 }, { - "epoch": 0.69, - "learning_rate": 0.00019650528911674994, - "loss": 0.0526, + "epoch": 0.41, + "learning_rate": 0.00023824264055712964, + "loss": 0.0593, "step": 63790 }, { - "epoch": 0.69, - "learning_rate": 0.0001964890648322409, - "loss": 0.0467, + "epoch": 0.41, + "learning_rate": 0.00023823295920277272, + "loss": 0.0671, "step": 63800 }, { - "epoch": 0.69, - "learning_rate": 0.0001964728405477318, - "loss": 0.0505, + "epoch": 0.41, + "learning_rate": 0.0002382232778484158, + "loss": 0.0596, "step": 63810 }, { - "epoch": 0.69, - "learning_rate": 0.0001964566162632228, - "loss": 0.0438, + "epoch": 0.41, + "learning_rate": 0.00023821359649405885, + "loss": 0.0509, "step": 63820 }, { - "epoch": 0.69, - "learning_rate": 0.0001964403919787137, - "loss": 0.0537, + "epoch": 0.41, + "learning_rate": 0.00023820391513970193, + "loss": 0.0552, "step": 63830 }, { - "epoch": 0.69, - "learning_rate": 0.0001964241676942047, - "loss": 0.0478, + "epoch": 0.41, + "learning_rate": 0.000238194233785345, + "loss": 0.0547, "step": 63840 }, { - "epoch": 0.69, - "learning_rate": 0.0001964079434096956, - "loss": 0.0479, + "epoch": 0.41, + "learning_rate": 0.00023818455243098806, + "loss": 0.0643, "step": 63850 }, { - "epoch": 0.69, - "learning_rate": 0.0001963917191251866, - "loss": 0.053, + "epoch": 0.41, + "learning_rate": 0.00023817487107663111, + "loss": 0.0615, "step": 63860 }, { - "epoch": 0.69, - "learning_rate": 0.0001963754948406775, - "loss": 0.0586, + "epoch": 0.41, + "learning_rate": 0.0002381651897222742, + "loss": 0.0632, "step": 63870 }, { - "epoch": 0.69, - "learning_rate": 0.00019635927055616846, - "loss": 0.0476, + "epoch": 0.41, + "learning_rate": 0.00023815550836791725, + "loss": 0.0574, "step": 63880 }, { - "epoch": 0.69, - "learning_rate": 0.0001963430462716594, - "loss": 0.0541, + "epoch": 0.41, + "learning_rate": 0.00023814582701356033, + "loss": 0.0616, "step": 63890 }, { - "epoch": 0.69, - "learning_rate": 0.00019632682198715036, - "loss": 0.0531, + "epoch": 0.41, + "learning_rate": 0.0002381361456592034, + "loss": 0.0549, "step": 63900 }, { - "epoch": 0.69, - "learning_rate": 0.00019631059770264128, - "loss": 0.0532, + "epoch": 0.41, + "learning_rate": 0.00023812646430484649, + "loss": 0.056, "step": 63910 }, { - "epoch": 0.69, - "learning_rate": 0.00019629437341813226, - "loss": 0.0515, + "epoch": 0.41, + "learning_rate": 0.00023811678295048954, + "loss": 0.0584, "step": 63920 }, { - "epoch": 0.69, - "learning_rate": 0.00019627814913362318, - "loss": 0.0468, + "epoch": 0.41, + "learning_rate": 0.0002381071015961326, + "loss": 0.0559, "step": 63930 }, { - "epoch": 0.69, - "learning_rate": 0.00019626192484911416, - "loss": 0.043, + "epoch": 0.41, + "learning_rate": 0.00023809742024177567, + "loss": 0.0602, "step": 63940 }, { - "epoch": 0.69, - "learning_rate": 0.00019624570056460508, - "loss": 0.0454, + "epoch": 0.41, + "learning_rate": 0.00023808773888741872, + "loss": 0.0536, "step": 63950 }, { - "epoch": 0.69, - "learning_rate": 0.00019622947628009603, - "loss": 0.0474, + "epoch": 0.41, + "learning_rate": 0.0002380780575330618, + "loss": 0.054, "step": 63960 }, { - "epoch": 0.69, - "learning_rate": 0.00019621325199558698, - "loss": 0.051, + "epoch": 0.41, + "learning_rate": 0.00023806837617870488, + "loss": 0.063, "step": 63970 }, { - "epoch": 0.69, - "learning_rate": 0.00019619702771107793, - "loss": 0.0501, + "epoch": 0.41, + "learning_rate": 0.00023805869482434796, + "loss": 0.0587, "step": 63980 }, { - "epoch": 0.69, - "learning_rate": 0.00019618080342656885, - "loss": 0.0463, + "epoch": 0.41, + "learning_rate": 0.00023804901346999102, + "loss": 0.0547, "step": 63990 }, { - "epoch": 0.69, - "learning_rate": 0.00019616457914205983, - "loss": 0.0488, + "epoch": 0.41, + "learning_rate": 0.00023803933211563407, + "loss": 0.0577, "step": 64000 }, { - "epoch": 0.69, - "eval_cer": 0.9213204203265004, - "eval_loss": 0.03410179913043976, - "eval_runtime": 119.0431, - "eval_samples_per_second": 16.801, - "eval_steps_per_second": 4.2, + "epoch": 0.41, + "eval_cer": 0.920002711558016, + "eval_loss": 0.03821108117699623, + "eval_runtime": 119.9562, + "eval_samples_per_second": 16.673, + "eval_steps_per_second": 4.168, "step": 64000 }, { - "epoch": 0.69, - "learning_rate": 0.00019614835485755075, - "loss": 0.046, + "epoch": 0.41, + "learning_rate": 0.00023802965076127715, + "loss": 0.0529, "step": 64010 }, { - "epoch": 0.69, - "learning_rate": 0.00019613213057304173, - "loss": 0.0452, + "epoch": 0.41, + "learning_rate": 0.0002380199694069202, + "loss": 0.0499, "step": 64020 }, { - "epoch": 0.69, - "learning_rate": 0.00019611590628853265, - "loss": 0.0458, + "epoch": 0.41, + "learning_rate": 0.00023801028805256328, + "loss": 0.053, "step": 64030 }, { - "epoch": 0.69, - "learning_rate": 0.00019609968200402363, - "loss": 0.0608, + "epoch": 0.41, + "learning_rate": 0.00023800060669820636, + "loss": 0.0655, "step": 64040 }, { - "epoch": 0.69, - "learning_rate": 0.00019608345771951455, - "loss": 0.0571, + "epoch": 0.41, + "learning_rate": 0.0002379909253438494, + "loss": 0.0569, "step": 64050 }, { - "epoch": 0.69, - "learning_rate": 0.0001960672334350055, - "loss": 0.0468, + "epoch": 0.41, + "learning_rate": 0.0002379812439894925, + "loss": 0.0592, "step": 64060 }, { - "epoch": 0.69, - "learning_rate": 0.00019605100915049645, - "loss": 0.0491, + "epoch": 0.41, + "learning_rate": 0.00023797156263513555, + "loss": 0.0568, "step": 64070 }, { - "epoch": 0.69, - "learning_rate": 0.0001960347848659874, - "loss": 0.0515, + "epoch": 0.41, + "learning_rate": 0.0002379618812807786, + "loss": 0.0567, "step": 64080 }, { - "epoch": 0.69, - "learning_rate": 0.00019601856058147832, - "loss": 0.051, + "epoch": 0.41, + "learning_rate": 0.00023795219992642168, + "loss": 0.0518, "step": 64090 }, { - "epoch": 0.69, - "learning_rate": 0.0001960023362969693, - "loss": 0.0495, + "epoch": 0.41, + "learning_rate": 0.00023794251857206476, + "loss": 0.0571, "step": 64100 }, { - "epoch": 0.69, - "learning_rate": 0.00019598611201246022, - "loss": 0.0611, + "epoch": 0.41, + "learning_rate": 0.00023793283721770784, + "loss": 0.0604, "step": 64110 }, { - "epoch": 0.69, - "learning_rate": 0.0001959698877279512, - "loss": 0.0545, + "epoch": 0.41, + "learning_rate": 0.0002379231558633509, + "loss": 0.0547, "step": 64120 }, { - "epoch": 0.69, - "learning_rate": 0.00019595366344344212, - "loss": 0.0549, + "epoch": 0.41, + "learning_rate": 0.00023791347450899397, + "loss": 0.0631, "step": 64130 }, { - "epoch": 0.69, - "learning_rate": 0.00019593743915893307, - "loss": 0.0487, + "epoch": 0.41, + "learning_rate": 0.00023790379315463702, + "loss": 0.0597, "step": 64140 }, { - "epoch": 0.69, - "learning_rate": 0.00019592121487442402, - "loss": 0.049, + "epoch": 0.41, + "learning_rate": 0.00023789411180028008, + "loss": 0.0573, "step": 64150 }, { - "epoch": 0.69, - "learning_rate": 0.00019590499058991497, - "loss": 0.05, + "epoch": 0.41, + "learning_rate": 0.00023788443044592316, + "loss": 0.0579, "step": 64160 }, { - "epoch": 0.69, - "learning_rate": 0.0001958887663054059, - "loss": 0.0484, + "epoch": 0.41, + "learning_rate": 0.00023787474909156624, + "loss": 0.0544, "step": 64170 }, { - "epoch": 0.69, - "learning_rate": 0.00019587254202089687, - "loss": 0.0505, + "epoch": 0.41, + "learning_rate": 0.00023786506773720932, + "loss": 0.0528, "step": 64180 }, { - "epoch": 0.69, - "learning_rate": 0.0001958563177363878, - "loss": 0.0457, + "epoch": 0.41, + "learning_rate": 0.00023785538638285237, + "loss": 0.0537, "step": 64190 }, { - "epoch": 0.69, - "learning_rate": 0.00019584009345187877, - "loss": 0.0488, + "epoch": 0.41, + "learning_rate": 0.00023784570502849545, + "loss": 0.0518, "step": 64200 }, { - "epoch": 0.69, - "learning_rate": 0.0001958238691673697, - "loss": 0.0545, + "epoch": 0.41, + "learning_rate": 0.0002378360236741385, + "loss": 0.0536, "step": 64210 }, { - "epoch": 0.69, - "learning_rate": 0.00019580764488286067, - "loss": 0.0475, + "epoch": 0.41, + "learning_rate": 0.00023782634231978155, + "loss": 0.0588, "step": 64220 }, { - "epoch": 0.69, - "learning_rate": 0.0001957914205983516, - "loss": 0.0496, + "epoch": 0.41, + "learning_rate": 0.00023781666096542463, + "loss": 0.0666, "step": 64230 }, { - "epoch": 0.69, - "learning_rate": 0.00019577519631384254, - "loss": 0.0479, + "epoch": 0.41, + "learning_rate": 0.0002378069796110677, + "loss": 0.0594, "step": 64240 }, { - "epoch": 0.69, - "learning_rate": 0.0001957589720293335, - "loss": 0.0505, + "epoch": 0.41, + "learning_rate": 0.00023779729825671077, + "loss": 0.0594, "step": 64250 }, { - "epoch": 0.7, - "learning_rate": 0.00019574274774482444, - "loss": 0.0425, - "step": 64260 + "epoch": 0.41, + "learning_rate": 0.00023778761690235385, + "loss": 0.0581, + "step": 64260 }, { - "epoch": 0.7, - "learning_rate": 0.00019572652346031537, - "loss": 0.0458, + "epoch": 0.41, + "learning_rate": 0.00023777793554799692, + "loss": 0.0556, "step": 64270 }, { - "epoch": 0.7, - "learning_rate": 0.00019571029917580634, - "loss": 0.0483, + "epoch": 0.41, + "learning_rate": 0.00023776825419363995, + "loss": 0.054, "step": 64280 }, { - "epoch": 0.7, - "learning_rate": 0.00019569407489129727, - "loss": 0.0513, + "epoch": 0.41, + "learning_rate": 0.00023775857283928303, + "loss": 0.0639, "step": 64290 }, { - "epoch": 0.7, - "learning_rate": 0.00019567785060678824, - "loss": 0.0468, + "epoch": 0.42, + "learning_rate": 0.0002377488914849261, + "loss": 0.0545, "step": 64300 }, { - "epoch": 0.7, - "learning_rate": 0.00019566162632227917, - "loss": 0.047, + "epoch": 0.42, + "learning_rate": 0.0002377392101305692, + "loss": 0.0555, "step": 64310 }, { - "epoch": 0.7, - "learning_rate": 0.00019564540203777011, - "loss": 0.0501, + "epoch": 0.42, + "learning_rate": 0.00023772952877621224, + "loss": 0.054, "step": 64320 }, { - "epoch": 0.7, - "learning_rate": 0.00019562917775326106, - "loss": 0.0521, + "epoch": 0.42, + "learning_rate": 0.00023771984742185532, + "loss": 0.0616, "step": 64330 }, { - "epoch": 0.7, - "learning_rate": 0.00019561295346875201, - "loss": 0.0533, + "epoch": 0.42, + "learning_rate": 0.0002377101660674984, + "loss": 0.0524, "step": 64340 }, { - "epoch": 0.7, - "learning_rate": 0.00019559672918424296, - "loss": 0.0537, + "epoch": 0.42, + "learning_rate": 0.00023770048471314143, + "loss": 0.057, "step": 64350 }, { - "epoch": 0.7, - "learning_rate": 0.00019558050489973391, - "loss": 0.05, + "epoch": 0.42, + "learning_rate": 0.0002376908033587845, + "loss": 0.0602, "step": 64360 }, { - "epoch": 0.7, - "learning_rate": 0.00019556428061522484, - "loss": 0.0511, + "epoch": 0.42, + "learning_rate": 0.0002376811220044276, + "loss": 0.0573, "step": 64370 }, { - "epoch": 0.7, - "learning_rate": 0.0001955480563307158, - "loss": 0.0465, + "epoch": 0.42, + "learning_rate": 0.00023767144065007067, + "loss": 0.0614, "step": 64380 }, { - "epoch": 0.7, - "learning_rate": 0.00019553183204620674, - "loss": 0.0514, + "epoch": 0.42, + "learning_rate": 0.00023766175929571372, + "loss": 0.0588, "step": 64390 }, { - "epoch": 0.7, - "learning_rate": 0.0001955156077616977, - "loss": 0.0477, + "epoch": 0.42, + "learning_rate": 0.0002376520779413568, + "loss": 0.0554, "step": 64400 }, { - "epoch": 0.7, - "learning_rate": 0.00019549938347718864, - "loss": 0.0455, + "epoch": 0.42, + "learning_rate": 0.00023764239658699988, + "loss": 0.0573, "step": 64410 }, { - "epoch": 0.7, - "learning_rate": 0.00019548315919267959, - "loss": 0.0616, + "epoch": 0.42, + "learning_rate": 0.0002376327152326429, + "loss": 0.0581, "step": 64420 }, { - "epoch": 0.7, - "learning_rate": 0.00019546693490817054, - "loss": 0.0449, + "epoch": 0.42, + "learning_rate": 0.00023762303387828598, + "loss": 0.0621, "step": 64430 }, { - "epoch": 0.7, - "learning_rate": 0.00019545071062366149, - "loss": 0.0546, + "epoch": 0.42, + "learning_rate": 0.00023761335252392906, + "loss": 0.0511, "step": 64440 }, { - "epoch": 0.7, - "learning_rate": 0.0001954344863391524, - "loss": 0.0477, + "epoch": 0.42, + "learning_rate": 0.00023760367116957212, + "loss": 0.0551, "step": 64450 }, { - "epoch": 0.7, - "learning_rate": 0.00019541826205464338, - "loss": 0.0438, + "epoch": 0.42, + "learning_rate": 0.0002375939898152152, + "loss": 0.0606, "step": 64460 }, { - "epoch": 0.7, - "learning_rate": 0.0001954020377701343, - "loss": 0.0484, + "epoch": 0.42, + "learning_rate": 0.00023758430846085828, + "loss": 0.062, "step": 64470 }, { - "epoch": 0.7, - "learning_rate": 0.00019538581348562528, - "loss": 0.055, + "epoch": 0.42, + "learning_rate": 0.00023757462710650136, + "loss": 0.0573, "step": 64480 }, { - "epoch": 0.7, - "learning_rate": 0.0001953695892011162, - "loss": 0.0507, + "epoch": 0.42, + "learning_rate": 0.00023756494575214438, + "loss": 0.0609, "step": 64490 }, { - "epoch": 0.7, - "learning_rate": 0.00019535336491660716, - "loss": 0.046, + "epoch": 0.42, + "learning_rate": 0.00023755526439778746, + "loss": 0.0653, "step": 64500 }, { - "epoch": 0.7, - "learning_rate": 0.0001953371406320981, - "loss": 0.0462, + "epoch": 0.42, + "learning_rate": 0.00023754558304343054, + "loss": 0.0599, "step": 64510 }, { - "epoch": 0.7, - "learning_rate": 0.00019532091634758906, - "loss": 0.0523, + "epoch": 0.42, + "learning_rate": 0.0002375359016890736, + "loss": 0.0555, "step": 64520 }, { - "epoch": 0.7, - "learning_rate": 0.00019530469206308, - "loss": 0.0533, + "epoch": 0.42, + "learning_rate": 0.00023752622033471667, + "loss": 0.0534, "step": 64530 }, { - "epoch": 0.7, - "learning_rate": 0.00019528846777857096, - "loss": 0.0485, + "epoch": 0.42, + "learning_rate": 0.00023751653898035975, + "loss": 0.0512, "step": 64540 }, { - "epoch": 0.7, - "learning_rate": 0.00019527224349406188, - "loss": 0.0533, + "epoch": 0.42, + "learning_rate": 0.00023750685762600283, + "loss": 0.05, "step": 64550 }, { - "epoch": 0.7, - "learning_rate": 0.00019525601920955286, - "loss": 0.0522, + "epoch": 0.42, + "learning_rate": 0.00023749717627164586, + "loss": 0.0529, "step": 64560 }, { - "epoch": 0.7, - "learning_rate": 0.00019523979492504378, - "loss": 0.0474, + "epoch": 0.42, + "learning_rate": 0.00023748749491728894, + "loss": 0.0543, "step": 64570 }, { - "epoch": 0.7, - "learning_rate": 0.00019522357064053475, - "loss": 0.0499, + "epoch": 0.42, + "learning_rate": 0.00023747781356293202, + "loss": 0.063, "step": 64580 }, { - "epoch": 0.7, - "learning_rate": 0.00019520734635602568, - "loss": 0.0528, + "epoch": 0.42, + "learning_rate": 0.00023746813220857507, + "loss": 0.062, "step": 64590 }, { - "epoch": 0.7, - "learning_rate": 0.00019519112207151663, - "loss": 0.0541, + "epoch": 0.42, + "learning_rate": 0.00023745845085421815, + "loss": 0.0624, "step": 64600 }, { - "epoch": 0.7, - "learning_rate": 0.00019517489778700758, - "loss": 0.0582, + "epoch": 0.42, + "learning_rate": 0.00023744876949986123, + "loss": 0.0689, "step": 64610 }, { - "epoch": 0.7, - "learning_rate": 0.00019515867350249853, - "loss": 0.046, + "epoch": 0.42, + "learning_rate": 0.00023743908814550428, + "loss": 0.0552, "step": 64620 }, { - "epoch": 0.7, - "learning_rate": 0.00019514244921798945, - "loss": 0.0494, + "epoch": 0.42, + "learning_rate": 0.00023742940679114734, + "loss": 0.0581, "step": 64630 }, { - "epoch": 0.7, - "learning_rate": 0.00019512622493348043, - "loss": 0.0488, + "epoch": 0.42, + "learning_rate": 0.00023741972543679042, + "loss": 0.0553, "step": 64640 }, { - "epoch": 0.7, - "learning_rate": 0.00019511000064897135, - "loss": 0.0445, + "epoch": 0.42, + "learning_rate": 0.00023741004408243347, + "loss": 0.0599, "step": 64650 }, { - "epoch": 0.7, - "learning_rate": 0.00019509377636446233, - "loss": 0.0509, + "epoch": 0.42, + "learning_rate": 0.00023740036272807655, + "loss": 0.0591, "step": 64660 }, { - "epoch": 0.7, - "learning_rate": 0.00019507755207995325, - "loss": 0.0541, + "epoch": 0.42, + "learning_rate": 0.00023739068137371963, + "loss": 0.0536, "step": 64670 }, { - "epoch": 0.7, - "learning_rate": 0.0001950613277954442, - "loss": 0.0473, + "epoch": 0.42, + "learning_rate": 0.0002373810000193627, + "loss": 0.0525, "step": 64680 }, { - "epoch": 0.7, - "learning_rate": 0.00019504510351093515, - "loss": 0.0565, + "epoch": 0.42, + "learning_rate": 0.00023737131866500576, + "loss": 0.0571, "step": 64690 }, { - "epoch": 0.7, - "learning_rate": 0.0001950288792264261, - "loss": 0.0456, + "epoch": 0.42, + "learning_rate": 0.00023736163731064881, + "loss": 0.0622, "step": 64700 }, { - "epoch": 0.7, - "learning_rate": 0.00019501265494191705, - "loss": 0.0545, + "epoch": 0.42, + "learning_rate": 0.0002373519559562919, + "loss": 0.0529, "step": 64710 }, { - "epoch": 0.7, - "learning_rate": 0.000194996430657408, - "loss": 0.0515, + "epoch": 0.42, + "learning_rate": 0.00023734227460193495, + "loss": 0.0591, "step": 64720 }, { - "epoch": 0.7, - "learning_rate": 0.00019498020637289892, - "loss": 0.0449, + "epoch": 0.42, + "learning_rate": 0.00023733259324757803, + "loss": 0.0582, "step": 64730 }, { - "epoch": 0.7, - "learning_rate": 0.0001949639820883899, - "loss": 0.0453, + "epoch": 0.42, + "learning_rate": 0.0002373229118932211, + "loss": 0.0659, "step": 64740 }, { - "epoch": 0.7, - "learning_rate": 0.00019494775780388082, - "loss": 0.0485, + "epoch": 0.42, + "learning_rate": 0.00023731323053886419, + "loss": 0.0553, "step": 64750 }, { - "epoch": 0.7, - "learning_rate": 0.0001949315335193718, - "loss": 0.0516, + "epoch": 0.42, + "learning_rate": 0.00023730354918450724, + "loss": 0.0647, "step": 64760 }, { - "epoch": 0.7, - "learning_rate": 0.00019491530923486272, - "loss": 0.0545, + "epoch": 0.42, + "learning_rate": 0.0002372938678301503, + "loss": 0.0614, "step": 64770 }, { - "epoch": 0.7, - "learning_rate": 0.00019489908495035367, - "loss": 0.0554, + "epoch": 0.42, + "learning_rate": 0.00023728418647579337, + "loss": 0.0549, "step": 64780 }, { - "epoch": 0.7, - "learning_rate": 0.00019488286066584462, - "loss": 0.0452, + "epoch": 0.42, + "learning_rate": 0.00023727450512143642, + "loss": 0.0621, "step": 64790 }, { - "epoch": 0.7, - "learning_rate": 0.00019486663638133557, - "loss": 0.0471, + "epoch": 0.42, + "learning_rate": 0.0002372648237670795, + "loss": 0.0616, "step": 64800 }, { - "epoch": 0.7, - "learning_rate": 0.0001948504120968265, - "loss": 0.0521, + "epoch": 0.42, + "learning_rate": 0.00023725514241272258, + "loss": 0.0568, "step": 64810 }, { - "epoch": 0.7, - "learning_rate": 0.00019483418781231747, - "loss": 0.0496, + "epoch": 0.42, + "learning_rate": 0.00023724546105836564, + "loss": 0.0575, "step": 64820 }, { - "epoch": 0.7, - "learning_rate": 0.0001948179635278084, - "loss": 0.0504, + "epoch": 0.42, + "learning_rate": 0.00023723577970400872, + "loss": 0.0625, "step": 64830 }, { - "epoch": 0.7, - "learning_rate": 0.00019480173924329937, - "loss": 0.0477, + "epoch": 0.42, + "learning_rate": 0.00023722609834965177, + "loss": 0.0571, "step": 64840 }, { - "epoch": 0.7, - "learning_rate": 0.0001947855149587903, - "loss": 0.0496, + "epoch": 0.42, + "learning_rate": 0.00023721641699529482, + "loss": 0.0554, "step": 64850 }, { - "epoch": 0.7, - "learning_rate": 0.00019476929067428124, - "loss": 0.0548, + "epoch": 0.42, + "learning_rate": 0.0002372067356409379, + "loss": 0.0562, "step": 64860 }, { - "epoch": 0.7, - "learning_rate": 0.0001947530663897722, - "loss": 0.0478, + "epoch": 0.42, + "learning_rate": 0.00023719705428658098, + "loss": 0.062, "step": 64870 }, { - "epoch": 0.7, - "learning_rate": 0.00019473684210526314, - "loss": 0.0433, + "epoch": 0.42, + "learning_rate": 0.00023718737293222406, + "loss": 0.0596, "step": 64880 }, { - "epoch": 0.7, - "learning_rate": 0.0001947206178207541, - "loss": 0.0455, + "epoch": 0.42, + "learning_rate": 0.0002371776915778671, + "loss": 0.0533, "step": 64890 }, { - "epoch": 0.7, - "learning_rate": 0.00019470439353624504, - "loss": 0.0517, + "epoch": 0.42, + "learning_rate": 0.0002371680102235102, + "loss": 0.0611, "step": 64900 }, { - "epoch": 0.7, - "learning_rate": 0.00019468816925173596, - "loss": 0.0498, + "epoch": 0.42, + "learning_rate": 0.00023715832886915325, + "loss": 0.0564, "step": 64910 }, { - "epoch": 0.7, - "learning_rate": 0.00019467194496722694, - "loss": 0.0508, + "epoch": 0.42, + "learning_rate": 0.0002371486475147963, + "loss": 0.0563, "step": 64920 }, { - "epoch": 0.7, - "learning_rate": 0.00019465572068271786, - "loss": 0.0536, + "epoch": 0.42, + "learning_rate": 0.00023713896616043938, + "loss": 0.0641, "step": 64930 }, { - "epoch": 0.7, - "learning_rate": 0.00019463949639820884, - "loss": 0.0558, + "epoch": 0.42, + "learning_rate": 0.00023712928480608246, + "loss": 0.0607, "step": 64940 }, { - "epoch": 0.7, - "learning_rate": 0.00019462327211369976, - "loss": 0.0489, + "epoch": 0.42, + "learning_rate": 0.00023711960345172554, + "loss": 0.0586, "step": 64950 }, { - "epoch": 0.7, - "learning_rate": 0.0001946070478291907, - "loss": 0.051, + "epoch": 0.42, + "learning_rate": 0.0002371099220973686, + "loss": 0.0549, "step": 64960 }, { - "epoch": 0.7, - "learning_rate": 0.00019459082354468166, - "loss": 0.0591, + "epoch": 0.42, + "learning_rate": 0.00023710024074301167, + "loss": 0.0647, "step": 64970 }, { - "epoch": 0.7, - "learning_rate": 0.0001945745992601726, - "loss": 0.0526, + "epoch": 0.42, + "learning_rate": 0.00023709055938865472, + "loss": 0.0527, "step": 64980 }, { - "epoch": 0.7, - "learning_rate": 0.00019455837497566353, - "loss": 0.0617, + "epoch": 0.42, + "learning_rate": 0.00023708087803429778, + "loss": 0.0547, "step": 64990 }, { - "epoch": 0.7, - "learning_rate": 0.0001945421506911545, - "loss": 0.0485, + "epoch": 0.42, + "learning_rate": 0.00023707119667994086, + "loss": 0.061, "step": 65000 }, { - "epoch": 0.7, - "eval_cer": 0.9213098185146508, - "eval_loss": 0.034628286957740784, - "eval_runtime": 118.9146, - "eval_samples_per_second": 16.819, - "eval_steps_per_second": 4.205, + "epoch": 0.42, + "eval_cer": 0.9201581742176025, + "eval_loss": 0.03896106779575348, + "eval_runtime": 120.0403, + "eval_samples_per_second": 16.661, + "eval_steps_per_second": 4.165, "step": 65000 }, { - "epoch": 0.7, - "learning_rate": 0.00019452592640664543, - "loss": 0.0519, + "epoch": 0.42, + "learning_rate": 0.00023706151532558394, + "loss": 0.0566, "step": 65010 }, { - "epoch": 0.7, - "learning_rate": 0.0001945097021221364, - "loss": 0.0408, + "epoch": 0.42, + "learning_rate": 0.000237051833971227, + "loss": 0.0514, "step": 65020 }, { - "epoch": 0.7, - "learning_rate": 0.00019449347783762733, - "loss": 0.05, + "epoch": 0.42, + "learning_rate": 0.00023704215261687007, + "loss": 0.0557, "step": 65030 }, { - "epoch": 0.7, - "learning_rate": 0.0001944772535531183, - "loss": 0.0468, + "epoch": 0.42, + "learning_rate": 0.00023703247126251315, + "loss": 0.0579, "step": 65040 }, { - "epoch": 0.7, - "learning_rate": 0.00019446102926860923, - "loss": 0.055, + "epoch": 0.42, + "learning_rate": 0.00023702278990815617, + "loss": 0.0516, "step": 65050 }, { - "epoch": 0.7, - "learning_rate": 0.00019444480498410018, - "loss": 0.0497, + "epoch": 0.42, + "learning_rate": 0.00023701310855379925, + "loss": 0.0538, "step": 65060 }, { - "epoch": 0.7, - "learning_rate": 0.00019442858069959113, - "loss": 0.0456, + "epoch": 0.42, + "learning_rate": 0.00023700342719944233, + "loss": 0.0654, "step": 65070 }, { - "epoch": 0.7, - "learning_rate": 0.00019441235641508208, - "loss": 0.0477, + "epoch": 0.42, + "learning_rate": 0.0002369937458450854, + "loss": 0.0578, "step": 65080 }, { - "epoch": 0.7, - "learning_rate": 0.000194396132130573, - "loss": 0.0509, + "epoch": 0.42, + "learning_rate": 0.00023698406449072846, + "loss": 0.069, "step": 65090 }, { - "epoch": 0.7, - "learning_rate": 0.00019437990784606398, - "loss": 0.0484, + "epoch": 0.42, + "learning_rate": 0.00023697438313637154, + "loss": 0.0604, "step": 65100 }, { - "epoch": 0.7, - "learning_rate": 0.0001943636835615549, - "loss": 0.0586, + "epoch": 0.42, + "learning_rate": 0.00023696470178201462, + "loss": 0.0567, "step": 65110 }, { - "epoch": 0.7, - "learning_rate": 0.00019434745927704588, - "loss": 0.0533, + "epoch": 0.42, + "learning_rate": 0.00023695502042765765, + "loss": 0.0551, "step": 65120 }, { - "epoch": 0.7, - "learning_rate": 0.0001943312349925368, - "loss": 0.0476, + "epoch": 0.42, + "learning_rate": 0.00023694533907330073, + "loss": 0.0539, "step": 65130 }, { - "epoch": 0.7, - "learning_rate": 0.00019431501070802775, - "loss": 0.0551, + "epoch": 0.42, + "learning_rate": 0.0002369356577189438, + "loss": 0.0572, "step": 65140 }, { - "epoch": 0.7, - "learning_rate": 0.0001942987864235187, + "epoch": 0.42, + "learning_rate": 0.0002369259763645869, "loss": 0.0525, "step": 65150 }, { - "epoch": 0.7, - "learning_rate": 0.00019428256213900965, - "loss": 0.0578, + "epoch": 0.42, + "learning_rate": 0.00023691629501022994, + "loss": 0.0507, "step": 65160 }, { - "epoch": 0.7, - "learning_rate": 0.00019426633785450057, - "loss": 0.0484, + "epoch": 0.42, + "learning_rate": 0.00023690661365587302, + "loss": 0.0624, "step": 65170 }, { - "epoch": 0.7, - "learning_rate": 0.00019425011356999155, - "loss": 0.0624, + "epoch": 0.42, + "learning_rate": 0.0002368969323015161, + "loss": 0.055, "step": 65180 }, { - "epoch": 0.71, - "learning_rate": 0.00019423388928548247, - "loss": 0.0486, + "epoch": 0.42, + "learning_rate": 0.00023688725094715913, + "loss": 0.061, "step": 65190 }, { - "epoch": 0.71, - "learning_rate": 0.00019421766500097345, - "loss": 0.0505, + "epoch": 0.42, + "learning_rate": 0.0002368775695928022, + "loss": 0.0535, "step": 65200 }, { - "epoch": 0.71, - "learning_rate": 0.00019420144071646437, - "loss": 0.0473, + "epoch": 0.42, + "learning_rate": 0.0002368678882384453, + "loss": 0.0548, "step": 65210 }, { - "epoch": 0.71, - "learning_rate": 0.00019418521643195535, - "loss": 0.0461, + "epoch": 0.42, + "learning_rate": 0.00023685820688408834, + "loss": 0.0557, "step": 65220 }, { - "epoch": 0.71, - "learning_rate": 0.00019416899214744627, - "loss": 0.0549, + "epoch": 0.42, + "learning_rate": 0.00023684852552973142, + "loss": 0.0596, "step": 65230 }, { - "epoch": 0.71, - "learning_rate": 0.00019415276786293722, - "loss": 0.0472, + "epoch": 0.42, + "learning_rate": 0.0002368388441753745, + "loss": 0.0566, "step": 65240 }, { - "epoch": 0.71, - "learning_rate": 0.00019413654357842817, - "loss": 0.0453, + "epoch": 0.42, + "learning_rate": 0.00023682916282101758, + "loss": 0.0624, "step": 65250 }, { - "epoch": 0.71, - "learning_rate": 0.00019412031929391912, - "loss": 0.0474, + "epoch": 0.42, + "learning_rate": 0.0002368194814666606, + "loss": 0.0572, "step": 65260 }, { - "epoch": 0.71, - "learning_rate": 0.00019410409500941004, - "loss": 0.0514, + "epoch": 0.42, + "learning_rate": 0.00023680980011230368, + "loss": 0.0503, "step": 65270 }, { - "epoch": 0.71, - "learning_rate": 0.00019408787072490102, - "loss": 0.0521, + "epoch": 0.42, + "learning_rate": 0.00023680011875794676, + "loss": 0.0536, "step": 65280 }, { - "epoch": 0.71, - "learning_rate": 0.00019407164644039194, - "loss": 0.0486, + "epoch": 0.42, + "learning_rate": 0.00023679043740358982, + "loss": 0.0559, "step": 65290 }, { - "epoch": 0.71, - "learning_rate": 0.00019405542215588292, - "loss": 0.0504, + "epoch": 0.42, + "learning_rate": 0.0002367807560492329, + "loss": 0.0587, "step": 65300 }, { - "epoch": 0.71, - "learning_rate": 0.00019403919787137384, - "loss": 0.0497, + "epoch": 0.42, + "learning_rate": 0.00023677107469487598, + "loss": 0.0582, "step": 65310 }, { - "epoch": 0.71, - "learning_rate": 0.0001940229735868648, - "loss": 0.0535, + "epoch": 0.42, + "learning_rate": 0.00023676139334051906, + "loss": 0.0524, "step": 65320 }, { - "epoch": 0.71, - "learning_rate": 0.00019400674930235574, - "loss": 0.054, + "epoch": 0.42, + "learning_rate": 0.00023675171198616208, + "loss": 0.0521, "step": 65330 }, { - "epoch": 0.71, - "learning_rate": 0.0001939905250178467, - "loss": 0.0585, + "epoch": 0.42, + "learning_rate": 0.00023674203063180516, + "loss": 0.0493, "step": 65340 }, { - "epoch": 0.71, - "learning_rate": 0.00019397430073333762, - "loss": 0.0499, + "epoch": 0.42, + "learning_rate": 0.00023673234927744824, + "loss": 0.0579, "step": 65350 }, { - "epoch": 0.71, - "learning_rate": 0.0001939580764488286, - "loss": 0.0463, + "epoch": 0.42, + "learning_rate": 0.0002367226679230913, + "loss": 0.059, "step": 65360 }, { - "epoch": 0.71, - "learning_rate": 0.00019394185216431952, - "loss": 0.0432, + "epoch": 0.42, + "learning_rate": 0.00023671298656873437, + "loss": 0.0566, "step": 65370 }, { - "epoch": 0.71, - "learning_rate": 0.0001939256278798105, - "loss": 0.0473, + "epoch": 0.42, + "learning_rate": 0.00023670330521437745, + "loss": 0.0522, "step": 65380 }, { - "epoch": 0.71, - "learning_rate": 0.00019390940359530142, - "loss": 0.0588, + "epoch": 0.42, + "learning_rate": 0.00023669362386002053, + "loss": 0.0559, "step": 65390 }, { - "epoch": 0.71, - "learning_rate": 0.0001938931793107924, - "loss": 0.0531, + "epoch": 0.42, + "learning_rate": 0.00023668394250566356, + "loss": 0.0592, "step": 65400 }, { - "epoch": 0.71, - "learning_rate": 0.00019387695502628331, - "loss": 0.0472, + "epoch": 0.42, + "learning_rate": 0.00023667426115130664, + "loss": 0.0543, "step": 65410 }, { - "epoch": 0.71, - "learning_rate": 0.00019386073074177426, - "loss": 0.0492, + "epoch": 0.42, + "learning_rate": 0.0002366645797969497, + "loss": 0.0576, "step": 65420 }, { - "epoch": 0.71, - "learning_rate": 0.00019384450645726521, - "loss": 0.0483, + "epoch": 0.42, + "learning_rate": 0.00023665489844259277, + "loss": 0.0588, "step": 65430 }, { - "epoch": 0.71, - "learning_rate": 0.00019382828217275616, - "loss": 0.0432, + "epoch": 0.42, + "learning_rate": 0.00023664521708823585, + "loss": 0.0579, "step": 65440 }, { - "epoch": 0.71, - "learning_rate": 0.0001938120578882471, - "loss": 0.0449, + "epoch": 0.42, + "learning_rate": 0.00023663553573387893, + "loss": 0.0636, "step": 65450 }, { - "epoch": 0.71, - "learning_rate": 0.00019379583360373806, - "loss": 0.0468, + "epoch": 0.42, + "learning_rate": 0.00023662585437952196, + "loss": 0.0508, "step": 65460 }, { - "epoch": 0.71, - "learning_rate": 0.00019377960931922899, - "loss": 0.0496, + "epoch": 0.42, + "learning_rate": 0.00023661617302516504, + "loss": 0.0707, "step": 65470 }, { - "epoch": 0.71, - "learning_rate": 0.00019376338503471996, - "loss": 0.0399, + "epoch": 0.42, + "learning_rate": 0.00023660649167080812, + "loss": 0.0563, "step": 65480 }, { - "epoch": 0.71, - "learning_rate": 0.00019374716075021089, - "loss": 0.0491, + "epoch": 0.42, + "learning_rate": 0.00023659681031645117, + "loss": 0.0556, "step": 65490 }, { - "epoch": 0.71, - "learning_rate": 0.00019373093646570184, - "loss": 0.0452, + "epoch": 0.42, + "learning_rate": 0.00023658712896209425, + "loss": 0.0619, "step": 65500 }, { - "epoch": 0.71, - "learning_rate": 0.00019371471218119279, - "loss": 0.0492, + "epoch": 0.42, + "learning_rate": 0.00023657744760773733, + "loss": 0.0719, "step": 65510 }, { - "epoch": 0.71, - "learning_rate": 0.00019369848789668373, - "loss": 0.0499, + "epoch": 0.42, + "learning_rate": 0.0002365677662533804, + "loss": 0.0653, "step": 65520 }, { - "epoch": 0.71, - "learning_rate": 0.00019368226361217466, - "loss": 0.0505, + "epoch": 0.42, + "learning_rate": 0.00023655808489902343, + "loss": 0.0626, "step": 65530 }, { - "epoch": 0.71, - "learning_rate": 0.00019366603932766563, - "loss": 0.0455, + "epoch": 0.42, + "learning_rate": 0.0002365484035446665, + "loss": 0.061, "step": 65540 }, { - "epoch": 0.71, - "learning_rate": 0.00019364981504315656, - "loss": 0.0489, + "epoch": 0.42, + "learning_rate": 0.0002365387221903096, + "loss": 0.0562, "step": 65550 }, { - "epoch": 0.71, - "learning_rate": 0.00019363359075864753, - "loss": 0.0555, + "epoch": 0.42, + "learning_rate": 0.00023652904083595265, + "loss": 0.055, "step": 65560 }, { - "epoch": 0.71, - "learning_rate": 0.00019361736647413846, - "loss": 0.0505, + "epoch": 0.42, + "learning_rate": 0.00023651935948159573, + "loss": 0.0558, "step": 65570 }, { - "epoch": 0.71, - "learning_rate": 0.00019360114218962943, - "loss": 0.05, + "epoch": 0.42, + "learning_rate": 0.0002365096781272388, + "loss": 0.0593, "step": 65580 }, { - "epoch": 0.71, - "learning_rate": 0.00019358491790512036, - "loss": 0.057, + "epoch": 0.42, + "learning_rate": 0.00023649999677288189, + "loss": 0.0544, "step": 65590 }, { - "epoch": 0.71, - "learning_rate": 0.0001935686936206113, - "loss": 0.0495, + "epoch": 0.42, + "learning_rate": 0.0002364903154185249, + "loss": 0.0591, "step": 65600 }, { - "epoch": 0.71, - "learning_rate": 0.00019355246933610226, - "loss": 0.0466, + "epoch": 0.42, + "learning_rate": 0.000236480634064168, + "loss": 0.0515, "step": 65610 }, { - "epoch": 0.71, - "learning_rate": 0.0001935362450515932, - "loss": 0.0504, + "epoch": 0.42, + "learning_rate": 0.00023647095270981104, + "loss": 0.0554, "step": 65620 }, { - "epoch": 0.71, - "learning_rate": 0.00019352002076708413, - "loss": 0.0466, + "epoch": 0.42, + "learning_rate": 0.00023646127135545412, + "loss": 0.0703, "step": 65630 }, { - "epoch": 0.71, - "learning_rate": 0.0001935037964825751, - "loss": 0.0477, + "epoch": 0.42, + "learning_rate": 0.0002364515900010972, + "loss": 0.0597, "step": 65640 }, { - "epoch": 0.71, - "learning_rate": 0.00019348757219806603, - "loss": 0.0566, + "epoch": 0.42, + "learning_rate": 0.00023644190864674028, + "loss": 0.0589, "step": 65650 }, { - "epoch": 0.71, - "learning_rate": 0.000193471347913557, - "loss": 0.0478, + "epoch": 0.42, + "learning_rate": 0.00023643222729238334, + "loss": 0.0532, "step": 65660 }, { - "epoch": 0.71, - "learning_rate": 0.00019345512362904793, + "epoch": 0.42, + "learning_rate": 0.0002364225459380264, "loss": 0.059, "step": 65670 }, { - "epoch": 0.71, - "learning_rate": 0.00019343889934453888, - "loss": 0.0495, + "epoch": 0.42, + "learning_rate": 0.00023641286458366947, + "loss": 0.0543, "step": 65680 }, { - "epoch": 0.71, - "learning_rate": 0.00019342267506002983, - "loss": 0.0525, + "epoch": 0.42, + "learning_rate": 0.00023640318322931252, + "loss": 0.0653, "step": 65690 }, { - "epoch": 0.71, - "learning_rate": 0.00019340645077552078, - "loss": 0.0474, + "epoch": 0.42, + "learning_rate": 0.0002363935018749556, + "loss": 0.065, "step": 65700 }, { - "epoch": 0.71, - "learning_rate": 0.00019339022649101175, - "loss": 0.0454, + "epoch": 0.42, + "learning_rate": 0.00023638382052059868, + "loss": 0.0605, "step": 65710 }, { - "epoch": 0.71, - "learning_rate": 0.00019337400220650268, - "loss": 0.0494, + "epoch": 0.42, + "learning_rate": 0.00023637413916624176, + "loss": 0.0681, "step": 65720 }, { - "epoch": 0.71, - "learning_rate": 0.00019335777792199365, - "loss": 0.0452, + "epoch": 0.42, + "learning_rate": 0.0002363644578118848, + "loss": 0.0527, "step": 65730 }, { - "epoch": 0.71, - "learning_rate": 0.00019334155363748458, - "loss": 0.0488, + "epoch": 0.42, + "learning_rate": 0.00023635477645752787, + "loss": 0.0558, "step": 65740 }, { - "epoch": 0.71, - "learning_rate": 0.00019332532935297553, - "loss": 0.0411, + "epoch": 0.42, + "learning_rate": 0.00023634509510317095, + "loss": 0.0633, "step": 65750 }, { - "epoch": 0.71, - "learning_rate": 0.00019330910506846648, - "loss": 0.0428, + "epoch": 0.42, + "learning_rate": 0.000236335413748814, + "loss": 0.0612, "step": 65760 }, { - "epoch": 0.71, - "learning_rate": 0.00019329288078395743, - "loss": 0.0501, + "epoch": 0.42, + "learning_rate": 0.00023632573239445708, + "loss": 0.0596, "step": 65770 }, { - "epoch": 0.71, - "learning_rate": 0.00019327665649944835, - "loss": 0.05, + "epoch": 0.42, + "learning_rate": 0.00023631605104010016, + "loss": 0.056, "step": 65780 }, { - "epoch": 0.71, - "learning_rate": 0.00019326043221493932, - "loss": 0.0511, + "epoch": 0.42, + "learning_rate": 0.00023630636968574324, + "loss": 0.0594, "step": 65790 }, { - "epoch": 0.71, - "learning_rate": 0.00019324420793043025, - "loss": 0.0468, + "epoch": 0.42, + "learning_rate": 0.0002362966883313863, + "loss": 0.0562, "step": 65800 }, { - "epoch": 0.71, - "learning_rate": 0.00019322798364592122, - "loss": 0.0446, + "epoch": 0.42, + "learning_rate": 0.00023628700697702934, + "loss": 0.0596, "step": 65810 }, { - "epoch": 0.71, - "learning_rate": 0.00019321175936141215, - "loss": 0.0536, + "epoch": 0.42, + "learning_rate": 0.0002362773256226724, + "loss": 0.0556, "step": 65820 }, { - "epoch": 0.71, - "learning_rate": 0.0001931955350769031, - "loss": 0.0518, + "epoch": 0.42, + "learning_rate": 0.00023626764426831548, + "loss": 0.0635, "step": 65830 }, { - "epoch": 0.71, - "learning_rate": 0.00019317931079239405, - "loss": 0.0503, + "epoch": 0.42, + "learning_rate": 0.00023625796291395855, + "loss": 0.0564, "step": 65840 }, { - "epoch": 0.71, - "learning_rate": 0.000193163086507885, - "loss": 0.0519, + "epoch": 0.43, + "learning_rate": 0.00023624828155960163, + "loss": 0.0509, "step": 65850 }, { - "epoch": 0.71, - "learning_rate": 0.00019314686222337592, - "loss": 0.0611, + "epoch": 0.43, + "learning_rate": 0.0002362386002052447, + "loss": 0.0597, "step": 65860 }, { - "epoch": 0.71, - "learning_rate": 0.0001931306379388669, - "loss": 0.0492, + "epoch": 0.43, + "learning_rate": 0.00023622891885088777, + "loss": 0.0474, "step": 65870 }, { - "epoch": 0.71, - "learning_rate": 0.00019311441365435782, - "loss": 0.0506, + "epoch": 0.43, + "learning_rate": 0.00023621923749653082, + "loss": 0.0571, "step": 65880 }, { - "epoch": 0.71, - "learning_rate": 0.0001930981893698488, - "loss": 0.0461, + "epoch": 0.43, + "learning_rate": 0.00023620955614217387, + "loss": 0.0465, "step": 65890 }, { - "epoch": 0.71, - "learning_rate": 0.00019308196508533972, - "loss": 0.0451, + "epoch": 0.43, + "learning_rate": 0.00023619987478781695, + "loss": 0.067, "step": 65900 }, { - "epoch": 0.71, - "learning_rate": 0.0001930657408008307, - "loss": 0.0497, + "epoch": 0.43, + "learning_rate": 0.00023619019343346003, + "loss": 0.0525, "step": 65910 }, { - "epoch": 0.71, - "learning_rate": 0.00019304951651632162, - "loss": 0.0551, + "epoch": 0.43, + "learning_rate": 0.0002361805120791031, + "loss": 0.0606, "step": 65920 }, { - "epoch": 0.71, - "learning_rate": 0.00019303329223181257, - "loss": 0.0566, + "epoch": 0.43, + "learning_rate": 0.00023617083072474616, + "loss": 0.0511, "step": 65930 }, { - "epoch": 0.71, - "learning_rate": 0.00019301706794730352, - "loss": 0.0486, + "epoch": 0.43, + "learning_rate": 0.00023616114937038924, + "loss": 0.0572, "step": 65940 }, { - "epoch": 0.71, - "learning_rate": 0.00019300084366279447, - "loss": 0.0504, + "epoch": 0.43, + "learning_rate": 0.0002361514680160323, + "loss": 0.0679, "step": 65950 }, { - "epoch": 0.71, - "learning_rate": 0.0001929846193782854, - "loss": 0.0465, + "epoch": 0.43, + "learning_rate": 0.00023614178666167535, + "loss": 0.0601, "step": 65960 }, { - "epoch": 0.71, - "learning_rate": 0.00019296839509377637, - "loss": 0.0529, + "epoch": 0.43, + "learning_rate": 0.00023613210530731843, + "loss": 0.0612, "step": 65970 }, { - "epoch": 0.71, - "learning_rate": 0.0001929521708092673, - "loss": 0.0537, + "epoch": 0.43, + "learning_rate": 0.0002361224239529615, + "loss": 0.0509, "step": 65980 }, { - "epoch": 0.71, - "learning_rate": 0.00019293594652475827, - "loss": 0.0514, + "epoch": 0.43, + "learning_rate": 0.0002361127425986046, + "loss": 0.0626, "step": 65990 }, { - "epoch": 0.71, - "learning_rate": 0.0001929197222402492, - "loss": 0.052, + "epoch": 0.43, + "learning_rate": 0.00023610306124424764, + "loss": 0.0605, "step": 66000 }, { - "epoch": 0.71, - "eval_cer": 0.9212992167028011, - "eval_loss": 0.034340739250183105, - "eval_runtime": 118.9294, - "eval_samples_per_second": 16.817, - "eval_steps_per_second": 4.204, + "epoch": 0.43, + "eval_cer": 0.9198996723534064, + "eval_loss": 0.03807980939745903, + "eval_runtime": 120.0579, + "eval_samples_per_second": 16.659, + "eval_steps_per_second": 4.165, "step": 66000 }, { - "epoch": 0.71, - "learning_rate": 0.00019290349795574014, - "loss": 0.0516, + "epoch": 0.43, + "learning_rate": 0.00023609337988989072, + "loss": 0.0626, "step": 66010 }, { - "epoch": 0.71, - "learning_rate": 0.0001928872736712311, - "loss": 0.0482, + "epoch": 0.43, + "learning_rate": 0.00023608369853553375, + "loss": 0.0565, "step": 66020 }, { - "epoch": 0.71, - "learning_rate": 0.00019287104938672204, - "loss": 0.0479, + "epoch": 0.43, + "learning_rate": 0.00023607401718117683, + "loss": 0.0591, "step": 66030 }, { - "epoch": 0.71, - "learning_rate": 0.00019285482510221296, - "loss": 0.0467, + "epoch": 0.43, + "learning_rate": 0.0002360643358268199, + "loss": 0.055, "step": 66040 }, { - "epoch": 0.71, - "learning_rate": 0.00019283860081770394, - "loss": 0.05, + "epoch": 0.43, + "learning_rate": 0.000236054654472463, + "loss": 0.0614, "step": 66050 }, { - "epoch": 0.71, - "learning_rate": 0.00019282237653319486, - "loss": 0.0529, + "epoch": 0.43, + "learning_rate": 0.00023604497311810604, + "loss": 0.0514, "step": 66060 }, { - "epoch": 0.71, - "learning_rate": 0.00019280615224868584, - "loss": 0.0464, + "epoch": 0.43, + "learning_rate": 0.00023603529176374912, + "loss": 0.059, "step": 66070 }, { - "epoch": 0.71, - "learning_rate": 0.00019278992796417676, - "loss": 0.0497, + "epoch": 0.43, + "learning_rate": 0.0002360256104093922, + "loss": 0.063, "step": 66080 }, { - "epoch": 0.71, - "learning_rate": 0.00019277370367966774, - "loss": 0.0509, + "epoch": 0.43, + "learning_rate": 0.00023601592905503522, + "loss": 0.0571, "step": 66090 }, { - "epoch": 0.71, - "learning_rate": 0.00019275747939515866, - "loss": 0.0505, + "epoch": 0.43, + "learning_rate": 0.0002360062477006783, + "loss": 0.0615, "step": 66100 }, { - "epoch": 0.72, - "learning_rate": 0.0001927412551106496, - "loss": 0.0543, + "epoch": 0.43, + "learning_rate": 0.00023599656634632138, + "loss": 0.0552, "step": 66110 }, { - "epoch": 0.72, - "learning_rate": 0.00019272503082614056, - "loss": 0.0519, + "epoch": 0.43, + "learning_rate": 0.00023598688499196446, + "loss": 0.0538, "step": 66120 }, { - "epoch": 0.72, - "learning_rate": 0.0001927088065416315, - "loss": 0.0498, + "epoch": 0.43, + "learning_rate": 0.00023597720363760752, + "loss": 0.0547, "step": 66130 }, { - "epoch": 0.72, - "learning_rate": 0.00019269258225712243, - "loss": 0.065, + "epoch": 0.43, + "learning_rate": 0.0002359675222832506, + "loss": 0.0556, "step": 66140 }, { - "epoch": 0.72, - "learning_rate": 0.0001926763579726134, - "loss": 0.0541, + "epoch": 0.43, + "learning_rate": 0.00023595784092889368, + "loss": 0.0596, "step": 66150 }, { - "epoch": 0.72, - "learning_rate": 0.00019266013368810433, - "loss": 0.0579, + "epoch": 0.43, + "learning_rate": 0.0002359481595745367, + "loss": 0.0476, "step": 66160 }, { - "epoch": 0.72, - "learning_rate": 0.0001926439094035953, - "loss": 0.045, + "epoch": 0.43, + "learning_rate": 0.00023593847822017978, + "loss": 0.0613, "step": 66170 }, { - "epoch": 0.72, - "learning_rate": 0.00019262768511908623, - "loss": 0.05, + "epoch": 0.43, + "learning_rate": 0.00023592879686582286, + "loss": 0.0551, "step": 66180 }, { - "epoch": 0.72, - "learning_rate": 0.00019261146083457718, - "loss": 0.0541, + "epoch": 0.43, + "learning_rate": 0.00023591911551146594, + "loss": 0.0558, "step": 66190 }, { - "epoch": 0.72, - "learning_rate": 0.00019259523655006813, - "loss": 0.0537, + "epoch": 0.43, + "learning_rate": 0.000235909434157109, + "loss": 0.0576, "step": 66200 }, { - "epoch": 0.72, - "learning_rate": 0.00019257901226555908, - "loss": 0.0489, + "epoch": 0.43, + "learning_rate": 0.00023589975280275207, + "loss": 0.0547, "step": 66210 }, { - "epoch": 0.72, - "learning_rate": 0.00019256278798105, - "loss": 0.0487, + "epoch": 0.43, + "learning_rate": 0.00023589007144839515, + "loss": 0.0589, "step": 66220 }, { - "epoch": 0.72, - "learning_rate": 0.00019254656369654098, - "loss": 0.0487, + "epoch": 0.43, + "learning_rate": 0.00023588039009403818, + "loss": 0.0587, "step": 66230 }, { - "epoch": 0.72, - "learning_rate": 0.0001925303394120319, - "loss": 0.0436, + "epoch": 0.43, + "learning_rate": 0.00023587070873968126, + "loss": 0.0619, "step": 66240 }, { - "epoch": 0.72, - "learning_rate": 0.00019251411512752288, - "loss": 0.0513, + "epoch": 0.43, + "learning_rate": 0.00023586102738532434, + "loss": 0.0695, "step": 66250 }, { - "epoch": 0.72, - "learning_rate": 0.0001924978908430138, - "loss": 0.0533, + "epoch": 0.43, + "learning_rate": 0.0002358513460309674, + "loss": 0.0587, "step": 66260 }, { - "epoch": 0.72, - "learning_rate": 0.00019248166655850478, - "loss": 0.0449, + "epoch": 0.43, + "learning_rate": 0.00023584166467661047, + "loss": 0.0608, "step": 66270 }, { - "epoch": 0.72, - "learning_rate": 0.0001924654422739957, - "loss": 0.0491, + "epoch": 0.43, + "learning_rate": 0.00023583198332225355, + "loss": 0.0639, "step": 66280 }, { - "epoch": 0.72, - "learning_rate": 0.00019244921798948665, - "loss": 0.0474, + "epoch": 0.43, + "learning_rate": 0.00023582230196789663, + "loss": 0.0585, "step": 66290 }, { - "epoch": 0.72, - "learning_rate": 0.0001924329937049776, - "loss": 0.0515, + "epoch": 0.43, + "learning_rate": 0.00023581262061353966, + "loss": 0.0587, "step": 66300 }, { - "epoch": 0.72, - "learning_rate": 0.00019241676942046855, - "loss": 0.0454, + "epoch": 0.43, + "learning_rate": 0.00023580293925918274, + "loss": 0.0509, "step": 66310 }, { - "epoch": 0.72, - "learning_rate": 0.00019240054513595947, - "loss": 0.048, + "epoch": 0.43, + "learning_rate": 0.00023579325790482582, + "loss": 0.0502, "step": 66320 }, { - "epoch": 0.72, - "learning_rate": 0.00019238432085145045, - "loss": 0.0608, + "epoch": 0.43, + "learning_rate": 0.00023578357655046887, + "loss": 0.0529, "step": 66330 }, { - "epoch": 0.72, - "learning_rate": 0.00019236809656694137, - "loss": 0.0464, + "epoch": 0.43, + "learning_rate": 0.00023577389519611195, + "loss": 0.0548, "step": 66340 }, { - "epoch": 0.72, - "learning_rate": 0.00019235187228243235, - "loss": 0.0487, + "epoch": 0.43, + "learning_rate": 0.00023576421384175503, + "loss": 0.0536, "step": 66350 }, { - "epoch": 0.72, - "learning_rate": 0.00019233564799792327, - "loss": 0.0485, + "epoch": 0.43, + "learning_rate": 0.0002357545324873981, + "loss": 0.063, "step": 66360 }, { - "epoch": 0.72, - "learning_rate": 0.00019231942371341422, - "loss": 0.0569, + "epoch": 0.43, + "learning_rate": 0.00023574485113304113, + "loss": 0.062, "step": 66370 }, { - "epoch": 0.72, - "learning_rate": 0.00019230319942890517, - "loss": 0.0451, + "epoch": 0.43, + "learning_rate": 0.0002357351697786842, + "loss": 0.061, "step": 66380 }, { - "epoch": 0.72, - "learning_rate": 0.00019228697514439612, - "loss": 0.043, + "epoch": 0.43, + "learning_rate": 0.0002357254884243273, + "loss": 0.0604, "step": 66390 }, { - "epoch": 0.72, - "learning_rate": 0.00019227075085988704, - "loss": 0.0488, + "epoch": 0.43, + "learning_rate": 0.00023571580706997035, + "loss": 0.055, "step": 66400 }, { - "epoch": 0.72, - "learning_rate": 0.00019225452657537802, - "loss": 0.0416, + "epoch": 0.43, + "learning_rate": 0.00023570612571561343, + "loss": 0.0544, "step": 66410 }, { - "epoch": 0.72, - "learning_rate": 0.00019223830229086894, - "loss": 0.0519, + "epoch": 0.43, + "learning_rate": 0.0002356964443612565, + "loss": 0.0597, "step": 66420 }, { - "epoch": 0.72, - "learning_rate": 0.00019222207800635992, - "loss": 0.0538, + "epoch": 0.43, + "learning_rate": 0.00023568676300689956, + "loss": 0.0497, "step": 66430 }, { - "epoch": 0.72, - "learning_rate": 0.00019220585372185084, - "loss": 0.0461, + "epoch": 0.43, + "learning_rate": 0.0002356770816525426, + "loss": 0.06, "step": 66440 }, { - "epoch": 0.72, - "learning_rate": 0.00019218962943734182, - "loss": 0.0477, + "epoch": 0.43, + "learning_rate": 0.0002356674002981857, + "loss": 0.0605, "step": 66450 }, { - "epoch": 0.72, - "learning_rate": 0.00019217340515283274, - "loss": 0.0478, + "epoch": 0.43, + "learning_rate": 0.00023565771894382874, + "loss": 0.0542, "step": 66460 }, { - "epoch": 0.72, - "learning_rate": 0.0001921571808683237, - "loss": 0.0418, + "epoch": 0.43, + "learning_rate": 0.00023564803758947182, + "loss": 0.0633, "step": 66470 }, { - "epoch": 0.72, - "learning_rate": 0.00019214095658381464, - "loss": 0.0492, + "epoch": 0.43, + "learning_rate": 0.0002356383562351149, + "loss": 0.0689, "step": 66480 }, { - "epoch": 0.72, - "learning_rate": 0.0001921247322993056, - "loss": 0.0457, + "epoch": 0.43, + "learning_rate": 0.00023562867488075798, + "loss": 0.0541, "step": 66490 }, { - "epoch": 0.72, - "learning_rate": 0.00019210850801479651, - "loss": 0.046, + "epoch": 0.43, + "learning_rate": 0.00023561899352640104, + "loss": 0.0609, "step": 66500 }, { - "epoch": 0.72, - "learning_rate": 0.0001920922837302875, - "loss": 0.0424, + "epoch": 0.43, + "learning_rate": 0.0002356093121720441, + "loss": 0.0628, "step": 66510 }, { - "epoch": 0.72, - "learning_rate": 0.00019207605944577841, - "loss": 0.0409, + "epoch": 0.43, + "learning_rate": 0.00023559963081768717, + "loss": 0.0521, "step": 66520 }, { - "epoch": 0.72, - "learning_rate": 0.0001920598351612694, - "loss": 0.0428, + "epoch": 0.43, + "learning_rate": 0.00023558994946333022, + "loss": 0.0538, "step": 66530 }, { - "epoch": 0.72, - "learning_rate": 0.0001920436108767603, - "loss": 0.0534, + "epoch": 0.43, + "learning_rate": 0.0002355802681089733, + "loss": 0.0585, "step": 66540 }, { - "epoch": 0.72, - "learning_rate": 0.00019202738659225126, - "loss": 0.0475, + "epoch": 0.43, + "learning_rate": 0.00023557058675461638, + "loss": 0.0564, "step": 66550 }, { - "epoch": 0.72, - "learning_rate": 0.0001920111623077422, - "loss": 0.0531, + "epoch": 0.43, + "learning_rate": 0.00023556090540025946, + "loss": 0.0552, "step": 66560 }, { - "epoch": 0.72, - "learning_rate": 0.00019199493802323316, - "loss": 0.0484, + "epoch": 0.43, + "learning_rate": 0.0002355512240459025, + "loss": 0.0522, "step": 66570 }, { - "epoch": 0.72, - "learning_rate": 0.0001919787137387241, - "loss": 0.0481, + "epoch": 0.43, + "learning_rate": 0.00023554154269154556, + "loss": 0.0513, "step": 66580 }, { - "epoch": 0.72, - "learning_rate": 0.00019196248945421506, - "loss": 0.057, + "epoch": 0.43, + "learning_rate": 0.00023553186133718864, + "loss": 0.0622, "step": 66590 }, { - "epoch": 0.72, - "learning_rate": 0.00019194626516970598, - "loss": 0.043, + "epoch": 0.43, + "learning_rate": 0.0002355221799828317, + "loss": 0.0533, "step": 66600 }, { - "epoch": 0.72, - "learning_rate": 0.00019193004088519696, - "loss": 0.0441, + "epoch": 0.43, + "learning_rate": 0.00023551249862847478, + "loss": 0.0561, "step": 66610 }, { - "epoch": 0.72, - "learning_rate": 0.00019191381660068788, - "loss": 0.0471, + "epoch": 0.43, + "learning_rate": 0.00023550281727411786, + "loss": 0.0515, "step": 66620 }, { - "epoch": 0.72, - "learning_rate": 0.00019189759231617886, - "loss": 0.0426, + "epoch": 0.43, + "learning_rate": 0.0002354931359197609, + "loss": 0.0523, "step": 66630 }, { - "epoch": 0.72, - "learning_rate": 0.00019188136803166978, - "loss": 0.0508, + "epoch": 0.43, + "learning_rate": 0.000235483454565404, + "loss": 0.0557, "step": 66640 }, { - "epoch": 0.72, - "learning_rate": 0.00019186514374716073, - "loss": 0.0557, + "epoch": 0.43, + "learning_rate": 0.00023547377321104704, + "loss": 0.0566, "step": 66650 }, { - "epoch": 0.72, - "learning_rate": 0.00019184891946265168, - "loss": 0.0546, + "epoch": 0.43, + "learning_rate": 0.0002354640918566901, + "loss": 0.0558, "step": 66660 }, { - "epoch": 0.72, - "learning_rate": 0.00019183269517814263, - "loss": 0.0462, + "epoch": 0.43, + "learning_rate": 0.00023545441050233317, + "loss": 0.0539, "step": 66670 }, { - "epoch": 0.72, - "learning_rate": 0.00019181647089363356, - "loss": 0.0526, + "epoch": 0.43, + "learning_rate": 0.00023544472914797625, + "loss": 0.0523, "step": 66680 }, { - "epoch": 0.72, - "learning_rate": 0.00019180024660912453, - "loss": 0.0463, + "epoch": 0.43, + "learning_rate": 0.00023543504779361933, + "loss": 0.0569, "step": 66690 }, { - "epoch": 0.72, - "learning_rate": 0.00019178402232461546, - "loss": 0.0562, + "epoch": 0.43, + "learning_rate": 0.0002354253664392624, + "loss": 0.0587, "step": 66700 }, { - "epoch": 0.72, - "learning_rate": 0.00019176779804010643, - "loss": 0.0465, + "epoch": 0.43, + "learning_rate": 0.00023541568508490547, + "loss": 0.0476, "step": 66710 }, { - "epoch": 0.72, - "learning_rate": 0.00019175157375559736, - "loss": 0.0547, + "epoch": 0.43, + "learning_rate": 0.00023540600373054852, + "loss": 0.0497, "step": 66720 }, { - "epoch": 0.72, - "learning_rate": 0.0001917353494710883, - "loss": 0.0508, + "epoch": 0.43, + "learning_rate": 0.00023539632237619157, + "loss": 0.0526, "step": 66730 }, { - "epoch": 0.72, - "learning_rate": 0.00019171912518657925, - "loss": 0.0456, + "epoch": 0.43, + "learning_rate": 0.00023538664102183465, + "loss": 0.0614, "step": 66740 }, { - "epoch": 0.72, - "learning_rate": 0.0001917029009020702, - "loss": 0.06, + "epoch": 0.43, + "learning_rate": 0.00023537695966747773, + "loss": 0.0529, "step": 66750 }, { - "epoch": 0.72, - "learning_rate": 0.00019168667661756115, - "loss": 0.0478, + "epoch": 0.43, + "learning_rate": 0.0002353672783131208, + "loss": 0.0526, "step": 66760 }, { - "epoch": 0.72, - "learning_rate": 0.0001916704523330521, - "loss": 0.0465, + "epoch": 0.43, + "learning_rate": 0.00023535759695876386, + "loss": 0.0583, "step": 66770 }, { - "epoch": 0.72, - "learning_rate": 0.00019165422804854303, - "loss": 0.049, + "epoch": 0.43, + "learning_rate": 0.00023534791560440694, + "loss": 0.0525, "step": 66780 }, { - "epoch": 0.72, - "learning_rate": 0.000191638003764034, - "loss": 0.0533, + "epoch": 0.43, + "learning_rate": 0.00023533823425005, + "loss": 0.0607, "step": 66790 }, { - "epoch": 0.72, - "learning_rate": 0.00019162177947952493, - "loss": 0.0471, + "epoch": 0.43, + "learning_rate": 0.00023532855289569305, + "loss": 0.0539, "step": 66800 }, { - "epoch": 0.72, - "learning_rate": 0.0001916055551950159, - "loss": 0.0514, + "epoch": 0.43, + "learning_rate": 0.00023531887154133613, + "loss": 0.0546, "step": 66810 }, { - "epoch": 0.72, - "learning_rate": 0.00019158933091050683, - "loss": 0.0439, + "epoch": 0.43, + "learning_rate": 0.0002353091901869792, + "loss": 0.0552, "step": 66820 }, { - "epoch": 0.72, - "learning_rate": 0.00019157310662599778, - "loss": 0.0532, + "epoch": 0.43, + "learning_rate": 0.00023529950883262226, + "loss": 0.0546, "step": 66830 }, { - "epoch": 0.72, - "learning_rate": 0.00019155688234148873, - "loss": 0.0499, + "epoch": 0.43, + "learning_rate": 0.00023528982747826534, + "loss": 0.0606, "step": 66840 }, { - "epoch": 0.72, - "learning_rate": 0.00019154065805697968, - "loss": 0.047, + "epoch": 0.43, + "learning_rate": 0.00023528014612390842, + "loss": 0.0606, "step": 66850 }, { - "epoch": 0.72, - "learning_rate": 0.0001915244337724706, - "loss": 0.0458, + "epoch": 0.43, + "learning_rate": 0.00023527046476955145, + "loss": 0.063, "step": 66860 }, { - "epoch": 0.72, - "learning_rate": 0.00019150820948796157, - "loss": 0.0547, + "epoch": 0.43, + "learning_rate": 0.00023526078341519453, + "loss": 0.0622, "step": 66870 }, { - "epoch": 0.72, - "learning_rate": 0.0001914919852034525, - "loss": 0.0541, + "epoch": 0.43, + "learning_rate": 0.0002352511020608376, + "loss": 0.0598, "step": 66880 }, { - "epoch": 0.72, - "learning_rate": 0.00019147576091894347, - "loss": 0.0518, + "epoch": 0.43, + "learning_rate": 0.00023524142070648069, + "loss": 0.058, "step": 66890 }, { - "epoch": 0.72, - "learning_rate": 0.0001914595366344344, - "loss": 0.0447, + "epoch": 0.43, + "learning_rate": 0.00023523173935212374, + "loss": 0.0589, "step": 66900 }, { - "epoch": 0.72, - "learning_rate": 0.00019144331234992535, - "loss": 0.0484, + "epoch": 0.43, + "learning_rate": 0.00023522205799776682, + "loss": 0.0546, "step": 66910 }, { - "epoch": 0.72, - "learning_rate": 0.0001914270880654163, - "loss": 0.0592, + "epoch": 0.43, + "learning_rate": 0.0002352123766434099, + "loss": 0.058, "step": 66920 }, { - "epoch": 0.72, - "learning_rate": 0.00019141086378090725, - "loss": 0.0492, + "epoch": 0.43, + "learning_rate": 0.00023520269528905292, + "loss": 0.0549, "step": 66930 }, { - "epoch": 0.72, - "learning_rate": 0.0001913946394963982, - "loss": 0.0488, + "epoch": 0.43, + "learning_rate": 0.000235193013934696, + "loss": 0.056, "step": 66940 }, { - "epoch": 0.72, - "learning_rate": 0.00019137841521188915, - "loss": 0.0405, + "epoch": 0.43, + "learning_rate": 0.00023518333258033908, + "loss": 0.0592, "step": 66950 }, { - "epoch": 0.72, - "learning_rate": 0.00019136219092738007, - "loss": 0.0438, + "epoch": 0.43, + "learning_rate": 0.00023517365122598216, + "loss": 0.0549, "step": 66960 }, { - "epoch": 0.72, - "learning_rate": 0.00019134596664287105, - "loss": 0.0469, + "epoch": 0.43, + "learning_rate": 0.00023516396987162522, + "loss": 0.0613, "step": 66970 }, { - "epoch": 0.72, - "learning_rate": 0.00019132974235836197, - "loss": 0.0511, + "epoch": 0.43, + "learning_rate": 0.0002351542885172683, + "loss": 0.0532, "step": 66980 }, { - "epoch": 0.72, - "learning_rate": 0.00019131351807385294, - "loss": 0.0525, + "epoch": 0.43, + "learning_rate": 0.00023514460716291138, + "loss": 0.055, "step": 66990 }, { - "epoch": 0.72, - "learning_rate": 0.00019129729378934387, - "loss": 0.0427, + "epoch": 0.43, + "learning_rate": 0.0002351349258085544, + "loss": 0.0566, "step": 67000 }, { - "epoch": 0.72, - "eval_cer": 0.9212011499431919, - "eval_loss": 0.034092072397470474, - "eval_runtime": 118.846, - "eval_samples_per_second": 16.829, - "eval_steps_per_second": 4.207, + "epoch": 0.43, + "eval_cer": 0.9199828267992317, + "eval_loss": 0.03815074265003204, + "eval_runtime": 120.3509, + "eval_samples_per_second": 16.618, + "eval_steps_per_second": 4.155, "step": 67000 }, { - "epoch": 0.72, - "learning_rate": 0.00019128106950483482, - "loss": 0.0556, + "epoch": 0.43, + "learning_rate": 0.00023512524445419748, + "loss": 0.0598, "step": 67010 }, { - "epoch": 0.72, - "learning_rate": 0.00019126484522032577, - "loss": 0.0535, + "epoch": 0.43, + "learning_rate": 0.00023511556309984056, + "loss": 0.0573, "step": 67020 }, { - "epoch": 0.73, - "learning_rate": 0.00019124862093581672, - "loss": 0.0482, + "epoch": 0.43, + "learning_rate": 0.0002351058817454836, + "loss": 0.0583, "step": 67030 }, { - "epoch": 0.73, - "learning_rate": 0.00019123239665130764, - "loss": 0.043, + "epoch": 0.43, + "learning_rate": 0.0002350962003911267, + "loss": 0.0672, "step": 67040 }, { - "epoch": 0.73, - "learning_rate": 0.00019121617236679862, - "loss": 0.0438, + "epoch": 0.43, + "learning_rate": 0.00023508651903676977, + "loss": 0.049, "step": 67050 }, { - "epoch": 0.73, - "learning_rate": 0.00019119994808228954, - "loss": 0.053, + "epoch": 0.43, + "learning_rate": 0.00023507683768241285, + "loss": 0.0637, "step": 67060 }, { - "epoch": 0.73, - "learning_rate": 0.00019118372379778052, - "loss": 0.0629, + "epoch": 0.43, + "learning_rate": 0.00023506715632805588, + "loss": 0.0563, "step": 67070 }, { - "epoch": 0.73, - "learning_rate": 0.00019116749951327144, - "loss": 0.0498, + "epoch": 0.43, + "learning_rate": 0.00023505747497369896, + "loss": 0.0584, "step": 67080 }, { - "epoch": 0.73, - "learning_rate": 0.0001911512752287624, - "loss": 0.0423, + "epoch": 0.43, + "learning_rate": 0.00023504779361934204, + "loss": 0.0561, "step": 67090 }, { - "epoch": 0.73, - "learning_rate": 0.00019113505094425334, - "loss": 0.0566, + "epoch": 0.43, + "learning_rate": 0.0002350381122649851, + "loss": 0.0594, "step": 67100 }, { - "epoch": 0.73, - "learning_rate": 0.0001911188266597443, - "loss": 0.0494, + "epoch": 0.43, + "learning_rate": 0.00023502843091062817, + "loss": 0.0604, "step": 67110 }, { - "epoch": 0.73, - "learning_rate": 0.00019110260237523524, - "loss": 0.0543, + "epoch": 0.43, + "learning_rate": 0.00023501874955627125, + "loss": 0.0545, "step": 67120 }, { - "epoch": 0.73, - "learning_rate": 0.0001910863780907262, - "loss": 0.0455, + "epoch": 0.43, + "learning_rate": 0.00023500906820191433, + "loss": 0.0666, "step": 67130 }, { - "epoch": 0.73, - "learning_rate": 0.0001910701538062171, - "loss": 0.0519, + "epoch": 0.43, + "learning_rate": 0.00023499938684755736, + "loss": 0.0609, "step": 67140 }, { - "epoch": 0.73, - "learning_rate": 0.0001910539295217081, - "loss": 0.0487, + "epoch": 0.43, + "learning_rate": 0.00023498970549320044, + "loss": 0.0576, "step": 67150 }, { - "epoch": 0.73, - "learning_rate": 0.000191037705237199, - "loss": 0.0435, + "epoch": 0.43, + "learning_rate": 0.00023498002413884352, + "loss": 0.0568, "step": 67160 }, { - "epoch": 0.73, - "learning_rate": 0.00019102148095268999, - "loss": 0.0481, + "epoch": 0.43, + "learning_rate": 0.00023497034278448657, + "loss": 0.0498, "step": 67170 }, { - "epoch": 0.73, - "learning_rate": 0.0001910052566681809, - "loss": 0.0485, + "epoch": 0.43, + "learning_rate": 0.00023496066143012965, + "loss": 0.055, "step": 67180 }, { - "epoch": 0.73, - "learning_rate": 0.00019098903238367186, - "loss": 0.0613, + "epoch": 0.43, + "learning_rate": 0.00023495098007577273, + "loss": 0.0568, "step": 67190 }, { - "epoch": 0.73, - "learning_rate": 0.0001909728080991628, - "loss": 0.0437, + "epoch": 0.43, + "learning_rate": 0.0002349412987214158, + "loss": 0.0519, "step": 67200 }, { - "epoch": 0.73, - "learning_rate": 0.00019095658381465376, - "loss": 0.0502, + "epoch": 0.43, + "learning_rate": 0.00023493161736705883, + "loss": 0.0541, "step": 67210 }, { - "epoch": 0.73, - "learning_rate": 0.00019094035953014468, - "loss": 0.0483, + "epoch": 0.43, + "learning_rate": 0.0002349219360127019, + "loss": 0.0535, "step": 67220 }, { - "epoch": 0.73, - "learning_rate": 0.00019092413524563566, - "loss": 0.0419, + "epoch": 0.43, + "learning_rate": 0.00023491225465834497, + "loss": 0.0559, "step": 67230 }, { - "epoch": 0.73, - "learning_rate": 0.00019090791096112658, - "loss": 0.0466, + "epoch": 0.43, + "learning_rate": 0.00023490257330398805, + "loss": 0.0535, "step": 67240 }, { - "epoch": 0.73, - "learning_rate": 0.00019089168667661756, - "loss": 0.0502, + "epoch": 0.43, + "learning_rate": 0.00023489289194963112, + "loss": 0.0535, "step": 67250 }, { - "epoch": 0.73, - "learning_rate": 0.00019087546239210848, - "loss": 0.0531, + "epoch": 0.43, + "learning_rate": 0.0002348832105952742, + "loss": 0.0533, "step": 67260 }, { - "epoch": 0.73, - "learning_rate": 0.00019085923810759946, - "loss": 0.0468, + "epoch": 0.43, + "learning_rate": 0.00023487352924091726, + "loss": 0.0622, "step": 67270 }, { - "epoch": 0.73, - "learning_rate": 0.00019084301382309038, - "loss": 0.0481, + "epoch": 0.43, + "learning_rate": 0.0002348638478865603, + "loss": 0.0537, "step": 67280 }, { - "epoch": 0.73, - "learning_rate": 0.00019082678953858133, - "loss": 0.0501, + "epoch": 0.43, + "learning_rate": 0.0002348541665322034, + "loss": 0.0621, "step": 67290 }, { - "epoch": 0.73, - "learning_rate": 0.00019081056525407228, - "loss": 0.0543, + "epoch": 0.43, + "learning_rate": 0.00023484448517784644, + "loss": 0.0557, "step": 67300 }, { - "epoch": 0.73, - "learning_rate": 0.00019079434096956323, - "loss": 0.0522, + "epoch": 0.43, + "learning_rate": 0.00023483480382348952, + "loss": 0.0601, "step": 67310 }, { - "epoch": 0.73, - "learning_rate": 0.00019077811668505415, - "loss": 0.0587, + "epoch": 0.43, + "learning_rate": 0.0002348251224691326, + "loss": 0.0525, "step": 67320 }, { - "epoch": 0.73, - "learning_rate": 0.00019076189240054513, - "loss": 0.0484, + "epoch": 0.43, + "learning_rate": 0.00023481544111477568, + "loss": 0.0629, "step": 67330 }, { - "epoch": 0.73, - "learning_rate": 0.00019074566811603605, - "loss": 0.0522, + "epoch": 0.43, + "learning_rate": 0.00023480575976041873, + "loss": 0.0596, "step": 67340 }, { - "epoch": 0.73, - "learning_rate": 0.00019072944383152703, - "loss": 0.0359, + "epoch": 0.43, + "learning_rate": 0.0002347960784060618, + "loss": 0.0608, "step": 67350 }, { - "epoch": 0.73, - "learning_rate": 0.00019071321954701795, - "loss": 0.0503, + "epoch": 0.43, + "learning_rate": 0.00023478639705170487, + "loss": 0.0551, "step": 67360 }, { - "epoch": 0.73, - "learning_rate": 0.0001906969952625089, - "loss": 0.0451, + "epoch": 0.43, + "learning_rate": 0.00023477671569734792, + "loss": 0.0576, "step": 67370 }, { - "epoch": 0.73, - "learning_rate": 0.00019068077097799985, - "loss": 0.0463, + "epoch": 0.43, + "learning_rate": 0.000234767034342991, + "loss": 0.0582, "step": 67380 }, { - "epoch": 0.73, - "learning_rate": 0.0001906645466934908, - "loss": 0.0466, + "epoch": 0.43, + "learning_rate": 0.00023475735298863408, + "loss": 0.058, "step": 67390 }, { - "epoch": 0.73, - "learning_rate": 0.00019064832240898172, - "loss": 0.0487, + "epoch": 0.44, + "learning_rate": 0.00023474767163427716, + "loss": 0.0663, "step": 67400 }, { - "epoch": 0.73, - "learning_rate": 0.0001906320981244727, - "loss": 0.0496, + "epoch": 0.44, + "learning_rate": 0.0002347379902799202, + "loss": 0.0524, "step": 67410 }, { - "epoch": 0.73, - "learning_rate": 0.00019061587383996362, - "loss": 0.0539, + "epoch": 0.44, + "learning_rate": 0.00023472830892556326, + "loss": 0.0529, "step": 67420 }, { - "epoch": 0.73, - "learning_rate": 0.0001905996495554546, - "loss": 0.0448, + "epoch": 0.44, + "learning_rate": 0.00023471862757120632, + "loss": 0.0584, "step": 67430 }, { - "epoch": 0.73, - "learning_rate": 0.00019058342527094552, - "loss": 0.0534, + "epoch": 0.44, + "learning_rate": 0.0002347089462168494, + "loss": 0.0548, "step": 67440 }, { - "epoch": 0.73, - "learning_rate": 0.0001905672009864365, - "loss": 0.049, + "epoch": 0.44, + "learning_rate": 0.00023469926486249248, + "loss": 0.0566, "step": 67450 }, { - "epoch": 0.73, - "learning_rate": 0.00019055097670192742, - "loss": 0.0489, + "epoch": 0.44, + "learning_rate": 0.00023468958350813556, + "loss": 0.0536, "step": 67460 }, { - "epoch": 0.73, - "learning_rate": 0.00019053475241741837, - "loss": 0.0518, + "epoch": 0.44, + "learning_rate": 0.0002346799021537786, + "loss": 0.0559, "step": 67470 }, { - "epoch": 0.73, - "learning_rate": 0.00019051852813290932, - "loss": 0.0532, + "epoch": 0.44, + "learning_rate": 0.0002346702207994217, + "loss": 0.0556, "step": 67480 }, { - "epoch": 0.73, - "learning_rate": 0.00019050230384840027, - "loss": 0.0483, + "epoch": 0.44, + "learning_rate": 0.00023466053944506474, + "loss": 0.0602, "step": 67490 }, { - "epoch": 0.73, - "learning_rate": 0.0001904860795638912, - "loss": 0.0455, + "epoch": 0.44, + "learning_rate": 0.0002346508580907078, + "loss": 0.0533, "step": 67500 }, { - "epoch": 0.73, - "learning_rate": 0.00019046985527938217, - "loss": 0.0522, + "epoch": 0.44, + "learning_rate": 0.00023464117673635087, + "loss": 0.0514, "step": 67510 }, { - "epoch": 0.73, - "learning_rate": 0.0001904536309948731, - "loss": 0.05, + "epoch": 0.44, + "learning_rate": 0.00023463149538199395, + "loss": 0.0533, "step": 67520 }, { - "epoch": 0.73, - "learning_rate": 0.00019043740671036407, - "loss": 0.0437, + "epoch": 0.44, + "learning_rate": 0.00023462181402763703, + "loss": 0.052, "step": 67530 }, { - "epoch": 0.73, - "learning_rate": 0.000190421182425855, - "loss": 0.0469, + "epoch": 0.44, + "learning_rate": 0.0002346121326732801, + "loss": 0.053, "step": 67540 }, { - "epoch": 0.73, - "learning_rate": 0.00019040495814134594, - "loss": 0.0468, + "epoch": 0.44, + "learning_rate": 0.00023460245131892317, + "loss": 0.0568, "step": 67550 }, { - "epoch": 0.73, - "learning_rate": 0.0001903887338568369, - "loss": 0.0428, + "epoch": 0.44, + "learning_rate": 0.00023459276996456622, + "loss": 0.0509, "step": 67560 }, { - "epoch": 0.73, - "learning_rate": 0.00019037250957232784, - "loss": 0.0516, + "epoch": 0.44, + "learning_rate": 0.00023458308861020927, + "loss": 0.0537, "step": 67570 }, { - "epoch": 0.73, - "learning_rate": 0.00019035628528781876, - "loss": 0.0447, + "epoch": 0.44, + "learning_rate": 0.00023457340725585235, + "loss": 0.0551, "step": 67580 }, { - "epoch": 0.73, - "learning_rate": 0.00019034006100330974, - "loss": 0.0524, + "epoch": 0.44, + "learning_rate": 0.00023456372590149543, + "loss": 0.0572, "step": 67590 }, { - "epoch": 0.73, - "learning_rate": 0.00019032383671880066, - "loss": 0.0474, + "epoch": 0.44, + "learning_rate": 0.0002345540445471385, + "loss": 0.0614, "step": 67600 }, { - "epoch": 0.73, - "learning_rate": 0.00019030761243429164, - "loss": 0.0471, + "epoch": 0.44, + "learning_rate": 0.00023454436319278156, + "loss": 0.0599, "step": 67610 }, { - "epoch": 0.73, - "learning_rate": 0.00019029138814978256, - "loss": 0.0449, + "epoch": 0.44, + "learning_rate": 0.00023453468183842464, + "loss": 0.0543, "step": 67620 }, { - "epoch": 0.73, - "learning_rate": 0.00019027516386527354, - "loss": 0.0476, + "epoch": 0.44, + "learning_rate": 0.00023452500048406767, + "loss": 0.0543, "step": 67630 }, { - "epoch": 0.73, - "learning_rate": 0.00019025893958076446, - "loss": 0.044, + "epoch": 0.44, + "learning_rate": 0.00023451531912971075, + "loss": 0.0632, "step": 67640 }, { - "epoch": 0.73, - "learning_rate": 0.0001902427152962554, - "loss": 0.0429, + "epoch": 0.44, + "learning_rate": 0.00023450563777535383, + "loss": 0.0636, "step": 67650 }, { - "epoch": 0.73, - "learning_rate": 0.00019022649101174636, - "loss": 0.0467, + "epoch": 0.44, + "learning_rate": 0.0002344959564209969, + "loss": 0.0528, "step": 67660 }, { - "epoch": 0.73, - "learning_rate": 0.0001902102667272373, - "loss": 0.0445, + "epoch": 0.44, + "learning_rate": 0.00023448627506663996, + "loss": 0.0623, "step": 67670 }, { - "epoch": 0.73, - "learning_rate": 0.00019019404244272823, - "loss": 0.0447, + "epoch": 0.44, + "learning_rate": 0.00023447659371228304, + "loss": 0.0648, "step": 67680 }, { - "epoch": 0.73, - "learning_rate": 0.0001901778181582192, - "loss": 0.045, + "epoch": 0.44, + "learning_rate": 0.00023446691235792612, + "loss": 0.0548, "step": 67690 }, { - "epoch": 0.73, - "learning_rate": 0.00019016159387371013, - "loss": 0.0478, + "epoch": 0.44, + "learning_rate": 0.00023445723100356915, + "loss": 0.0534, "step": 67700 }, { - "epoch": 0.73, - "learning_rate": 0.0001901453695892011, - "loss": 0.0463, + "epoch": 0.44, + "learning_rate": 0.00023444754964921223, + "loss": 0.0528, "step": 67710 }, { - "epoch": 0.73, - "learning_rate": 0.00019012914530469203, - "loss": 0.0468, + "epoch": 0.44, + "learning_rate": 0.0002344378682948553, + "loss": 0.0655, "step": 67720 }, { - "epoch": 0.73, - "learning_rate": 0.00019011292102018298, - "loss": 0.0496, + "epoch": 0.44, + "learning_rate": 0.00023442818694049839, + "loss": 0.0704, "step": 67730 }, { - "epoch": 0.73, - "learning_rate": 0.00019009669673567393, - "loss": 0.0618, + "epoch": 0.44, + "learning_rate": 0.00023441850558614144, + "loss": 0.0585, "step": 67740 }, { - "epoch": 0.73, - "learning_rate": 0.00019008047245116488, - "loss": 0.045, + "epoch": 0.44, + "learning_rate": 0.00023440882423178452, + "loss": 0.0551, "step": 67750 }, { - "epoch": 0.73, - "learning_rate": 0.0001900642481666558, - "loss": 0.0433, + "epoch": 0.44, + "learning_rate": 0.0002343991428774276, + "loss": 0.0629, "step": 67760 }, { - "epoch": 0.73, - "learning_rate": 0.00019004802388214678, - "loss": 0.0477, + "epoch": 0.44, + "learning_rate": 0.00023438946152307062, + "loss": 0.0563, "step": 67770 }, { - "epoch": 0.73, - "learning_rate": 0.0001900317995976377, - "loss": 0.0456, + "epoch": 0.44, + "learning_rate": 0.0002343797801687137, + "loss": 0.0551, "step": 67780 }, { - "epoch": 0.73, - "learning_rate": 0.00019001557531312868, - "loss": 0.0514, + "epoch": 0.44, + "learning_rate": 0.00023437009881435678, + "loss": 0.0529, "step": 67790 }, { - "epoch": 0.73, - "learning_rate": 0.0001899993510286196, - "loss": 0.049, + "epoch": 0.44, + "learning_rate": 0.00023436041745999986, + "loss": 0.0505, "step": 67800 }, { - "epoch": 0.73, - "learning_rate": 0.00018998312674411058, - "loss": 0.0533, + "epoch": 0.44, + "learning_rate": 0.00023435073610564292, + "loss": 0.0555, "step": 67810 }, { - "epoch": 0.73, - "learning_rate": 0.0001899669024596015, - "loss": 0.0513, + "epoch": 0.44, + "learning_rate": 0.000234341054751286, + "loss": 0.0563, "step": 67820 }, { - "epoch": 0.73, - "learning_rate": 0.00018995067817509245, - "loss": 0.0436, + "epoch": 0.44, + "learning_rate": 0.00023433137339692908, + "loss": 0.0563, "step": 67830 }, { - "epoch": 0.73, - "learning_rate": 0.0001899344538905834, - "loss": 0.0403, + "epoch": 0.44, + "learning_rate": 0.0002343216920425721, + "loss": 0.0685, "step": 67840 }, { - "epoch": 0.73, - "learning_rate": 0.00018991822960607435, - "loss": 0.0506, + "epoch": 0.44, + "learning_rate": 0.00023431201068821518, + "loss": 0.0591, "step": 67850 }, { - "epoch": 0.73, - "learning_rate": 0.00018990200532156528, - "loss": 0.0502, + "epoch": 0.44, + "learning_rate": 0.00023430232933385826, + "loss": 0.0588, "step": 67860 }, { - "epoch": 0.73, - "learning_rate": 0.00018988578103705625, - "loss": 0.0544, + "epoch": 0.44, + "learning_rate": 0.0002342926479795013, + "loss": 0.0577, "step": 67870 }, { - "epoch": 0.73, - "learning_rate": 0.00018986955675254718, - "loss": 0.0564, + "epoch": 0.44, + "learning_rate": 0.0002342829666251444, + "loss": 0.0579, "step": 67880 }, { - "epoch": 0.73, - "learning_rate": 0.00018985333246803815, - "loss": 0.0503, + "epoch": 0.44, + "learning_rate": 0.00023427328527078747, + "loss": 0.0523, "step": 67890 }, { - "epoch": 0.73, - "learning_rate": 0.00018983710818352908, - "loss": 0.0569, + "epoch": 0.44, + "learning_rate": 0.00023426360391643055, + "loss": 0.0682, "step": 67900 }, { - "epoch": 0.73, - "learning_rate": 0.00018982088389902003, - "loss": 0.0489, + "epoch": 0.44, + "learning_rate": 0.00023425392256207358, + "loss": 0.0552, "step": 67910 }, { - "epoch": 0.73, - "learning_rate": 0.00018980465961451098, - "loss": 0.042, + "epoch": 0.44, + "learning_rate": 0.00023424424120771666, + "loss": 0.0577, "step": 67920 }, { - "epoch": 0.73, - "learning_rate": 0.00018978843533000192, - "loss": 0.0449, + "epoch": 0.44, + "learning_rate": 0.00023423455985335974, + "loss": 0.0591, "step": 67930 }, { - "epoch": 0.73, - "learning_rate": 0.00018977221104549287, - "loss": 0.0494, + "epoch": 0.44, + "learning_rate": 0.0002342248784990028, + "loss": 0.0542, "step": 67940 }, { - "epoch": 0.73, - "learning_rate": 0.00018975598676098382, - "loss": 0.0523, + "epoch": 0.44, + "learning_rate": 0.00023421519714464587, + "loss": 0.0642, "step": 67950 }, { - "epoch": 0.74, - "learning_rate": 0.00018973976247647475, - "loss": 0.0475, + "epoch": 0.44, + "learning_rate": 0.00023420551579028895, + "loss": 0.0561, "step": 67960 }, { - "epoch": 0.74, - "learning_rate": 0.00018972353819196572, - "loss": 0.0486, + "epoch": 0.44, + "learning_rate": 0.00023419583443593203, + "loss": 0.0587, "step": 67970 }, { - "epoch": 0.74, - "learning_rate": 0.00018970731390745665, - "loss": 0.0486, + "epoch": 0.44, + "learning_rate": 0.00023418615308157506, + "loss": 0.061, "step": 67980 }, { - "epoch": 0.74, - "learning_rate": 0.00018969108962294762, - "loss": 0.0418, + "epoch": 0.44, + "learning_rate": 0.00023417647172721814, + "loss": 0.0523, "step": 67990 }, { - "epoch": 0.74, - "learning_rate": 0.00018967486533843855, - "loss": 0.0502, + "epoch": 0.44, + "learning_rate": 0.00023416679037286121, + "loss": 0.0616, "step": 68000 }, { - "epoch": 0.74, - "eval_cer": 0.9211401895250565, - "eval_loss": 0.03432660922408104, - "eval_runtime": 118.9272, - "eval_samples_per_second": 16.817, - "eval_steps_per_second": 4.204, + "epoch": 0.44, + "eval_cer": 0.9200415772229127, + "eval_loss": 0.037961166352033615, + "eval_runtime": 120.0353, + "eval_samples_per_second": 16.662, + "eval_steps_per_second": 4.165, "step": 68000 }, { - "epoch": 0.74, - "learning_rate": 0.0001896586410539295, - "loss": 0.0477, + "epoch": 0.44, + "learning_rate": 0.00023415710901850427, + "loss": 0.0578, "step": 68010 }, { - "epoch": 0.74, - "learning_rate": 0.00018964241676942045, - "loss": 0.045, + "epoch": 0.44, + "learning_rate": 0.00023414742766414735, + "loss": 0.0671, "step": 68020 }, { - "epoch": 0.74, - "learning_rate": 0.0001896261924849114, - "loss": 0.0434, + "epoch": 0.44, + "learning_rate": 0.00023413774630979043, + "loss": 0.057, "step": 68030 }, { - "epoch": 0.74, - "learning_rate": 0.00018960996820040232, - "loss": 0.0407, + "epoch": 0.44, + "learning_rate": 0.00023412806495543348, + "loss": 0.0556, "step": 68040 }, { - "epoch": 0.74, - "learning_rate": 0.0001895937439158933, - "loss": 0.0439, + "epoch": 0.44, + "learning_rate": 0.00023411838360107653, + "loss": 0.0527, "step": 68050 }, { - "epoch": 0.74, - "learning_rate": 0.00018957751963138424, - "loss": 0.0474, + "epoch": 0.44, + "learning_rate": 0.0002341087022467196, + "loss": 0.0571, "step": 68060 }, { - "epoch": 0.74, - "learning_rate": 0.0001895612953468752, - "loss": 0.0401, + "epoch": 0.44, + "learning_rate": 0.00023409902089236266, + "loss": 0.0492, "step": 68070 }, { - "epoch": 0.74, - "learning_rate": 0.00018954507106236614, - "loss": 0.05, + "epoch": 0.44, + "learning_rate": 0.00023408933953800574, + "loss": 0.0555, "step": 68080 }, { - "epoch": 0.74, - "learning_rate": 0.00018952884677785707, - "loss": 0.0499, + "epoch": 0.44, + "learning_rate": 0.00023407965818364882, + "loss": 0.0581, "step": 68090 }, { - "epoch": 0.74, - "learning_rate": 0.00018951262249334804, - "loss": 0.0436, + "epoch": 0.44, + "learning_rate": 0.0002340699768292919, + "loss": 0.0528, "step": 68100 }, { - "epoch": 0.74, - "learning_rate": 0.00018949639820883897, - "loss": 0.0474, + "epoch": 0.44, + "learning_rate": 0.00023406029547493496, + "loss": 0.0589, "step": 68110 }, { - "epoch": 0.74, - "learning_rate": 0.00018948017392432994, - "loss": 0.0492, + "epoch": 0.44, + "learning_rate": 0.000234050614120578, + "loss": 0.0609, "step": 68120 }, { - "epoch": 0.74, - "learning_rate": 0.00018946394963982087, - "loss": 0.0557, + "epoch": 0.44, + "learning_rate": 0.0002340409327662211, + "loss": 0.0625, "step": 68130 }, { - "epoch": 0.74, - "learning_rate": 0.00018944772535531184, - "loss": 0.0477, + "epoch": 0.44, + "learning_rate": 0.00023403125141186414, + "loss": 0.0516, "step": 68140 }, { - "epoch": 0.74, - "learning_rate": 0.00018943150107080277, - "loss": 0.0503, + "epoch": 0.44, + "learning_rate": 0.00023402157005750722, + "loss": 0.0582, "step": 68150 }, { - "epoch": 0.74, - "learning_rate": 0.00018941527678629372, - "loss": 0.0452, + "epoch": 0.44, + "learning_rate": 0.0002340118887031503, + "loss": 0.0571, "step": 68160 }, { - "epoch": 0.74, - "learning_rate": 0.00018939905250178467, - "loss": 0.0524, + "epoch": 0.44, + "learning_rate": 0.00023400220734879338, + "loss": 0.0572, "step": 68170 }, { - "epoch": 0.74, - "learning_rate": 0.00018938282821727562, - "loss": 0.0435, + "epoch": 0.44, + "learning_rate": 0.00023399252599443643, + "loss": 0.0534, "step": 68180 }, { - "epoch": 0.74, - "learning_rate": 0.00018936660393276654, - "loss": 0.0458, + "epoch": 0.44, + "learning_rate": 0.0002339828446400795, + "loss": 0.0546, "step": 68190 }, { - "epoch": 0.74, - "learning_rate": 0.00018935037964825751, - "loss": 0.0426, + "epoch": 0.44, + "learning_rate": 0.00023397316328572257, + "loss": 0.0589, "step": 68200 }, { - "epoch": 0.74, - "learning_rate": 0.00018933415536374844, - "loss": 0.0507, + "epoch": 0.44, + "learning_rate": 0.00023396348193136562, + "loss": 0.0536, "step": 68210 }, { - "epoch": 0.74, - "learning_rate": 0.00018931793107923941, - "loss": 0.0474, + "epoch": 0.44, + "learning_rate": 0.0002339538005770087, + "loss": 0.0562, "step": 68220 }, { - "epoch": 0.74, - "learning_rate": 0.00018930170679473034, - "loss": 0.0484, + "epoch": 0.44, + "learning_rate": 0.00023394411922265178, + "loss": 0.0606, "step": 68230 }, { - "epoch": 0.74, - "learning_rate": 0.0001892854825102213, - "loss": 0.051, + "epoch": 0.44, + "learning_rate": 0.00023393443786829483, + "loss": 0.0552, "step": 68240 }, { - "epoch": 0.74, - "learning_rate": 0.00018926925822571224, - "loss": 0.0468, + "epoch": 0.44, + "learning_rate": 0.0002339247565139379, + "loss": 0.0787, "step": 68250 }, { - "epoch": 0.74, - "learning_rate": 0.00018925303394120319, - "loss": 0.0486, + "epoch": 0.44, + "learning_rate": 0.00023391507515958096, + "loss": 0.0532, "step": 68260 }, { - "epoch": 0.74, - "learning_rate": 0.0001892368096566941, - "loss": 0.0534, + "epoch": 0.44, + "learning_rate": 0.00023390539380522402, + "loss": 0.06, "step": 68270 }, { - "epoch": 0.74, - "learning_rate": 0.00018922058537218509, - "loss": 0.0482, + "epoch": 0.44, + "learning_rate": 0.0002338957124508671, + "loss": 0.0576, "step": 68280 }, { - "epoch": 0.74, - "learning_rate": 0.000189204361087676, - "loss": 0.0526, + "epoch": 0.44, + "learning_rate": 0.00023388603109651018, + "loss": 0.0572, "step": 68290 }, { - "epoch": 0.74, - "learning_rate": 0.00018918813680316699, - "loss": 0.052, + "epoch": 0.44, + "learning_rate": 0.00023387634974215326, + "loss": 0.0604, "step": 68300 }, { - "epoch": 0.74, - "learning_rate": 0.0001891719125186579, - "loss": 0.0483, + "epoch": 0.44, + "learning_rate": 0.0002338666683877963, + "loss": 0.0529, "step": 68310 }, { - "epoch": 0.74, - "learning_rate": 0.00018915568823414888, - "loss": 0.0455, + "epoch": 0.44, + "learning_rate": 0.0002338569870334394, + "loss": 0.0519, "step": 68320 }, { - "epoch": 0.74, - "learning_rate": 0.0001891394639496398, - "loss": 0.0454, + "epoch": 0.44, + "learning_rate": 0.00023384730567908244, + "loss": 0.0574, "step": 68330 }, { - "epoch": 0.74, - "learning_rate": 0.00018912323966513076, - "loss": 0.0457, + "epoch": 0.44, + "learning_rate": 0.0002338376243247255, + "loss": 0.0586, "step": 68340 }, { - "epoch": 0.74, - "learning_rate": 0.0001891070153806217, - "loss": 0.0437, + "epoch": 0.44, + "learning_rate": 0.00023382794297036857, + "loss": 0.0618, "step": 68350 }, { - "epoch": 0.74, - "learning_rate": 0.00018909079109611266, - "loss": 0.0459, + "epoch": 0.44, + "learning_rate": 0.00023381826161601165, + "loss": 0.058, "step": 68360 }, { - "epoch": 0.74, - "learning_rate": 0.00018907456681160358, - "loss": 0.0465, + "epoch": 0.44, + "learning_rate": 0.00023380858026165473, + "loss": 0.0589, "step": 68370 }, { - "epoch": 0.74, - "learning_rate": 0.00018905834252709456, + "epoch": 0.44, + "learning_rate": 0.00023379889890729779, "loss": 0.0495, "step": 68380 }, { - "epoch": 0.74, - "learning_rate": 0.00018904211824258548, - "loss": 0.053, + "epoch": 0.44, + "learning_rate": 0.00023378921755294087, + "loss": 0.0566, "step": 68390 }, { - "epoch": 0.74, - "learning_rate": 0.00018902589395807646, - "loss": 0.0506, + "epoch": 0.44, + "learning_rate": 0.00023377953619858392, + "loss": 0.0578, "step": 68400 }, { - "epoch": 0.74, - "learning_rate": 0.00018900966967356738, - "loss": 0.0592, + "epoch": 0.44, + "learning_rate": 0.00023376985484422697, + "loss": 0.0478, "step": 68410 }, { - "epoch": 0.74, - "learning_rate": 0.00018899344538905833, - "loss": 0.0518, + "epoch": 0.44, + "learning_rate": 0.00023376017348987005, + "loss": 0.0541, "step": 68420 }, { - "epoch": 0.74, - "learning_rate": 0.00018897722110454928, - "loss": 0.0518, + "epoch": 0.44, + "learning_rate": 0.00023375049213551313, + "loss": 0.0664, "step": 68430 }, { - "epoch": 0.74, - "learning_rate": 0.00018896099682004023, - "loss": 0.0524, + "epoch": 0.44, + "learning_rate": 0.00023374081078115618, + "loss": 0.058, "step": 68440 }, { - "epoch": 0.74, - "learning_rate": 0.00018894477253553115, - "loss": 0.0465, + "epoch": 0.44, + "learning_rate": 0.00023373112942679926, + "loss": 0.0531, "step": 68450 }, { - "epoch": 0.74, - "learning_rate": 0.00018892854825102213, - "loss": 0.0429, + "epoch": 0.44, + "learning_rate": 0.00023372144807244234, + "loss": 0.0541, "step": 68460 }, { - "epoch": 0.74, - "learning_rate": 0.00018891232396651305, - "loss": 0.0389, + "epoch": 0.44, + "learning_rate": 0.00023371176671808537, + "loss": 0.0587, "step": 68470 }, { - "epoch": 0.74, - "learning_rate": 0.00018889609968200403, - "loss": 0.0462, + "epoch": 0.44, + "learning_rate": 0.00023370208536372845, + "loss": 0.0557, "step": 68480 }, { - "epoch": 0.74, - "learning_rate": 0.00018887987539749495, - "loss": 0.0503, + "epoch": 0.44, + "learning_rate": 0.00023369240400937153, + "loss": 0.0504, "step": 68490 }, { - "epoch": 0.74, - "learning_rate": 0.00018886365111298593, - "loss": 0.0467, + "epoch": 0.44, + "learning_rate": 0.0002336827226550146, + "loss": 0.0594, "step": 68500 }, { - "epoch": 0.74, - "learning_rate": 0.00018884742682847685, - "loss": 0.0511, + "epoch": 0.44, + "learning_rate": 0.00023367304130065766, + "loss": 0.0472, "step": 68510 }, { - "epoch": 0.74, - "learning_rate": 0.0001888312025439678, - "loss": 0.0541, + "epoch": 0.44, + "learning_rate": 0.00023366335994630074, + "loss": 0.0519, "step": 68520 }, { - "epoch": 0.74, - "learning_rate": 0.00018881497825945875, - "loss": 0.0484, + "epoch": 0.44, + "learning_rate": 0.00023365367859194382, + "loss": 0.0583, "step": 68530 }, { - "epoch": 0.74, - "learning_rate": 0.0001887987539749497, - "loss": 0.0498, + "epoch": 0.44, + "learning_rate": 0.00023364399723758685, + "loss": 0.0664, "step": 68540 }, { - "epoch": 0.74, - "learning_rate": 0.00018878252969044062, - "loss": 0.052, + "epoch": 0.44, + "learning_rate": 0.00023363431588322993, + "loss": 0.0581, "step": 68550 }, { - "epoch": 0.74, - "learning_rate": 0.0001887663054059316, - "loss": 0.0419, + "epoch": 0.44, + "learning_rate": 0.000233624634528873, + "loss": 0.0601, "step": 68560 }, { - "epoch": 0.74, - "learning_rate": 0.00018875008112142252, - "loss": 0.0454, + "epoch": 0.44, + "learning_rate": 0.00023361495317451609, + "loss": 0.0547, "step": 68570 }, { - "epoch": 0.74, - "learning_rate": 0.0001887338568369135, - "loss": 0.0488, + "epoch": 0.44, + "learning_rate": 0.00023360527182015914, + "loss": 0.0559, "step": 68580 }, { - "epoch": 0.74, - "learning_rate": 0.00018871763255240442, - "loss": 0.053, + "epoch": 0.44, + "learning_rate": 0.00023359559046580222, + "loss": 0.0549, "step": 68590 }, { - "epoch": 0.74, - "learning_rate": 0.00018870140826789537, - "loss": 0.0446, + "epoch": 0.44, + "learning_rate": 0.0002335859091114453, + "loss": 0.0584, "step": 68600 }, { - "epoch": 0.74, - "learning_rate": 0.00018868518398338632, - "loss": 0.049, + "epoch": 0.44, + "learning_rate": 0.00023357622775708832, + "loss": 0.064, "step": 68610 }, { - "epoch": 0.74, - "learning_rate": 0.00018866895969887727, - "loss": 0.0524, + "epoch": 0.44, + "learning_rate": 0.0002335665464027314, + "loss": 0.0633, "step": 68620 }, { - "epoch": 0.74, - "learning_rate": 0.00018865273541436822, - "loss": 0.0487, + "epoch": 0.44, + "learning_rate": 0.00023355686504837448, + "loss": 0.0556, "step": 68630 }, { - "epoch": 0.74, - "learning_rate": 0.00018863651112985917, - "loss": 0.0495, + "epoch": 0.44, + "learning_rate": 0.00023354718369401754, + "loss": 0.0585, "step": 68640 }, { - "epoch": 0.74, - "learning_rate": 0.0001886202868453501, - "loss": 0.0458, + "epoch": 0.44, + "learning_rate": 0.00023353750233966062, + "loss": 0.0584, "step": 68650 }, { - "epoch": 0.74, - "learning_rate": 0.00018860406256084107, - "loss": 0.0453, + "epoch": 0.44, + "learning_rate": 0.0002335278209853037, + "loss": 0.0558, "step": 68660 }, { - "epoch": 0.74, - "learning_rate": 0.000188587838276332, - "loss": 0.0657, + "epoch": 0.44, + "learning_rate": 0.00023351813963094677, + "loss": 0.0589, "step": 68670 }, { - "epoch": 0.74, - "learning_rate": 0.00018857161399182297, - "loss": 0.0462, + "epoch": 0.44, + "learning_rate": 0.0002335084582765898, + "loss": 0.053, "step": 68680 }, { - "epoch": 0.74, - "learning_rate": 0.0001885553897073139, - "loss": 0.0471, + "epoch": 0.44, + "learning_rate": 0.00023349877692223288, + "loss": 0.0546, "step": 68690 }, { - "epoch": 0.74, - "learning_rate": 0.00018853916542280484, - "loss": 0.0522, + "epoch": 0.44, + "learning_rate": 0.00023348909556787596, + "loss": 0.0588, "step": 68700 }, { - "epoch": 0.74, - "learning_rate": 0.0001885229411382958, - "loss": 0.0456, + "epoch": 0.44, + "learning_rate": 0.000233479414213519, + "loss": 0.0498, "step": 68710 }, { - "epoch": 0.74, - "learning_rate": 0.00018850671685378674, - "loss": 0.0438, + "epoch": 0.44, + "learning_rate": 0.0002334697328591621, + "loss": 0.0538, "step": 68720 }, { - "epoch": 0.74, - "learning_rate": 0.00018849049256927766, - "loss": 0.0446, + "epoch": 0.44, + "learning_rate": 0.00023346005150480517, + "loss": 0.0679, "step": 68730 }, { - "epoch": 0.74, - "learning_rate": 0.00018847426828476864, - "loss": 0.0439, + "epoch": 0.44, + "learning_rate": 0.00023345037015044825, + "loss": 0.0512, "step": 68740 }, { - "epoch": 0.74, - "learning_rate": 0.00018845804400025956, - "loss": 0.0551, + "epoch": 0.44, + "learning_rate": 0.00023344068879609128, + "loss": 0.0504, "step": 68750 }, { - "epoch": 0.74, - "learning_rate": 0.00018844181971575054, - "loss": 0.0437, + "epoch": 0.44, + "learning_rate": 0.00023343100744173436, + "loss": 0.0545, "step": 68760 }, { - "epoch": 0.74, - "learning_rate": 0.00018842559543124146, - "loss": 0.0524, + "epoch": 0.44, + "learning_rate": 0.00023342132608737744, + "loss": 0.0549, "step": 68770 }, { - "epoch": 0.74, - "learning_rate": 0.0001884093711467324, - "loss": 0.0461, + "epoch": 0.44, + "learning_rate": 0.0002334116447330205, + "loss": 0.0555, "step": 68780 }, { - "epoch": 0.74, - "learning_rate": 0.00018839314686222336, - "loss": 0.0448, + "epoch": 0.44, + "learning_rate": 0.00023340196337866357, + "loss": 0.0544, "step": 68790 }, { - "epoch": 0.74, - "learning_rate": 0.0001883769225777143, - "loss": 0.0506, + "epoch": 0.44, + "learning_rate": 0.00023339228202430665, + "loss": 0.0503, "step": 68800 }, { - "epoch": 0.74, - "learning_rate": 0.00018836069829320526, - "loss": 0.0428, + "epoch": 0.44, + "learning_rate": 0.0002333826006699497, + "loss": 0.0496, "step": 68810 }, { - "epoch": 0.74, - "learning_rate": 0.0001883444740086962, - "loss": 0.0435, + "epoch": 0.44, + "learning_rate": 0.00023337291931559275, + "loss": 0.056, "step": 68820 }, { - "epoch": 0.74, - "learning_rate": 0.00018832824972418713, - "loss": 0.043, + "epoch": 0.44, + "learning_rate": 0.00023336323796123583, + "loss": 0.0513, "step": 68830 }, { - "epoch": 0.74, - "learning_rate": 0.0001883120254396781, - "loss": 0.0445, + "epoch": 0.44, + "learning_rate": 0.0002333535566068789, + "loss": 0.0518, "step": 68840 }, { - "epoch": 0.74, - "learning_rate": 0.00018829580115516903, - "loss": 0.0448, + "epoch": 0.44, + "learning_rate": 0.00023334387525252197, + "loss": 0.0498, "step": 68850 }, { - "epoch": 0.74, - "learning_rate": 0.00018827957687066, - "loss": 0.0486, + "epoch": 0.44, + "learning_rate": 0.00023333419389816505, + "loss": 0.057, "step": 68860 }, { - "epoch": 0.74, - "learning_rate": 0.00018826335258615093, - "loss": 0.0464, + "epoch": 0.44, + "learning_rate": 0.00023332451254380813, + "loss": 0.0604, "step": 68870 }, { - "epoch": 0.75, - "learning_rate": 0.00018824712830164188, - "loss": 0.0435, + "epoch": 0.44, + "learning_rate": 0.00023331483118945118, + "loss": 0.0599, "step": 68880 }, { - "epoch": 0.75, - "learning_rate": 0.00018823090401713283, - "loss": 0.0515, + "epoch": 0.44, + "learning_rate": 0.00023330514983509423, + "loss": 0.0609, "step": 68890 }, { - "epoch": 0.75, - "learning_rate": 0.00018821467973262378, - "loss": 0.0451, + "epoch": 0.44, + "learning_rate": 0.0002332954684807373, + "loss": 0.0557, "step": 68900 }, { - "epoch": 0.75, - "learning_rate": 0.0001881984554481147, - "loss": 0.0398, + "epoch": 0.44, + "learning_rate": 0.00023328578712638036, + "loss": 0.0592, "step": 68910 }, { - "epoch": 0.75, - "learning_rate": 0.00018818223116360568, - "loss": 0.0499, + "epoch": 0.44, + "learning_rate": 0.00023327610577202344, + "loss": 0.0638, "step": 68920 }, { - "epoch": 0.75, - "learning_rate": 0.0001881660068790966, - "loss": 0.0484, + "epoch": 0.44, + "learning_rate": 0.00023326642441766652, + "loss": 0.048, "step": 68930 }, { - "epoch": 0.75, - "learning_rate": 0.00018814978259458758, - "loss": 0.0529, + "epoch": 0.44, + "learning_rate": 0.0002332567430633096, + "loss": 0.0504, "step": 68940 }, { - "epoch": 0.75, - "learning_rate": 0.0001881335583100785, - "loss": 0.039, + "epoch": 0.45, + "learning_rate": 0.00023324706170895266, + "loss": 0.0658, "step": 68950 }, { - "epoch": 0.75, - "learning_rate": 0.00018811733402556945, - "loss": 0.0492, + "epoch": 0.45, + "learning_rate": 0.0002332373803545957, + "loss": 0.0555, "step": 68960 }, { - "epoch": 0.75, - "learning_rate": 0.0001881011097410604, - "loss": 0.0559, + "epoch": 0.45, + "learning_rate": 0.0002332276990002388, + "loss": 0.0578, "step": 68970 }, { - "epoch": 0.75, - "learning_rate": 0.00018808488545655135, - "loss": 0.042, + "epoch": 0.45, + "learning_rate": 0.00023321801764588184, + "loss": 0.0612, "step": 68980 }, { - "epoch": 0.75, - "learning_rate": 0.0001880686611720423, - "loss": 0.0579, + "epoch": 0.45, + "learning_rate": 0.00023320833629152492, + "loss": 0.0544, "step": 68990 }, { - "epoch": 0.75, - "learning_rate": 0.00018805243688753325, - "loss": 0.0434, + "epoch": 0.45, + "learning_rate": 0.000233198654937168, + "loss": 0.0666, "step": 69000 }, { - "epoch": 0.75, - "eval_cer": 0.9212638773299691, - "eval_loss": 0.03374125435948372, - "eval_runtime": 118.7625, - "eval_samples_per_second": 16.84, - "eval_steps_per_second": 4.21, + "epoch": 0.45, + "eval_cer": 0.9200650773923851, + "eval_loss": 0.03810597211122513, + "eval_runtime": 120.1331, + "eval_samples_per_second": 16.648, + "eval_steps_per_second": 4.162, "step": 69000 }, { - "epoch": 0.75, - "learning_rate": 0.00018803621260302417, - "loss": 0.05, + "epoch": 0.45, + "learning_rate": 0.00023318897358281105, + "loss": 0.0587, "step": 69010 }, { - "epoch": 0.75, - "learning_rate": 0.00018801998831851515, - "loss": 0.0521, + "epoch": 0.45, + "learning_rate": 0.00023317929222845413, + "loss": 0.0553, "step": 69020 }, { - "epoch": 0.75, - "learning_rate": 0.00018800376403400607, - "loss": 0.0574, + "epoch": 0.45, + "learning_rate": 0.0002331696108740972, + "loss": 0.0561, "step": 69030 }, { - "epoch": 0.75, - "learning_rate": 0.00018798753974949705, - "loss": 0.0475, + "epoch": 0.45, + "learning_rate": 0.00023315992951974024, + "loss": 0.0529, "step": 69040 }, { - "epoch": 0.75, - "learning_rate": 0.00018797131546498797, - "loss": 0.0437, + "epoch": 0.45, + "learning_rate": 0.00023315024816538332, + "loss": 0.0568, "step": 69050 }, { - "epoch": 0.75, - "learning_rate": 0.00018795509118047892, - "loss": 0.0513, + "epoch": 0.45, + "learning_rate": 0.0002331405668110264, + "loss": 0.0571, "step": 69060 }, { - "epoch": 0.75, - "learning_rate": 0.00018793886689596987, - "loss": 0.0499, + "epoch": 0.45, + "learning_rate": 0.00023313088545666948, + "loss": 0.0552, "step": 69070 }, { - "epoch": 0.75, - "learning_rate": 0.00018792264261146082, - "loss": 0.0464, + "epoch": 0.45, + "learning_rate": 0.00023312120410231253, + "loss": 0.0554, "step": 69080 }, { - "epoch": 0.75, - "learning_rate": 0.00018790641832695175, - "loss": 0.0505, + "epoch": 0.45, + "learning_rate": 0.0002331115227479556, + "loss": 0.0476, "step": 69090 }, { - "epoch": 0.75, - "learning_rate": 0.00018789019404244272, - "loss": 0.051, + "epoch": 0.45, + "learning_rate": 0.00023310184139359866, + "loss": 0.0468, "step": 69100 }, { - "epoch": 0.75, - "learning_rate": 0.00018787396975793365, - "loss": 0.0493, + "epoch": 0.45, + "learning_rate": 0.00023309216003924172, + "loss": 0.0556, "step": 69110 }, { - "epoch": 0.75, - "learning_rate": 0.00018785774547342462, - "loss": 0.0504, + "epoch": 0.45, + "learning_rate": 0.0002330824786848848, + "loss": 0.0542, "step": 69120 }, { - "epoch": 0.75, - "learning_rate": 0.00018784152118891555, - "loss": 0.0472, + "epoch": 0.45, + "learning_rate": 0.00023307279733052788, + "loss": 0.0551, "step": 69130 }, { - "epoch": 0.75, - "learning_rate": 0.0001878252969044065, - "loss": 0.0448, + "epoch": 0.45, + "learning_rate": 0.00023306311597617096, + "loss": 0.053, "step": 69140 }, { - "epoch": 0.75, - "learning_rate": 0.00018780907261989744, - "loss": 0.0444, + "epoch": 0.45, + "learning_rate": 0.000233053434621814, + "loss": 0.0623, "step": 69150 }, { - "epoch": 0.75, - "learning_rate": 0.0001877928483353884, - "loss": 0.0477, + "epoch": 0.45, + "learning_rate": 0.0002330437532674571, + "loss": 0.0535, "step": 69160 }, { - "epoch": 0.75, - "learning_rate": 0.00018777662405087934, - "loss": 0.045, + "epoch": 0.45, + "learning_rate": 0.00023303407191310014, + "loss": 0.0609, "step": 69170 }, { - "epoch": 0.75, - "learning_rate": 0.0001877603997663703, - "loss": 0.0505, + "epoch": 0.45, + "learning_rate": 0.0002330243905587432, + "loss": 0.0489, "step": 69180 }, { - "epoch": 0.75, - "learning_rate": 0.00018774417548186122, - "loss": 0.0487, + "epoch": 0.45, + "learning_rate": 0.00023301470920438627, + "loss": 0.0572, "step": 69190 }, { - "epoch": 0.75, - "learning_rate": 0.0001877279511973522, - "loss": 0.048, + "epoch": 0.45, + "learning_rate": 0.00023300502785002935, + "loss": 0.0567, "step": 69200 }, { - "epoch": 0.75, - "learning_rate": 0.00018771172691284312, - "loss": 0.0453, + "epoch": 0.45, + "learning_rate": 0.0002329953464956724, + "loss": 0.0587, "step": 69210 }, { - "epoch": 0.75, - "learning_rate": 0.0001876955026283341, - "loss": 0.0436, + "epoch": 0.45, + "learning_rate": 0.00023298566514131549, + "loss": 0.0486, "step": 69220 }, { - "epoch": 0.75, - "learning_rate": 0.00018767927834382502, - "loss": 0.0538, + "epoch": 0.45, + "learning_rate": 0.00023297598378695857, + "loss": 0.0524, "step": 69230 }, { - "epoch": 0.75, - "learning_rate": 0.00018766305405931597, - "loss": 0.0447, + "epoch": 0.45, + "learning_rate": 0.0002329663024326016, + "loss": 0.0528, "step": 69240 }, { - "epoch": 0.75, - "learning_rate": 0.00018764682977480692, - "loss": 0.0512, + "epoch": 0.45, + "learning_rate": 0.00023295662107824467, + "loss": 0.0525, "step": 69250 }, { - "epoch": 0.75, - "learning_rate": 0.00018763060549029787, - "loss": 0.068, + "epoch": 0.45, + "learning_rate": 0.00023294693972388775, + "loss": 0.0505, "step": 69260 }, { - "epoch": 0.75, - "learning_rate": 0.0001876143812057888, - "loss": 0.0545, + "epoch": 0.45, + "learning_rate": 0.00023293725836953083, + "loss": 0.0529, "step": 69270 }, { - "epoch": 0.75, - "learning_rate": 0.00018759815692127976, - "loss": 0.054, + "epoch": 0.45, + "learning_rate": 0.00023292757701517388, + "loss": 0.0539, "step": 69280 }, { - "epoch": 0.75, - "learning_rate": 0.0001875819326367707, - "loss": 0.0526, + "epoch": 0.45, + "learning_rate": 0.00023291789566081696, + "loss": 0.0517, "step": 69290 }, { - "epoch": 0.75, - "learning_rate": 0.00018756570835226166, - "loss": 0.0431, + "epoch": 0.45, + "learning_rate": 0.00023290821430646004, + "loss": 0.0502, "step": 69300 }, { - "epoch": 0.75, - "learning_rate": 0.0001875494840677526, - "loss": 0.0488, + "epoch": 0.45, + "learning_rate": 0.00023289853295210307, + "loss": 0.0524, "step": 69310 }, { - "epoch": 0.75, - "learning_rate": 0.00018753325978324356, - "loss": 0.0463, + "epoch": 0.45, + "learning_rate": 0.00023288885159774615, + "loss": 0.0645, "step": 69320 }, { - "epoch": 0.75, - "learning_rate": 0.00018751703549873449, - "loss": 0.0476, + "epoch": 0.45, + "learning_rate": 0.00023287917024338923, + "loss": 0.0584, "step": 69330 }, { - "epoch": 0.75, - "learning_rate": 0.00018750081121422544, - "loss": 0.0501, + "epoch": 0.45, + "learning_rate": 0.0002328694888890323, + "loss": 0.057, "step": 69340 }, { - "epoch": 0.75, - "learning_rate": 0.00018748458692971639, - "loss": 0.0455, + "epoch": 0.45, + "learning_rate": 0.00023285980753467536, + "loss": 0.063, "step": 69350 }, { - "epoch": 0.75, - "learning_rate": 0.00018746836264520734, - "loss": 0.0423, + "epoch": 0.45, + "learning_rate": 0.00023285012618031844, + "loss": 0.0464, "step": 69360 }, { - "epoch": 0.75, - "learning_rate": 0.00018745213836069826, - "loss": 0.0521, + "epoch": 0.45, + "learning_rate": 0.00023284044482596152, + "loss": 0.0527, "step": 69370 }, { - "epoch": 0.75, - "learning_rate": 0.00018743591407618924, - "loss": 0.0451, + "epoch": 0.45, + "learning_rate": 0.00023283076347160455, + "loss": 0.0547, "step": 69380 }, { - "epoch": 0.75, - "learning_rate": 0.00018741968979168016, - "loss": 0.048, + "epoch": 0.45, + "learning_rate": 0.00023282108211724763, + "loss": 0.0519, "step": 69390 }, { - "epoch": 0.75, - "learning_rate": 0.00018740346550717113, - "loss": 0.0451, + "epoch": 0.45, + "learning_rate": 0.0002328114007628907, + "loss": 0.0517, "step": 69400 }, { - "epoch": 0.75, - "learning_rate": 0.00018738724122266206, - "loss": 0.051, + "epoch": 0.45, + "learning_rate": 0.00023280171940853376, + "loss": 0.0556, "step": 69410 }, { - "epoch": 0.75, - "learning_rate": 0.000187371016938153, - "loss": 0.049, + "epoch": 0.45, + "learning_rate": 0.00023279203805417684, + "loss": 0.0553, "step": 69420 }, { - "epoch": 0.75, - "learning_rate": 0.00018735479265364396, - "loss": 0.0566, + "epoch": 0.45, + "learning_rate": 0.00023278235669981992, + "loss": 0.0545, "step": 69430 }, { - "epoch": 0.75, - "learning_rate": 0.0001873385683691349, - "loss": 0.0455, + "epoch": 0.45, + "learning_rate": 0.000232772675345463, + "loss": 0.0557, "step": 69440 }, { - "epoch": 0.75, - "learning_rate": 0.00018732234408462583, - "loss": 0.0447, + "epoch": 0.45, + "learning_rate": 0.00023276299399110602, + "loss": 0.0585, "step": 69450 }, { - "epoch": 0.75, - "learning_rate": 0.0001873061198001168, - "loss": 0.0505, + "epoch": 0.45, + "learning_rate": 0.0002327533126367491, + "loss": 0.0521, "step": 69460 }, { - "epoch": 0.75, - "learning_rate": 0.00018728989551560773, - "loss": 0.0471, + "epoch": 0.45, + "learning_rate": 0.00023274363128239218, + "loss": 0.0526, "step": 69470 }, { - "epoch": 0.75, - "learning_rate": 0.0001872736712310987, - "loss": 0.0537, + "epoch": 0.45, + "learning_rate": 0.00023273394992803524, + "loss": 0.0474, "step": 69480 }, { - "epoch": 0.75, - "learning_rate": 0.00018725744694658963, - "loss": 0.0546, + "epoch": 0.45, + "learning_rate": 0.00023272426857367831, + "loss": 0.0556, "step": 69490 }, { - "epoch": 0.75, - "learning_rate": 0.0001872412226620806, - "loss": 0.0472, + "epoch": 0.45, + "learning_rate": 0.0002327145872193214, + "loss": 0.0562, "step": 69500 }, { - "epoch": 0.75, - "learning_rate": 0.00018722499837757153, - "loss": 0.0481, + "epoch": 0.45, + "learning_rate": 0.00023270490586496447, + "loss": 0.0521, "step": 69510 }, { - "epoch": 0.75, - "learning_rate": 0.00018720877409306248, - "loss": 0.0455, + "epoch": 0.45, + "learning_rate": 0.0002326952245106075, + "loss": 0.055, "step": 69520 }, { - "epoch": 0.75, - "learning_rate": 0.00018719254980855343, - "loss": 0.0566, + "epoch": 0.45, + "learning_rate": 0.00023268554315625058, + "loss": 0.0512, "step": 69530 }, { - "epoch": 0.75, - "learning_rate": 0.00018717632552404438, - "loss": 0.0476, + "epoch": 0.45, + "learning_rate": 0.00023267586180189366, + "loss": 0.0538, "step": 69540 }, { - "epoch": 0.75, - "learning_rate": 0.0001871601012395353, - "loss": 0.0599, + "epoch": 0.45, + "learning_rate": 0.0002326661804475367, + "loss": 0.0614, "step": 69550 }, { - "epoch": 0.75, - "learning_rate": 0.00018714387695502628, - "loss": 0.0513, + "epoch": 0.45, + "learning_rate": 0.0002326564990931798, + "loss": 0.0563, "step": 69560 }, { - "epoch": 0.75, - "learning_rate": 0.0001871276526705172, - "loss": 0.0498, + "epoch": 0.45, + "learning_rate": 0.00023264681773882287, + "loss": 0.0509, "step": 69570 }, { - "epoch": 0.75, - "learning_rate": 0.00018711142838600818, - "loss": 0.0426, + "epoch": 0.45, + "learning_rate": 0.00023263713638446595, + "loss": 0.0632, "step": 69580 }, { - "epoch": 0.75, - "learning_rate": 0.0001870952041014991, - "loss": 0.0432, + "epoch": 0.45, + "learning_rate": 0.00023262745503010898, + "loss": 0.0522, "step": 69590 }, { - "epoch": 0.75, - "learning_rate": 0.00018707897981699005, - "loss": 0.0497, + "epoch": 0.45, + "learning_rate": 0.00023261777367575206, + "loss": 0.0613, "step": 69600 }, { - "epoch": 0.75, - "learning_rate": 0.000187062755532481, - "loss": 0.0442, + "epoch": 0.45, + "learning_rate": 0.0002326080923213951, + "loss": 0.0475, "step": 69610 }, { - "epoch": 0.75, - "learning_rate": 0.00018704653124797195, - "loss": 0.0524, + "epoch": 0.45, + "learning_rate": 0.0002325984109670382, + "loss": 0.0511, "step": 69620 }, { - "epoch": 0.75, - "learning_rate": 0.00018703030696346287, - "loss": 0.048, + "epoch": 0.45, + "learning_rate": 0.00023258872961268127, + "loss": 0.0527, "step": 69630 }, { - "epoch": 0.75, - "learning_rate": 0.00018701408267895385, - "loss": 0.0435, + "epoch": 0.45, + "learning_rate": 0.00023257904825832435, + "loss": 0.0522, "step": 69640 }, { - "epoch": 0.75, - "learning_rate": 0.00018699785839444477, - "loss": 0.048, + "epoch": 0.45, + "learning_rate": 0.0002325693669039674, + "loss": 0.0541, "step": 69650 }, { - "epoch": 0.75, - "learning_rate": 0.00018698163410993575, - "loss": 0.052, + "epoch": 0.45, + "learning_rate": 0.00023255968554961045, + "loss": 0.0592, "step": 69660 }, { - "epoch": 0.75, - "learning_rate": 0.00018696540982542667, - "loss": 0.0584, + "epoch": 0.45, + "learning_rate": 0.00023255000419525353, + "loss": 0.0566, "step": 69670 }, { - "epoch": 0.75, - "learning_rate": 0.00018694918554091765, - "loss": 0.058, + "epoch": 0.45, + "learning_rate": 0.0002325403228408966, + "loss": 0.0523, "step": 69680 }, { - "epoch": 0.75, - "learning_rate": 0.00018693296125640857, - "loss": 0.0532, + "epoch": 0.45, + "learning_rate": 0.00023253064148653967, + "loss": 0.0487, "step": 69690 }, { - "epoch": 0.75, - "learning_rate": 0.00018691673697189952, - "loss": 0.0519, + "epoch": 0.45, + "learning_rate": 0.00023252096013218275, + "loss": 0.0548, "step": 69700 }, { - "epoch": 0.75, - "learning_rate": 0.00018690051268739047, - "loss": 0.0396, + "epoch": 0.45, + "learning_rate": 0.00023251127877782583, + "loss": 0.0527, "step": 69710 }, { - "epoch": 0.75, - "learning_rate": 0.00018688428840288142, - "loss": 0.0454, + "epoch": 0.45, + "learning_rate": 0.00023250159742346888, + "loss": 0.0542, "step": 69720 }, { - "epoch": 0.75, - "learning_rate": 0.00018686806411837234, - "loss": 0.044, + "epoch": 0.45, + "learning_rate": 0.00023249191606911193, + "loss": 0.0548, "step": 69730 }, { - "epoch": 0.75, - "learning_rate": 0.00018685183983386332, - "loss": 0.0452, + "epoch": 0.45, + "learning_rate": 0.000232482234714755, + "loss": 0.0534, "step": 69740 }, { - "epoch": 0.75, - "learning_rate": 0.00018683561554935424, - "loss": 0.0437, + "epoch": 0.45, + "learning_rate": 0.00023247255336039806, + "loss": 0.0528, "step": 69750 }, { - "epoch": 0.75, - "learning_rate": 0.00018681939126484522, - "loss": 0.0532, + "epoch": 0.45, + "learning_rate": 0.00023246287200604114, + "loss": 0.059, "step": 69760 }, { - "epoch": 0.75, - "learning_rate": 0.00018680316698033614, - "loss": 0.0448, + "epoch": 0.45, + "learning_rate": 0.00023245319065168422, + "loss": 0.0542, "step": 69770 }, { - "epoch": 0.75, - "learning_rate": 0.0001867869426958271, - "loss": 0.0521, + "epoch": 0.45, + "learning_rate": 0.0002324435092973273, + "loss": 0.055, "step": 69780 }, { - "epoch": 0.75, - "learning_rate": 0.00018677071841131804, - "loss": 0.0468, + "epoch": 0.45, + "learning_rate": 0.00023243382794297036, + "loss": 0.0507, "step": 69790 }, { - "epoch": 0.75, - "learning_rate": 0.000186754494126809, - "loss": 0.0469, + "epoch": 0.45, + "learning_rate": 0.0002324241465886134, + "loss": 0.0558, "step": 69800 }, { - "epoch": 0.76, - "learning_rate": 0.0001867382698422999, - "loss": 0.0484, + "epoch": 0.45, + "learning_rate": 0.00023241446523425646, + "loss": 0.0589, "step": 69810 }, { - "epoch": 0.76, - "learning_rate": 0.0001867220455577909, - "loss": 0.0527, + "epoch": 0.45, + "learning_rate": 0.00023240478387989954, + "loss": 0.0519, "step": 69820 }, { - "epoch": 0.76, - "learning_rate": 0.0001867058212732818, - "loss": 0.0493, + "epoch": 0.45, + "learning_rate": 0.00023239510252554262, + "loss": 0.0562, "step": 69830 }, { - "epoch": 0.76, - "learning_rate": 0.0001866895969887728, - "loss": 0.0478, + "epoch": 0.45, + "learning_rate": 0.0002323854211711857, + "loss": 0.0522, "step": 69840 }, { - "epoch": 0.76, - "learning_rate": 0.0001866733727042637, - "loss": 0.0534, + "epoch": 0.45, + "learning_rate": 0.00023237573981682875, + "loss": 0.0621, "step": 69850 }, { - "epoch": 0.76, - "learning_rate": 0.0001866571484197547, - "loss": 0.0538, + "epoch": 0.45, + "learning_rate": 0.00023236605846247183, + "loss": 0.0582, "step": 69860 }, { - "epoch": 0.76, - "learning_rate": 0.0001866409241352456, - "loss": 0.0436, + "epoch": 0.45, + "learning_rate": 0.00023235637710811489, + "loss": 0.0545, "step": 69870 }, { - "epoch": 0.76, - "learning_rate": 0.00018662469985073656, - "loss": 0.0535, + "epoch": 0.45, + "learning_rate": 0.00023234669575375794, + "loss": 0.0558, "step": 69880 }, { - "epoch": 0.76, - "learning_rate": 0.0001866084755662275, - "loss": 0.0449, + "epoch": 0.45, + "learning_rate": 0.00023233701439940102, + "loss": 0.0557, "step": 69890 }, { - "epoch": 0.76, - "learning_rate": 0.00018659225128171846, - "loss": 0.0453, + "epoch": 0.45, + "learning_rate": 0.0002323273330450441, + "loss": 0.0543, "step": 69900 }, { - "epoch": 0.76, - "learning_rate": 0.00018657602699720938, - "loss": 0.0553, + "epoch": 0.45, + "learning_rate": 0.00023231765169068718, + "loss": 0.0531, "step": 69910 }, { - "epoch": 0.76, - "learning_rate": 0.00018655980271270036, - "loss": 0.0504, + "epoch": 0.45, + "learning_rate": 0.00023230797033633023, + "loss": 0.0497, "step": 69920 }, { - "epoch": 0.76, - "learning_rate": 0.00018654357842819128, - "loss": 0.0534, + "epoch": 0.45, + "learning_rate": 0.0002322982889819733, + "loss": 0.055, "step": 69930 }, { - "epoch": 0.76, - "learning_rate": 0.00018652735414368226, - "loss": 0.0421, + "epoch": 0.45, + "learning_rate": 0.00023228860762761636, + "loss": 0.0605, "step": 69940 }, { - "epoch": 0.76, - "learning_rate": 0.00018651112985917318, - "loss": 0.0481, + "epoch": 0.45, + "learning_rate": 0.00023227892627325942, + "loss": 0.0501, "step": 69950 }, { - "epoch": 0.76, - "learning_rate": 0.00018649490557466413, - "loss": 0.049, + "epoch": 0.45, + "learning_rate": 0.0002322692449189025, + "loss": 0.0527, "step": 69960 }, { - "epoch": 0.76, - "learning_rate": 0.00018647868129015508, - "loss": 0.0509, + "epoch": 0.45, + "learning_rate": 0.00023225956356454558, + "loss": 0.0534, "step": 69970 }, { - "epoch": 0.76, - "learning_rate": 0.00018646245700564603, - "loss": 0.0492, + "epoch": 0.45, + "learning_rate": 0.00023224988221018866, + "loss": 0.0583, "step": 69980 }, { - "epoch": 0.76, - "learning_rate": 0.00018644623272113695, - "loss": 0.0577, + "epoch": 0.45, + "learning_rate": 0.0002322402008558317, + "loss": 0.0585, "step": 69990 }, { - "epoch": 0.76, - "learning_rate": 0.00018643000843662793, - "loss": 0.0579, + "epoch": 0.45, + "learning_rate": 0.0002322305195014748, + "loss": 0.052, "step": 70000 }, { - "epoch": 0.76, - "eval_cer": 0.9213389734972374, - "eval_loss": 0.0336674340069294, - "eval_runtime": 118.719, - "eval_samples_per_second": 16.847, - "eval_steps_per_second": 4.212, + "epoch": 0.45, + "eval_cer": 0.9199529996610553, + "eval_loss": 0.037266287952661514, + "eval_runtime": 120.2383, + "eval_samples_per_second": 16.634, + "eval_steps_per_second": 4.158, "step": 70000 }, { - "epoch": 0.76, - "learning_rate": 0.00018641378415211885, - "loss": 0.0501, + "epoch": 0.45, + "learning_rate": 0.0002322208381471178, + "loss": 0.0492, "step": 70010 }, { - "epoch": 0.76, - "learning_rate": 0.00018639755986760983, - "loss": 0.052, + "epoch": 0.45, + "learning_rate": 0.0002322111567927609, + "loss": 0.0508, "step": 70020 }, { - "epoch": 0.76, - "learning_rate": 0.00018638133558310075, - "loss": 0.0421, + "epoch": 0.45, + "learning_rate": 0.00023220147543840397, + "loss": 0.0482, "step": 70030 }, { - "epoch": 0.76, - "learning_rate": 0.00018636511129859173, - "loss": 0.045, + "epoch": 0.45, + "learning_rate": 0.00023219179408404705, + "loss": 0.0495, "step": 70040 }, { - "epoch": 0.76, - "learning_rate": 0.00018634888701408265, - "loss": 0.0454, + "epoch": 0.45, + "learning_rate": 0.0002321821127296901, + "loss": 0.0539, "step": 70050 }, { - "epoch": 0.76, - "learning_rate": 0.0001863326627295736, - "loss": 0.0442, + "epoch": 0.45, + "learning_rate": 0.00023217243137533319, + "loss": 0.0576, "step": 70060 }, { - "epoch": 0.76, - "learning_rate": 0.00018631643844506455, - "loss": 0.0443, + "epoch": 0.45, + "learning_rate": 0.00023216275002097627, + "loss": 0.0543, "step": 70070 }, { - "epoch": 0.76, - "learning_rate": 0.0001863002141605555, - "loss": 0.0482, + "epoch": 0.45, + "learning_rate": 0.0002321530686666193, + "loss": 0.0547, "step": 70080 }, { - "epoch": 0.76, - "learning_rate": 0.00018628398987604642, - "loss": 0.0483, + "epoch": 0.45, + "learning_rate": 0.00023214338731226237, + "loss": 0.0538, "step": 70090 }, { - "epoch": 0.76, - "learning_rate": 0.0001862677655915374, - "loss": 0.0491, + "epoch": 0.45, + "learning_rate": 0.00023213370595790545, + "loss": 0.0468, "step": 70100 }, { - "epoch": 0.76, - "learning_rate": 0.00018625154130702832, - "loss": 0.0457, + "epoch": 0.45, + "learning_rate": 0.00023212402460354853, + "loss": 0.0541, "step": 70110 }, { - "epoch": 0.76, - "learning_rate": 0.0001862353170225193, - "loss": 0.0394, + "epoch": 0.45, + "learning_rate": 0.00023211434324919158, + "loss": 0.0588, "step": 70120 }, { - "epoch": 0.76, - "learning_rate": 0.00018621909273801022, - "loss": 0.0502, + "epoch": 0.45, + "learning_rate": 0.00023210466189483466, + "loss": 0.0555, "step": 70130 }, { - "epoch": 0.76, - "learning_rate": 0.00018620286845350117, - "loss": 0.0398, + "epoch": 0.45, + "learning_rate": 0.00023209498054047774, + "loss": 0.0523, "step": 70140 }, { - "epoch": 0.76, - "learning_rate": 0.00018618664416899212, - "loss": 0.0505, + "epoch": 0.45, + "learning_rate": 0.00023208529918612077, + "loss": 0.0496, "step": 70150 }, { - "epoch": 0.76, - "learning_rate": 0.00018617041988448307, - "loss": 0.0535, + "epoch": 0.45, + "learning_rate": 0.00023207561783176385, + "loss": 0.0699, "step": 70160 }, { - "epoch": 0.76, - "learning_rate": 0.00018615419559997402, - "loss": 0.0575, + "epoch": 0.45, + "learning_rate": 0.00023206593647740693, + "loss": 0.0536, "step": 70170 }, { - "epoch": 0.76, - "learning_rate": 0.00018613797131546497, - "loss": 0.0508, + "epoch": 0.45, + "learning_rate": 0.00023205625512305, + "loss": 0.0567, "step": 70180 }, { - "epoch": 0.76, - "learning_rate": 0.0001861217470309559, - "loss": 0.0535, + "epoch": 0.45, + "learning_rate": 0.00023204657376869306, + "loss": 0.0514, "step": 70190 }, { - "epoch": 0.76, - "learning_rate": 0.00018610552274644687, - "loss": 0.0457, + "epoch": 0.45, + "learning_rate": 0.00023203689241433614, + "loss": 0.0629, "step": 70200 }, { - "epoch": 0.76, - "learning_rate": 0.0001860892984619378, - "loss": 0.0471, + "epoch": 0.45, + "learning_rate": 0.00023202721105997922, + "loss": 0.0614, "step": 70210 }, { - "epoch": 0.76, - "learning_rate": 0.00018607307417742877, - "loss": 0.0505, + "epoch": 0.45, + "learning_rate": 0.00023201752970562225, + "loss": 0.0562, "step": 70220 }, { - "epoch": 0.76, - "learning_rate": 0.0001860568498929197, - "loss": 0.047, + "epoch": 0.45, + "learning_rate": 0.00023200784835126533, + "loss": 0.0663, "step": 70230 }, { - "epoch": 0.76, - "learning_rate": 0.00018604062560841064, - "loss": 0.0497, + "epoch": 0.45, + "learning_rate": 0.0002319981669969084, + "loss": 0.0492, "step": 70240 }, { - "epoch": 0.76, - "learning_rate": 0.0001860244013239016, - "loss": 0.0497, + "epoch": 0.45, + "learning_rate": 0.00023198848564255146, + "loss": 0.0512, "step": 70250 }, { - "epoch": 0.76, - "learning_rate": 0.00018600817703939254, - "loss": 0.049, + "epoch": 0.45, + "learning_rate": 0.00023197880428819454, + "loss": 0.0486, "step": 70260 }, { - "epoch": 0.76, - "learning_rate": 0.00018599195275488347, - "loss": 0.0473, + "epoch": 0.45, + "learning_rate": 0.00023196912293383762, + "loss": 0.0493, "step": 70270 }, { - "epoch": 0.76, - "learning_rate": 0.00018597572847037444, - "loss": 0.0501, + "epoch": 0.45, + "learning_rate": 0.0002319594415794807, + "loss": 0.0683, "step": 70280 }, { - "epoch": 0.76, - "learning_rate": 0.00018595950418586537, - "loss": 0.0445, + "epoch": 0.45, + "learning_rate": 0.00023194976022512372, + "loss": 0.0629, "step": 70290 }, { - "epoch": 0.76, - "learning_rate": 0.00018594327990135634, - "loss": 0.0498, + "epoch": 0.45, + "learning_rate": 0.0002319400788707668, + "loss": 0.06, "step": 70300 }, { - "epoch": 0.76, - "learning_rate": 0.00018592705561684727, - "loss": 0.0567, + "epoch": 0.45, + "learning_rate": 0.00023193039751640988, + "loss": 0.0525, "step": 70310 }, { - "epoch": 0.76, - "learning_rate": 0.00018591083133233822, - "loss": 0.0501, + "epoch": 0.45, + "learning_rate": 0.00023192071616205293, + "loss": 0.0519, "step": 70320 }, { - "epoch": 0.76, - "learning_rate": 0.00018589460704782917, - "loss": 0.0512, + "epoch": 0.45, + "learning_rate": 0.00023191103480769601, + "loss": 0.0614, "step": 70330 }, { - "epoch": 0.76, - "learning_rate": 0.00018587838276332011, - "loss": 0.0493, + "epoch": 0.45, + "learning_rate": 0.0002319013534533391, + "loss": 0.0594, "step": 70340 }, { - "epoch": 0.76, - "learning_rate": 0.00018586215847881106, - "loss": 0.0483, + "epoch": 0.45, + "learning_rate": 0.00023189167209898217, + "loss": 0.0639, "step": 70350 }, { - "epoch": 0.76, - "learning_rate": 0.00018584593419430201, - "loss": 0.0426, + "epoch": 0.45, + "learning_rate": 0.0002318819907446252, + "loss": 0.0596, "step": 70360 }, { - "epoch": 0.76, - "learning_rate": 0.00018582970990979294, - "loss": 0.0548, + "epoch": 0.45, + "learning_rate": 0.00023187230939026828, + "loss": 0.0493, "step": 70370 }, { - "epoch": 0.76, - "learning_rate": 0.00018581348562528391, - "loss": 0.0434, + "epoch": 0.45, + "learning_rate": 0.00023186262803591136, + "loss": 0.0553, "step": 70380 }, { - "epoch": 0.76, - "learning_rate": 0.00018579726134077484, - "loss": 0.0447, + "epoch": 0.45, + "learning_rate": 0.0002318529466815544, + "loss": 0.0621, "step": 70390 }, { - "epoch": 0.76, - "learning_rate": 0.00018578103705626581, - "loss": 0.0442, + "epoch": 0.45, + "learning_rate": 0.0002318432653271975, + "loss": 0.0534, "step": 70400 }, { - "epoch": 0.76, - "learning_rate": 0.00018576481277175676, - "loss": 0.046, + "epoch": 0.45, + "learning_rate": 0.00023183358397284057, + "loss": 0.0555, "step": 70410 }, { - "epoch": 0.76, - "learning_rate": 0.00018574858848724769, - "loss": 0.0485, + "epoch": 0.45, + "learning_rate": 0.00023182390261848362, + "loss": 0.0483, "step": 70420 }, { - "epoch": 0.76, - "learning_rate": 0.00018573236420273866, - "loss": 0.0465, + "epoch": 0.45, + "learning_rate": 0.00023181422126412668, + "loss": 0.0574, "step": 70430 }, { - "epoch": 0.76, - "learning_rate": 0.00018571613991822959, - "loss": 0.0474, + "epoch": 0.45, + "learning_rate": 0.00023180453990976976, + "loss": 0.0544, "step": 70440 }, { - "epoch": 0.76, - "learning_rate": 0.00018569991563372056, - "loss": 0.0545, + "epoch": 0.45, + "learning_rate": 0.0002317948585554128, + "loss": 0.0555, "step": 70450 }, { - "epoch": 0.76, - "learning_rate": 0.00018568369134921149, - "loss": 0.0481, + "epoch": 0.45, + "learning_rate": 0.0002317851772010559, + "loss": 0.0575, "step": 70460 }, { - "epoch": 0.76, - "learning_rate": 0.00018566746706470243, - "loss": 0.0515, + "epoch": 0.45, + "learning_rate": 0.00023177549584669897, + "loss": 0.0509, "step": 70470 }, { - "epoch": 0.76, - "learning_rate": 0.00018565124278019338, - "loss": 0.0468, + "epoch": 0.45, + "learning_rate": 0.00023176581449234205, + "loss": 0.0494, "step": 70480 }, { - "epoch": 0.76, - "learning_rate": 0.00018563501849568433, - "loss": 0.0446, + "epoch": 0.45, + "learning_rate": 0.0002317561331379851, + "loss": 0.0535, "step": 70490 }, { - "epoch": 0.76, - "learning_rate": 0.00018561879421117526, - "loss": 0.043, + "epoch": 0.46, + "learning_rate": 0.00023174645178362815, + "loss": 0.059, "step": 70500 }, { - "epoch": 0.76, - "learning_rate": 0.00018560256992666623, - "loss": 0.047, + "epoch": 0.46, + "learning_rate": 0.00023173677042927123, + "loss": 0.0531, "step": 70510 }, { - "epoch": 0.76, - "learning_rate": 0.00018558634564215716, - "loss": 0.0503, + "epoch": 0.46, + "learning_rate": 0.0002317270890749143, + "loss": 0.0565, "step": 70520 }, { - "epoch": 0.76, - "learning_rate": 0.00018557012135764813, - "loss": 0.0515, + "epoch": 0.46, + "learning_rate": 0.00023171740772055737, + "loss": 0.0548, "step": 70530 }, { - "epoch": 0.76, - "learning_rate": 0.00018555389707313906, - "loss": 0.0415, + "epoch": 0.46, + "learning_rate": 0.00023170772636620045, + "loss": 0.0536, "step": 70540 }, { - "epoch": 0.76, - "learning_rate": 0.00018553767278863003, - "loss": 0.0429, + "epoch": 0.46, + "learning_rate": 0.00023169804501184353, + "loss": 0.0574, "step": 70550 }, { - "epoch": 0.76, - "learning_rate": 0.00018552144850412096, - "loss": 0.0494, + "epoch": 0.46, + "learning_rate": 0.00023168836365748658, + "loss": 0.062, "step": 70560 }, { - "epoch": 0.76, - "learning_rate": 0.0001855052242196119, - "loss": 0.0553, + "epoch": 0.46, + "learning_rate": 0.00023167868230312963, + "loss": 0.0518, "step": 70570 }, { - "epoch": 0.76, - "learning_rate": 0.00018548899993510286, - "loss": 0.045, + "epoch": 0.46, + "learning_rate": 0.0002316690009487727, + "loss": 0.0581, "step": 70580 }, { - "epoch": 0.76, - "learning_rate": 0.0001854727756505938, - "loss": 0.0469, + "epoch": 0.46, + "learning_rate": 0.00023165931959441576, + "loss": 0.0618, "step": 70590 }, { - "epoch": 0.76, - "learning_rate": 0.00018545655136608473, - "loss": 0.0406, + "epoch": 0.46, + "learning_rate": 0.00023164963824005884, + "loss": 0.0569, "step": 70600 }, { - "epoch": 0.76, - "learning_rate": 0.0001854403270815757, - "loss": 0.0473, + "epoch": 0.46, + "learning_rate": 0.00023163995688570192, + "loss": 0.0578, "step": 70610 }, { - "epoch": 0.76, - "learning_rate": 0.00018542410279706663, - "loss": 0.049, + "epoch": 0.46, + "learning_rate": 0.00023163027553134498, + "loss": 0.0548, "step": 70620 }, { - "epoch": 0.76, - "learning_rate": 0.0001854078785125576, - "loss": 0.0473, + "epoch": 0.46, + "learning_rate": 0.00023162059417698806, + "loss": 0.0598, "step": 70630 }, { - "epoch": 0.76, - "learning_rate": 0.00018539165422804853, - "loss": 0.0441, - "step": 70640 + "epoch": 0.46, + "learning_rate": 0.0002316109128226311, + "loss": 0.0625, + "step": 70640 }, { - "epoch": 0.76, - "learning_rate": 0.00018537542994353948, - "loss": 0.0428, + "epoch": 0.46, + "learning_rate": 0.00023160123146827416, + "loss": 0.0569, "step": 70650 }, { - "epoch": 0.76, - "learning_rate": 0.00018535920565903043, - "loss": 0.0516, + "epoch": 0.46, + "learning_rate": 0.00023159155011391724, + "loss": 0.056, "step": 70660 }, { - "epoch": 0.76, - "learning_rate": 0.00018534298137452138, - "loss": 0.0446, + "epoch": 0.46, + "learning_rate": 0.00023158186875956032, + "loss": 0.0521, "step": 70670 }, { - "epoch": 0.76, - "learning_rate": 0.0001853267570900123, - "loss": 0.0478, + "epoch": 0.46, + "learning_rate": 0.0002315721874052034, + "loss": 0.0539, "step": 70680 }, { - "epoch": 0.76, - "learning_rate": 0.00018531053280550328, - "loss": 0.0455, + "epoch": 0.46, + "learning_rate": 0.00023156250605084645, + "loss": 0.0592, "step": 70690 }, { - "epoch": 0.76, - "learning_rate": 0.0001852943085209942, - "loss": 0.0446, + "epoch": 0.46, + "learning_rate": 0.00023155282469648953, + "loss": 0.0578, "step": 70700 }, { - "epoch": 0.76, - "learning_rate": 0.00018527808423648518, - "loss": 0.0438, + "epoch": 0.46, + "learning_rate": 0.00023154314334213259, + "loss": 0.0508, "step": 70710 }, { - "epoch": 0.76, - "learning_rate": 0.0001852618599519761, - "loss": 0.0585, + "epoch": 0.46, + "learning_rate": 0.00023153346198777564, + "loss": 0.0524, "step": 70720 }, { - "epoch": 0.77, - "learning_rate": 0.00018524563566746707, - "loss": 0.0436, + "epoch": 0.46, + "learning_rate": 0.00023152378063341872, + "loss": 0.0581, "step": 70730 }, { - "epoch": 0.77, - "learning_rate": 0.000185229411382958, - "loss": 0.0513, + "epoch": 0.46, + "learning_rate": 0.0002315140992790618, + "loss": 0.0559, "step": 70740 }, { - "epoch": 0.77, - "learning_rate": 0.00018521318709844895, - "loss": 0.0388, + "epoch": 0.46, + "learning_rate": 0.00023150441792470488, + "loss": 0.0527, "step": 70750 }, { - "epoch": 0.77, - "learning_rate": 0.0001851969628139399, - "loss": 0.0496, + "epoch": 0.46, + "learning_rate": 0.00023149473657034793, + "loss": 0.0537, "step": 70760 }, { - "epoch": 0.77, - "learning_rate": 0.00018518073852943085, - "loss": 0.0476, + "epoch": 0.46, + "learning_rate": 0.000231485055215991, + "loss": 0.0579, "step": 70770 }, { - "epoch": 0.77, - "learning_rate": 0.00018516451424492177, - "loss": 0.0479, + "epoch": 0.46, + "learning_rate": 0.00023147537386163406, + "loss": 0.0567, "step": 70780 }, { - "epoch": 0.77, - "learning_rate": 0.00018514828996041275, - "loss": 0.0538, + "epoch": 0.46, + "learning_rate": 0.00023146569250727712, + "loss": 0.0496, "step": 70790 }, { - "epoch": 0.77, - "learning_rate": 0.00018513206567590367, - "loss": 0.0448, + "epoch": 0.46, + "learning_rate": 0.0002314560111529202, + "loss": 0.0587, "step": 70800 }, { - "epoch": 0.77, - "learning_rate": 0.00018511584139139465, - "loss": 0.0422, + "epoch": 0.46, + "learning_rate": 0.00023144632979856328, + "loss": 0.0591, "step": 70810 }, { - "epoch": 0.77, - "learning_rate": 0.00018509961710688557, - "loss": 0.0539, + "epoch": 0.46, + "learning_rate": 0.00023143664844420633, + "loss": 0.0609, "step": 70820 }, { - "epoch": 0.77, - "learning_rate": 0.00018508339282237652, - "loss": 0.0444, + "epoch": 0.46, + "learning_rate": 0.0002314269670898494, + "loss": 0.0551, "step": 70830 }, { - "epoch": 0.77, - "learning_rate": 0.00018506716853786747, - "loss": 0.0478, + "epoch": 0.46, + "learning_rate": 0.0002314172857354925, + "loss": 0.0588, "step": 70840 }, { - "epoch": 0.77, - "learning_rate": 0.00018505094425335842, - "loss": 0.0427, + "epoch": 0.46, + "learning_rate": 0.0002314076043811355, + "loss": 0.0639, "step": 70850 }, { - "epoch": 0.77, - "learning_rate": 0.00018503471996884937, - "loss": 0.0508, + "epoch": 0.46, + "learning_rate": 0.0002313979230267786, + "loss": 0.0553, "step": 70860 }, { - "epoch": 0.77, - "learning_rate": 0.00018501849568434032, - "loss": 0.0468, + "epoch": 0.46, + "learning_rate": 0.00023138824167242167, + "loss": 0.0557, "step": 70870 }, { - "epoch": 0.77, - "learning_rate": 0.00018500227139983124, - "loss": 0.0409, + "epoch": 0.46, + "learning_rate": 0.00023137856031806475, + "loss": 0.0518, "step": 70880 }, { - "epoch": 0.77, - "learning_rate": 0.00018498604711532222, - "loss": 0.0551, + "epoch": 0.46, + "learning_rate": 0.0002313688789637078, + "loss": 0.0498, "step": 70890 }, { - "epoch": 0.77, - "learning_rate": 0.00018496982283081314, - "loss": 0.0497, + "epoch": 0.46, + "learning_rate": 0.00023135919760935089, + "loss": 0.0614, "step": 70900 }, { - "epoch": 0.77, - "learning_rate": 0.00018495359854630412, - "loss": 0.0514, + "epoch": 0.46, + "learning_rate": 0.00023134951625499396, + "loss": 0.0505, "step": 70910 }, { - "epoch": 0.77, - "learning_rate": 0.00018493737426179504, - "loss": 0.0441, + "epoch": 0.46, + "learning_rate": 0.000231339834900637, + "loss": 0.052, "step": 70920 }, { - "epoch": 0.77, - "learning_rate": 0.000184921149977286, - "loss": 0.0475, + "epoch": 0.46, + "learning_rate": 0.00023133015354628007, + "loss": 0.1046, "step": 70930 }, { - "epoch": 0.77, - "learning_rate": 0.00018490492569277694, - "loss": 0.0418, + "epoch": 0.46, + "learning_rate": 0.00023132047219192315, + "loss": 0.0848, "step": 70940 }, { - "epoch": 0.77, - "learning_rate": 0.0001848887014082679, - "loss": 0.049, + "epoch": 0.46, + "learning_rate": 0.00023131079083756623, + "loss": 0.0537, "step": 70950 }, { - "epoch": 0.77, - "learning_rate": 0.0001848724771237588, - "loss": 0.055, + "epoch": 0.46, + "learning_rate": 0.00023130110948320928, + "loss": 0.05, "step": 70960 }, { - "epoch": 0.77, - "learning_rate": 0.0001848562528392498, - "loss": 0.0494, + "epoch": 0.46, + "learning_rate": 0.00023129142812885236, + "loss": 0.0569, "step": 70970 }, { - "epoch": 0.77, - "learning_rate": 0.0001848400285547407, - "loss": 0.0439, + "epoch": 0.46, + "learning_rate": 0.00023128174677449544, + "loss": 0.0568, "step": 70980 }, { - "epoch": 0.77, - "learning_rate": 0.0001848238042702317, - "loss": 0.0406, + "epoch": 0.46, + "learning_rate": 0.00023127206542013847, + "loss": 0.0576, "step": 70990 }, { - "epoch": 0.77, - "learning_rate": 0.0001848075799857226, - "loss": 0.0534, + "epoch": 0.46, + "learning_rate": 0.00023126238406578155, + "loss": 0.0576, "step": 71000 }, { - "epoch": 0.77, - "eval_cer": 0.9212488580965154, - "eval_loss": 0.03301897272467613, - "eval_runtime": 118.9229, - "eval_samples_per_second": 16.818, - "eval_steps_per_second": 4.204, + "epoch": 0.46, + "eval_cer": 0.9200460964862728, + "eval_loss": 0.03755395486950874, + "eval_runtime": 119.9894, + "eval_samples_per_second": 16.668, + "eval_steps_per_second": 4.167, "step": 71000 }, { - "epoch": 0.77, - "learning_rate": 0.00018479135570121356, - "loss": 0.045, + "epoch": 0.46, + "learning_rate": 0.00023125270271142463, + "loss": 0.0486, "step": 71010 }, { - "epoch": 0.77, - "learning_rate": 0.0001847751314167045, - "loss": 0.0449, + "epoch": 0.46, + "learning_rate": 0.00023124302135706768, + "loss": 0.0564, "step": 71020 }, { - "epoch": 0.77, - "learning_rate": 0.00018475890713219546, - "loss": 0.044, + "epoch": 0.46, + "learning_rate": 0.00023123334000271076, + "loss": 0.0552, "step": 71030 }, { - "epoch": 0.77, - "learning_rate": 0.0001847426828476864, - "loss": 0.043, + "epoch": 0.46, + "learning_rate": 0.00023122365864835384, + "loss": 0.0558, "step": 71040 }, { - "epoch": 0.77, - "learning_rate": 0.00018472645856317736, - "loss": 0.0441, + "epoch": 0.46, + "learning_rate": 0.00023121397729399692, + "loss": 0.057, "step": 71050 }, { - "epoch": 0.77, - "learning_rate": 0.00018471023427866828, - "loss": 0.0419, + "epoch": 0.46, + "learning_rate": 0.00023120429593963994, + "loss": 0.0617, "step": 71060 }, { - "epoch": 0.77, - "learning_rate": 0.00018469400999415926, - "loss": 0.0522, + "epoch": 0.46, + "learning_rate": 0.00023119461458528302, + "loss": 0.0605, "step": 71070 }, { - "epoch": 0.77, - "learning_rate": 0.00018467778570965018, - "loss": 0.0454, + "epoch": 0.46, + "learning_rate": 0.0002311849332309261, + "loss": 0.0556, "step": 71080 }, { - "epoch": 0.77, - "learning_rate": 0.00018466156142514116, - "loss": 0.047, + "epoch": 0.46, + "learning_rate": 0.00023117525187656916, + "loss": 0.056, "step": 71090 }, { - "epoch": 0.77, - "learning_rate": 0.00018464533714063208, - "loss": 0.0443, + "epoch": 0.46, + "learning_rate": 0.00023116557052221224, + "loss": 0.0506, "step": 71100 }, { - "epoch": 0.77, - "learning_rate": 0.00018462911285612303, - "loss": 0.047, + "epoch": 0.46, + "learning_rate": 0.00023115588916785532, + "loss": 0.0555, "step": 71110 }, { - "epoch": 0.77, - "learning_rate": 0.00018461288857161398, - "loss": 0.0409, + "epoch": 0.46, + "learning_rate": 0.0002311462078134984, + "loss": 0.0535, "step": 71120 }, { - "epoch": 0.77, - "learning_rate": 0.00018459666428710493, - "loss": 0.0525, + "epoch": 0.46, + "learning_rate": 0.00023113652645914142, + "loss": 0.0532, "step": 71130 }, { - "epoch": 0.77, - "learning_rate": 0.00018458044000259585, - "loss": 0.041, + "epoch": 0.46, + "learning_rate": 0.0002311268451047845, + "loss": 0.0447, "step": 71140 }, { - "epoch": 0.77, - "learning_rate": 0.00018456421571808683, - "loss": 0.0486, + "epoch": 0.46, + "learning_rate": 0.00023111716375042758, + "loss": 0.0543, "step": 71150 }, { - "epoch": 0.77, - "learning_rate": 0.00018454799143357775, - "loss": 0.0442, + "epoch": 0.46, + "learning_rate": 0.00023110748239607063, + "loss": 0.0534, "step": 71160 }, { - "epoch": 0.77, - "learning_rate": 0.00018453176714906873, - "loss": 0.0504, + "epoch": 0.46, + "learning_rate": 0.00023109780104171371, + "loss": 0.0568, "step": 71170 }, { - "epoch": 0.77, - "learning_rate": 0.00018451554286455965, - "loss": 0.051, + "epoch": 0.46, + "learning_rate": 0.0002310881196873568, + "loss": 0.0564, "step": 71180 }, { - "epoch": 0.77, - "learning_rate": 0.0001844993185800506, - "loss": 0.0556, + "epoch": 0.46, + "learning_rate": 0.00023107843833299985, + "loss": 0.0506, "step": 71190 }, { - "epoch": 0.77, - "learning_rate": 0.00018448309429554155, - "loss": 0.0419, + "epoch": 0.46, + "learning_rate": 0.0002310687569786429, + "loss": 0.0592, "step": 71200 }, { - "epoch": 0.77, - "learning_rate": 0.0001844668700110325, - "loss": 0.0515, + "epoch": 0.46, + "learning_rate": 0.00023105907562428598, + "loss": 0.0532, "step": 71210 }, { - "epoch": 0.77, - "learning_rate": 0.00018445064572652345, - "loss": 0.0459, + "epoch": 0.46, + "learning_rate": 0.00023104939426992903, + "loss": 0.0536, "step": 71220 }, { - "epoch": 0.77, - "learning_rate": 0.0001844344214420144, - "loss": 0.0516, + "epoch": 0.46, + "learning_rate": 0.0002310397129155721, + "loss": 0.0517, "step": 71230 }, { - "epoch": 0.77, - "learning_rate": 0.00018441819715750532, - "loss": 0.0537, + "epoch": 0.46, + "learning_rate": 0.0002310300315612152, + "loss": 0.0599, "step": 71240 }, { - "epoch": 0.77, - "learning_rate": 0.0001844019728729963, - "loss": 0.0586, + "epoch": 0.46, + "learning_rate": 0.00023102035020685827, + "loss": 0.0611, "step": 71250 }, { - "epoch": 0.77, - "learning_rate": 0.00018438574858848722, - "loss": 0.0637, + "epoch": 0.46, + "learning_rate": 0.00023101066885250132, + "loss": 0.0539, "step": 71260 }, { - "epoch": 0.77, - "learning_rate": 0.0001843695243039782, - "loss": 0.0419, + "epoch": 0.46, + "learning_rate": 0.00023100098749814438, + "loss": 0.0524, "step": 71270 }, { - "epoch": 0.77, - "learning_rate": 0.00018435330001946912, - "loss": 0.0549, + "epoch": 0.46, + "learning_rate": 0.00023099130614378746, + "loss": 0.0546, "step": 71280 }, { - "epoch": 0.77, - "learning_rate": 0.00018433707573496007, - "loss": 0.0485, + "epoch": 0.46, + "learning_rate": 0.0002309816247894305, + "loss": 0.0481, "step": 71290 }, { - "epoch": 0.77, - "learning_rate": 0.00018432085145045102, - "loss": 0.0527, + "epoch": 0.46, + "learning_rate": 0.0002309719434350736, + "loss": 0.0477, "step": 71300 }, { - "epoch": 0.77, - "learning_rate": 0.00018430462716594197, - "loss": 0.0523, + "epoch": 0.46, + "learning_rate": 0.00023096226208071667, + "loss": 0.0576, "step": 71310 }, { - "epoch": 0.77, - "learning_rate": 0.0001842884028814329, - "loss": 0.0511, + "epoch": 0.46, + "learning_rate": 0.00023095258072635975, + "loss": 0.0612, "step": 71320 }, { - "epoch": 0.77, - "learning_rate": 0.00018427217859692387, - "loss": 0.0494, + "epoch": 0.46, + "learning_rate": 0.0002309428993720028, + "loss": 0.0506, "step": 71330 }, { - "epoch": 0.77, - "learning_rate": 0.0001842559543124148, - "loss": 0.0427, + "epoch": 0.46, + "learning_rate": 0.00023093321801764585, + "loss": 0.0528, "step": 71340 }, { - "epoch": 0.77, - "learning_rate": 0.00018423973002790577, - "loss": 0.0504, + "epoch": 0.46, + "learning_rate": 0.00023092353666328893, + "loss": 0.0513, "step": 71350 }, { - "epoch": 0.77, - "learning_rate": 0.0001842235057433967, - "loss": 0.043, + "epoch": 0.46, + "learning_rate": 0.00023091385530893199, + "loss": 0.0504, "step": 71360 }, { - "epoch": 0.77, - "learning_rate": 0.00018420728145888764, - "loss": 0.0487, + "epoch": 0.46, + "learning_rate": 0.00023090417395457507, + "loss": 0.0593, "step": 71370 }, { - "epoch": 0.77, - "learning_rate": 0.0001841910571743786, - "loss": 0.0552, + "epoch": 0.46, + "learning_rate": 0.00023089449260021815, + "loss": 0.058, "step": 71380 }, { - "epoch": 0.77, - "learning_rate": 0.00018417483288986954, - "loss": 0.0451, + "epoch": 0.46, + "learning_rate": 0.00023088481124586123, + "loss": 0.0527, "step": 71390 }, { - "epoch": 0.77, - "learning_rate": 0.0001841586086053605, - "loss": 0.0562, + "epoch": 0.46, + "learning_rate": 0.00023087512989150428, + "loss": 0.0545, "step": 71400 }, { - "epoch": 0.77, - "learning_rate": 0.00018414238432085144, - "loss": 0.0473, + "epoch": 0.46, + "learning_rate": 0.00023086544853714733, + "loss": 0.059, "step": 71410 }, { - "epoch": 0.77, - "learning_rate": 0.00018412616003634236, - "loss": 0.0533, + "epoch": 0.46, + "learning_rate": 0.00023085576718279038, + "loss": 0.0553, "step": 71420 }, { - "epoch": 0.77, - "learning_rate": 0.00018410993575183334, - "loss": 0.0528, + "epoch": 0.46, + "learning_rate": 0.00023084608582843346, + "loss": 0.0544, "step": 71430 }, { - "epoch": 0.77, - "learning_rate": 0.00018409371146732426, - "loss": 0.0474, + "epoch": 0.46, + "learning_rate": 0.00023083640447407654, + "loss": 0.0666, "step": 71440 }, { - "epoch": 0.77, - "learning_rate": 0.00018407748718281524, - "loss": 0.0457, + "epoch": 0.46, + "learning_rate": 0.00023082672311971962, + "loss": 0.0628, "step": 71450 }, { - "epoch": 0.77, - "learning_rate": 0.00018406126289830616, - "loss": 0.0473, + "epoch": 0.46, + "learning_rate": 0.00023081704176536268, + "loss": 0.0573, "step": 71460 }, { - "epoch": 0.77, - "learning_rate": 0.00018404503861379711, - "loss": 0.0474, + "epoch": 0.46, + "learning_rate": 0.00023080736041100576, + "loss": 0.0648, "step": 71470 }, { - "epoch": 0.77, - "learning_rate": 0.00018402881432928806, - "loss": 0.0525, + "epoch": 0.46, + "learning_rate": 0.0002307976790566488, + "loss": 0.0683, "step": 71480 }, { - "epoch": 0.77, - "learning_rate": 0.000184012590044779, - "loss": 0.0495, + "epoch": 0.46, + "learning_rate": 0.00023078799770229186, + "loss": 0.0639, "step": 71490 }, { - "epoch": 0.77, - "learning_rate": 0.00018399636576026994, - "loss": 0.049, + "epoch": 0.46, + "learning_rate": 0.00023077831634793494, + "loss": 0.0565, "step": 71500 }, { - "epoch": 0.77, - "learning_rate": 0.0001839801414757609, - "loss": 0.0427, + "epoch": 0.46, + "learning_rate": 0.00023076863499357802, + "loss": 0.0606, "step": 71510 }, { - "epoch": 0.77, - "learning_rate": 0.00018396391719125184, - "loss": 0.0417, + "epoch": 0.46, + "learning_rate": 0.0002307589536392211, + "loss": 0.0562, "step": 71520 }, { - "epoch": 0.77, - "learning_rate": 0.0001839476929067428, - "loss": 0.0465, + "epoch": 0.46, + "learning_rate": 0.00023074927228486415, + "loss": 0.0536, "step": 71530 }, { - "epoch": 0.77, - "learning_rate": 0.00018393146862223374, - "loss": 0.056, + "epoch": 0.46, + "learning_rate": 0.00023073959093050723, + "loss": 0.0545, "step": 71540 }, { - "epoch": 0.77, - "learning_rate": 0.0001839152443377247, - "loss": 0.0509, + "epoch": 0.46, + "learning_rate": 0.00023072990957615029, + "loss": 0.0641, "step": 71550 }, { - "epoch": 0.77, - "learning_rate": 0.00018389902005321563, - "loss": 0.0508, + "epoch": 0.46, + "learning_rate": 0.00023072022822179334, + "loss": 0.0574, "step": 71560 }, { - "epoch": 0.77, - "learning_rate": 0.00018388279576870658, - "loss": 0.0481, + "epoch": 0.46, + "learning_rate": 0.00023071054686743642, + "loss": 0.0583, "step": 71570 }, { - "epoch": 0.77, - "learning_rate": 0.00018386657148419753, - "loss": 0.051, + "epoch": 0.46, + "learning_rate": 0.0002307008655130795, + "loss": 0.052, "step": 71580 }, { - "epoch": 0.77, - "learning_rate": 0.00018385034719968848, - "loss": 0.0521, + "epoch": 0.46, + "learning_rate": 0.00023069118415872258, + "loss": 0.0501, "step": 71590 }, { - "epoch": 0.77, - "learning_rate": 0.0001838341229151794, - "loss": 0.0384, + "epoch": 0.46, + "learning_rate": 0.00023068150280436563, + "loss": 0.0633, "step": 71600 }, { - "epoch": 0.77, - "learning_rate": 0.00018381789863067038, - "loss": 0.0448, + "epoch": 0.46, + "learning_rate": 0.0002306718214500087, + "loss": 0.0538, "step": 71610 }, { - "epoch": 0.77, - "learning_rate": 0.0001838016743461613, - "loss": 0.0517, + "epoch": 0.46, + "learning_rate": 0.00023066214009565174, + "loss": 0.0529, "step": 71620 }, { - "epoch": 0.77, - "learning_rate": 0.00018378545006165228, - "loss": 0.0504, + "epoch": 0.46, + "learning_rate": 0.00023065245874129482, + "loss": 0.0532, "step": 71630 }, { - "epoch": 0.77, - "learning_rate": 0.0001837692257771432, - "loss": 0.0431, + "epoch": 0.46, + "learning_rate": 0.0002306427773869379, + "loss": 0.0538, "step": 71640 }, { - "epoch": 0.77, - "learning_rate": 0.00018375300149263416, - "loss": 0.0496, + "epoch": 0.46, + "learning_rate": 0.00023063309603258097, + "loss": 0.0625, "step": 71650 }, { - "epoch": 0.78, - "learning_rate": 0.0001837367772081251, - "loss": 0.0546, + "epoch": 0.46, + "learning_rate": 0.00023062341467822403, + "loss": 0.0589, "step": 71660 }, { - "epoch": 0.78, - "learning_rate": 0.00018372055292361606, - "loss": 0.0493, + "epoch": 0.46, + "learning_rate": 0.0002306137333238671, + "loss": 0.0583, "step": 71670 }, { - "epoch": 0.78, - "learning_rate": 0.00018370432863910698, - "loss": 0.0468, + "epoch": 0.46, + "learning_rate": 0.0002306040519695102, + "loss": 0.0579, "step": 71680 }, { - "epoch": 0.78, - "learning_rate": 0.00018368810435459795, - "loss": 0.063, + "epoch": 0.46, + "learning_rate": 0.0002305943706151532, + "loss": 0.0568, "step": 71690 }, { - "epoch": 0.78, - "learning_rate": 0.00018367188007008888, - "loss": 0.0416, + "epoch": 0.46, + "learning_rate": 0.0002305846892607963, + "loss": 0.0635, "step": 71700 }, { - "epoch": 0.78, - "learning_rate": 0.00018365565578557985, - "loss": 0.054, + "epoch": 0.46, + "learning_rate": 0.00023057500790643937, + "loss": 0.0594, "step": 71710 }, { - "epoch": 0.78, - "learning_rate": 0.00018363943150107078, - "loss": 0.0533, + "epoch": 0.46, + "learning_rate": 0.00023056532655208245, + "loss": 0.0556, "step": 71720 }, { - "epoch": 0.78, - "learning_rate": 0.00018362320721656175, - "loss": 0.0471, + "epoch": 0.46, + "learning_rate": 0.0002305556451977255, + "loss": 0.0531, "step": 71730 }, { - "epoch": 0.78, - "learning_rate": 0.00018360698293205268, - "loss": 0.0443, + "epoch": 0.46, + "learning_rate": 0.00023054596384336858, + "loss": 0.0506, "step": 71740 }, { - "epoch": 0.78, - "learning_rate": 0.00018359075864754363, - "loss": 0.0557, + "epoch": 0.46, + "learning_rate": 0.00023053628248901166, + "loss": 0.0668, "step": 71750 }, { - "epoch": 0.78, - "learning_rate": 0.00018357453436303458, - "loss": 0.0504, + "epoch": 0.46, + "learning_rate": 0.0002305266011346547, + "loss": 0.0539, "step": 71760 }, { - "epoch": 0.78, - "learning_rate": 0.00018355831007852553, - "loss": 0.0485, + "epoch": 0.46, + "learning_rate": 0.00023051691978029777, + "loss": 0.0624, "step": 71770 }, { - "epoch": 0.78, - "learning_rate": 0.00018354208579401645, - "loss": 0.0472, + "epoch": 0.46, + "learning_rate": 0.00023050723842594085, + "loss": 0.0541, "step": 71780 }, { - "epoch": 0.78, - "learning_rate": 0.00018352586150950743, - "loss": 0.0469, + "epoch": 0.46, + "learning_rate": 0.00023049755707158393, + "loss": 0.0552, "step": 71790 }, { - "epoch": 0.78, - "learning_rate": 0.00018350963722499835, - "loss": 0.0431, + "epoch": 0.46, + "learning_rate": 0.00023048787571722698, + "loss": 0.0531, "step": 71800 }, { - "epoch": 0.78, - "learning_rate": 0.00018349341294048932, - "loss": 0.0527, + "epoch": 0.46, + "learning_rate": 0.00023047819436287006, + "loss": 0.0567, "step": 71810 }, { - "epoch": 0.78, - "learning_rate": 0.00018347718865598025, - "loss": 0.0432, + "epoch": 0.46, + "learning_rate": 0.00023046851300851314, + "loss": 0.052, "step": 71820 }, { - "epoch": 0.78, - "learning_rate": 0.0001834609643714712, - "loss": 0.0407, + "epoch": 0.46, + "learning_rate": 0.00023045883165415617, + "loss": 0.0567, "step": 71830 }, { - "epoch": 0.78, - "learning_rate": 0.00018344474008696215, - "loss": 0.0417, + "epoch": 0.46, + "learning_rate": 0.00023044915029979925, + "loss": 0.0542, "step": 71840 }, { - "epoch": 0.78, - "learning_rate": 0.0001834285158024531, - "loss": 0.0447, + "epoch": 0.46, + "learning_rate": 0.00023043946894544233, + "loss": 0.0518, "step": 71850 }, { - "epoch": 0.78, - "learning_rate": 0.00018341229151794402, - "loss": 0.0445, + "epoch": 0.46, + "learning_rate": 0.00023042978759108538, + "loss": 0.0619, "step": 71860 }, { - "epoch": 0.78, - "learning_rate": 0.000183396067233435, - "loss": 0.0511, + "epoch": 0.46, + "learning_rate": 0.00023042010623672846, + "loss": 0.0566, "step": 71870 }, { - "epoch": 0.78, - "learning_rate": 0.00018337984294892592, - "loss": 0.0557, + "epoch": 0.46, + "learning_rate": 0.00023041042488237154, + "loss": 0.0594, "step": 71880 }, { - "epoch": 0.78, - "learning_rate": 0.0001833636186644169, - "loss": 0.0451, + "epoch": 0.46, + "learning_rate": 0.00023040074352801462, + "loss": 0.0562, "step": 71890 }, { - "epoch": 0.78, - "learning_rate": 0.00018334739437990782, - "loss": 0.0493, + "epoch": 0.46, + "learning_rate": 0.00023039106217365764, + "loss": 0.0554, "step": 71900 }, { - "epoch": 0.78, - "learning_rate": 0.0001833311700953988, - "loss": 0.0475, + "epoch": 0.46, + "learning_rate": 0.00023038138081930072, + "loss": 0.058, "step": 71910 }, { - "epoch": 0.78, - "learning_rate": 0.00018331494581088972, - "loss": 0.045, + "epoch": 0.46, + "learning_rate": 0.0002303716994649438, + "loss": 0.0522, "step": 71920 }, { - "epoch": 0.78, - "learning_rate": 0.00018329872152638067, - "loss": 0.048, + "epoch": 0.46, + "learning_rate": 0.00023036201811058686, + "loss": 0.0547, "step": 71930 }, { - "epoch": 0.78, - "learning_rate": 0.00018328249724187162, - "loss": 0.0457, + "epoch": 0.46, + "learning_rate": 0.00023035233675622994, + "loss": 0.0472, "step": 71940 }, { - "epoch": 0.78, - "learning_rate": 0.00018326627295736257, - "loss": 0.0507, + "epoch": 0.46, + "learning_rate": 0.00023034265540187302, + "loss": 0.0513, "step": 71950 }, { - "epoch": 0.78, - "learning_rate": 0.0001832500486728535, - "loss": 0.0452, + "epoch": 0.46, + "learning_rate": 0.0002303329740475161, + "loss": 0.0505, "step": 71960 }, { - "epoch": 0.78, - "learning_rate": 0.00018323382438834447, - "loss": 0.0513, + "epoch": 0.46, + "learning_rate": 0.00023032329269315912, + "loss": 0.0546, "step": 71970 }, { - "epoch": 0.78, - "learning_rate": 0.0001832176001038354, - "loss": 0.0425, + "epoch": 0.46, + "learning_rate": 0.0002303136113388022, + "loss": 0.0683, "step": 71980 }, { - "epoch": 0.78, - "learning_rate": 0.00018320137581932637, - "loss": 0.0466, + "epoch": 0.46, + "learning_rate": 0.00023030392998444528, + "loss": 0.0547, "step": 71990 }, { - "epoch": 0.78, - "learning_rate": 0.0001831851515348173, - "loss": 0.0437, + "epoch": 0.46, + "learning_rate": 0.00023029424863008833, + "loss": 0.0529, "step": 72000 }, { - "epoch": 0.78, - "eval_cer": 0.9211596261801142, - "eval_loss": 0.033371277153491974, - "eval_runtime": 118.9108, - "eval_samples_per_second": 16.819, - "eval_steps_per_second": 4.205, + "epoch": 0.46, + "eval_cer": 0.9200415772229127, + "eval_loss": 0.03651151433587074, + "eval_runtime": 120.2459, + "eval_samples_per_second": 16.633, + "eval_steps_per_second": 4.158, "step": 72000 }, { - "epoch": 0.78, - "learning_rate": 0.00018316892725030824, - "loss": 0.0473, + "epoch": 0.46, + "learning_rate": 0.00023028456727573141, + "loss": 0.056, "step": 72010 }, { - "epoch": 0.78, - "learning_rate": 0.0001831527029657992, - "loss": 0.0473, + "epoch": 0.46, + "learning_rate": 0.0002302748859213745, + "loss": 0.062, "step": 72020 }, { - "epoch": 0.78, - "learning_rate": 0.00018313647868129014, - "loss": 0.0399, + "epoch": 0.46, + "learning_rate": 0.00023026520456701755, + "loss": 0.0505, "step": 72030 }, { - "epoch": 0.78, - "learning_rate": 0.00018312025439678106, - "loss": 0.0457, + "epoch": 0.46, + "learning_rate": 0.0002302555232126606, + "loss": 0.0575, "step": 72040 }, { - "epoch": 0.78, - "learning_rate": 0.00018310403011227204, - "loss": 0.0505, + "epoch": 0.47, + "learning_rate": 0.00023024584185830368, + "loss": 0.0597, "step": 72050 }, { - "epoch": 0.78, - "learning_rate": 0.00018308780582776296, - "loss": 0.0409, + "epoch": 0.47, + "learning_rate": 0.00023023616050394673, + "loss": 0.0579, "step": 72060 }, { - "epoch": 0.78, - "learning_rate": 0.00018307158154325394, - "loss": 0.0519, + "epoch": 0.47, + "learning_rate": 0.0002302264791495898, + "loss": 0.0499, "step": 72070 }, { - "epoch": 0.78, - "learning_rate": 0.00018305535725874486, - "loss": 0.0464, + "epoch": 0.47, + "learning_rate": 0.0002302167977952329, + "loss": 0.0533, "step": 72080 }, { - "epoch": 0.78, - "learning_rate": 0.00018303913297423584, - "loss": 0.0543, + "epoch": 0.47, + "learning_rate": 0.00023020711644087597, + "loss": 0.0536, "step": 72090 }, { - "epoch": 0.78, - "learning_rate": 0.00018302290868972676, - "loss": 0.0484, + "epoch": 0.47, + "learning_rate": 0.00023019743508651902, + "loss": 0.0576, "step": 72100 }, { - "epoch": 0.78, - "learning_rate": 0.0001830066844052177, - "loss": 0.0464, + "epoch": 0.47, + "learning_rate": 0.00023018775373216208, + "loss": 0.0574, "step": 72110 }, { - "epoch": 0.78, - "learning_rate": 0.00018299046012070866, - "loss": 0.0507, + "epoch": 0.47, + "learning_rate": 0.00023017807237780516, + "loss": 0.0566, "step": 72120 }, { - "epoch": 0.78, - "learning_rate": 0.0001829742358361996, - "loss": 0.0773, + "epoch": 0.47, + "learning_rate": 0.0002301683910234482, + "loss": 0.0541, "step": 72130 }, { - "epoch": 0.78, - "learning_rate": 0.00018295801155169053, - "loss": 0.0538, + "epoch": 0.47, + "learning_rate": 0.0002301587096690913, + "loss": 0.0581, "step": 72140 }, { - "epoch": 0.78, - "learning_rate": 0.0001829417872671815, - "loss": 0.0551, + "epoch": 0.47, + "learning_rate": 0.00023014902831473437, + "loss": 0.0504, "step": 72150 }, { - "epoch": 0.78, - "learning_rate": 0.00018292556298267243, - "loss": 0.0463, + "epoch": 0.47, + "learning_rate": 0.00023013934696037745, + "loss": 0.0574, "step": 72160 }, { - "epoch": 0.78, - "learning_rate": 0.0001829093386981634, - "loss": 0.0505, + "epoch": 0.47, + "learning_rate": 0.0002301296656060205, + "loss": 0.0599, "step": 72170 }, { - "epoch": 0.78, - "learning_rate": 0.00018289311441365433, - "loss": 0.055, + "epoch": 0.47, + "learning_rate": 0.00023011998425166355, + "loss": 0.0518, "step": 72180 }, { - "epoch": 0.78, - "learning_rate": 0.00018287689012914528, - "loss": 0.0525, + "epoch": 0.47, + "learning_rate": 0.00023011030289730663, + "loss": 0.0582, "step": 72190 }, { - "epoch": 0.78, - "learning_rate": 0.00018286066584463623, - "loss": 0.0481, + "epoch": 0.47, + "learning_rate": 0.00023010062154294969, + "loss": 0.0464, "step": 72200 }, { - "epoch": 0.78, - "learning_rate": 0.00018284444156012718, - "loss": 0.0452, + "epoch": 0.47, + "learning_rate": 0.00023009094018859277, + "loss": 0.0564, "step": 72210 }, { - "epoch": 0.78, - "learning_rate": 0.00018282821727561813, - "loss": 0.0459, + "epoch": 0.47, + "learning_rate": 0.00023008125883423585, + "loss": 0.0642, "step": 72220 }, { - "epoch": 0.78, - "learning_rate": 0.00018281199299110908, - "loss": 0.0412, + "epoch": 0.47, + "learning_rate": 0.0002300715774798789, + "loss": 0.0532, "step": 72230 }, { - "epoch": 0.78, - "learning_rate": 0.0001827957687066, - "loss": 0.0483, + "epoch": 0.47, + "learning_rate": 0.00023006189612552198, + "loss": 0.0499, "step": 72240 }, { - "epoch": 0.78, - "learning_rate": 0.00018277954442209098, - "loss": 0.0436, + "epoch": 0.47, + "learning_rate": 0.00023005221477116503, + "loss": 0.0542, "step": 72250 }, { - "epoch": 0.78, - "learning_rate": 0.0001827633201375819, - "loss": 0.0487, + "epoch": 0.47, + "learning_rate": 0.00023004253341680808, + "loss": 0.0539, "step": 72260 }, { - "epoch": 0.78, - "learning_rate": 0.00018274709585307288, - "loss": 0.0426, + "epoch": 0.47, + "learning_rate": 0.00023003285206245116, + "loss": 0.0526, "step": 72270 }, { - "epoch": 0.78, - "learning_rate": 0.0001827308715685638, - "loss": 0.046, + "epoch": 0.47, + "learning_rate": 0.00023002317070809424, + "loss": 0.0582, "step": 72280 }, { - "epoch": 0.78, - "learning_rate": 0.00018271464728405475, - "loss": 0.0479, + "epoch": 0.47, + "learning_rate": 0.00023001348935373732, + "loss": 0.0513, "step": 72290 }, { - "epoch": 0.78, - "learning_rate": 0.0001826984229995457, - "loss": 0.0441, + "epoch": 0.47, + "learning_rate": 0.00023000380799938038, + "loss": 0.0534, "step": 72300 }, { - "epoch": 0.78, - "learning_rate": 0.00018268219871503665, - "loss": 0.0489, + "epoch": 0.47, + "learning_rate": 0.00022999412664502343, + "loss": 0.0594, "step": 72310 }, { - "epoch": 0.78, - "learning_rate": 0.00018266597443052757, - "loss": 0.0491, + "epoch": 0.47, + "learning_rate": 0.0002299844452906665, + "loss": 0.0601, "step": 72320 }, { - "epoch": 0.78, - "learning_rate": 0.00018264975014601855, - "loss": 0.0512, + "epoch": 0.47, + "learning_rate": 0.00022997476393630956, + "loss": 0.0608, "step": 72330 }, { - "epoch": 0.78, - "learning_rate": 0.00018263352586150947, - "loss": 0.0517, + "epoch": 0.47, + "learning_rate": 0.00022996508258195264, + "loss": 0.0512, "step": 72340 }, { - "epoch": 0.78, - "learning_rate": 0.00018261730157700045, - "loss": 0.053, + "epoch": 0.47, + "learning_rate": 0.00022995540122759572, + "loss": 0.0533, "step": 72350 }, { - "epoch": 0.78, - "learning_rate": 0.00018260107729249137, - "loss": 0.0522, + "epoch": 0.47, + "learning_rate": 0.0002299457198732388, + "loss": 0.0526, "step": 72360 }, { - "epoch": 0.78, - "learning_rate": 0.00018258485300798232, - "loss": 0.043, + "epoch": 0.47, + "learning_rate": 0.00022993603851888185, + "loss": 0.0543, "step": 72370 }, { - "epoch": 0.78, - "learning_rate": 0.00018256862872347327, - "loss": 0.0459, + "epoch": 0.47, + "learning_rate": 0.0002299263571645249, + "loss": 0.0566, "step": 72380 }, { - "epoch": 0.78, - "learning_rate": 0.00018255240443896422, - "loss": 0.0474, + "epoch": 0.47, + "learning_rate": 0.00022991667581016799, + "loss": 0.057, "step": 72390 }, { - "epoch": 0.78, - "learning_rate": 0.00018253618015445517, - "loss": 0.0467, + "epoch": 0.47, + "learning_rate": 0.00022990699445581104, + "loss": 0.0539, "step": 72400 }, { - "epoch": 0.78, - "learning_rate": 0.00018251995586994612, - "loss": 0.0486, + "epoch": 0.47, + "learning_rate": 0.00022989731310145412, + "loss": 0.0599, "step": 72410 }, { - "epoch": 0.78, - "learning_rate": 0.00018250373158543704, - "loss": 0.0479, + "epoch": 0.47, + "learning_rate": 0.0002298876317470972, + "loss": 0.0522, "step": 72420 }, { - "epoch": 0.78, - "learning_rate": 0.00018248750730092802, - "loss": 0.0434, + "epoch": 0.47, + "learning_rate": 0.00022987795039274025, + "loss": 0.0536, "step": 72430 }, { - "epoch": 0.78, - "learning_rate": 0.00018247128301641894, - "loss": 0.0422, + "epoch": 0.47, + "learning_rate": 0.00022986826903838333, + "loss": 0.0568, "step": 72440 }, { - "epoch": 0.78, - "learning_rate": 0.00018245505873190992, - "loss": 0.049, + "epoch": 0.47, + "learning_rate": 0.00022985858768402638, + "loss": 0.0569, "step": 72450 }, { - "epoch": 0.78, - "learning_rate": 0.00018243883444740084, - "loss": 0.0414, + "epoch": 0.47, + "learning_rate": 0.00022984890632966944, + "loss": 0.0658, "step": 72460 }, { - "epoch": 0.78, - "learning_rate": 0.0001824226101628918, - "loss": 0.049, + "epoch": 0.47, + "learning_rate": 0.00022983922497531251, + "loss": 0.0612, "step": 72470 }, { - "epoch": 0.78, - "learning_rate": 0.00018240638587838274, - "loss": 0.0527, + "epoch": 0.47, + "learning_rate": 0.0002298295436209556, + "loss": 0.0571, "step": 72480 }, { - "epoch": 0.78, - "learning_rate": 0.0001823901615938737, - "loss": 0.0459, + "epoch": 0.47, + "learning_rate": 0.00022981986226659867, + "loss": 0.0618, "step": 72490 }, { - "epoch": 0.78, - "learning_rate": 0.00018237393730936461, - "loss": 0.0552, + "epoch": 0.47, + "learning_rate": 0.00022981018091224173, + "loss": 0.06, "step": 72500 }, { - "epoch": 0.78, - "learning_rate": 0.0001823577130248556, - "loss": 0.0513, + "epoch": 0.47, + "learning_rate": 0.0002298004995578848, + "loss": 0.0605, "step": 72510 }, { - "epoch": 0.78, - "learning_rate": 0.00018234148874034651, - "loss": 0.0454, + "epoch": 0.47, + "learning_rate": 0.00022979081820352786, + "loss": 0.065, "step": 72520 }, { - "epoch": 0.78, - "learning_rate": 0.0001823252644558375, - "loss": 0.0477, + "epoch": 0.47, + "learning_rate": 0.0002297811368491709, + "loss": 0.0487, "step": 72530 }, { - "epoch": 0.78, - "learning_rate": 0.00018230904017132841, - "loss": 0.0509, + "epoch": 0.47, + "learning_rate": 0.000229771455494814, + "loss": 0.0484, "step": 72540 }, { - "epoch": 0.78, - "learning_rate": 0.00018229281588681936, - "loss": 0.0521, + "epoch": 0.47, + "learning_rate": 0.00022976177414045707, + "loss": 0.0555, "step": 72550 }, { - "epoch": 0.78, - "learning_rate": 0.00018227659160231031, - "loss": 0.0415, + "epoch": 0.47, + "learning_rate": 0.00022975209278610015, + "loss": 0.0566, "step": 72560 }, { - "epoch": 0.78, - "learning_rate": 0.00018226036731780126, - "loss": 0.0494, + "epoch": 0.47, + "learning_rate": 0.0002297424114317432, + "loss": 0.0582, "step": 72570 }, { - "epoch": 0.79, - "learning_rate": 0.0001822441430332922, - "loss": 0.049, + "epoch": 0.47, + "learning_rate": 0.00022973273007738628, + "loss": 0.0624, "step": 72580 }, { - "epoch": 0.79, - "learning_rate": 0.00018222791874878316, - "loss": 0.0453, + "epoch": 0.47, + "learning_rate": 0.00022972304872302934, + "loss": 0.0596, "step": 72590 }, { - "epoch": 0.79, - "learning_rate": 0.00018221169446427409, - "loss": 0.0449, + "epoch": 0.47, + "learning_rate": 0.0002297133673686724, + "loss": 0.0572, "step": 72600 }, { - "epoch": 0.79, - "learning_rate": 0.00018219547017976506, - "loss": 0.0414, + "epoch": 0.47, + "learning_rate": 0.00022970368601431547, + "loss": 0.0622, "step": 72610 }, { - "epoch": 0.79, - "learning_rate": 0.00018217924589525599, - "loss": 0.05, + "epoch": 0.47, + "learning_rate": 0.00022969400465995855, + "loss": 0.0559, "step": 72620 }, { - "epoch": 0.79, - "learning_rate": 0.00018216302161074696, - "loss": 0.0483, + "epoch": 0.47, + "learning_rate": 0.0002296843233056016, + "loss": 0.0525, "step": 72630 }, { - "epoch": 0.79, - "learning_rate": 0.00018214679732623788, - "loss": 0.0444, + "epoch": 0.47, + "learning_rate": 0.00022967464195124468, + "loss": 0.0496, "step": 72640 }, { - "epoch": 0.79, - "learning_rate": 0.00018213057304172883, - "loss": 0.0506, + "epoch": 0.47, + "learning_rate": 0.00022966496059688776, + "loss": 0.0578, "step": 72650 }, { - "epoch": 0.79, - "learning_rate": 0.00018211434875721978, - "loss": 0.0485, + "epoch": 0.47, + "learning_rate": 0.0002296552792425308, + "loss": 0.0526, "step": 72660 }, { - "epoch": 0.79, - "learning_rate": 0.00018209812447271073, - "loss": 0.0461, + "epoch": 0.47, + "learning_rate": 0.00022964559788817387, + "loss": 0.0591, "step": 72670 }, { - "epoch": 0.79, - "learning_rate": 0.00018208190018820166, - "loss": 0.0492, + "epoch": 0.47, + "learning_rate": 0.00022963591653381695, + "loss": 0.0564, "step": 72680 }, { - "epoch": 0.79, - "learning_rate": 0.00018206567590369263, - "loss": 0.0425, + "epoch": 0.47, + "learning_rate": 0.00022962623517946003, + "loss": 0.0615, "step": 72690 }, { - "epoch": 0.79, - "learning_rate": 0.00018204945161918356, - "loss": 0.0523, + "epoch": 0.47, + "learning_rate": 0.00022961655382510308, + "loss": 0.0569, "step": 72700 }, { - "epoch": 0.79, - "learning_rate": 0.00018203322733467453, - "loss": 0.0484, + "epoch": 0.47, + "learning_rate": 0.00022960687247074616, + "loss": 0.0525, "step": 72710 }, { - "epoch": 0.79, - "learning_rate": 0.00018201700305016546, - "loss": 0.0455, + "epoch": 0.47, + "learning_rate": 0.00022959719111638924, + "loss": 0.0549, "step": 72720 }, { - "epoch": 0.79, - "learning_rate": 0.0001820007787656564, - "loss": 0.0441, + "epoch": 0.47, + "learning_rate": 0.00022958750976203226, + "loss": 0.0541, "step": 72730 }, { - "epoch": 0.79, - "learning_rate": 0.00018198455448114736, - "loss": 0.0478, + "epoch": 0.47, + "learning_rate": 0.00022957782840767534, + "loss": 0.0602, "step": 72740 }, { - "epoch": 0.79, - "learning_rate": 0.0001819683301966383, - "loss": 0.0507, + "epoch": 0.47, + "learning_rate": 0.00022956814705331842, + "loss": 0.0546, "step": 72750 }, { - "epoch": 0.79, - "learning_rate": 0.00018195210591212928, - "loss": 0.0443, + "epoch": 0.47, + "learning_rate": 0.0002295584656989615, + "loss": 0.0625, "step": 72760 }, { - "epoch": 0.79, - "learning_rate": 0.0001819358816276202, - "loss": 0.0519, + "epoch": 0.47, + "learning_rate": 0.00022954878434460456, + "loss": 0.0555, "step": 72770 }, { - "epoch": 0.79, - "learning_rate": 0.00018191965734311118, - "loss": 0.0436, + "epoch": 0.47, + "learning_rate": 0.00022953910299024764, + "loss": 0.0528, "step": 72780 }, { - "epoch": 0.79, - "learning_rate": 0.0001819034330586021, - "loss": 0.0528, + "epoch": 0.47, + "learning_rate": 0.00022952942163589072, + "loss": 0.0603, "step": 72790 }, { - "epoch": 0.79, - "learning_rate": 0.00018188720877409305, - "loss": 0.0449, + "epoch": 0.47, + "learning_rate": 0.00022951974028153374, + "loss": 0.0531, "step": 72800 }, { - "epoch": 0.79, - "learning_rate": 0.000181870984489584, - "loss": 0.0489, + "epoch": 0.47, + "learning_rate": 0.00022951005892717682, + "loss": 0.0485, "step": 72810 }, { - "epoch": 0.79, - "learning_rate": 0.00018185476020507495, - "loss": 0.0527, + "epoch": 0.47, + "learning_rate": 0.0002295003775728199, + "loss": 0.0647, "step": 72820 }, { - "epoch": 0.79, - "learning_rate": 0.00018183853592056588, - "loss": 0.0443, + "epoch": 0.47, + "learning_rate": 0.00022949069621846295, + "loss": 0.0544, "step": 72830 }, { - "epoch": 0.79, - "learning_rate": 0.00018182231163605685, - "loss": 0.0448, + "epoch": 0.47, + "learning_rate": 0.00022948101486410603, + "loss": 0.0639, "step": 72840 }, { - "epoch": 0.79, - "learning_rate": 0.00018180608735154778, - "loss": 0.0484, + "epoch": 0.47, + "learning_rate": 0.0002294713335097491, + "loss": 0.0526, "step": 72850 }, { - "epoch": 0.79, - "learning_rate": 0.00018178986306703875, - "loss": 0.0531, + "epoch": 0.47, + "learning_rate": 0.0002294616521553922, + "loss": 0.0506, "step": 72860 }, { - "epoch": 0.79, - "learning_rate": 0.00018177363878252968, - "loss": 0.0432, + "epoch": 0.47, + "learning_rate": 0.00022945197080103522, + "loss": 0.0544, "step": 72870 }, { - "epoch": 0.79, - "learning_rate": 0.00018175741449802062, - "loss": 0.0512, + "epoch": 0.47, + "learning_rate": 0.0002294422894466783, + "loss": 0.0527, "step": 72880 }, { - "epoch": 0.79, - "learning_rate": 0.00018174119021351157, - "loss": 0.0463, + "epoch": 0.47, + "learning_rate": 0.00022943260809232138, + "loss": 0.0586, "step": 72890 }, { - "epoch": 0.79, - "learning_rate": 0.00018172496592900252, - "loss": 0.0415, + "epoch": 0.47, + "learning_rate": 0.00022942292673796443, + "loss": 0.0535, "step": 72900 }, { - "epoch": 0.79, - "learning_rate": 0.00018170874164449347, - "loss": 0.0468, + "epoch": 0.47, + "learning_rate": 0.0002294132453836075, + "loss": 0.0593, "step": 72910 }, { - "epoch": 0.79, - "learning_rate": 0.00018169251735998442, - "loss": 0.0432, + "epoch": 0.47, + "learning_rate": 0.0002294035640292506, + "loss": 0.0504, "step": 72920 }, { - "epoch": 0.79, - "learning_rate": 0.00018167629307547535, - "loss": 0.0455, + "epoch": 0.47, + "learning_rate": 0.00022939388267489367, + "loss": 0.0581, "step": 72930 }, { - "epoch": 0.79, - "learning_rate": 0.00018166006879096632, - "loss": 0.049, + "epoch": 0.47, + "learning_rate": 0.0002293842013205367, + "loss": 0.0551, "step": 72940 }, { - "epoch": 0.79, - "learning_rate": 0.00018164384450645725, - "loss": 0.0488, + "epoch": 0.47, + "learning_rate": 0.00022937451996617978, + "loss": 0.0517, "step": 72950 }, { - "epoch": 0.79, - "learning_rate": 0.00018162762022194822, - "loss": 0.0479, + "epoch": 0.47, + "learning_rate": 0.00022936483861182286, + "loss": 0.0536, "step": 72960 }, { - "epoch": 0.79, - "learning_rate": 0.00018161139593743915, - "loss": 0.0467, + "epoch": 0.47, + "learning_rate": 0.0002293551572574659, + "loss": 0.0549, "step": 72970 }, { - "epoch": 0.79, - "learning_rate": 0.0001815951716529301, - "loss": 0.0489, + "epoch": 0.47, + "learning_rate": 0.000229345475903109, + "loss": 0.0565, "step": 72980 }, { - "epoch": 0.79, - "learning_rate": 0.00018157894736842105, - "loss": 0.0499, + "epoch": 0.47, + "learning_rate": 0.00022933579454875207, + "loss": 0.0582, "step": 72990 }, { - "epoch": 0.79, - "learning_rate": 0.000181562723083912, - "loss": 0.05, + "epoch": 0.47, + "learning_rate": 0.00022932611319439512, + "loss": 0.0504, "step": 73000 }, { - "epoch": 0.79, - "eval_cer": 0.9212656442986107, - "eval_loss": 0.033203139901161194, - "eval_runtime": 119.0919, - "eval_samples_per_second": 16.794, - "eval_steps_per_second": 4.198, + "epoch": 0.47, + "eval_cer": 0.9200831544458253, + "eval_loss": 0.03714871034026146, + "eval_runtime": 120.0036, + "eval_samples_per_second": 16.666, + "eval_steps_per_second": 4.167, "step": 73000 }, { - "epoch": 0.79, - "learning_rate": 0.00018154649879940292, - "loss": 0.0472, + "epoch": 0.47, + "learning_rate": 0.00022931643184003817, + "loss": 0.0522, "step": 73010 }, { - "epoch": 0.79, - "learning_rate": 0.0001815302745148939, - "loss": 0.051, + "epoch": 0.47, + "learning_rate": 0.00022930675048568125, + "loss": 0.047, "step": 73020 }, { - "epoch": 0.79, - "learning_rate": 0.00018151405023038482, - "loss": 0.0522, + "epoch": 0.47, + "learning_rate": 0.0002292970691313243, + "loss": 0.069, "step": 73030 }, { - "epoch": 0.79, - "learning_rate": 0.0001814978259458758, - "loss": 0.0507, + "epoch": 0.47, + "learning_rate": 0.00022928738777696739, + "loss": 0.0583, "step": 73040 }, { - "epoch": 0.79, - "learning_rate": 0.00018148160166136672, - "loss": 0.0524, + "epoch": 0.47, + "learning_rate": 0.00022927770642261047, + "loss": 0.0568, "step": 73050 }, { - "epoch": 0.79, - "learning_rate": 0.00018146537737685767, - "loss": 0.0505, + "epoch": 0.47, + "learning_rate": 0.00022926802506825355, + "loss": 0.0563, "step": 73060 }, { - "epoch": 0.79, - "learning_rate": 0.00018144915309234862, - "loss": 0.0495, + "epoch": 0.47, + "learning_rate": 0.0002292583437138966, + "loss": 0.051, "step": 73070 }, { - "epoch": 0.79, - "learning_rate": 0.00018143292880783957, - "loss": 0.0435, + "epoch": 0.47, + "learning_rate": 0.00022924866235953965, + "loss": 0.057, "step": 73080 }, { - "epoch": 0.79, - "learning_rate": 0.00018141670452333052, - "loss": 0.0529, + "epoch": 0.47, + "learning_rate": 0.00022923898100518273, + "loss": 0.0505, "step": 73090 }, { - "epoch": 0.79, - "learning_rate": 0.00018140048023882147, - "loss": 0.0508, + "epoch": 0.47, + "learning_rate": 0.00022922929965082578, + "loss": 0.0515, "step": 73100 }, { - "epoch": 0.79, - "learning_rate": 0.0001813842559543124, - "loss": 0.0524, + "epoch": 0.47, + "learning_rate": 0.00022921961829646886, + "loss": 0.0597, "step": 73110 }, { - "epoch": 0.79, - "learning_rate": 0.00018136803166980337, - "loss": 0.0437, + "epoch": 0.47, + "learning_rate": 0.00022920993694211194, + "loss": 0.0588, "step": 73120 }, { - "epoch": 0.79, - "learning_rate": 0.0001813518073852943, - "loss": 0.0445, + "epoch": 0.47, + "learning_rate": 0.00022920025558775502, + "loss": 0.0573, "step": 73130 }, { - "epoch": 0.79, - "learning_rate": 0.00018133558310078526, - "loss": 0.047, + "epoch": 0.47, + "learning_rate": 0.00022919057423339807, + "loss": 0.0538, "step": 73140 }, { - "epoch": 0.79, - "learning_rate": 0.0001813193588162762, - "loss": 0.048, + "epoch": 0.47, + "learning_rate": 0.00022918089287904113, + "loss": 0.0539, "step": 73150 }, { - "epoch": 0.79, - "learning_rate": 0.00018130313453176714, - "loss": 0.0503, + "epoch": 0.47, + "learning_rate": 0.0002291712115246842, + "loss": 0.0555, "step": 73160 }, { - "epoch": 0.79, - "learning_rate": 0.0001812869102472581, - "loss": 0.0477, + "epoch": 0.47, + "learning_rate": 0.00022916153017032726, + "loss": 0.0577, "step": 73170 }, { - "epoch": 0.79, - "learning_rate": 0.00018127068596274904, - "loss": 0.049, + "epoch": 0.47, + "learning_rate": 0.00022915184881597034, + "loss": 0.0501, "step": 73180 }, { - "epoch": 0.79, - "learning_rate": 0.00018125446167823996, - "loss": 0.0432, + "epoch": 0.47, + "learning_rate": 0.00022914216746161342, + "loss": 0.057, "step": 73190 }, { - "epoch": 0.79, - "learning_rate": 0.00018123823739373094, - "loss": 0.0463, + "epoch": 0.47, + "learning_rate": 0.00022913248610725647, + "loss": 0.0595, "step": 73200 }, { - "epoch": 0.79, - "learning_rate": 0.00018122201310922186, - "loss": 0.0496, + "epoch": 0.47, + "learning_rate": 0.00022912280475289955, + "loss": 0.0502, "step": 73210 }, { - "epoch": 0.79, - "learning_rate": 0.00018120578882471284, - "loss": 0.0487, + "epoch": 0.47, + "learning_rate": 0.0002291131233985426, + "loss": 0.0549, "step": 73220 }, { - "epoch": 0.79, - "learning_rate": 0.00018118956454020376, - "loss": 0.0457, + "epoch": 0.47, + "learning_rate": 0.00022910344204418566, + "loss": 0.0526, "step": 73230 }, { - "epoch": 0.79, - "learning_rate": 0.0001811733402556947, - "loss": 0.0445, + "epoch": 0.47, + "learning_rate": 0.00022909376068982874, + "loss": 0.0544, "step": 73240 }, { - "epoch": 0.79, - "learning_rate": 0.00018115711597118566, - "loss": 0.0557, + "epoch": 0.47, + "learning_rate": 0.00022908407933547182, + "loss": 0.0554, "step": 73250 }, { - "epoch": 0.79, - "learning_rate": 0.0001811408916866766, - "loss": 0.0456, + "epoch": 0.47, + "learning_rate": 0.0002290743979811149, + "loss": 0.061, "step": 73260 }, { - "epoch": 0.79, - "learning_rate": 0.00018112466740216756, - "loss": 0.0489, + "epoch": 0.47, + "learning_rate": 0.00022906471662675795, + "loss": 0.0521, "step": 73270 }, { - "epoch": 0.79, - "learning_rate": 0.0001811084431176585, - "loss": 0.0462, + "epoch": 0.47, + "learning_rate": 0.00022905503527240103, + "loss": 0.0577, "step": 73280 }, { - "epoch": 0.79, - "learning_rate": 0.00018109221883314943, - "loss": 0.0438, + "epoch": 0.47, + "learning_rate": 0.00022904535391804408, + "loss": 0.0544, "step": 73290 }, { - "epoch": 0.79, - "learning_rate": 0.0001810759945486404, - "loss": 0.042, + "epoch": 0.47, + "learning_rate": 0.00022903567256368713, + "loss": 0.0482, "step": 73300 }, { - "epoch": 0.79, - "learning_rate": 0.00018105977026413133, - "loss": 0.047, + "epoch": 0.47, + "learning_rate": 0.00022902599120933021, + "loss": 0.0535, "step": 73310 }, { - "epoch": 0.79, - "learning_rate": 0.0001810435459796223, - "loss": 0.0434, + "epoch": 0.47, + "learning_rate": 0.0002290163098549733, + "loss": 0.0539, "step": 73320 }, { - "epoch": 0.79, - "learning_rate": 0.00018102732169511323, - "loss": 0.0453, + "epoch": 0.47, + "learning_rate": 0.00022900662850061637, + "loss": 0.0538, "step": 73330 }, { - "epoch": 0.79, - "learning_rate": 0.00018101109741060418, - "loss": 0.0386, + "epoch": 0.47, + "learning_rate": 0.00022899694714625943, + "loss": 0.0542, "step": 73340 }, { - "epoch": 0.79, - "learning_rate": 0.00018099487312609513, - "loss": 0.0439, + "epoch": 0.47, + "learning_rate": 0.0002289872657919025, + "loss": 0.0544, "step": 73350 }, { - "epoch": 0.79, - "learning_rate": 0.00018097864884158608, - "loss": 0.0488, + "epoch": 0.47, + "learning_rate": 0.00022897758443754556, + "loss": 0.0509, "step": 73360 }, { - "epoch": 0.79, - "learning_rate": 0.000180962424557077, - "loss": 0.0485, + "epoch": 0.47, + "learning_rate": 0.0002289679030831886, + "loss": 0.0563, "step": 73370 }, { - "epoch": 0.79, - "learning_rate": 0.00018094620027256798, - "loss": 0.0497, + "epoch": 0.47, + "learning_rate": 0.0002289582217288317, + "loss": 0.0514, "step": 73380 }, { - "epoch": 0.79, - "learning_rate": 0.0001809299759880589, - "loss": 0.0521, + "epoch": 0.47, + "learning_rate": 0.00022894854037447477, + "loss": 0.058, "step": 73390 }, { - "epoch": 0.79, - "learning_rate": 0.00018091375170354988, - "loss": 0.0483, + "epoch": 0.47, + "learning_rate": 0.00022893885902011782, + "loss": 0.0521, "step": 73400 }, { - "epoch": 0.79, - "learning_rate": 0.0001808975274190408, - "loss": 0.0479, + "epoch": 0.47, + "learning_rate": 0.0002289291776657609, + "loss": 0.0498, "step": 73410 }, { - "epoch": 0.79, - "learning_rate": 0.00018088130313453175, - "loss": 0.049, + "epoch": 0.47, + "learning_rate": 0.00022891949631140398, + "loss": 0.0536, "step": 73420 }, { - "epoch": 0.79, - "learning_rate": 0.0001808650788500227, - "loss": 0.0469, + "epoch": 0.47, + "learning_rate": 0.000228909814957047, + "loss": 0.0515, "step": 73430 }, { - "epoch": 0.79, - "learning_rate": 0.00018084885456551365, - "loss": 0.0484, + "epoch": 0.47, + "learning_rate": 0.0002289001336026901, + "loss": 0.0557, "step": 73440 }, { - "epoch": 0.79, - "learning_rate": 0.0001808326302810046, - "loss": 0.0457, + "epoch": 0.47, + "learning_rate": 0.00022889045224833317, + "loss": 0.0576, "step": 73450 }, { - "epoch": 0.79, - "learning_rate": 0.00018081640599649555, - "loss": 0.0475, + "epoch": 0.47, + "learning_rate": 0.00022888077089397625, + "loss": 0.0558, "step": 73460 }, { - "epoch": 0.79, - "learning_rate": 0.00018080018171198647, - "loss": 0.0436, + "epoch": 0.47, + "learning_rate": 0.0002288710895396193, + "loss": 0.058, "step": 73470 }, { - "epoch": 0.79, - "learning_rate": 0.00018078395742747745, - "loss": 0.0461, + "epoch": 0.47, + "learning_rate": 0.00022886140818526238, + "loss": 0.0501, "step": 73480 }, { - "epoch": 0.79, - "learning_rate": 0.00018076773314296837, - "loss": 0.0463, + "epoch": 0.47, + "learning_rate": 0.00022885172683090546, + "loss": 0.0569, "step": 73490 }, { - "epoch": 0.79, - "learning_rate": 0.00018075150885845935, - "loss": 0.0496, + "epoch": 0.47, + "learning_rate": 0.0002288420454765485, + "loss": 0.0584, "step": 73500 }, { - "epoch": 0.8, - "learning_rate": 0.00018073528457395027, - "loss": 0.045, + "epoch": 0.47, + "learning_rate": 0.00022883236412219157, + "loss": 0.0484, "step": 73510 }, { - "epoch": 0.8, - "learning_rate": 0.00018071906028944122, - "loss": 0.043, + "epoch": 0.47, + "learning_rate": 0.00022882268276783465, + "loss": 0.0548, "step": 73520 }, { - "epoch": 0.8, - "learning_rate": 0.00018070283600493217, - "loss": 0.046, + "epoch": 0.47, + "learning_rate": 0.00022881300141347773, + "loss": 0.0526, "step": 73530 }, { - "epoch": 0.8, - "learning_rate": 0.00018068661172042312, - "loss": 0.0418, + "epoch": 0.47, + "learning_rate": 0.00022880332005912078, + "loss": 0.0553, "step": 73540 }, { - "epoch": 0.8, - "learning_rate": 0.00018067038743591404, - "loss": 0.0545, + "epoch": 0.47, + "learning_rate": 0.00022879363870476386, + "loss": 0.0583, "step": 73550 }, { - "epoch": 0.8, - "learning_rate": 0.00018065416315140502, - "loss": 0.0499, + "epoch": 0.47, + "learning_rate": 0.00022878395735040694, + "loss": 0.0491, "step": 73560 }, { - "epoch": 0.8, - "learning_rate": 0.00018063793886689594, - "loss": 0.0486, + "epoch": 0.47, + "learning_rate": 0.00022877427599604996, + "loss": 0.0562, "step": 73570 }, { - "epoch": 0.8, - "learning_rate": 0.00018062171458238692, - "loss": 0.0462, + "epoch": 0.47, + "learning_rate": 0.00022876459464169304, + "loss": 0.0551, "step": 73580 }, { - "epoch": 0.8, - "learning_rate": 0.00018060549029787784, - "loss": 0.048, + "epoch": 0.47, + "learning_rate": 0.00022875491328733612, + "loss": 0.0545, "step": 73590 }, { - "epoch": 0.8, - "learning_rate": 0.00018058926601336882, - "loss": 0.0504, + "epoch": 0.48, + "learning_rate": 0.00022874523193297918, + "loss": 0.048, "step": 73600 }, { - "epoch": 0.8, - "learning_rate": 0.00018057304172885974, - "loss": 0.0512, + "epoch": 0.48, + "learning_rate": 0.00022873555057862226, + "loss": 0.057, "step": 73610 }, { - "epoch": 0.8, - "learning_rate": 0.0001805568174443507, - "loss": 0.0494, + "epoch": 0.48, + "learning_rate": 0.00022872586922426534, + "loss": 0.0571, "step": 73620 }, { - "epoch": 0.8, - "learning_rate": 0.00018054059315984164, - "loss": 0.0563, + "epoch": 0.48, + "learning_rate": 0.00022871618786990842, + "loss": 0.0631, "step": 73630 }, { - "epoch": 0.8, - "learning_rate": 0.0001805243688753326, - "loss": 0.0525, + "epoch": 0.48, + "learning_rate": 0.00022870650651555144, + "loss": 0.0541, "step": 73640 }, { - "epoch": 0.8, - "learning_rate": 0.0001805081445908235, - "loss": 0.0496, + "epoch": 0.48, + "learning_rate": 0.00022869682516119452, + "loss": 0.0573, "step": 73650 }, { - "epoch": 0.8, - "learning_rate": 0.0001804919203063145, - "loss": 0.0484, + "epoch": 0.48, + "learning_rate": 0.0002286871438068376, + "loss": 0.0491, "step": 73660 }, { - "epoch": 0.8, - "learning_rate": 0.0001804756960218054, - "loss": 0.0381, + "epoch": 0.48, + "learning_rate": 0.00022867746245248065, + "loss": 0.0582, "step": 73670 }, { - "epoch": 0.8, - "learning_rate": 0.0001804594717372964, - "loss": 0.0569, + "epoch": 0.48, + "learning_rate": 0.00022866778109812373, + "loss": 0.063, "step": 73680 }, { - "epoch": 0.8, - "learning_rate": 0.0001804432474527873, - "loss": 0.0448, + "epoch": 0.48, + "learning_rate": 0.0002286580997437668, + "loss": 0.0554, "step": 73690 }, { - "epoch": 0.8, - "learning_rate": 0.00018042702316827826, - "loss": 0.0394, + "epoch": 0.48, + "learning_rate": 0.0002286484183894099, + "loss": 0.0561, "step": 73700 }, { - "epoch": 0.8, - "learning_rate": 0.0001804107988837692, - "loss": 0.0441, + "epoch": 0.48, + "learning_rate": 0.00022863873703505292, + "loss": 0.0544, "step": 73710 }, { - "epoch": 0.8, - "learning_rate": 0.00018039457459926016, - "loss": 0.0476, + "epoch": 0.48, + "learning_rate": 0.000228629055680696, + "loss": 0.054, "step": 73720 }, { - "epoch": 0.8, - "learning_rate": 0.00018037835031475108, - "loss": 0.0475, + "epoch": 0.48, + "learning_rate": 0.00022861937432633908, + "loss": 0.0543, "step": 73730 }, { - "epoch": 0.8, - "learning_rate": 0.00018036212603024206, - "loss": 0.0442, + "epoch": 0.48, + "learning_rate": 0.00022860969297198213, + "loss": 0.0499, "step": 73740 }, { - "epoch": 0.8, - "learning_rate": 0.00018034590174573298, - "loss": 0.0472, + "epoch": 0.48, + "learning_rate": 0.0002286000116176252, + "loss": 0.0584, "step": 73750 }, { - "epoch": 0.8, - "learning_rate": 0.00018032967746122396, - "loss": 0.0478, + "epoch": 0.48, + "learning_rate": 0.0002285903302632683, + "loss": 0.0535, "step": 73760 }, { - "epoch": 0.8, - "learning_rate": 0.00018031345317671488, - "loss": 0.0524, + "epoch": 0.48, + "learning_rate": 0.00022858064890891137, + "loss": 0.0472, "step": 73770 }, { - "epoch": 0.8, - "learning_rate": 0.00018029722889220586, - "loss": 0.0483, + "epoch": 0.48, + "learning_rate": 0.0002285709675545544, + "loss": 0.0563, "step": 73780 }, { - "epoch": 0.8, - "learning_rate": 0.00018028100460769678, - "loss": 0.0444, + "epoch": 0.48, + "learning_rate": 0.00022856128620019748, + "loss": 0.0524, "step": 73790 }, { - "epoch": 0.8, - "learning_rate": 0.00018026478032318773, - "loss": 0.048, + "epoch": 0.48, + "learning_rate": 0.00022855160484584053, + "loss": 0.0512, "step": 73800 }, { - "epoch": 0.8, - "learning_rate": 0.00018024855603867868, - "loss": 0.0533, + "epoch": 0.48, + "learning_rate": 0.0002285419234914836, + "loss": 0.0581, "step": 73810 }, { - "epoch": 0.8, - "learning_rate": 0.00018023233175416963, - "loss": 0.0446, + "epoch": 0.48, + "learning_rate": 0.0002285322421371267, + "loss": 0.051, "step": 73820 }, { - "epoch": 0.8, - "learning_rate": 0.00018021610746966055, - "loss": 0.0408, + "epoch": 0.48, + "learning_rate": 0.00022852256078276977, + "loss": 0.057, "step": 73830 }, { - "epoch": 0.8, - "learning_rate": 0.00018019988318515153, - "loss": 0.0406, + "epoch": 0.48, + "learning_rate": 0.00022851287942841282, + "loss": 0.0451, "step": 73840 }, { - "epoch": 0.8, - "learning_rate": 0.00018018365890064245, - "loss": 0.0523, + "epoch": 0.48, + "learning_rate": 0.00022850319807405587, + "loss": 0.0518, "step": 73850 }, { - "epoch": 0.8, - "learning_rate": 0.00018016743461613343, - "loss": 0.044, + "epoch": 0.48, + "learning_rate": 0.00022849351671969895, + "loss": 0.0568, "step": 73860 }, { - "epoch": 0.8, - "learning_rate": 0.00018015121033162435, - "loss": 0.0396, + "epoch": 0.48, + "learning_rate": 0.000228483835365342, + "loss": 0.0531, "step": 73870 }, { - "epoch": 0.8, - "learning_rate": 0.0001801349860471153, - "loss": 0.0442, + "epoch": 0.48, + "learning_rate": 0.00022847415401098509, + "loss": 0.0546, "step": 73880 }, { - "epoch": 0.8, - "learning_rate": 0.00018011876176260625, - "loss": 0.0514, + "epoch": 0.48, + "learning_rate": 0.00022846447265662816, + "loss": 0.0586, "step": 73890 }, { - "epoch": 0.8, - "learning_rate": 0.0001801025374780972, - "loss": 0.0489, + "epoch": 0.48, + "learning_rate": 0.00022845479130227124, + "loss": 0.0475, "step": 73900 }, { - "epoch": 0.8, - "learning_rate": 0.00018008631319358813, - "loss": 0.0438, + "epoch": 0.48, + "learning_rate": 0.0002284451099479143, + "loss": 0.0598, "step": 73910 }, { - "epoch": 0.8, - "learning_rate": 0.0001800700889090791, - "loss": 0.0438, + "epoch": 0.48, + "learning_rate": 0.00022843542859355735, + "loss": 0.0513, "step": 73920 }, { - "epoch": 0.8, - "learning_rate": 0.00018005386462457003, - "loss": 0.0442, + "epoch": 0.48, + "learning_rate": 0.00022842574723920043, + "loss": 0.0524, "step": 73930 }, { - "epoch": 0.8, - "learning_rate": 0.000180037640340061, - "loss": 0.0477, + "epoch": 0.48, + "learning_rate": 0.00022841606588484348, + "loss": 0.0587, "step": 73940 }, { - "epoch": 0.8, - "learning_rate": 0.00018002141605555193, - "loss": 0.0462, + "epoch": 0.48, + "learning_rate": 0.00022840638453048656, + "loss": 0.0553, "step": 73950 }, { - "epoch": 0.8, - "learning_rate": 0.0001800051917710429, - "loss": 0.0406, + "epoch": 0.48, + "learning_rate": 0.00022839670317612964, + "loss": 0.0563, "step": 73960 }, { - "epoch": 0.8, - "learning_rate": 0.00017998896748653382, - "loss": 0.0506, + "epoch": 0.48, + "learning_rate": 0.00022838702182177272, + "loss": 0.0698, "step": 73970 }, { - "epoch": 0.8, - "learning_rate": 0.00017997274320202477, - "loss": 0.0438, + "epoch": 0.48, + "learning_rate": 0.00022837734046741577, + "loss": 0.0551, "step": 73980 }, { - "epoch": 0.8, - "learning_rate": 0.00017995651891751572, - "loss": 0.0546, + "epoch": 0.48, + "learning_rate": 0.00022836765911305883, + "loss": 0.0566, "step": 73990 }, { - "epoch": 0.8, - "learning_rate": 0.00017994029463300667, - "loss": 0.043, + "epoch": 0.48, + "learning_rate": 0.00022835797775870188, + "loss": 0.0499, "step": 74000 }, { - "epoch": 0.8, - "eval_cer": 0.9211852472254175, - "eval_loss": 0.03291938826441765, - "eval_runtime": 118.8661, - "eval_samples_per_second": 16.826, - "eval_steps_per_second": 4.206, + "epoch": 0.48, + "eval_cer": 0.9200479041916167, + "eval_loss": 0.037295423448085785, + "eval_runtime": 120.0199, + "eval_samples_per_second": 16.664, + "eval_steps_per_second": 4.166, "step": 74000 }, { - "epoch": 0.8, - "learning_rate": 0.0001799240703484976, - "loss": 0.0495, + "epoch": 0.48, + "learning_rate": 0.00022834829640434496, + "loss": 0.056, "step": 74010 }, { - "epoch": 0.8, - "learning_rate": 0.00017990784606398857, - "loss": 0.0487, + "epoch": 0.48, + "learning_rate": 0.00022833861504998804, + "loss": 0.0527, "step": 74020 }, { - "epoch": 0.8, - "learning_rate": 0.0001798916217794795, - "loss": 0.0439, + "epoch": 0.48, + "learning_rate": 0.00022832893369563112, + "loss": 0.0605, "step": 74030 }, { - "epoch": 0.8, - "learning_rate": 0.00017987539749497047, - "loss": 0.0427, + "epoch": 0.48, + "learning_rate": 0.00022831925234127417, + "loss": 0.0535, "step": 74040 }, { - "epoch": 0.8, - "learning_rate": 0.0001798591732104614, - "loss": 0.0498, + "epoch": 0.48, + "learning_rate": 0.00022830957098691725, + "loss": 0.0577, "step": 74050 }, { - "epoch": 0.8, - "learning_rate": 0.00017984294892595235, - "loss": 0.0421, + "epoch": 0.48, + "learning_rate": 0.0002282998896325603, + "loss": 0.0545, "step": 74060 }, { - "epoch": 0.8, - "learning_rate": 0.0001798267246414433, - "loss": 0.0426, + "epoch": 0.48, + "learning_rate": 0.00022829020827820336, + "loss": 0.0498, "step": 74070 }, { - "epoch": 0.8, - "learning_rate": 0.00017981050035693425, - "loss": 0.0516, + "epoch": 0.48, + "learning_rate": 0.00022828052692384644, + "loss": 0.0526, "step": 74080 }, { - "epoch": 0.8, - "learning_rate": 0.00017979427607242517, - "loss": 0.0466, + "epoch": 0.48, + "learning_rate": 0.00022827084556948952, + "loss": 0.0513, "step": 74090 }, { - "epoch": 0.8, - "learning_rate": 0.00017977805178791614, - "loss": 0.0424, + "epoch": 0.48, + "learning_rate": 0.0002282611642151326, + "loss": 0.0534, "step": 74100 }, { - "epoch": 0.8, - "learning_rate": 0.00017976182750340707, - "loss": 0.038, + "epoch": 0.48, + "learning_rate": 0.00022825148286077565, + "loss": 0.0566, "step": 74110 }, { - "epoch": 0.8, - "learning_rate": 0.00017974560321889804, - "loss": 0.0527, + "epoch": 0.48, + "learning_rate": 0.00022824180150641873, + "loss": 0.0504, "step": 74120 }, { - "epoch": 0.8, - "learning_rate": 0.00017972937893438897, - "loss": 0.0408, + "epoch": 0.48, + "learning_rate": 0.00022823212015206178, + "loss": 0.0545, "step": 74130 }, { - "epoch": 0.8, - "learning_rate": 0.00017971315464987994, - "loss": 0.0445, + "epoch": 0.48, + "learning_rate": 0.00022822243879770483, + "loss": 0.0491, "step": 74140 }, { - "epoch": 0.8, - "learning_rate": 0.00017969693036537087, - "loss": 0.0535, + "epoch": 0.48, + "learning_rate": 0.00022821275744334791, + "loss": 0.0527, "step": 74150 }, { - "epoch": 0.8, - "learning_rate": 0.00017968070608086182, - "loss": 0.0488, + "epoch": 0.48, + "learning_rate": 0.000228203076088991, + "loss": 0.0575, "step": 74160 }, { - "epoch": 0.8, - "learning_rate": 0.00017966448179635277, - "loss": 0.0442, + "epoch": 0.48, + "learning_rate": 0.00022819339473463407, + "loss": 0.0536, "step": 74170 }, { - "epoch": 0.8, - "learning_rate": 0.00017964825751184372, - "loss": 0.0432, + "epoch": 0.48, + "learning_rate": 0.00022818371338027713, + "loss": 0.0563, "step": 74180 }, { - "epoch": 0.8, - "learning_rate": 0.00017963203322733464, - "loss": 0.0452, + "epoch": 0.48, + "learning_rate": 0.0002281740320259202, + "loss": 0.0539, "step": 74190 }, { - "epoch": 0.8, - "learning_rate": 0.00017961580894282562, - "loss": 0.0466, + "epoch": 0.48, + "learning_rate": 0.00022816435067156323, + "loss": 0.0556, "step": 74200 }, { - "epoch": 0.8, - "learning_rate": 0.00017959958465831654, - "loss": 0.0489, + "epoch": 0.48, + "learning_rate": 0.0002281546693172063, + "loss": 0.0612, "step": 74210 }, { - "epoch": 0.8, - "learning_rate": 0.00017958336037380751, - "loss": 0.0456, + "epoch": 0.48, + "learning_rate": 0.0002281449879628494, + "loss": 0.0517, "step": 74220 }, { - "epoch": 0.8, - "learning_rate": 0.00017956713608929844, - "loss": 0.0421, + "epoch": 0.48, + "learning_rate": 0.00022813530660849247, + "loss": 0.0478, "step": 74230 }, { - "epoch": 0.8, - "learning_rate": 0.0001795509118047894, - "loss": 0.0504, + "epoch": 0.48, + "learning_rate": 0.00022812562525413552, + "loss": 0.0531, "step": 74240 }, { - "epoch": 0.8, - "learning_rate": 0.00017953468752028034, - "loss": 0.0448, + "epoch": 0.48, + "learning_rate": 0.0002281159438997786, + "loss": 0.0596, "step": 74250 }, { - "epoch": 0.8, - "learning_rate": 0.0001795184632357713, - "loss": 0.0411, + "epoch": 0.48, + "learning_rate": 0.00022810626254542168, + "loss": 0.0456, "step": 74260 }, { - "epoch": 0.8, - "learning_rate": 0.0001795022389512622, - "loss": 0.0546, + "epoch": 0.48, + "learning_rate": 0.0002280965811910647, + "loss": 0.0545, "step": 74270 }, { - "epoch": 0.8, - "learning_rate": 0.00017948601466675319, - "loss": 0.0466, + "epoch": 0.48, + "learning_rate": 0.0002280868998367078, + "loss": 0.049, "step": 74280 }, { - "epoch": 0.8, - "learning_rate": 0.0001794697903822441, - "loss": 0.0383, + "epoch": 0.48, + "learning_rate": 0.00022807721848235087, + "loss": 0.0517, "step": 74290 }, { - "epoch": 0.8, - "learning_rate": 0.00017945356609773509, - "loss": 0.0429, + "epoch": 0.48, + "learning_rate": 0.00022806753712799395, + "loss": 0.0546, "step": 74300 }, { - "epoch": 0.8, - "learning_rate": 0.000179437341813226, - "loss": 0.045, + "epoch": 0.48, + "learning_rate": 0.000228057855773637, + "loss": 0.049, "step": 74310 }, { - "epoch": 0.8, - "learning_rate": 0.00017942111752871699, - "loss": 0.049, + "epoch": 0.48, + "learning_rate": 0.00022804817441928008, + "loss": 0.051, "step": 74320 }, { - "epoch": 0.8, - "learning_rate": 0.0001794048932442079, - "loss": 0.0483, + "epoch": 0.48, + "learning_rate": 0.00022803849306492316, + "loss": 0.0512, "step": 74330 }, { - "epoch": 0.8, - "learning_rate": 0.00017938866895969886, - "loss": 0.0402, + "epoch": 0.48, + "learning_rate": 0.00022802881171056619, + "loss": 0.0483, "step": 74340 }, { - "epoch": 0.8, - "learning_rate": 0.0001793724446751898, - "loss": 0.0404, + "epoch": 0.48, + "learning_rate": 0.00022801913035620927, + "loss": 0.0562, "step": 74350 }, { - "epoch": 0.8, - "learning_rate": 0.00017935622039068076, - "loss": 0.0455, + "epoch": 0.48, + "learning_rate": 0.00022800944900185235, + "loss": 0.0539, "step": 74360 }, { - "epoch": 0.8, - "learning_rate": 0.00017933999610617168, - "loss": 0.0476, + "epoch": 0.48, + "learning_rate": 0.00022799976764749543, + "loss": 0.0572, "step": 74370 }, { - "epoch": 0.8, - "learning_rate": 0.00017932377182166266, - "loss": 0.0438, + "epoch": 0.48, + "learning_rate": 0.00022799008629313848, + "loss": 0.0554, "step": 74380 }, { - "epoch": 0.8, - "learning_rate": 0.00017930754753715358, - "loss": 0.0451, + "epoch": 0.48, + "learning_rate": 0.00022798040493878156, + "loss": 0.0524, "step": 74390 }, { - "epoch": 0.8, - "learning_rate": 0.00017929132325264456, - "loss": 0.0531, + "epoch": 0.48, + "learning_rate": 0.00022797072358442464, + "loss": 0.052, "step": 74400 }, { - "epoch": 0.8, - "learning_rate": 0.00017927509896813548, - "loss": 0.0435, + "epoch": 0.48, + "learning_rate": 0.00022796104223006766, + "loss": 0.0541, "step": 74410 }, { - "epoch": 0.8, - "learning_rate": 0.00017925887468362643, - "loss": 0.0437, + "epoch": 0.48, + "learning_rate": 0.00022795136087571074, + "loss": 0.0567, "step": 74420 }, { - "epoch": 0.81, - "learning_rate": 0.00017924265039911738, - "loss": 0.0499, + "epoch": 0.48, + "learning_rate": 0.00022794167952135382, + "loss": 0.06, "step": 74430 }, { - "epoch": 0.81, - "learning_rate": 0.00017922642611460833, - "loss": 0.0491, + "epoch": 0.48, + "learning_rate": 0.00022793199816699688, + "loss": 0.0455, "step": 74440 }, { - "epoch": 0.81, - "learning_rate": 0.00017921020183009928, - "loss": 0.0445, + "epoch": 0.48, + "learning_rate": 0.00022792231681263996, + "loss": 0.0548, "step": 74450 }, { - "epoch": 0.81, - "learning_rate": 0.00017919397754559023, - "loss": 0.0509, + "epoch": 0.48, + "learning_rate": 0.00022791263545828304, + "loss": 0.0501, "step": 74460 }, { - "epoch": 0.81, - "learning_rate": 0.00017917775326108115, - "loss": 0.0458, + "epoch": 0.48, + "learning_rate": 0.00022790295410392612, + "loss": 0.053, "step": 74470 }, { - "epoch": 0.81, - "learning_rate": 0.00017916152897657213, - "loss": 0.0441, + "epoch": 0.48, + "learning_rate": 0.00022789327274956914, + "loss": 0.0502, "step": 74480 }, { - "epoch": 0.81, - "learning_rate": 0.00017914530469206305, - "loss": 0.049, + "epoch": 0.48, + "learning_rate": 0.00022788359139521222, + "loss": 0.0553, "step": 74490 }, { - "epoch": 0.81, - "learning_rate": 0.00017912908040755403, - "loss": 0.0401, + "epoch": 0.48, + "learning_rate": 0.0002278739100408553, + "loss": 0.0483, "step": 74500 }, { - "epoch": 0.81, - "learning_rate": 0.00017911285612304495, - "loss": 0.0505, + "epoch": 0.48, + "learning_rate": 0.00022786422868649835, + "loss": 0.0596, "step": 74510 }, { - "epoch": 0.81, - "learning_rate": 0.0001790966318385359, - "loss": 0.0526, + "epoch": 0.48, + "learning_rate": 0.00022785454733214143, + "loss": 0.0538, "step": 74520 }, { - "epoch": 0.81, - "learning_rate": 0.00017908040755402685, - "loss": 0.0498, + "epoch": 0.48, + "learning_rate": 0.0002278448659777845, + "loss": 0.0546, "step": 74530 }, { - "epoch": 0.81, - "learning_rate": 0.0001790641832695178, - "loss": 0.0432, + "epoch": 0.48, + "learning_rate": 0.0002278351846234276, + "loss": 0.061, "step": 74540 }, { - "epoch": 0.81, - "learning_rate": 0.00017904795898500872, - "loss": 0.0472, + "epoch": 0.48, + "learning_rate": 0.00022782550326907062, + "loss": 0.0527, "step": 74550 }, { - "epoch": 0.81, - "learning_rate": 0.0001790317347004997, - "loss": 0.048, + "epoch": 0.48, + "learning_rate": 0.0002278158219147137, + "loss": 0.0546, "step": 74560 }, { - "epoch": 0.81, - "learning_rate": 0.00017901551041599062, - "loss": 0.0403, + "epoch": 0.48, + "learning_rate": 0.00022780614056035678, + "loss": 0.0523, "step": 74570 }, { - "epoch": 0.81, - "learning_rate": 0.0001789992861314816, - "loss": 0.047, + "epoch": 0.48, + "learning_rate": 0.00022779645920599983, + "loss": 0.055, "step": 74580 }, { - "epoch": 0.81, - "learning_rate": 0.00017898306184697252, - "loss": 0.0417, + "epoch": 0.48, + "learning_rate": 0.0002277867778516429, + "loss": 0.0479, "step": 74590 }, { - "epoch": 0.81, - "learning_rate": 0.00017896683756246347, - "loss": 0.0463, + "epoch": 0.48, + "learning_rate": 0.000227777096497286, + "loss": 0.0514, "step": 74600 }, { - "epoch": 0.81, - "learning_rate": 0.00017895061327795442, - "loss": 0.0514, + "epoch": 0.48, + "learning_rate": 0.00022776741514292904, + "loss": 0.0563, "step": 74610 }, { - "epoch": 0.81, - "learning_rate": 0.00017893438899344537, - "loss": 0.05, + "epoch": 0.48, + "learning_rate": 0.0002277577337885721, + "loss": 0.0494, "step": 74620 }, { - "epoch": 0.81, - "learning_rate": 0.00017891816470893632, - "loss": 0.0498, + "epoch": 0.48, + "learning_rate": 0.00022774805243421517, + "loss": 0.0484, "step": 74630 }, { - "epoch": 0.81, - "learning_rate": 0.00017890194042442727, - "loss": 0.0514, + "epoch": 0.48, + "learning_rate": 0.00022773837107985823, + "loss": 0.0515, "step": 74640 }, { - "epoch": 0.81, - "learning_rate": 0.0001788857161399182, - "loss": 0.051, + "epoch": 0.48, + "learning_rate": 0.0002277286897255013, + "loss": 0.0615, "step": 74650 }, { - "epoch": 0.81, - "learning_rate": 0.00017886949185540917, - "loss": 0.0487, + "epoch": 0.48, + "learning_rate": 0.0002277190083711444, + "loss": 0.0649, "step": 74660 }, { - "epoch": 0.81, - "learning_rate": 0.0001788532675709001, - "loss": 0.0452, + "epoch": 0.48, + "learning_rate": 0.00022770932701678747, + "loss": 0.0555, "step": 74670 }, { - "epoch": 0.81, - "learning_rate": 0.00017883704328639107, - "loss": 0.043, + "epoch": 0.48, + "learning_rate": 0.00022769964566243052, + "loss": 0.0526, "step": 74680 }, { - "epoch": 0.81, - "learning_rate": 0.000178820819001882, - "loss": 0.0499, + "epoch": 0.48, + "learning_rate": 0.00022768996430807357, + "loss": 0.0501, "step": 74690 }, { - "epoch": 0.81, - "learning_rate": 0.00017880459471737294, - "loss": 0.0441, + "epoch": 0.48, + "learning_rate": 0.00022768028295371665, + "loss": 0.0533, "step": 74700 }, { - "epoch": 0.81, - "learning_rate": 0.0001787883704328639, - "loss": 0.0517, + "epoch": 0.48, + "learning_rate": 0.0002276706015993597, + "loss": 0.0597, "step": 74710 }, { - "epoch": 0.81, - "learning_rate": 0.00017877214614835484, - "loss": 0.0459, + "epoch": 0.48, + "learning_rate": 0.00022766092024500278, + "loss": 0.0533, "step": 74720 }, { - "epoch": 0.81, - "learning_rate": 0.00017875592186384576, - "loss": 0.0412, + "epoch": 0.48, + "learning_rate": 0.00022765123889064586, + "loss": 0.0506, "step": 74730 }, { - "epoch": 0.81, - "learning_rate": 0.00017873969757933674, - "loss": 0.0444, + "epoch": 0.48, + "learning_rate": 0.00022764155753628894, + "loss": 0.0579, "step": 74740 }, { - "epoch": 0.81, - "learning_rate": 0.00017872347329482766, - "loss": 0.0542, + "epoch": 0.48, + "learning_rate": 0.000227631876181932, + "loss": 0.0513, "step": 74750 }, { - "epoch": 0.81, - "learning_rate": 0.00017870724901031864, - "loss": 0.0464, + "epoch": 0.48, + "learning_rate": 0.00022762219482757505, + "loss": 0.0523, "step": 74760 }, { - "epoch": 0.81, - "learning_rate": 0.00017869102472580956, - "loss": 0.0502, + "epoch": 0.48, + "learning_rate": 0.00022761251347321813, + "loss": 0.0526, "step": 74770 }, { - "epoch": 0.81, - "learning_rate": 0.0001786748004413005, - "loss": 0.0511, + "epoch": 0.48, + "learning_rate": 0.00022760283211886118, + "loss": 0.0562, "step": 74780 }, { - "epoch": 0.81, - "learning_rate": 0.00017865857615679146, - "loss": 0.048, + "epoch": 0.48, + "learning_rate": 0.00022759315076450426, + "loss": 0.0546, "step": 74790 }, { - "epoch": 0.81, - "learning_rate": 0.0001786423518722824, - "loss": 0.0478, + "epoch": 0.48, + "learning_rate": 0.00022758346941014734, + "loss": 0.0556, "step": 74800 }, { - "epoch": 0.81, - "learning_rate": 0.00017862612758777336, - "loss": 0.0458, + "epoch": 0.48, + "learning_rate": 0.0002275737880557904, + "loss": 0.0593, "step": 74810 }, { - "epoch": 0.81, - "learning_rate": 0.0001786099033032643, - "loss": 0.0491, + "epoch": 0.48, + "learning_rate": 0.00022756410670143347, + "loss": 0.0618, "step": 74820 }, { - "epoch": 0.81, - "learning_rate": 0.00017859367901875523, - "loss": 0.0525, + "epoch": 0.48, + "learning_rate": 0.00022755442534707653, + "loss": 0.0563, "step": 74830 }, { - "epoch": 0.81, - "learning_rate": 0.0001785774547342462, - "loss": 0.0422, + "epoch": 0.48, + "learning_rate": 0.00022754474399271958, + "loss": 0.0459, "step": 74840 }, { - "epoch": 0.81, - "learning_rate": 0.00017856123044973713, - "loss": 0.0416, + "epoch": 0.48, + "learning_rate": 0.00022753506263836266, + "loss": 0.0519, "step": 74850 }, { - "epoch": 0.81, - "learning_rate": 0.0001785450061652281, - "loss": 0.0573, + "epoch": 0.48, + "learning_rate": 0.00022752538128400574, + "loss": 0.0538, "step": 74860 }, { - "epoch": 0.81, - "learning_rate": 0.00017852878188071903, - "loss": 0.0443, + "epoch": 0.48, + "learning_rate": 0.00022751569992964882, + "loss": 0.056, "step": 74870 }, { - "epoch": 0.81, - "learning_rate": 0.00017851255759620998, - "loss": 0.041, + "epoch": 0.48, + "learning_rate": 0.00022750601857529187, + "loss": 0.0611, "step": 74880 }, { - "epoch": 0.81, - "learning_rate": 0.00017849633331170093, - "loss": 0.0402, + "epoch": 0.48, + "learning_rate": 0.00022749633722093495, + "loss": 0.0579, "step": 74890 }, { - "epoch": 0.81, - "learning_rate": 0.00017848010902719188, - "loss": 0.0437, + "epoch": 0.48, + "learning_rate": 0.000227486655866578, + "loss": 0.0526, "step": 74900 }, { - "epoch": 0.81, - "learning_rate": 0.0001784638847426828, - "loss": 0.0505, + "epoch": 0.48, + "learning_rate": 0.00022747697451222106, + "loss": 0.0614, "step": 74910 }, { - "epoch": 0.81, - "learning_rate": 0.00017844766045817378, - "loss": 0.0435, + "epoch": 0.48, + "learning_rate": 0.00022746729315786414, + "loss": 0.0516, "step": 74920 }, { - "epoch": 0.81, - "learning_rate": 0.0001784314361736647, - "loss": 0.0495, + "epoch": 0.48, + "learning_rate": 0.00022745761180350722, + "loss": 0.0579, "step": 74930 }, { - "epoch": 0.81, - "learning_rate": 0.00017841521188915568, - "loss": 0.0511, + "epoch": 0.48, + "learning_rate": 0.0002274479304491503, + "loss": 0.0581, "step": 74940 }, { - "epoch": 0.81, - "learning_rate": 0.0001783989876046466, - "loss": 0.0457, + "epoch": 0.48, + "learning_rate": 0.00022743824909479335, + "loss": 0.055, "step": 74950 }, { - "epoch": 0.81, - "learning_rate": 0.00017838276332013755, - "loss": 0.0449, + "epoch": 0.48, + "learning_rate": 0.00022742856774043643, + "loss": 0.0524, "step": 74960 }, { - "epoch": 0.81, - "learning_rate": 0.0001783665390356285, - "loss": 0.0432, + "epoch": 0.48, + "learning_rate": 0.00022741888638607948, + "loss": 0.0572, "step": 74970 }, { - "epoch": 0.81, - "learning_rate": 0.00017835031475111945, - "loss": 0.0499, + "epoch": 0.48, + "learning_rate": 0.00022740920503172253, + "loss": 0.0502, "step": 74980 }, { - "epoch": 0.81, - "learning_rate": 0.0001783340904666104, - "loss": 0.0485, + "epoch": 0.48, + "learning_rate": 0.00022739952367736561, + "loss": 0.0566, "step": 74990 }, { - "epoch": 0.81, - "learning_rate": 0.00017831786618210135, - "loss": 0.0554, + "epoch": 0.48, + "learning_rate": 0.0002273898423230087, + "loss": 0.0578, "step": 75000 }, { - "epoch": 0.81, - "eval_cer": 0.9211613931487558, - "eval_loss": 0.032306186854839325, - "eval_runtime": 118.8578, - "eval_samples_per_second": 16.827, - "eval_steps_per_second": 4.207, + "epoch": 0.48, + "eval_cer": 0.9199900576206078, + "eval_loss": 0.03665885701775551, + "eval_runtime": 120.0194, + "eval_samples_per_second": 16.664, + "eval_steps_per_second": 4.166, "step": 75000 }, { - "epoch": 0.81, - "learning_rate": 0.00017830164189759228, - "loss": 0.0474, + "epoch": 0.48, + "learning_rate": 0.00022738016096865175, + "loss": 0.054, "step": 75010 }, { - "epoch": 0.81, - "learning_rate": 0.00017828541761308325, - "loss": 0.0421, + "epoch": 0.48, + "learning_rate": 0.00022737047961429483, + "loss": 0.0585, "step": 75020 }, { - "epoch": 0.81, - "learning_rate": 0.00017826919332857418, - "loss": 0.0474, + "epoch": 0.48, + "learning_rate": 0.0002273607982599379, + "loss": 0.0547, "step": 75030 }, { - "epoch": 0.81, - "learning_rate": 0.00017825296904406515, - "loss": 0.0517, + "epoch": 0.48, + "learning_rate": 0.00022735111690558093, + "loss": 0.0516, "step": 75040 }, { - "epoch": 0.81, - "learning_rate": 0.00017823674475955607, - "loss": 0.0455, + "epoch": 0.48, + "learning_rate": 0.000227341435551224, + "loss": 0.0554, "step": 75050 }, { - "epoch": 0.81, - "learning_rate": 0.00017822052047504702, - "loss": 0.0402, + "epoch": 0.48, + "learning_rate": 0.0002273317541968671, + "loss": 0.0527, "step": 75060 }, { - "epoch": 0.81, - "learning_rate": 0.00017820429619053797, - "loss": 0.0494, + "epoch": 0.48, + "learning_rate": 0.00022732207284251017, + "loss": 0.054, "step": 75070 }, { - "epoch": 0.81, - "learning_rate": 0.00017818807190602892, - "loss": 0.0406, + "epoch": 0.48, + "learning_rate": 0.00022731239148815322, + "loss": 0.049, "step": 75080 }, { - "epoch": 0.81, - "learning_rate": 0.0001781718476215199, - "loss": 0.0487, + "epoch": 0.48, + "learning_rate": 0.0002273027101337963, + "loss": 0.0559, "step": 75090 }, { - "epoch": 0.81, - "learning_rate": 0.00017815562333701082, - "loss": 0.0504, + "epoch": 0.48, + "learning_rate": 0.00022729302877943938, + "loss": 0.0572, "step": 75100 }, { - "epoch": 0.81, - "learning_rate": 0.00017813939905250177, - "loss": 0.0462, + "epoch": 0.48, + "learning_rate": 0.0002272833474250824, + "loss": 0.0595, "step": 75110 }, { - "epoch": 0.81, - "learning_rate": 0.00017812317476799272, - "loss": 0.0537, + "epoch": 0.48, + "learning_rate": 0.0002272736660707255, + "loss": 0.0503, "step": 75120 }, { - "epoch": 0.81, - "learning_rate": 0.00017810695048348367, - "loss": 0.0479, + "epoch": 0.48, + "learning_rate": 0.00022726398471636857, + "loss": 0.051, "step": 75130 }, { - "epoch": 0.81, - "learning_rate": 0.00017809072619897462, - "loss": 0.0556, + "epoch": 0.48, + "learning_rate": 0.00022725430336201165, + "loss": 0.0582, "step": 75140 }, { - "epoch": 0.81, - "learning_rate": 0.00017807450191446557, - "loss": 0.0553, + "epoch": 0.49, + "learning_rate": 0.0002272446220076547, + "loss": 0.0549, "step": 75150 }, { - "epoch": 0.81, - "learning_rate": 0.0001780582776299565, - "loss": 0.0513, + "epoch": 0.49, + "learning_rate": 0.00022723494065329778, + "loss": 0.0525, "step": 75160 }, { - "epoch": 0.81, - "learning_rate": 0.00017804205334544747, - "loss": 0.0468, + "epoch": 0.49, + "learning_rate": 0.00022722525929894086, + "loss": 0.0538, "step": 75170 }, { - "epoch": 0.81, - "learning_rate": 0.0001780258290609384, - "loss": 0.0501, + "epoch": 0.49, + "learning_rate": 0.00022721557794458389, + "loss": 0.0595, "step": 75180 }, { - "epoch": 0.81, - "learning_rate": 0.00017800960477642937, - "loss": 0.0477, + "epoch": 0.49, + "learning_rate": 0.00022720589659022697, + "loss": 0.0555, "step": 75190 }, { - "epoch": 0.81, - "learning_rate": 0.0001779933804919203, - "loss": 0.0569, + "epoch": 0.49, + "learning_rate": 0.00022719621523587005, + "loss": 0.0495, "step": 75200 }, { - "epoch": 0.81, - "learning_rate": 0.00017797715620741124, - "loss": 0.0503, + "epoch": 0.49, + "learning_rate": 0.0002271865338815131, + "loss": 0.059, "step": 75210 }, { - "epoch": 0.81, - "learning_rate": 0.0001779609319229022, - "loss": 0.0448, + "epoch": 0.49, + "learning_rate": 0.00022717685252715618, + "loss": 0.0558, "step": 75220 }, { - "epoch": 0.81, - "learning_rate": 0.00017794470763839314, - "loss": 0.0466, + "epoch": 0.49, + "learning_rate": 0.00022716717117279926, + "loss": 0.0543, "step": 75230 }, { - "epoch": 0.81, - "learning_rate": 0.00017792848335388407, - "loss": 0.0432, + "epoch": 0.49, + "learning_rate": 0.00022715748981844234, + "loss": 0.1502, "step": 75240 }, { - "epoch": 0.81, - "learning_rate": 0.00017791225906937504, - "loss": 0.0468, + "epoch": 0.49, + "learning_rate": 0.00022714780846408536, + "loss": 0.0914, "step": 75250 }, { - "epoch": 0.81, - "learning_rate": 0.00017789603478486597, - "loss": 0.0423, + "epoch": 0.49, + "learning_rate": 0.00022713812710972844, + "loss": 0.0557, "step": 75260 }, { - "epoch": 0.81, - "learning_rate": 0.00017787981050035694, - "loss": 0.04, + "epoch": 0.49, + "learning_rate": 0.00022712844575537152, + "loss": 0.059, "step": 75270 }, { - "epoch": 0.81, - "learning_rate": 0.00017786358621584787, - "loss": 0.044, + "epoch": 0.49, + "learning_rate": 0.00022711876440101458, + "loss": 0.0474, "step": 75280 }, { - "epoch": 0.81, - "learning_rate": 0.00017784736193133881, - "loss": 0.0443, + "epoch": 0.49, + "learning_rate": 0.00022710908304665766, + "loss": 0.0485, "step": 75290 }, { - "epoch": 0.81, - "learning_rate": 0.00017783113764682976, - "loss": 0.0417, + "epoch": 0.49, + "learning_rate": 0.00022709940169230073, + "loss": 0.0537, "step": 75300 }, { - "epoch": 0.81, - "learning_rate": 0.00017781491336232071, - "loss": 0.0442, + "epoch": 0.49, + "learning_rate": 0.00022708972033794381, + "loss": 0.0533, "step": 75310 }, { - "epoch": 0.81, - "learning_rate": 0.00017779868907781166, - "loss": 0.0508, + "epoch": 0.49, + "learning_rate": 0.00022708003898358684, + "loss": 0.0551, "step": 75320 }, { - "epoch": 0.81, - "learning_rate": 0.00017778246479330261, - "loss": 0.0405, + "epoch": 0.49, + "learning_rate": 0.00022707035762922992, + "loss": 0.0549, "step": 75330 }, { - "epoch": 0.81, - "learning_rate": 0.00017776624050879354, - "loss": 0.043, + "epoch": 0.49, + "learning_rate": 0.000227060676274873, + "loss": 0.0545, "step": 75340 }, { - "epoch": 0.81, - "learning_rate": 0.0001777500162242845, - "loss": 0.0528, + "epoch": 0.49, + "learning_rate": 0.00022705099492051605, + "loss": 0.058, "step": 75350 }, { - "epoch": 0.82, - "learning_rate": 0.00017773379193977544, - "loss": 0.0444, + "epoch": 0.49, + "learning_rate": 0.00022704131356615913, + "loss": 0.0496, "step": 75360 }, { - "epoch": 0.82, - "learning_rate": 0.0001777175676552664, - "loss": 0.0448, + "epoch": 0.49, + "learning_rate": 0.0002270316322118022, + "loss": 0.0504, "step": 75370 }, { - "epoch": 0.82, - "learning_rate": 0.00017770134337075734, - "loss": 0.0526, + "epoch": 0.49, + "learning_rate": 0.00022702195085744526, + "loss": 0.0562, "step": 75380 }, { - "epoch": 0.82, - "learning_rate": 0.00017768511908624829, - "loss": 0.0507, + "epoch": 0.49, + "learning_rate": 0.00022701226950308832, + "loss": 0.0649, "step": 75390 }, { - "epoch": 0.82, - "learning_rate": 0.00017766889480173924, - "loss": 0.048, + "epoch": 0.49, + "learning_rate": 0.0002270025881487314, + "loss": 0.0511, "step": 75400 }, { - "epoch": 0.82, - "learning_rate": 0.00017765267051723019, - "loss": 0.0469, + "epoch": 0.49, + "learning_rate": 0.00022699290679437445, + "loss": 0.0562, "step": 75410 }, { - "epoch": 0.82, - "learning_rate": 0.0001776364462327211, - "loss": 0.0457, + "epoch": 0.49, + "learning_rate": 0.00022698322544001753, + "loss": 0.056, "step": 75420 }, { - "epoch": 0.82, - "learning_rate": 0.00017762022194821208, - "loss": 0.0441, + "epoch": 0.49, + "learning_rate": 0.0002269735440856606, + "loss": 0.054, "step": 75430 }, { - "epoch": 0.82, - "learning_rate": 0.000177603997663703, - "loss": 0.0487, + "epoch": 0.49, + "learning_rate": 0.0002269638627313037, + "loss": 0.0617, "step": 75440 }, { - "epoch": 0.82, - "learning_rate": 0.00017758777337919398, - "loss": 0.0437, + "epoch": 0.49, + "learning_rate": 0.00022695418137694674, + "loss": 0.046, "step": 75450 }, { - "epoch": 0.82, - "learning_rate": 0.0001775715490946849, - "loss": 0.0402, + "epoch": 0.49, + "learning_rate": 0.0002269445000225898, + "loss": 0.0556, "step": 75460 }, { - "epoch": 0.82, - "learning_rate": 0.00017755532481017586, - "loss": 0.046, + "epoch": 0.49, + "learning_rate": 0.00022693481866823287, + "loss": 0.0519, "step": 75470 }, { - "epoch": 0.82, - "learning_rate": 0.0001775391005256668, - "loss": 0.0449, + "epoch": 0.49, + "learning_rate": 0.00022692513731387593, + "loss": 0.0494, "step": 75480 }, { - "epoch": 0.82, - "learning_rate": 0.00017752287624115776, - "loss": 0.0519, + "epoch": 0.49, + "learning_rate": 0.000226915455959519, + "loss": 0.059, "step": 75490 }, { - "epoch": 0.82, - "learning_rate": 0.0001775066519566487, - "loss": 0.0418, + "epoch": 0.49, + "learning_rate": 0.0002269057746051621, + "loss": 0.0546, "step": 75500 }, { - "epoch": 0.82, - "learning_rate": 0.00017749042767213966, - "loss": 0.0431, + "epoch": 0.49, + "learning_rate": 0.00022689609325080517, + "loss": 0.0557, "step": 75510 }, { - "epoch": 0.82, - "learning_rate": 0.00017747420338763058, - "loss": 0.0555, + "epoch": 0.49, + "learning_rate": 0.00022688641189644822, + "loss": 0.0471, "step": 75520 }, { - "epoch": 0.82, - "learning_rate": 0.00017745797910312156, - "loss": 0.0435, + "epoch": 0.49, + "learning_rate": 0.00022687673054209127, + "loss": 0.0625, "step": 75530 }, { - "epoch": 0.82, - "learning_rate": 0.00017744175481861248, - "loss": 0.0458, + "epoch": 0.49, + "learning_rate": 0.00022686704918773435, + "loss": 0.059, "step": 75540 }, { - "epoch": 0.82, - "learning_rate": 0.00017742553053410345, - "loss": 0.0425, + "epoch": 0.49, + "learning_rate": 0.0002268573678333774, + "loss": 0.0604, "step": 75550 }, { - "epoch": 0.82, - "learning_rate": 0.00017740930624959438, - "loss": 0.0497, + "epoch": 0.49, + "learning_rate": 0.00022684768647902048, + "loss": 0.0501, "step": 75560 }, { - "epoch": 0.82, - "learning_rate": 0.00017739308196508533, - "loss": 0.047, + "epoch": 0.49, + "learning_rate": 0.00022683800512466356, + "loss": 0.0523, "step": 75570 }, { - "epoch": 0.82, - "learning_rate": 0.00017737685768057628, - "loss": 0.0447, + "epoch": 0.49, + "learning_rate": 0.00022682832377030662, + "loss": 0.0476, "step": 75580 }, { - "epoch": 0.82, - "learning_rate": 0.00017736063339606723, - "loss": 0.0455, + "epoch": 0.49, + "learning_rate": 0.0002268186424159497, + "loss": 0.0518, "step": 75590 }, { - "epoch": 0.82, - "learning_rate": 0.00017734440911155815, - "loss": 0.0416, + "epoch": 0.49, + "learning_rate": 0.00022680896106159275, + "loss": 0.0602, "step": 75600 }, { - "epoch": 0.82, - "learning_rate": 0.00017732818482704913, - "loss": 0.0419, + "epoch": 0.49, + "learning_rate": 0.0002267992797072358, + "loss": 0.0623, "step": 75610 }, { - "epoch": 0.82, - "learning_rate": 0.00017731196054254005, - "loss": 0.0423, + "epoch": 0.49, + "learning_rate": 0.00022678959835287888, + "loss": 0.0676, "step": 75620 }, { - "epoch": 0.82, - "learning_rate": 0.00017729573625803103, - "loss": 0.046, + "epoch": 0.49, + "learning_rate": 0.00022677991699852196, + "loss": 0.0532, "step": 75630 }, { - "epoch": 0.82, - "learning_rate": 0.00017727951197352195, - "loss": 0.039, + "epoch": 0.49, + "learning_rate": 0.00022677023564416504, + "loss": 0.0595, "step": 75640 }, { - "epoch": 0.82, - "learning_rate": 0.0001772632876890129, - "loss": 0.0512, + "epoch": 0.49, + "learning_rate": 0.0002267605542898081, + "loss": 0.0545, "step": 75650 }, { - "epoch": 0.82, - "learning_rate": 0.00017724706340450385, - "loss": 0.0413, + "epoch": 0.49, + "learning_rate": 0.00022675087293545117, + "loss": 0.0576, "step": 75660 }, { - "epoch": 0.82, - "learning_rate": 0.0001772308391199948, - "loss": 0.0441, + "epoch": 0.49, + "learning_rate": 0.00022674119158109423, + "loss": 0.0677, "step": 75670 }, { - "epoch": 0.82, - "learning_rate": 0.00017721461483548575, - "loss": 0.0438, + "epoch": 0.49, + "learning_rate": 0.00022673151022673728, + "loss": 0.0574, "step": 75680 }, { - "epoch": 0.82, - "learning_rate": 0.0001771983905509767, - "loss": 0.0468, + "epoch": 0.49, + "learning_rate": 0.00022672182887238036, + "loss": 0.054, "step": 75690 }, { - "epoch": 0.82, - "learning_rate": 0.00017718216626646762, - "loss": 0.0432, + "epoch": 0.49, + "learning_rate": 0.00022671214751802344, + "loss": 0.0568, "step": 75700 }, { - "epoch": 0.82, - "learning_rate": 0.0001771659419819586, - "loss": 0.0441, + "epoch": 0.49, + "learning_rate": 0.00022670246616366652, + "loss": 0.0578, "step": 75710 }, { - "epoch": 0.82, - "learning_rate": 0.00017714971769744952, - "loss": 0.0403, + "epoch": 0.49, + "learning_rate": 0.00022669278480930957, + "loss": 0.056, "step": 75720 }, { - "epoch": 0.82, - "learning_rate": 0.0001771334934129405, - "loss": 0.0489, + "epoch": 0.49, + "learning_rate": 0.00022668310345495265, + "loss": 0.0456, "step": 75730 }, { - "epoch": 0.82, - "learning_rate": 0.00017711726912843142, - "loss": 0.0494, + "epoch": 0.49, + "learning_rate": 0.0002266734221005957, + "loss": 0.0558, "step": 75740 }, { - "epoch": 0.82, - "learning_rate": 0.00017710104484392237, - "loss": 0.0418, + "epoch": 0.49, + "learning_rate": 0.00022666374074623876, + "loss": 0.0599, "step": 75750 }, { - "epoch": 0.82, - "learning_rate": 0.00017708482055941332, - "loss": 0.0652, + "epoch": 0.49, + "learning_rate": 0.00022665405939188184, + "loss": 0.0534, "step": 75760 }, { - "epoch": 0.82, - "learning_rate": 0.00017706859627490427, - "loss": 0.0471, + "epoch": 0.49, + "learning_rate": 0.00022664437803752492, + "loss": 0.0601, "step": 75770 }, { - "epoch": 0.82, - "learning_rate": 0.0001770523719903952, - "loss": 0.046, + "epoch": 0.49, + "learning_rate": 0.000226634696683168, + "loss": 0.0504, "step": 75780 }, { - "epoch": 0.82, - "learning_rate": 0.00017703614770588617, - "loss": 0.0486, + "epoch": 0.49, + "learning_rate": 0.00022662501532881105, + "loss": 0.0577, "step": 75790 }, { - "epoch": 0.82, - "learning_rate": 0.0001770199234213771, - "loss": 0.0556, + "epoch": 0.49, + "learning_rate": 0.00022661533397445413, + "loss": 0.058, "step": 75800 }, { - "epoch": 0.82, - "learning_rate": 0.00017700369913686807, - "loss": 0.0554, + "epoch": 0.49, + "learning_rate": 0.00022660565262009715, + "loss": 0.0499, "step": 75810 }, { - "epoch": 0.82, - "learning_rate": 0.000176987474852359, - "loss": 0.0444, + "epoch": 0.49, + "learning_rate": 0.00022659597126574023, + "loss": 0.0529, "step": 75820 }, { - "epoch": 0.82, - "learning_rate": 0.00017697125056784997, - "loss": 0.0441, + "epoch": 0.49, + "learning_rate": 0.0002265862899113833, + "loss": 0.0497, "step": 75830 }, { - "epoch": 0.82, - "learning_rate": 0.0001769550262833409, - "loss": 0.048, + "epoch": 0.49, + "learning_rate": 0.0002265766085570264, + "loss": 0.0536, "step": 75840 }, { - "epoch": 0.82, - "learning_rate": 0.00017693880199883184, - "loss": 0.0489, + "epoch": 0.49, + "learning_rate": 0.00022656692720266945, + "loss": 0.0493, "step": 75850 }, { - "epoch": 0.82, - "learning_rate": 0.0001769225777143228, - "loss": 0.0427, + "epoch": 0.49, + "learning_rate": 0.00022655724584831253, + "loss": 0.0541, "step": 75860 }, { - "epoch": 0.82, - "learning_rate": 0.00017690635342981374, - "loss": 0.0442, + "epoch": 0.49, + "learning_rate": 0.0002265475644939556, + "loss": 0.0526, "step": 75870 }, { - "epoch": 0.82, - "learning_rate": 0.00017689012914530466, - "loss": 0.0458, + "epoch": 0.49, + "learning_rate": 0.00022653788313959863, + "loss": 0.0482, "step": 75880 }, { - "epoch": 0.82, - "learning_rate": 0.00017687390486079564, - "loss": 0.0552, + "epoch": 0.49, + "learning_rate": 0.0002265282017852417, + "loss": 0.0564, "step": 75890 }, { - "epoch": 0.82, - "learning_rate": 0.00017685768057628656, - "loss": 0.0434, + "epoch": 0.49, + "learning_rate": 0.0002265185204308848, + "loss": 0.0581, "step": 75900 }, { - "epoch": 0.82, - "learning_rate": 0.00017684145629177754, - "loss": 0.0486, + "epoch": 0.49, + "learning_rate": 0.00022650883907652787, + "loss": 0.0593, "step": 75910 }, { - "epoch": 0.82, - "learning_rate": 0.00017682523200726846, - "loss": 0.0423, + "epoch": 0.49, + "learning_rate": 0.00022649915772217092, + "loss": 0.0515, "step": 75920 }, { - "epoch": 0.82, - "learning_rate": 0.0001768090077227594, - "loss": 0.0427, + "epoch": 0.49, + "learning_rate": 0.000226489476367814, + "loss": 0.0597, "step": 75930 }, { - "epoch": 0.82, - "learning_rate": 0.00017679278343825036, - "loss": 0.0535, + "epoch": 0.49, + "learning_rate": 0.00022647979501345708, + "loss": 0.0484, "step": 75940 }, { - "epoch": 0.82, - "learning_rate": 0.0001767765591537413, - "loss": 0.0435, + "epoch": 0.49, + "learning_rate": 0.0002264701136591001, + "loss": 0.0507, "step": 75950 }, { - "epoch": 0.82, - "learning_rate": 0.00017676033486923223, - "loss": 0.0365, + "epoch": 0.49, + "learning_rate": 0.0002264604323047432, + "loss": 0.0467, "step": 75960 }, { - "epoch": 0.82, - "learning_rate": 0.0001767441105847232, - "loss": 0.0487, + "epoch": 0.49, + "learning_rate": 0.00022645075095038627, + "loss": 0.0555, "step": 75970 }, { - "epoch": 0.82, - "learning_rate": 0.00017672788630021413, - "loss": 0.0536, + "epoch": 0.49, + "learning_rate": 0.00022644106959602935, + "loss": 0.0618, "step": 75980 }, { - "epoch": 0.82, - "learning_rate": 0.0001767116620157051, - "loss": 0.0433, + "epoch": 0.49, + "learning_rate": 0.0002264313882416724, + "loss": 0.0501, "step": 75990 }, { - "epoch": 0.82, - "learning_rate": 0.00017669543773119603, - "loss": 0.0418, + "epoch": 0.49, + "learning_rate": 0.00022642170688731548, + "loss": 0.0545, "step": 76000 }, { - "epoch": 0.82, - "eval_cer": 0.9211799463194926, - "eval_loss": 0.03262558951973915, - "eval_runtime": 118.8732, - "eval_samples_per_second": 16.825, - "eval_steps_per_second": 4.206, + "epoch": 0.49, + "eval_cer": 0.9200289232855045, + "eval_loss": 0.03558797389268875, + "eval_runtime": 119.9372, + "eval_samples_per_second": 16.675, + "eval_steps_per_second": 4.169, "step": 76000 }, { - "epoch": 0.82, - "learning_rate": 0.000176679213446687, - "loss": 0.0426, + "epoch": 0.49, + "learning_rate": 0.00022641202553295856, + "loss": 0.0543, "step": 76010 }, { - "epoch": 0.82, - "learning_rate": 0.00017666298916217793, - "loss": 0.0451, + "epoch": 0.49, + "learning_rate": 0.00022640234417860159, + "loss": 0.0621, "step": 76020 }, { - "epoch": 0.82, - "learning_rate": 0.00017664676487766888, - "loss": 0.0426, + "epoch": 0.49, + "learning_rate": 0.00022639266282424467, + "loss": 0.0504, "step": 76030 }, { - "epoch": 0.82, - "learning_rate": 0.00017663054059315983, - "loss": 0.0464, + "epoch": 0.49, + "learning_rate": 0.00022638298146988775, + "loss": 0.0534, "step": 76040 }, { - "epoch": 0.82, - "learning_rate": 0.00017661431630865078, - "loss": 0.0385, + "epoch": 0.49, + "learning_rate": 0.0002263733001155308, + "loss": 0.0491, "step": 76050 }, { - "epoch": 0.82, - "learning_rate": 0.0001765980920241417, - "loss": 0.0429, + "epoch": 0.49, + "learning_rate": 0.00022636361876117388, + "loss": 0.049, "step": 76060 }, { - "epoch": 0.82, - "learning_rate": 0.00017658186773963268, - "loss": 0.0437, + "epoch": 0.49, + "learning_rate": 0.00022635393740681696, + "loss": 0.0533, "step": 76070 }, { - "epoch": 0.82, - "learning_rate": 0.0001765656434551236, - "loss": 0.0399, + "epoch": 0.49, + "learning_rate": 0.00022634425605246004, + "loss": 0.0558, "step": 76080 }, { - "epoch": 0.82, - "learning_rate": 0.00017654941917061458, - "loss": 0.0428, + "epoch": 0.49, + "learning_rate": 0.00022633457469810306, + "loss": 0.0512, "step": 76090 }, { - "epoch": 0.82, - "learning_rate": 0.0001765331948861055, - "loss": 0.0439, + "epoch": 0.49, + "learning_rate": 0.00022632489334374614, + "loss": 0.0539, "step": 76100 }, { - "epoch": 0.82, - "learning_rate": 0.00017651697060159645, - "loss": 0.0457, + "epoch": 0.49, + "learning_rate": 0.00022631521198938922, + "loss": 0.0552, "step": 76110 }, { - "epoch": 0.82, - "learning_rate": 0.0001765007463170874, - "loss": 0.0464, + "epoch": 0.49, + "learning_rate": 0.00022630553063503228, + "loss": 0.0526, "step": 76120 }, { - "epoch": 0.82, - "learning_rate": 0.00017648452203257835, - "loss": 0.0374, + "epoch": 0.49, + "learning_rate": 0.00022629584928067535, + "loss": 0.0588, "step": 76130 }, { - "epoch": 0.82, - "learning_rate": 0.00017646829774806927, - "loss": 0.0396, + "epoch": 0.49, + "learning_rate": 0.00022628616792631843, + "loss": 0.072, "step": 76140 }, { - "epoch": 0.82, - "learning_rate": 0.00017645207346356025, - "loss": 0.0469, + "epoch": 0.49, + "learning_rate": 0.00022627648657196151, + "loss": 0.0562, "step": 76150 }, { - "epoch": 0.82, - "learning_rate": 0.00017643584917905117, - "loss": 0.0432, + "epoch": 0.49, + "learning_rate": 0.00022626680521760454, + "loss": 0.0586, "step": 76160 }, { - "epoch": 0.82, - "learning_rate": 0.00017641962489454215, - "loss": 0.0501, + "epoch": 0.49, + "learning_rate": 0.00022625712386324762, + "loss": 0.0588, "step": 76170 }, { - "epoch": 0.82, - "learning_rate": 0.00017640340061003307, - "loss": 0.0424, + "epoch": 0.49, + "learning_rate": 0.0002262474425088907, + "loss": 0.056, "step": 76180 }, { - "epoch": 0.82, - "learning_rate": 0.00017638717632552405, - "loss": 0.0404, + "epoch": 0.49, + "learning_rate": 0.00022623776115453375, + "loss": 0.0603, "step": 76190 }, { - "epoch": 0.82, - "learning_rate": 0.00017637095204101497, - "loss": 0.0412, + "epoch": 0.49, + "learning_rate": 0.00022622807980017683, + "loss": 0.0538, "step": 76200 }, { - "epoch": 0.82, - "learning_rate": 0.00017635472775650592, - "loss": 0.0461, + "epoch": 0.49, + "learning_rate": 0.0002262183984458199, + "loss": 0.0555, "step": 76210 }, { - "epoch": 0.82, - "learning_rate": 0.00017633850347199687, - "loss": 0.0471, + "epoch": 0.49, + "learning_rate": 0.00022620871709146296, + "loss": 0.056, "step": 76220 }, { - "epoch": 0.82, - "learning_rate": 0.00017632227918748782, - "loss": 0.0457, + "epoch": 0.49, + "learning_rate": 0.00022619903573710602, + "loss": 0.0541, "step": 76230 }, { - "epoch": 0.82, - "learning_rate": 0.00017630605490297874, - "loss": 0.0419, + "epoch": 0.49, + "learning_rate": 0.0002261893543827491, + "loss": 0.0484, "step": 76240 }, { - "epoch": 0.82, - "learning_rate": 0.00017628983061846972, - "loss": 0.0499, + "epoch": 0.49, + "learning_rate": 0.00022617967302839215, + "loss": 0.0491, "step": 76250 }, { - "epoch": 0.82, - "learning_rate": 0.00017627360633396064, - "loss": 0.0463, + "epoch": 0.49, + "learning_rate": 0.00022616999167403523, + "loss": 0.0569, "step": 76260 }, { - "epoch": 0.82, - "learning_rate": 0.00017625738204945162, - "loss": 0.0417, + "epoch": 0.49, + "learning_rate": 0.0002261603103196783, + "loss": 0.0563, "step": 76270 }, { - "epoch": 0.83, - "learning_rate": 0.00017624115776494254, - "loss": 0.0461, + "epoch": 0.49, + "learning_rate": 0.0002261506289653214, + "loss": 0.0526, "step": 76280 }, { - "epoch": 0.83, - "learning_rate": 0.0001762249334804335, - "loss": 0.0485, + "epoch": 0.49, + "learning_rate": 0.00022614094761096444, + "loss": 0.0548, "step": 76290 }, { - "epoch": 0.83, - "learning_rate": 0.00017620870919592444, - "loss": 0.0463, + "epoch": 0.49, + "learning_rate": 0.0002261312662566075, + "loss": 0.057, "step": 76300 }, { - "epoch": 0.83, - "learning_rate": 0.0001761924849114154, - "loss": 0.051, + "epoch": 0.49, + "learning_rate": 0.00022612158490225057, + "loss": 0.0477, "step": 76310 }, { - "epoch": 0.83, - "learning_rate": 0.00017617626062690632, - "loss": 0.0417, + "epoch": 0.49, + "learning_rate": 0.00022611190354789363, + "loss": 0.0554, "step": 76320 }, { - "epoch": 0.83, - "learning_rate": 0.0001761600363423973, - "loss": 0.0405, + "epoch": 0.49, + "learning_rate": 0.0002261022221935367, + "loss": 0.055, "step": 76330 }, { - "epoch": 0.83, - "learning_rate": 0.00017614381205788822, - "loss": 0.0503, + "epoch": 0.49, + "learning_rate": 0.0002260925408391798, + "loss": 0.0539, "step": 76340 }, { - "epoch": 0.83, - "learning_rate": 0.0001761275877733792, - "loss": 0.05, + "epoch": 0.49, + "learning_rate": 0.00022608285948482287, + "loss": 0.0511, "step": 76350 }, { - "epoch": 0.83, - "learning_rate": 0.00017611136348887012, - "loss": 0.0425, + "epoch": 0.49, + "learning_rate": 0.00022607317813046592, + "loss": 0.059, "step": 76360 }, { - "epoch": 0.83, - "learning_rate": 0.0001760951392043611, - "loss": 0.0413, + "epoch": 0.49, + "learning_rate": 0.00022606349677610897, + "loss": 0.0528, "step": 76370 }, { - "epoch": 0.83, - "learning_rate": 0.00017607891491985201, - "loss": 0.05, + "epoch": 0.49, + "learning_rate": 0.00022605381542175205, + "loss": 0.0517, "step": 76380 }, { - "epoch": 0.83, - "learning_rate": 0.00017606269063534296, - "loss": 0.0537, + "epoch": 0.49, + "learning_rate": 0.0002260441340673951, + "loss": 0.0514, "step": 76390 }, { - "epoch": 0.83, - "learning_rate": 0.00017604646635083391, - "loss": 0.0549, + "epoch": 0.49, + "learning_rate": 0.00022603445271303818, + "loss": 0.0495, "step": 76400 }, { - "epoch": 0.83, - "learning_rate": 0.00017603024206632486, - "loss": 0.0486, + "epoch": 0.49, + "learning_rate": 0.00022602477135868126, + "loss": 0.0522, "step": 76410 }, { - "epoch": 0.83, - "learning_rate": 0.0001760140177818158, - "loss": 0.0418, + "epoch": 0.49, + "learning_rate": 0.00022601509000432432, + "loss": 0.0545, "step": 76420 }, { - "epoch": 0.83, - "learning_rate": 0.00017599779349730676, - "loss": 0.0468, + "epoch": 0.49, + "learning_rate": 0.0002260054086499674, + "loss": 0.056, "step": 76430 }, { - "epoch": 0.83, - "learning_rate": 0.00017598156921279769, - "loss": 0.0452, + "epoch": 0.49, + "learning_rate": 0.00022599572729561045, + "loss": 0.0689, "step": 76440 }, { - "epoch": 0.83, - "learning_rate": 0.00017596534492828866, - "loss": 0.0451, + "epoch": 0.49, + "learning_rate": 0.0002259860459412535, + "loss": 0.0554, "step": 76450 }, { - "epoch": 0.83, - "learning_rate": 0.00017594912064377959, - "loss": 0.0486, + "epoch": 0.49, + "learning_rate": 0.00022597636458689658, + "loss": 0.058, "step": 76460 }, { - "epoch": 0.83, - "learning_rate": 0.00017593289635927054, - "loss": 0.0452, + "epoch": 0.49, + "learning_rate": 0.00022596668323253966, + "loss": 0.0557, "step": 76470 }, { - "epoch": 0.83, - "learning_rate": 0.00017591667207476149, - "loss": 0.0486, + "epoch": 0.49, + "learning_rate": 0.00022595700187818274, + "loss": 0.0617, "step": 76480 }, { - "epoch": 0.83, - "learning_rate": 0.00017590044779025244, - "loss": 0.0529, + "epoch": 0.49, + "learning_rate": 0.0002259473205238258, + "loss": 0.0552, "step": 76490 }, { - "epoch": 0.83, - "learning_rate": 0.00017588422350574338, - "loss": 0.0483, + "epoch": 0.49, + "learning_rate": 0.00022593763916946887, + "loss": 0.0612, "step": 76500 }, { - "epoch": 0.83, - "learning_rate": 0.00017586799922123433, - "loss": 0.045, + "epoch": 0.49, + "learning_rate": 0.00022592795781511193, + "loss": 0.0526, "step": 76510 }, { - "epoch": 0.83, - "learning_rate": 0.00017585177493672526, - "loss": 0.0437, + "epoch": 0.49, + "learning_rate": 0.00022591827646075498, + "loss": 0.0536, "step": 76520 }, { - "epoch": 0.83, - "learning_rate": 0.00017583555065221623, - "loss": 0.0501, + "epoch": 0.49, + "learning_rate": 0.00022590859510639806, + "loss": 0.0617, "step": 76530 }, { - "epoch": 0.83, - "learning_rate": 0.00017581932636770716, - "loss": 0.0544, + "epoch": 0.49, + "learning_rate": 0.00022589891375204114, + "loss": 0.0522, "step": 76540 }, { - "epoch": 0.83, - "learning_rate": 0.00017580310208319813, - "loss": 0.0497, + "epoch": 0.49, + "learning_rate": 0.00022588923239768422, + "loss": 0.0505, "step": 76550 }, { - "epoch": 0.83, - "learning_rate": 0.00017578687779868906, - "loss": 0.0499, + "epoch": 0.49, + "learning_rate": 0.00022587955104332727, + "loss": 0.0578, "step": 76560 }, { - "epoch": 0.83, - "learning_rate": 0.00017577065351418, - "loss": 0.0504, + "epoch": 0.49, + "learning_rate": 0.00022586986968897035, + "loss": 0.057, "step": 76570 }, { - "epoch": 0.83, - "learning_rate": 0.00017575442922967096, - "loss": 0.0393, + "epoch": 0.49, + "learning_rate": 0.0002258601883346134, + "loss": 0.0523, "step": 76580 }, { - "epoch": 0.83, - "learning_rate": 0.0001757382049451619, - "loss": 0.0527, + "epoch": 0.49, + "learning_rate": 0.00022585050698025646, + "loss": 0.0553, "step": 76590 }, { - "epoch": 0.83, - "learning_rate": 0.00017572198066065283, - "loss": 0.0465, + "epoch": 0.49, + "learning_rate": 0.00022584082562589954, + "loss": 0.0615, "step": 76600 }, { - "epoch": 0.83, - "learning_rate": 0.0001757057563761438, - "loss": 0.0417, + "epoch": 0.49, + "learning_rate": 0.00022583114427154262, + "loss": 0.0545, "step": 76610 }, { - "epoch": 0.83, - "learning_rate": 0.00017568953209163473, - "loss": 0.0481, + "epoch": 0.49, + "learning_rate": 0.00022582146291718567, + "loss": 0.0537, "step": 76620 }, { - "epoch": 0.83, - "learning_rate": 0.0001756733078071257, - "loss": 0.055, + "epoch": 0.49, + "learning_rate": 0.00022581178156282875, + "loss": 0.0532, "step": 76630 }, { - "epoch": 0.83, - "learning_rate": 0.00017565708352261663, - "loss": 0.044, + "epoch": 0.49, + "learning_rate": 0.00022580210020847183, + "loss": 0.0609, "step": 76640 }, { - "epoch": 0.83, - "learning_rate": 0.00017564085923810758, - "loss": 0.0498, + "epoch": 0.49, + "learning_rate": 0.00022579241885411485, + "loss": 0.0489, "step": 76650 }, { - "epoch": 0.83, - "learning_rate": 0.00017562463495359853, - "loss": 0.0405, + "epoch": 0.49, + "learning_rate": 0.00022578273749975793, + "loss": 0.0487, "step": 76660 }, { - "epoch": 0.83, - "learning_rate": 0.00017560841066908948, - "loss": 0.0434, + "epoch": 0.49, + "learning_rate": 0.000225773056145401, + "loss": 0.0557, "step": 76670 }, { - "epoch": 0.83, - "learning_rate": 0.00017559218638458043, - "loss": 0.046, + "epoch": 0.49, + "learning_rate": 0.0002257633747910441, + "loss": 0.0538, "step": 76680 }, { - "epoch": 0.83, - "learning_rate": 0.00017557596210007138, - "loss": 0.0461, + "epoch": 0.49, + "learning_rate": 0.00022575369343668715, + "loss": 0.0593, "step": 76690 }, { - "epoch": 0.83, - "learning_rate": 0.0001755597378155623, - "loss": 0.0502, + "epoch": 0.5, + "learning_rate": 0.00022574401208233023, + "loss": 0.0544, "step": 76700 }, { - "epoch": 0.83, - "learning_rate": 0.00017554351353105328, - "loss": 0.0373, + "epoch": 0.5, + "learning_rate": 0.0002257343307279733, + "loss": 0.058, "step": 76710 }, { - "epoch": 0.83, - "learning_rate": 0.0001755272892465442, - "loss": 0.0493, + "epoch": 0.5, + "learning_rate": 0.00022572464937361633, + "loss": 0.0564, "step": 76720 }, { - "epoch": 0.83, - "learning_rate": 0.00017551106496203518, - "loss": 0.0409, + "epoch": 0.5, + "learning_rate": 0.0002257149680192594, + "loss": 0.0499, "step": 76730 }, { - "epoch": 0.83, - "learning_rate": 0.0001754948406775261, - "loss": 0.0502, + "epoch": 0.5, + "learning_rate": 0.0002257052866649025, + "loss": 0.0558, "step": 76740 }, { - "epoch": 0.83, - "learning_rate": 0.00017547861639301705, - "loss": 0.0459, + "epoch": 0.5, + "learning_rate": 0.00022569560531054557, + "loss": 0.0538, "step": 76750 }, { - "epoch": 0.83, - "learning_rate": 0.000175462392108508, - "loss": 0.0471, + "epoch": 0.5, + "learning_rate": 0.00022568592395618862, + "loss": 0.0591, "step": 76760 }, { - "epoch": 0.83, - "learning_rate": 0.00017544616782399895, - "loss": 0.0438, + "epoch": 0.5, + "learning_rate": 0.0002256762426018317, + "loss": 0.0547, "step": 76770 }, { - "epoch": 0.83, - "learning_rate": 0.00017542994353948987, - "loss": 0.0462, + "epoch": 0.5, + "learning_rate": 0.00022566656124747478, + "loss": 0.054, "step": 76780 }, { - "epoch": 0.83, - "learning_rate": 0.00017541371925498085, - "loss": 0.0481, + "epoch": 0.5, + "learning_rate": 0.0002256568798931178, + "loss": 0.0555, "step": 76790 }, { - "epoch": 0.83, - "learning_rate": 0.00017539749497047177, - "loss": 0.0551, + "epoch": 0.5, + "learning_rate": 0.0002256471985387609, + "loss": 0.0576, "step": 76800 }, { - "epoch": 0.83, - "learning_rate": 0.00017538127068596275, - "loss": 0.0498, + "epoch": 0.5, + "learning_rate": 0.00022563751718440397, + "loss": 0.0504, "step": 76810 }, { - "epoch": 0.83, - "learning_rate": 0.00017536504640145367, - "loss": 0.0418, + "epoch": 0.5, + "learning_rate": 0.00022562783583004702, + "loss": 0.0558, "step": 76820 }, { - "epoch": 0.83, - "learning_rate": 0.00017534882211694462, - "loss": 0.0444, + "epoch": 0.5, + "learning_rate": 0.0002256181544756901, + "loss": 0.0621, "step": 76830 }, { - "epoch": 0.83, - "learning_rate": 0.00017533259783243557, - "loss": 0.0442, + "epoch": 0.5, + "learning_rate": 0.00022560847312133318, + "loss": 0.0476, "step": 76840 }, { - "epoch": 0.83, - "learning_rate": 0.00017531637354792652, - "loss": 0.0392, + "epoch": 0.5, + "learning_rate": 0.00022559879176697626, + "loss": 0.0575, "step": 76850 }, { - "epoch": 0.83, - "learning_rate": 0.00017530014926341747, - "loss": 0.0439, + "epoch": 0.5, + "learning_rate": 0.00022558911041261929, + "loss": 0.055, "step": 76860 }, { - "epoch": 0.83, - "learning_rate": 0.00017528392497890842, - "loss": 0.0448, + "epoch": 0.5, + "learning_rate": 0.00022557942905826236, + "loss": 0.0576, "step": 76870 }, { - "epoch": 0.83, - "learning_rate": 0.00017526770069439934, - "loss": 0.0455, + "epoch": 0.5, + "learning_rate": 0.00022556974770390544, + "loss": 0.0578, "step": 76880 }, { - "epoch": 0.83, - "learning_rate": 0.00017525147640989032, - "loss": 0.0487, + "epoch": 0.5, + "learning_rate": 0.0002255600663495485, + "loss": 0.056, "step": 76890 }, { - "epoch": 0.83, - "learning_rate": 0.00017523525212538124, - "loss": 0.0415, + "epoch": 0.5, + "learning_rate": 0.00022555038499519158, + "loss": 0.0536, "step": 76900 }, { - "epoch": 0.83, - "learning_rate": 0.00017521902784087222, - "loss": 0.043, + "epoch": 0.5, + "learning_rate": 0.00022554070364083466, + "loss": 0.0541, "step": 76910 }, { - "epoch": 0.83, - "learning_rate": 0.00017520280355636314, - "loss": 0.0436, + "epoch": 0.5, + "learning_rate": 0.00022553102228647774, + "loss": 0.0534, "step": 76920 }, { - "epoch": 0.83, - "learning_rate": 0.0001751865792718541, - "loss": 0.043, + "epoch": 0.5, + "learning_rate": 0.00022552134093212076, + "loss": 0.0511, "step": 76930 }, { - "epoch": 0.83, - "learning_rate": 0.00017517035498734504, - "loss": 0.0445, + "epoch": 0.5, + "learning_rate": 0.00022551165957776384, + "loss": 0.0543, "step": 76940 }, { - "epoch": 0.83, - "learning_rate": 0.000175154130702836, - "loss": 0.0563, + "epoch": 0.5, + "learning_rate": 0.00022550197822340692, + "loss": 0.0615, "step": 76950 }, { - "epoch": 0.83, - "learning_rate": 0.0001751379064183269, - "loss": 0.0467, + "epoch": 0.5, + "learning_rate": 0.00022549229686904997, + "loss": 0.0624, "step": 76960 }, { - "epoch": 0.83, - "learning_rate": 0.0001751216821338179, - "loss": 0.0468, + "epoch": 0.5, + "learning_rate": 0.00022548261551469305, + "loss": 0.0485, "step": 76970 }, { - "epoch": 0.83, - "learning_rate": 0.0001751054578493088, - "loss": 0.0493, + "epoch": 0.5, + "learning_rate": 0.00022547293416033613, + "loss": 0.0648, "step": 76980 }, { - "epoch": 0.83, - "learning_rate": 0.0001750892335647998, - "loss": 0.0452, + "epoch": 0.5, + "learning_rate": 0.0002254632528059792, + "loss": 0.0631, "step": 76990 }, { - "epoch": 0.83, - "learning_rate": 0.0001750730092802907, - "loss": 0.0461, + "epoch": 0.5, + "learning_rate": 0.00022545357145162224, + "loss": 0.0527, "step": 77000 }, { - "epoch": 0.83, - "eval_cer": 0.9212444406749113, - "eval_loss": 0.03261556476354599, - "eval_runtime": 118.8475, - "eval_samples_per_second": 16.828, - "eval_steps_per_second": 4.207, + "epoch": 0.5, + "eval_cer": 0.9199611343351034, + "eval_loss": 0.03577205166220665, + "eval_runtime": 120.0009, + "eval_samples_per_second": 16.667, + "eval_steps_per_second": 4.167, "step": 77000 }, { - "epoch": 0.83, - "learning_rate": 0.00017505678499578166, - "loss": 0.0491, + "epoch": 0.5, + "learning_rate": 0.00022544389009726532, + "loss": 0.0537, "step": 77010 }, { - "epoch": 0.83, - "learning_rate": 0.0001750405607112726, - "loss": 0.0407, + "epoch": 0.5, + "learning_rate": 0.00022543420874290837, + "loss": 0.0506, "step": 77020 }, { - "epoch": 0.83, - "learning_rate": 0.00017502433642676356, - "loss": 0.0446, + "epoch": 0.5, + "learning_rate": 0.00022542452738855145, + "loss": 0.0523, "step": 77030 }, { - "epoch": 0.83, - "learning_rate": 0.0001750081121422545, - "loss": 0.0489, + "epoch": 0.5, + "learning_rate": 0.00022541484603419453, + "loss": 0.0516, "step": 77040 }, { - "epoch": 0.83, - "learning_rate": 0.00017499188785774546, - "loss": 0.0445, + "epoch": 0.5, + "learning_rate": 0.0002254051646798376, + "loss": 0.048, "step": 77050 }, { - "epoch": 0.83, - "learning_rate": 0.00017497566357323638, - "loss": 0.0477, + "epoch": 0.5, + "learning_rate": 0.00022539548332548066, + "loss": 0.0593, "step": 77060 }, { - "epoch": 0.83, - "learning_rate": 0.00017495943928872736, - "loss": 0.0464, + "epoch": 0.5, + "learning_rate": 0.00022538580197112372, + "loss": 0.0545, "step": 77070 }, { - "epoch": 0.83, - "learning_rate": 0.00017494321500421828, - "loss": 0.0393, + "epoch": 0.5, + "learning_rate": 0.0002253761206167668, + "loss": 0.0482, "step": 77080 }, { - "epoch": 0.83, - "learning_rate": 0.00017492699071970926, - "loss": 0.0484, + "epoch": 0.5, + "learning_rate": 0.00022536643926240985, + "loss": 0.0561, "step": 77090 }, { - "epoch": 0.83, - "learning_rate": 0.00017491076643520018, - "loss": 0.0556, + "epoch": 0.5, + "learning_rate": 0.00022535675790805293, + "loss": 0.052, "step": 77100 }, { - "epoch": 0.83, - "learning_rate": 0.00017489454215069113, - "loss": 0.0517, + "epoch": 0.5, + "learning_rate": 0.000225347076553696, + "loss": 0.0526, "step": 77110 }, { - "epoch": 0.83, - "learning_rate": 0.00017487831786618208, - "loss": 0.0432, + "epoch": 0.5, + "learning_rate": 0.0002253373951993391, + "loss": 0.0482, "step": 77120 }, { - "epoch": 0.83, - "learning_rate": 0.00017486209358167303, - "loss": 0.0535, + "epoch": 0.5, + "learning_rate": 0.00022532771384498214, + "loss": 0.0563, "step": 77130 }, { - "epoch": 0.83, - "learning_rate": 0.00017484586929716395, - "loss": 0.0484, + "epoch": 0.5, + "learning_rate": 0.0002253180324906252, + "loss": 0.0539, "step": 77140 }, { - "epoch": 0.83, - "learning_rate": 0.00017482964501265493, - "loss": 0.0499, + "epoch": 0.5, + "learning_rate": 0.00022530835113626827, + "loss": 0.0481, "step": 77150 }, { - "epoch": 0.83, - "learning_rate": 0.00017481342072814585, - "loss": 0.0456, + "epoch": 0.5, + "learning_rate": 0.00022529866978191133, + "loss": 0.0489, "step": 77160 }, { - "epoch": 0.83, - "learning_rate": 0.00017479719644363683, - "loss": 0.0421, + "epoch": 0.5, + "learning_rate": 0.0002252889884275544, + "loss": 0.0543, "step": 77170 }, { - "epoch": 0.83, - "learning_rate": 0.00017478097215912775, - "loss": 0.0414, + "epoch": 0.5, + "learning_rate": 0.00022527930707319749, + "loss": 0.0615, "step": 77180 }, { - "epoch": 0.83, - "learning_rate": 0.00017476474787461873, - "loss": 0.0482, + "epoch": 0.5, + "learning_rate": 0.00022526962571884054, + "loss": 0.0543, "step": 77190 }, { - "epoch": 0.84, - "learning_rate": 0.00017474852359010965, - "loss": 0.0468, + "epoch": 0.5, + "learning_rate": 0.00022525994436448362, + "loss": 0.0532, "step": 77200 }, { - "epoch": 0.84, - "learning_rate": 0.0001747322993056006, - "loss": 0.0449, + "epoch": 0.5, + "learning_rate": 0.00022525026301012667, + "loss": 0.0538, "step": 77210 }, { - "epoch": 0.84, - "learning_rate": 0.00017471607502109155, - "loss": 0.0426, + "epoch": 0.5, + "learning_rate": 0.00022524058165576972, + "loss": 0.0543, "step": 77220 }, { - "epoch": 0.84, - "learning_rate": 0.0001746998507365825, - "loss": 0.0541, + "epoch": 0.5, + "learning_rate": 0.0002252309003014128, + "loss": 0.054, "step": 77230 }, { - "epoch": 0.84, - "learning_rate": 0.00017468362645207342, - "loss": 0.0441, + "epoch": 0.5, + "learning_rate": 0.00022522121894705588, + "loss": 0.0475, "step": 77240 }, { - "epoch": 0.84, - "learning_rate": 0.0001746674021675644, - "loss": 0.0424, + "epoch": 0.5, + "learning_rate": 0.00022521153759269896, + "loss": 0.0579, "step": 77250 }, { - "epoch": 0.84, - "learning_rate": 0.00017465117788305532, - "loss": 0.049, + "epoch": 0.5, + "learning_rate": 0.00022520185623834202, + "loss": 0.0516, "step": 77260 }, { - "epoch": 0.84, - "learning_rate": 0.0001746349535985463, - "loss": 0.0422, + "epoch": 0.5, + "learning_rate": 0.0002251921748839851, + "loss": 0.047, "step": 77270 }, { - "epoch": 0.84, - "learning_rate": 0.00017461872931403722, - "loss": 0.0422, + "epoch": 0.5, + "learning_rate": 0.00022518249352962815, + "loss": 0.0545, "step": 77280 }, { - "epoch": 0.84, - "learning_rate": 0.00017460250502952817, - "loss": 0.043, + "epoch": 0.5, + "learning_rate": 0.0002251728121752712, + "loss": 0.0613, "step": 77290 }, { - "epoch": 0.84, - "learning_rate": 0.00017458628074501912, - "loss": 0.0464, + "epoch": 0.5, + "learning_rate": 0.00022516313082091428, + "loss": 0.0527, "step": 77300 }, { - "epoch": 0.84, - "learning_rate": 0.00017457005646051007, - "loss": 0.0415, + "epoch": 0.5, + "learning_rate": 0.00022515344946655736, + "loss": 0.0531, "step": 77310 }, { - "epoch": 0.84, - "learning_rate": 0.000174553832176001, - "loss": 0.0393, + "epoch": 0.5, + "learning_rate": 0.00022514376811220044, + "loss": 0.0541, "step": 77320 }, { - "epoch": 0.84, - "learning_rate": 0.00017453760789149197, - "loss": 0.0469, + "epoch": 0.5, + "learning_rate": 0.0002251340867578435, + "loss": 0.0523, "step": 77330 }, { - "epoch": 0.84, - "learning_rate": 0.0001745213836069829, - "loss": 0.0411, + "epoch": 0.5, + "learning_rate": 0.00022512440540348657, + "loss": 0.0531, "step": 77340 }, { - "epoch": 0.84, - "learning_rate": 0.00017450515932247387, - "loss": 0.049, + "epoch": 0.5, + "learning_rate": 0.00022511472404912963, + "loss": 0.0526, "step": 77350 }, { - "epoch": 0.84, - "learning_rate": 0.0001744889350379648, - "loss": 0.0442, + "epoch": 0.5, + "learning_rate": 0.00022510504269477268, + "loss": 0.0547, "step": 77360 }, { - "epoch": 0.84, - "learning_rate": 0.00017447271075345577, - "loss": 0.0488, + "epoch": 0.5, + "learning_rate": 0.00022509536134041576, + "loss": 0.0492, "step": 77370 }, { - "epoch": 0.84, - "learning_rate": 0.0001744564864689467, - "loss": 0.0434, + "epoch": 0.5, + "learning_rate": 0.00022508567998605884, + "loss": 0.0518, "step": 77380 }, { - "epoch": 0.84, - "learning_rate": 0.00017444026218443764, - "loss": 0.0446, + "epoch": 0.5, + "learning_rate": 0.0002250759986317019, + "loss": 0.0508, "step": 77390 }, { - "epoch": 0.84, - "learning_rate": 0.0001744240378999286, - "loss": 0.0439, + "epoch": 0.5, + "learning_rate": 0.00022506631727734497, + "loss": 0.0573, "step": 77400 }, { - "epoch": 0.84, - "learning_rate": 0.00017440781361541954, - "loss": 0.0407, + "epoch": 0.5, + "learning_rate": 0.00022505663592298805, + "loss": 0.0528, "step": 77410 }, { - "epoch": 0.84, - "learning_rate": 0.00017439158933091047, - "loss": 0.0402, + "epoch": 0.5, + "learning_rate": 0.00022504695456863108, + "loss": 0.049, "step": 77420 }, { - "epoch": 0.84, - "learning_rate": 0.00017437536504640144, - "loss": 0.0424, + "epoch": 0.5, + "learning_rate": 0.00022503727321427416, + "loss": 0.0501, "step": 77430 }, { - "epoch": 0.84, - "learning_rate": 0.0001743591407618924, - "loss": 0.0424, + "epoch": 0.5, + "learning_rate": 0.00022502759185991724, + "loss": 0.054, "step": 77440 }, { - "epoch": 0.84, - "learning_rate": 0.00017434291647738334, - "loss": 0.0444, + "epoch": 0.5, + "learning_rate": 0.00022501791050556032, + "loss": 0.0543, "step": 77450 }, { - "epoch": 0.84, - "learning_rate": 0.0001743266921928743, - "loss": 0.0571, + "epoch": 0.5, + "learning_rate": 0.00022500822915120337, + "loss": 0.0494, "step": 77460 }, { - "epoch": 0.84, - "learning_rate": 0.00017431046790836521, - "loss": 0.0565, + "epoch": 0.5, + "learning_rate": 0.00022499854779684645, + "loss": 0.0514, "step": 77470 }, { - "epoch": 0.84, - "learning_rate": 0.0001742942436238562, - "loss": 0.044, + "epoch": 0.5, + "learning_rate": 0.00022498886644248953, + "loss": 0.0611, "step": 77480 }, { - "epoch": 0.84, - "learning_rate": 0.00017427801933934711, - "loss": 0.0497, + "epoch": 0.5, + "learning_rate": 0.00022497918508813255, + "loss": 0.0496, "step": 77490 }, { - "epoch": 0.84, - "learning_rate": 0.0001742617950548381, - "loss": 0.0446, + "epoch": 0.5, + "learning_rate": 0.00022496950373377563, + "loss": 0.0527, "step": 77500 }, { - "epoch": 0.84, - "learning_rate": 0.000174245570770329, - "loss": 0.0462, + "epoch": 0.5, + "learning_rate": 0.0002249598223794187, + "loss": 0.0531, "step": 77510 }, { - "epoch": 0.84, - "learning_rate": 0.00017422934648581996, - "loss": 0.0488, + "epoch": 0.5, + "learning_rate": 0.0002249501410250618, + "loss": 0.0581, "step": 77520 }, { - "epoch": 0.84, - "learning_rate": 0.0001742131222013109, - "loss": 0.0426, + "epoch": 0.5, + "learning_rate": 0.00022494045967070485, + "loss": 0.0553, "step": 77530 }, { - "epoch": 0.84, - "learning_rate": 0.00017419689791680186, - "loss": 0.0488, + "epoch": 0.5, + "learning_rate": 0.00022493077831634792, + "loss": 0.0548, "step": 77540 }, { - "epoch": 0.84, - "learning_rate": 0.0001741806736322928, - "loss": 0.0433, + "epoch": 0.5, + "learning_rate": 0.000224921096961991, + "loss": 0.0529, "step": 77550 }, { - "epoch": 0.84, - "learning_rate": 0.00017416444934778376, - "loss": 0.0489, + "epoch": 0.5, + "learning_rate": 0.00022491141560763403, + "loss": 0.0521, "step": 77560 }, { - "epoch": 0.84, - "learning_rate": 0.00017414822506327468, - "loss": 0.0479, + "epoch": 0.5, + "learning_rate": 0.0002249017342532771, + "loss": 0.0496, "step": 77570 }, { - "epoch": 0.84, - "learning_rate": 0.00017413200077876566, - "loss": 0.0455, + "epoch": 0.5, + "learning_rate": 0.0002248920528989202, + "loss": 0.0515, "step": 77580 }, { - "epoch": 0.84, - "learning_rate": 0.00017411577649425658, - "loss": 0.0435, + "epoch": 0.5, + "learning_rate": 0.00022488237154456324, + "loss": 0.0498, "step": 77590 }, { - "epoch": 0.84, - "learning_rate": 0.00017409955220974756, - "loss": 0.043, + "epoch": 0.5, + "learning_rate": 0.00022487269019020632, + "loss": 0.0521, "step": 77600 }, { - "epoch": 0.84, - "learning_rate": 0.00017408332792523848, - "loss": 0.05, + "epoch": 0.5, + "learning_rate": 0.0002248630088358494, + "loss": 0.053, "step": 77610 }, { - "epoch": 0.84, - "learning_rate": 0.00017406710364072943, - "loss": 0.0477, + "epoch": 0.5, + "learning_rate": 0.00022485332748149248, + "loss": 0.0591, "step": 77620 }, { - "epoch": 0.84, - "learning_rate": 0.00017405087935622038, - "loss": 0.0488, + "epoch": 0.5, + "learning_rate": 0.0002248436461271355, + "loss": 0.0555, "step": 77630 }, { - "epoch": 0.84, - "learning_rate": 0.00017403465507171133, - "loss": 0.0458, + "epoch": 0.5, + "learning_rate": 0.0002248339647727786, + "loss": 0.0499, "step": 77640 }, { - "epoch": 0.84, - "learning_rate": 0.00017401843078720226, - "loss": 0.0455, + "epoch": 0.5, + "learning_rate": 0.00022482428341842167, + "loss": 0.0634, "step": 77650 }, { - "epoch": 0.84, - "learning_rate": 0.00017400220650269323, - "loss": 0.0411, + "epoch": 0.5, + "learning_rate": 0.00022481460206406472, + "loss": 0.0507, "step": 77660 }, { - "epoch": 0.84, - "learning_rate": 0.00017398598221818416, - "loss": 0.0524, + "epoch": 0.5, + "learning_rate": 0.0002248049207097078, + "loss": 0.0571, "step": 77670 }, { - "epoch": 0.84, - "learning_rate": 0.00017396975793367513, - "loss": 0.043, + "epoch": 0.5, + "learning_rate": 0.00022479523935535088, + "loss": 0.0535, "step": 77680 }, { - "epoch": 0.84, - "learning_rate": 0.00017395353364916606, - "loss": 0.0542, + "epoch": 0.5, + "learning_rate": 0.00022478555800099396, + "loss": 0.0557, "step": 77690 }, { - "epoch": 0.84, - "learning_rate": 0.000173937309364657, - "loss": 0.0478, + "epoch": 0.5, + "learning_rate": 0.00022477587664663698, + "loss": 0.0524, "step": 77700 }, { - "epoch": 0.84, - "learning_rate": 0.00017392108508014795, - "loss": 0.0501, + "epoch": 0.5, + "learning_rate": 0.00022476619529228006, + "loss": 0.0552, "step": 77710 }, { - "epoch": 0.84, - "learning_rate": 0.0001739048607956389, - "loss": 0.0479, + "epoch": 0.5, + "learning_rate": 0.00022475651393792314, + "loss": 0.0572, "step": 77720 }, { - "epoch": 0.84, - "learning_rate": 0.00017388863651112985, - "loss": 0.0423, + "epoch": 0.5, + "learning_rate": 0.0002247468325835662, + "loss": 0.0541, "step": 77730 }, { - "epoch": 0.84, - "learning_rate": 0.0001738724122266208, - "loss": 0.0405, + "epoch": 0.5, + "learning_rate": 0.00022473715122920928, + "loss": 0.062, "step": 77740 }, { - "epoch": 0.84, - "learning_rate": 0.00017385618794211173, - "loss": 0.0478, + "epoch": 0.5, + "learning_rate": 0.00022472746987485236, + "loss": 0.0582, "step": 77750 }, { - "epoch": 0.84, - "learning_rate": 0.0001738399636576027, - "loss": 0.0433, + "epoch": 0.5, + "learning_rate": 0.00022471778852049544, + "loss": 0.0499, "step": 77760 }, { - "epoch": 0.84, - "learning_rate": 0.00017382373937309363, - "loss": 0.0582, + "epoch": 0.5, + "learning_rate": 0.00022470810716613846, + "loss": 0.0595, "step": 77770 }, { - "epoch": 0.84, - "learning_rate": 0.0001738075150885846, - "loss": 0.0461, + "epoch": 0.5, + "learning_rate": 0.00022469842581178154, + "loss": 0.05, "step": 77780 }, { - "epoch": 0.84, - "learning_rate": 0.00017379129080407553, - "loss": 0.0474, + "epoch": 0.5, + "learning_rate": 0.0002246887444574246, + "loss": 0.0532, "step": 77790 }, { - "epoch": 0.84, - "learning_rate": 0.00017377506651956648, - "loss": 0.0456, + "epoch": 0.5, + "learning_rate": 0.00022467906310306767, + "loss": 0.0506, "step": 77800 }, { - "epoch": 0.84, - "learning_rate": 0.00017375884223505743, - "loss": 0.05, + "epoch": 0.5, + "learning_rate": 0.00022466938174871075, + "loss": 0.0598, "step": 77810 }, { - "epoch": 0.84, - "learning_rate": 0.00017374261795054838, - "loss": 0.0502, + "epoch": 0.5, + "learning_rate": 0.00022465970039435383, + "loss": 0.055, "step": 77820 }, { - "epoch": 0.84, - "learning_rate": 0.0001737263936660393, - "loss": 0.0428, + "epoch": 0.5, + "learning_rate": 0.0002246500190399969, + "loss": 0.0481, "step": 77830 }, { - "epoch": 0.84, - "learning_rate": 0.00017371016938153027, - "loss": 0.0473, + "epoch": 0.5, + "learning_rate": 0.00022464033768563994, + "loss": 0.0557, "step": 77840 }, { - "epoch": 0.84, - "learning_rate": 0.0001736939450970212, - "loss": 0.0443, + "epoch": 0.5, + "learning_rate": 0.00022463065633128302, + "loss": 0.058, "step": 77850 }, { - "epoch": 0.84, - "learning_rate": 0.00017367772081251217, - "loss": 0.0438, + "epoch": 0.5, + "learning_rate": 0.00022462097497692607, + "loss": 0.0509, "step": 77860 }, { - "epoch": 0.84, - "learning_rate": 0.0001736614965280031, - "loss": 0.0436, + "epoch": 0.5, + "learning_rate": 0.00022461129362256915, + "loss": 0.0435, "step": 77870 }, { - "epoch": 0.84, - "learning_rate": 0.00017364527224349407, - "loss": 0.0472, + "epoch": 0.5, + "learning_rate": 0.00022460161226821223, + "loss": 0.0584, "step": 77880 }, { - "epoch": 0.84, - "learning_rate": 0.000173629047958985, - "loss": 0.0434, + "epoch": 0.5, + "learning_rate": 0.0002245919309138553, + "loss": 0.062, "step": 77890 }, { - "epoch": 0.84, - "learning_rate": 0.00017361282367447595, - "loss": 0.0426, + "epoch": 0.5, + "learning_rate": 0.00022458224955949836, + "loss": 0.0557, "step": 77900 }, { - "epoch": 0.84, - "learning_rate": 0.0001735965993899669, - "loss": 0.0467, + "epoch": 0.5, + "learning_rate": 0.00022457256820514142, + "loss": 0.0621, "step": 77910 }, { - "epoch": 0.84, - "learning_rate": 0.00017358037510545785, - "loss": 0.0529, + "epoch": 0.5, + "learning_rate": 0.0002245628868507845, + "loss": 0.0515, "step": 77920 }, { - "epoch": 0.84, - "learning_rate": 0.00017356415082094877, - "loss": 0.046, + "epoch": 0.5, + "learning_rate": 0.00022455320549642755, + "loss": 0.0485, "step": 77930 }, { - "epoch": 0.84, - "learning_rate": 0.00017354792653643975, - "loss": 0.05, + "epoch": 0.5, + "learning_rate": 0.00022454352414207063, + "loss": 0.0491, "step": 77940 }, { - "epoch": 0.84, - "learning_rate": 0.00017353170225193067, - "loss": 0.0493, + "epoch": 0.5, + "learning_rate": 0.0002245338427877137, + "loss": 0.0563, "step": 77950 }, { - "epoch": 0.84, - "learning_rate": 0.00017351547796742164, - "loss": 0.0528, + "epoch": 0.5, + "learning_rate": 0.0002245241614333568, + "loss": 0.0542, "step": 77960 }, { - "epoch": 0.84, - "learning_rate": 0.00017349925368291257, - "loss": 0.0511, + "epoch": 0.5, + "learning_rate": 0.00022451448007899984, + "loss": 0.0547, "step": 77970 }, { - "epoch": 0.84, - "learning_rate": 0.00017348302939840352, - "loss": 0.0534, + "epoch": 0.5, + "learning_rate": 0.0002245047987246429, + "loss": 0.0487, "step": 77980 }, { - "epoch": 0.84, - "learning_rate": 0.00017346680511389447, - "loss": 0.0514, + "epoch": 0.5, + "learning_rate": 0.00022449511737028595, + "loss": 0.0508, "step": 77990 }, { - "epoch": 0.84, - "learning_rate": 0.00017345058082938542, - "loss": 0.0435, + "epoch": 0.5, + "learning_rate": 0.00022448543601592903, + "loss": 0.0464, "step": 78000 }, { - "epoch": 0.84, - "eval_cer": 0.9211976160059088, - "eval_loss": 0.03189348429441452, - "eval_runtime": 119.1171, - "eval_samples_per_second": 16.79, - "eval_steps_per_second": 4.198, + "epoch": 0.5, + "eval_cer": 0.9201102700259858, + "eval_loss": 0.03538144752383232, + "eval_runtime": 120.2717, + "eval_samples_per_second": 16.629, + "eval_steps_per_second": 4.157, "step": 78000 }, { - "epoch": 0.84, - "learning_rate": 0.00017343435654487634, - "loss": 0.0413, + "epoch": 0.5, + "learning_rate": 0.0002244757546615721, + "loss": 0.0577, "step": 78010 }, { - "epoch": 0.84, - "learning_rate": 0.00017341813226036732, - "loss": 0.0451, + "epoch": 0.5, + "learning_rate": 0.00022446607330721519, + "loss": 0.0517, "step": 78020 }, { - "epoch": 0.84, - "learning_rate": 0.00017340190797585824, - "loss": 0.0432, + "epoch": 0.5, + "learning_rate": 0.00022445639195285824, + "loss": 0.0542, "step": 78030 }, { - "epoch": 0.84, - "learning_rate": 0.00017338568369134922, - "loss": 0.0504, + "epoch": 0.5, + "learning_rate": 0.00022444671059850132, + "loss": 0.0448, "step": 78040 }, { - "epoch": 0.84, - "learning_rate": 0.00017336945940684014, - "loss": 0.0476, + "epoch": 0.5, + "learning_rate": 0.00022443702924414437, + "loss": 0.0612, "step": 78050 }, { - "epoch": 0.84, - "learning_rate": 0.00017335323512233112, - "loss": 0.047, + "epoch": 0.5, + "learning_rate": 0.00022442734788978742, + "loss": 0.0519, "step": 78060 }, { - "epoch": 0.84, - "learning_rate": 0.00017333701083782204, - "loss": 0.0408, + "epoch": 0.5, + "learning_rate": 0.0002244176665354305, + "loss": 0.0493, "step": 78070 }, { - "epoch": 0.84, - "learning_rate": 0.000173320786553313, - "loss": 0.0486, + "epoch": 0.5, + "learning_rate": 0.00022440798518107358, + "loss": 0.054, "step": 78080 }, { - "epoch": 0.84, - "learning_rate": 0.00017330456226880394, - "loss": 0.046, + "epoch": 0.5, + "learning_rate": 0.00022439830382671666, + "loss": 0.049, "step": 78090 }, { - "epoch": 0.84, - "learning_rate": 0.0001732883379842949, - "loss": 0.0438, + "epoch": 0.5, + "learning_rate": 0.00022438862247235972, + "loss": 0.0589, "step": 78100 }, { - "epoch": 0.84, - "learning_rate": 0.0001732721136997858, - "loss": 0.0441, + "epoch": 0.5, + "learning_rate": 0.0002243789411180028, + "loss": 0.0572, "step": 78110 }, { - "epoch": 0.84, - "learning_rate": 0.0001732558894152768, - "loss": 0.0447, + "epoch": 0.5, + "learning_rate": 0.00022436925976364585, + "loss": 0.0501, "step": 78120 }, { - "epoch": 0.85, - "learning_rate": 0.0001732396651307677, - "loss": 0.0467, + "epoch": 0.5, + "learning_rate": 0.0002243595784092889, + "loss": 0.0516, "step": 78130 }, { - "epoch": 0.85, - "learning_rate": 0.00017322344084625869, - "loss": 0.0514, + "epoch": 0.5, + "learning_rate": 0.00022434989705493198, + "loss": 0.0522, "step": 78140 }, { - "epoch": 0.85, - "learning_rate": 0.0001732072165617496, - "loss": 0.0453, + "epoch": 0.5, + "learning_rate": 0.00022434021570057506, + "loss": 0.0517, "step": 78150 }, { - "epoch": 0.85, - "learning_rate": 0.00017319099227724056, - "loss": 0.0491, + "epoch": 0.5, + "learning_rate": 0.00022433053434621814, + "loss": 0.0571, "step": 78160 }, { - "epoch": 0.85, - "learning_rate": 0.0001731747679927315, - "loss": 0.0464, + "epoch": 0.5, + "learning_rate": 0.0002243208529918612, + "loss": 0.0476, "step": 78170 }, { - "epoch": 0.85, - "learning_rate": 0.00017315854370822246, - "loss": 0.0557, + "epoch": 0.5, + "learning_rate": 0.00022431117163750427, + "loss": 0.0594, "step": 78180 }, { - "epoch": 0.85, - "learning_rate": 0.00017314231942371338, - "loss": 0.0527, + "epoch": 0.5, + "learning_rate": 0.0002243014902831473, + "loss": 0.0538, "step": 78190 }, { - "epoch": 0.85, - "learning_rate": 0.00017312609513920436, - "loss": 0.0458, + "epoch": 0.5, + "learning_rate": 0.00022429180892879038, + "loss": 0.051, "step": 78200 }, { - "epoch": 0.85, - "learning_rate": 0.00017310987085469528, - "loss": 0.0596, + "epoch": 0.5, + "learning_rate": 0.00022428212757443346, + "loss": 0.0528, "step": 78210 }, { - "epoch": 0.85, - "learning_rate": 0.00017309364657018626, - "loss": 0.0453, + "epoch": 0.5, + "learning_rate": 0.00022427244622007654, + "loss": 0.0524, "step": 78220 }, { - "epoch": 0.85, - "learning_rate": 0.00017307742228567718, - "loss": 0.0406, + "epoch": 0.5, + "learning_rate": 0.0002242627648657196, + "loss": 0.0595, "step": 78230 }, { - "epoch": 0.85, - "learning_rate": 0.00017306119800116816, - "loss": 0.0458, + "epoch": 0.5, + "learning_rate": 0.00022425308351136267, + "loss": 0.0519, "step": 78240 }, { - "epoch": 0.85, - "learning_rate": 0.00017304497371665908, - "loss": 0.0421, + "epoch": 0.51, + "learning_rate": 0.00022424340215700575, + "loss": 0.0504, "step": 78250 }, { - "epoch": 0.85, - "learning_rate": 0.00017302874943215003, - "loss": 0.047, + "epoch": 0.51, + "learning_rate": 0.00022423372080264878, + "loss": 0.0538, "step": 78260 }, { - "epoch": 0.85, - "learning_rate": 0.00017301252514764098, - "loss": 0.0442, + "epoch": 0.51, + "learning_rate": 0.00022422403944829186, + "loss": 0.0468, "step": 78270 }, { - "epoch": 0.85, - "learning_rate": 0.00017299630086313193, - "loss": 0.0447, + "epoch": 0.51, + "learning_rate": 0.00022421435809393494, + "loss": 0.0525, "step": 78280 }, { - "epoch": 0.85, - "learning_rate": 0.00017298007657862285, - "loss": 0.0447, + "epoch": 0.51, + "learning_rate": 0.00022420467673957801, + "loss": 0.0545, "step": 78290 }, { - "epoch": 0.85, - "learning_rate": 0.00017296385229411383, - "loss": 0.0491, + "epoch": 0.51, + "learning_rate": 0.00022419499538522107, + "loss": 0.0521, "step": 78300 }, { - "epoch": 0.85, - "learning_rate": 0.00017294762800960475, - "loss": 0.0493, + "epoch": 0.51, + "learning_rate": 0.00022418531403086415, + "loss": 0.0536, "step": 78310 }, { - "epoch": 0.85, - "learning_rate": 0.00017293140372509573, - "loss": 0.0419, + "epoch": 0.51, + "learning_rate": 0.00022417563267650723, + "loss": 0.0488, "step": 78320 }, { - "epoch": 0.85, - "learning_rate": 0.00017291517944058665, - "loss": 0.0426, + "epoch": 0.51, + "learning_rate": 0.00022416595132215025, + "loss": 0.0451, "step": 78330 }, { - "epoch": 0.85, - "learning_rate": 0.0001728989551560776, - "loss": 0.053, + "epoch": 0.51, + "learning_rate": 0.00022415626996779333, + "loss": 0.0559, "step": 78340 }, { - "epoch": 0.85, - "learning_rate": 0.00017288273087156855, - "loss": 0.0437, + "epoch": 0.51, + "learning_rate": 0.0002241465886134364, + "loss": 0.0551, "step": 78350 }, { - "epoch": 0.85, - "learning_rate": 0.0001728665065870595, - "loss": 0.0477, + "epoch": 0.51, + "learning_rate": 0.0002241369072590795, + "loss": 0.0514, "step": 78360 }, { - "epoch": 0.85, - "learning_rate": 0.00017285028230255042, - "loss": 0.0454, + "epoch": 0.51, + "learning_rate": 0.00022412722590472254, + "loss": 0.045, "step": 78370 }, { - "epoch": 0.85, - "learning_rate": 0.0001728340580180414, - "loss": 0.0459, + "epoch": 0.51, + "learning_rate": 0.00022411754455036562, + "loss": 0.054, "step": 78380 }, { - "epoch": 0.85, - "learning_rate": 0.00017281783373353232, - "loss": 0.0456, + "epoch": 0.51, + "learning_rate": 0.0002241078631960087, + "loss": 0.061, "step": 78390 }, { - "epoch": 0.85, - "learning_rate": 0.0001728016094490233, - "loss": 0.0428, + "epoch": 0.51, + "learning_rate": 0.00022409818184165173, + "loss": 0.053, "step": 78400 }, { - "epoch": 0.85, - "learning_rate": 0.00017278538516451422, - "loss": 0.0453, + "epoch": 0.51, + "learning_rate": 0.0002240885004872948, + "loss": 0.043, "step": 78410 }, { - "epoch": 0.85, - "learning_rate": 0.0001727691608800052, - "loss": 0.0458, + "epoch": 0.51, + "learning_rate": 0.0002240788191329379, + "loss": 0.0484, "step": 78420 }, { - "epoch": 0.85, - "learning_rate": 0.00017275293659549612, - "loss": 0.046, + "epoch": 0.51, + "learning_rate": 0.00022406913777858094, + "loss": 0.0541, "step": 78430 }, { - "epoch": 0.85, - "learning_rate": 0.00017273671231098707, - "loss": 0.0466, + "epoch": 0.51, + "learning_rate": 0.00022405945642422402, + "loss": 0.0464, "step": 78440 }, { - "epoch": 0.85, - "learning_rate": 0.00017272048802647802, - "loss": 0.0461, + "epoch": 0.51, + "learning_rate": 0.0002240497750698671, + "loss": 0.0536, "step": 78450 }, { - "epoch": 0.85, - "learning_rate": 0.00017270426374196897, - "loss": 0.0529, + "epoch": 0.51, + "learning_rate": 0.00022404009371551018, + "loss": 0.052, "step": 78460 }, { - "epoch": 0.85, - "learning_rate": 0.0001726880394574599, - "loss": 0.0555, + "epoch": 0.51, + "learning_rate": 0.0002240304123611532, + "loss": 0.048, "step": 78470 }, { - "epoch": 0.85, - "learning_rate": 0.00017267181517295087, - "loss": 0.0432, + "epoch": 0.51, + "learning_rate": 0.0002240207310067963, + "loss": 0.0559, "step": 78480 }, { - "epoch": 0.85, - "learning_rate": 0.0001726555908884418, - "loss": 0.0443, + "epoch": 0.51, + "learning_rate": 0.00022401104965243937, + "loss": 0.0714, "step": 78490 }, { - "epoch": 0.85, - "learning_rate": 0.00017263936660393277, - "loss": 0.0368, + "epoch": 0.51, + "learning_rate": 0.00022400136829808242, + "loss": 0.0551, "step": 78500 }, { - "epoch": 0.85, - "learning_rate": 0.0001726231423194237, - "loss": 0.0457, + "epoch": 0.51, + "learning_rate": 0.0002239916869437255, + "loss": 0.0511, "step": 78510 }, { - "epoch": 0.85, - "learning_rate": 0.00017260691803491464, - "loss": 0.0475, + "epoch": 0.51, + "learning_rate": 0.00022398200558936858, + "loss": 0.0507, "step": 78520 }, { - "epoch": 0.85, - "learning_rate": 0.0001725906937504056, - "loss": 0.0394, + "epoch": 0.51, + "learning_rate": 0.00022397232423501166, + "loss": 0.0467, "step": 78530 }, { - "epoch": 0.85, - "learning_rate": 0.00017257446946589654, - "loss": 0.0457, + "epoch": 0.51, + "learning_rate": 0.00022396264288065468, + "loss": 0.0608, "step": 78540 }, { - "epoch": 0.85, - "learning_rate": 0.00017255824518138746, - "loss": 0.0419, + "epoch": 0.51, + "learning_rate": 0.00022395296152629776, + "loss": 0.069, "step": 78550 }, { - "epoch": 0.85, - "learning_rate": 0.00017254202089687844, - "loss": 0.0396, + "epoch": 0.51, + "learning_rate": 0.00022394328017194084, + "loss": 0.049, "step": 78560 }, { - "epoch": 0.85, - "learning_rate": 0.00017252579661236936, - "loss": 0.041, + "epoch": 0.51, + "learning_rate": 0.0002239335988175839, + "loss": 0.0596, "step": 78570 }, { - "epoch": 0.85, - "learning_rate": 0.00017250957232786034, - "loss": 0.0508, + "epoch": 0.51, + "learning_rate": 0.00022392391746322698, + "loss": 0.0496, "step": 78580 }, { - "epoch": 0.85, - "learning_rate": 0.00017249334804335126, - "loss": 0.0489, + "epoch": 0.51, + "learning_rate": 0.00022391423610887006, + "loss": 0.0581, "step": 78590 }, { - "epoch": 0.85, - "learning_rate": 0.00017247712375884224, - "loss": 0.0416, + "epoch": 0.51, + "learning_rate": 0.0002239045547545131, + "loss": 0.0497, "step": 78600 }, { - "epoch": 0.85, - "learning_rate": 0.00017246089947433316, - "loss": 0.0449, + "epoch": 0.51, + "learning_rate": 0.00022389487340015616, + "loss": 0.0553, "step": 78610 }, { - "epoch": 0.85, - "learning_rate": 0.0001724446751898241, - "loss": 0.0378, + "epoch": 0.51, + "learning_rate": 0.00022388519204579924, + "loss": 0.045, "step": 78620 }, { - "epoch": 0.85, - "learning_rate": 0.00017242845090531506, - "loss": 0.0371, + "epoch": 0.51, + "learning_rate": 0.0002238755106914423, + "loss": 0.0527, "step": 78630 }, { - "epoch": 0.85, - "learning_rate": 0.000172412226620806, - "loss": 0.0394, + "epoch": 0.51, + "learning_rate": 0.00022386582933708537, + "loss": 0.0469, "step": 78640 }, { - "epoch": 0.85, - "learning_rate": 0.00017239600233629693, - "loss": 0.0433, + "epoch": 0.51, + "learning_rate": 0.00022385614798272845, + "loss": 0.0505, "step": 78650 }, { - "epoch": 0.85, - "learning_rate": 0.0001723797780517879, - "loss": 0.0478, + "epoch": 0.51, + "learning_rate": 0.00022384646662837153, + "loss": 0.0496, "step": 78660 }, { - "epoch": 0.85, - "learning_rate": 0.00017236355376727883, - "loss": 0.051, + "epoch": 0.51, + "learning_rate": 0.00022383678527401459, + "loss": 0.0486, "step": 78670 }, { - "epoch": 0.85, - "learning_rate": 0.0001723473294827698, - "loss": 0.0362, + "epoch": 0.51, + "learning_rate": 0.00022382710391965764, + "loss": 0.0517, "step": 78680 }, { - "epoch": 0.85, - "learning_rate": 0.00017233110519826073, - "loss": 0.0506, + "epoch": 0.51, + "learning_rate": 0.00022381742256530072, + "loss": 0.0552, "step": 78690 }, { - "epoch": 0.85, - "learning_rate": 0.00017231488091375168, - "loss": 0.0414, + "epoch": 0.51, + "learning_rate": 0.00022380774121094377, + "loss": 0.047, "step": 78700 }, { - "epoch": 0.85, - "learning_rate": 0.00017229865662924263, - "loss": 0.0466, + "epoch": 0.51, + "learning_rate": 0.00022379805985658685, + "loss": 0.0541, "step": 78710 }, { - "epoch": 0.85, - "learning_rate": 0.00017228243234473358, - "loss": 0.0441, + "epoch": 0.51, + "learning_rate": 0.00022378837850222993, + "loss": 0.0477, "step": 78720 }, { - "epoch": 0.85, - "learning_rate": 0.00017226620806022453, - "loss": 0.0431, + "epoch": 0.51, + "learning_rate": 0.000223778697147873, + "loss": 0.0499, "step": 78730 }, { - "epoch": 0.85, - "learning_rate": 0.00017224998377571548, - "loss": 0.0444, + "epoch": 0.51, + "learning_rate": 0.00022376901579351606, + "loss": 0.0534, "step": 78740 }, { - "epoch": 0.85, - "learning_rate": 0.0001722337594912064, - "loss": 0.0427, + "epoch": 0.51, + "learning_rate": 0.00022375933443915912, + "loss": 0.0534, "step": 78750 }, { - "epoch": 0.85, - "learning_rate": 0.00017221753520669738, - "loss": 0.0413, + "epoch": 0.51, + "learning_rate": 0.0002237496530848022, + "loss": 0.054, "step": 78760 }, { - "epoch": 0.85, - "learning_rate": 0.0001722013109221883, - "loss": 0.0448, + "epoch": 0.51, + "learning_rate": 0.00022373997173044525, + "loss": 0.0543, "step": 78770 }, { - "epoch": 0.85, - "learning_rate": 0.00017218508663767928, - "loss": 0.0475, + "epoch": 0.51, + "learning_rate": 0.00022373029037608833, + "loss": 0.0493, "step": 78780 }, { - "epoch": 0.85, - "learning_rate": 0.0001721688623531702, - "loss": 0.0508, + "epoch": 0.51, + "learning_rate": 0.0002237206090217314, + "loss": 0.0525, "step": 78790 }, { - "epoch": 0.85, - "learning_rate": 0.00017215263806866115, - "loss": 0.0432, + "epoch": 0.51, + "learning_rate": 0.00022371092766737446, + "loss": 0.0459, "step": 78800 }, { - "epoch": 0.85, - "learning_rate": 0.0001721364137841521, - "loss": 0.0425, + "epoch": 0.51, + "learning_rate": 0.00022370124631301754, + "loss": 0.0509, "step": 78810 }, { - "epoch": 0.85, - "learning_rate": 0.00017212018949964305, - "loss": 0.0513, + "epoch": 0.51, + "learning_rate": 0.0002236915649586606, + "loss": 0.0608, "step": 78820 }, { - "epoch": 0.85, - "learning_rate": 0.00017210396521513398, - "loss": 0.0426, + "epoch": 0.51, + "learning_rate": 0.00022368188360430365, + "loss": 0.0525, "step": 78830 }, { - "epoch": 0.85, - "learning_rate": 0.00017208774093062495, - "loss": 0.0487, + "epoch": 0.51, + "learning_rate": 0.00022367220224994673, + "loss": 0.0597, "step": 78840 }, { - "epoch": 0.85, - "learning_rate": 0.00017207151664611588, - "loss": 0.0472, + "epoch": 0.51, + "learning_rate": 0.0002236625208955898, + "loss": 0.0518, "step": 78850 }, { - "epoch": 0.85, - "learning_rate": 0.00017205529236160685, - "loss": 0.0496, + "epoch": 0.51, + "learning_rate": 0.00022365283954123289, + "loss": 0.0544, "step": 78860 }, { - "epoch": 0.85, - "learning_rate": 0.00017203906807709778, - "loss": 0.0493, + "epoch": 0.51, + "learning_rate": 0.00022364315818687594, + "loss": 0.0477, "step": 78870 }, { - "epoch": 0.85, - "learning_rate": 0.00017202284379258873, - "loss": 0.0457, + "epoch": 0.51, + "learning_rate": 0.00022363347683251902, + "loss": 0.0487, "step": 78880 }, { - "epoch": 0.85, - "learning_rate": 0.00017200661950807968, - "loss": 0.0449, + "epoch": 0.51, + "learning_rate": 0.00022362379547816207, + "loss": 0.0489, "step": 78890 }, { - "epoch": 0.85, - "learning_rate": 0.00017199039522357063, - "loss": 0.0502, + "epoch": 0.51, + "learning_rate": 0.00022361411412380512, + "loss": 0.0505, "step": 78900 }, { - "epoch": 0.85, - "learning_rate": 0.00017197417093906157, - "loss": 0.0392, + "epoch": 0.51, + "learning_rate": 0.0002236044327694482, + "loss": 0.0534, "step": 78910 }, { - "epoch": 0.85, - "learning_rate": 0.00017195794665455252, - "loss": 0.0443, + "epoch": 0.51, + "learning_rate": 0.00022359475141509128, + "loss": 0.0527, "step": 78920 }, { - "epoch": 0.85, - "learning_rate": 0.00017194172237004345, - "loss": 0.041, + "epoch": 0.51, + "learning_rate": 0.00022358507006073436, + "loss": 0.0519, "step": 78930 }, { - "epoch": 0.85, - "learning_rate": 0.00017192549808553442, - "loss": 0.0454, + "epoch": 0.51, + "learning_rate": 0.00022357538870637742, + "loss": 0.0493, "step": 78940 }, { - "epoch": 0.85, - "learning_rate": 0.00017190927380102535, - "loss": 0.0526, + "epoch": 0.51, + "learning_rate": 0.0002235657073520205, + "loss": 0.0545, "step": 78950 }, { - "epoch": 0.85, - "learning_rate": 0.00017189304951651632, - "loss": 0.0454, + "epoch": 0.51, + "learning_rate": 0.00022355602599766355, + "loss": 0.0523, "step": 78960 }, { - "epoch": 0.85, - "learning_rate": 0.00017187682523200725, - "loss": 0.0439, + "epoch": 0.51, + "learning_rate": 0.0002235463446433066, + "loss": 0.0512, "step": 78970 }, { - "epoch": 0.85, - "learning_rate": 0.0001718606009474982, - "loss": 0.0415, + "epoch": 0.51, + "learning_rate": 0.00022353666328894968, + "loss": 0.055, "step": 78980 }, { - "epoch": 0.85, - "learning_rate": 0.00017184437666298915, - "loss": 0.0479, + "epoch": 0.51, + "learning_rate": 0.00022352698193459276, + "loss": 0.0533, "step": 78990 }, { - "epoch": 0.85, - "learning_rate": 0.0001718281523784801, - "loss": 0.0453, + "epoch": 0.51, + "learning_rate": 0.0002235173005802358, + "loss": 0.0546, "step": 79000 }, { - "epoch": 0.85, - "eval_cer": 0.921160509664435, - "eval_loss": 0.031662482768297195, - "eval_runtime": 118.8073, - "eval_samples_per_second": 16.834, - "eval_steps_per_second": 4.208, + "epoch": 0.51, + "eval_cer": 0.9200325386961925, + "eval_loss": 0.0354156568646431, + "eval_runtime": 120.0383, + "eval_samples_per_second": 16.661, + "eval_steps_per_second": 4.165, "step": 79000 }, { - "epoch": 0.85, - "learning_rate": 0.00017181192809397102, - "loss": 0.0416, + "epoch": 0.51, + "learning_rate": 0.0002235076192258789, + "loss": 0.0533, "step": 79010 }, { - "epoch": 0.85, - "learning_rate": 0.000171795703809462, - "loss": 0.0394, + "epoch": 0.51, + "learning_rate": 0.00022349793787152197, + "loss": 0.0535, "step": 79020 }, { - "epoch": 0.85, - "learning_rate": 0.00017177947952495292, - "loss": 0.0499, + "epoch": 0.51, + "learning_rate": 0.000223488256517165, + "loss": 0.05, "step": 79030 }, { - "epoch": 0.85, - "learning_rate": 0.0001717632552404439, - "loss": 0.0434, + "epoch": 0.51, + "learning_rate": 0.00022347857516280808, + "loss": 0.0549, "step": 79040 }, { - "epoch": 0.86, - "learning_rate": 0.00017174703095593482, - "loss": 0.0471, + "epoch": 0.51, + "learning_rate": 0.00022346889380845116, + "loss": 0.0607, "step": 79050 }, { - "epoch": 0.86, - "learning_rate": 0.00017173080667142577, - "loss": 0.0421, + "epoch": 0.51, + "learning_rate": 0.00022345921245409424, + "loss": 0.0474, "step": 79060 }, { - "epoch": 0.86, - "learning_rate": 0.00017171458238691672, - "loss": 0.047, + "epoch": 0.51, + "learning_rate": 0.0002234495310997373, + "loss": 0.053, "step": 79070 }, { - "epoch": 0.86, - "learning_rate": 0.00017169835810240767, - "loss": 0.046, + "epoch": 0.51, + "learning_rate": 0.00022343984974538037, + "loss": 0.0514, "step": 79080 }, { - "epoch": 0.86, - "learning_rate": 0.00017168213381789862, - "loss": 0.043, + "epoch": 0.51, + "learning_rate": 0.00022343016839102345, + "loss": 0.1657, "step": 79090 }, { - "epoch": 0.86, - "learning_rate": 0.00017166590953338957, - "loss": 0.0458, + "epoch": 0.51, + "learning_rate": 0.00022342048703666648, + "loss": 0.057, "step": 79100 }, { - "epoch": 0.86, - "learning_rate": 0.0001716496852488805, - "loss": 0.0452, + "epoch": 0.51, + "learning_rate": 0.00022341080568230955, + "loss": 0.053, "step": 79110 }, { - "epoch": 0.86, - "learning_rate": 0.00017163346096437147, - "loss": 0.0447, + "epoch": 0.51, + "learning_rate": 0.00022340112432795263, + "loss": 0.0523, "step": 79120 }, { - "epoch": 0.86, - "learning_rate": 0.0001716172366798624, - "loss": 0.049, + "epoch": 0.51, + "learning_rate": 0.00022339144297359571, + "loss": 0.0527, "step": 79130 }, { - "epoch": 0.86, - "learning_rate": 0.00017160101239535337, - "loss": 0.0457, + "epoch": 0.51, + "learning_rate": 0.00022338176161923877, + "loss": 0.0567, "step": 79140 }, { - "epoch": 0.86, - "learning_rate": 0.0001715847881108443, - "loss": 0.0449, + "epoch": 0.51, + "learning_rate": 0.00022337208026488185, + "loss": 0.0542, "step": 79150 }, { - "epoch": 0.86, - "learning_rate": 0.00017156856382633524, - "loss": 0.0394, + "epoch": 0.51, + "learning_rate": 0.00022336239891052493, + "loss": 0.0516, "step": 79160 }, { - "epoch": 0.86, - "learning_rate": 0.0001715523395418262, - "loss": 0.0427, + "epoch": 0.51, + "learning_rate": 0.00022335271755616795, + "loss": 0.0525, "step": 79170 }, { - "epoch": 0.86, - "learning_rate": 0.00017153611525731714, - "loss": 0.0405, + "epoch": 0.51, + "learning_rate": 0.00022334303620181103, + "loss": 0.0508, "step": 79180 }, { - "epoch": 0.86, - "learning_rate": 0.00017151989097280806, - "loss": 0.0462, + "epoch": 0.51, + "learning_rate": 0.0002233333548474541, + "loss": 0.0457, "step": 79190 }, { - "epoch": 0.86, - "learning_rate": 0.00017150366668829904, - "loss": 0.0452, + "epoch": 0.51, + "learning_rate": 0.00022332367349309716, + "loss": 0.0472, "step": 79200 }, { - "epoch": 0.86, - "learning_rate": 0.00017148744240378996, - "loss": 0.0444, + "epoch": 0.51, + "learning_rate": 0.00022331399213874024, + "loss": 0.0512, "step": 79210 }, { - "epoch": 0.86, - "learning_rate": 0.00017147121811928094, - "loss": 0.0423, + "epoch": 0.51, + "learning_rate": 0.00022330431078438332, + "loss": 0.0524, "step": 79220 }, { - "epoch": 0.86, - "learning_rate": 0.00017145499383477186, - "loss": 0.0503, + "epoch": 0.51, + "learning_rate": 0.00022329462943002635, + "loss": 0.0473, "step": 79230 }, { - "epoch": 0.86, - "learning_rate": 0.0001714387695502628, - "loss": 0.0514, + "epoch": 0.51, + "learning_rate": 0.00022328494807566943, + "loss": 0.049, "step": 79240 }, { - "epoch": 0.86, - "learning_rate": 0.00017142254526575376, - "loss": 0.0515, + "epoch": 0.51, + "learning_rate": 0.0002232752667213125, + "loss": 0.0519, "step": 79250 }, { - "epoch": 0.86, - "learning_rate": 0.0001714063209812447, - "loss": 0.0394, + "epoch": 0.51, + "learning_rate": 0.0002232655853669556, + "loss": 0.0474, "step": 79260 }, { - "epoch": 0.86, - "learning_rate": 0.00017139009669673566, - "loss": 0.0464, + "epoch": 0.51, + "learning_rate": 0.00022325590401259864, + "loss": 0.0595, "step": 79270 }, { - "epoch": 0.86, - "learning_rate": 0.0001713738724122266, - "loss": 0.0437, + "epoch": 0.51, + "learning_rate": 0.00022324622265824172, + "loss": 0.05, "step": 79280 }, { - "epoch": 0.86, - "learning_rate": 0.00017135764812771753, - "loss": 0.0412, + "epoch": 0.51, + "learning_rate": 0.0002232365413038848, + "loss": 0.048, "step": 79290 }, { - "epoch": 0.86, - "learning_rate": 0.0001713414238432085, + "epoch": 0.51, + "learning_rate": 0.00022322685994952783, "loss": 0.0495, "step": 79300 }, { - "epoch": 0.86, - "learning_rate": 0.00017132519955869943, - "loss": 0.0464, + "epoch": 0.51, + "learning_rate": 0.0002232171785951709, + "loss": 0.0582, "step": 79310 }, { - "epoch": 0.86, - "learning_rate": 0.0001713089752741904, - "loss": 0.0519, + "epoch": 0.51, + "learning_rate": 0.000223207497240814, + "loss": 0.0521, "step": 79320 }, { - "epoch": 0.86, - "learning_rate": 0.00017129275098968133, - "loss": 0.0521, + "epoch": 0.51, + "learning_rate": 0.00022319781588645707, + "loss": 0.056, "step": 79330 }, { - "epoch": 0.86, - "learning_rate": 0.00017127652670517228, - "loss": 0.0524, + "epoch": 0.51, + "learning_rate": 0.00022318813453210012, + "loss": 0.0556, "step": 79340 }, { - "epoch": 0.86, - "learning_rate": 0.00017126030242066323, - "loss": 0.0413, + "epoch": 0.51, + "learning_rate": 0.0002231784531777432, + "loss": 0.0479, "step": 79350 }, { - "epoch": 0.86, - "learning_rate": 0.00017124407813615418, - "loss": 0.0483, + "epoch": 0.51, + "learning_rate": 0.00022316877182338628, + "loss": 0.0537, "step": 79360 }, { - "epoch": 0.86, - "learning_rate": 0.0001712278538516451, - "loss": 0.0515, + "epoch": 0.51, + "learning_rate": 0.0002231590904690293, + "loss": 0.0522, "step": 79370 }, { - "epoch": 0.86, - "learning_rate": 0.00017121162956713608, - "loss": 0.0471, + "epoch": 0.51, + "learning_rate": 0.00022314940911467238, + "loss": 0.0516, "step": 79380 }, { - "epoch": 0.86, - "learning_rate": 0.000171195405282627, - "loss": 0.0498, + "epoch": 0.51, + "learning_rate": 0.00022313972776031546, + "loss": 0.0595, "step": 79390 }, { - "epoch": 0.86, - "learning_rate": 0.00017117918099811798, - "loss": 0.046, + "epoch": 0.51, + "learning_rate": 0.00022313004640595852, + "loss": 0.059, "step": 79400 }, { - "epoch": 0.86, - "learning_rate": 0.0001711629567136089, - "loss": 0.0466, + "epoch": 0.51, + "learning_rate": 0.0002231203650516016, + "loss": 0.0542, "step": 79410 }, { - "epoch": 0.86, - "learning_rate": 0.00017114673242909988, - "loss": 0.0452, + "epoch": 0.51, + "learning_rate": 0.00022311068369724468, + "loss": 0.0505, "step": 79420 }, { - "epoch": 0.86, - "learning_rate": 0.0001711305081445908, - "loss": 0.0402, + "epoch": 0.51, + "learning_rate": 0.00022310100234288776, + "loss": 0.0521, "step": 79430 }, { - "epoch": 0.86, - "learning_rate": 0.00017111428386008175, - "loss": 0.0456, + "epoch": 0.51, + "learning_rate": 0.00022309132098853078, + "loss": 0.0479, "step": 79440 }, { - "epoch": 0.86, - "learning_rate": 0.0001710980595755727, - "loss": 0.0453, + "epoch": 0.51, + "learning_rate": 0.00022308163963417386, + "loss": 0.0508, "step": 79450 }, { - "epoch": 0.86, - "learning_rate": 0.00017108183529106365, - "loss": 0.0476, + "epoch": 0.51, + "learning_rate": 0.00022307195827981694, + "loss": 0.0486, "step": 79460 }, { - "epoch": 0.86, - "learning_rate": 0.00017106561100655457, - "loss": 0.0458, + "epoch": 0.51, + "learning_rate": 0.00022306227692546, + "loss": 0.052, "step": 79470 }, { - "epoch": 0.86, - "learning_rate": 0.00017104938672204555, - "loss": 0.0423, + "epoch": 0.51, + "learning_rate": 0.00022305259557110307, + "loss": 0.0506, "step": 79480 }, { - "epoch": 0.86, - "learning_rate": 0.00017103316243753647, - "loss": 0.0454, + "epoch": 0.51, + "learning_rate": 0.00022304291421674615, + "loss": 0.0499, "step": 79490 }, { - "epoch": 0.86, - "learning_rate": 0.00017101693815302745, - "loss": 0.0453, + "epoch": 0.51, + "learning_rate": 0.00022303323286238923, + "loss": 0.0534, "step": 79500 }, { - "epoch": 0.86, - "learning_rate": 0.00017100071386851837, - "loss": 0.0457, + "epoch": 0.51, + "learning_rate": 0.00022302355150803226, + "loss": 0.0503, "step": 79510 }, { - "epoch": 0.86, - "learning_rate": 0.00017098448958400932, - "loss": 0.0457, + "epoch": 0.51, + "learning_rate": 0.00022301387015367534, + "loss": 0.0561, "step": 79520 }, { - "epoch": 0.86, - "learning_rate": 0.00017096826529950027, - "loss": 0.045, + "epoch": 0.51, + "learning_rate": 0.00022300418879931842, + "loss": 0.0486, "step": 79530 }, { - "epoch": 0.86, - "learning_rate": 0.00017095204101499122, - "loss": 0.0546, + "epoch": 0.51, + "learning_rate": 0.00022299450744496147, + "loss": 0.0559, "step": 79540 }, { - "epoch": 0.86, - "learning_rate": 0.00017093581673048214, - "loss": 0.0453, + "epoch": 0.51, + "learning_rate": 0.00022298482609060455, + "loss": 0.0552, "step": 79550 }, { - "epoch": 0.86, - "learning_rate": 0.00017091959244597312, - "loss": 0.0499, + "epoch": 0.51, + "learning_rate": 0.00022297514473624763, + "loss": 0.0468, "step": 79560 }, { - "epoch": 0.86, - "learning_rate": 0.00017090336816146404, - "loss": 0.0457, + "epoch": 0.51, + "learning_rate": 0.00022296546338189068, + "loss": 0.0506, "step": 79570 }, { - "epoch": 0.86, - "learning_rate": 0.00017088714387695502, - "loss": 0.0445, + "epoch": 0.51, + "learning_rate": 0.00022295578202753374, + "loss": 0.0518, "step": 79580 }, { - "epoch": 0.86, - "learning_rate": 0.00017087091959244594, - "loss": 0.0451, + "epoch": 0.51, + "learning_rate": 0.00022294610067317682, + "loss": 0.0503, "step": 79590 }, { - "epoch": 0.86, - "learning_rate": 0.00017085469530793692, - "loss": 0.0443, + "epoch": 0.51, + "learning_rate": 0.00022293641931881987, + "loss": 0.0578, "step": 79600 }, { - "epoch": 0.86, - "learning_rate": 0.00017083847102342784, - "loss": 0.0397, + "epoch": 0.51, + "learning_rate": 0.00022292673796446295, + "loss": 0.0491, "step": 79610 }, { - "epoch": 0.86, - "learning_rate": 0.0001708222467389188, - "loss": 0.0438, + "epoch": 0.51, + "learning_rate": 0.00022291705661010603, + "loss": 0.0516, "step": 79620 }, { - "epoch": 0.86, - "learning_rate": 0.00017080602245440974, - "loss": 0.0497, + "epoch": 0.51, + "learning_rate": 0.0002229073752557491, + "loss": 0.0509, "step": 79630 }, { - "epoch": 0.86, - "learning_rate": 0.0001707897981699007, - "loss": 0.0437, + "epoch": 0.51, + "learning_rate": 0.00022289769390139216, + "loss": 0.0616, "step": 79640 }, { - "epoch": 0.86, - "learning_rate": 0.00017077357388539161, - "loss": 0.0468, + "epoch": 0.51, + "learning_rate": 0.0002228880125470352, + "loss": 0.0529, "step": 79650 }, { - "epoch": 0.86, - "learning_rate": 0.0001707573496008826, - "loss": 0.042, + "epoch": 0.51, + "learning_rate": 0.0002228783311926783, + "loss": 0.0625, "step": 79660 }, { - "epoch": 0.86, - "learning_rate": 0.0001707411253163735, - "loss": 0.048, + "epoch": 0.51, + "learning_rate": 0.00022286864983832135, + "loss": 0.069, "step": 79670 }, { - "epoch": 0.86, - "learning_rate": 0.0001707249010318645, - "loss": 0.046, + "epoch": 0.51, + "learning_rate": 0.00022285896848396443, + "loss": 0.0505, "step": 79680 }, { - "epoch": 0.86, - "learning_rate": 0.0001707086767473554, - "loss": 0.0398, + "epoch": 0.51, + "learning_rate": 0.0002228492871296075, + "loss": 0.0499, "step": 79690 }, { - "epoch": 0.86, - "learning_rate": 0.00017069245246284636, - "loss": 0.0394, + "epoch": 0.51, + "learning_rate": 0.00022283960577525058, + "loss": 0.0488, "step": 79700 }, { - "epoch": 0.86, - "learning_rate": 0.0001706762281783373, - "loss": 0.048, + "epoch": 0.51, + "learning_rate": 0.00022282992442089364, + "loss": 0.0491, "step": 79710 }, { - "epoch": 0.86, - "learning_rate": 0.00017066000389382826, - "loss": 0.0415, + "epoch": 0.51, + "learning_rate": 0.0002228202430665367, + "loss": 0.0606, "step": 79720 }, { - "epoch": 0.86, - "learning_rate": 0.00017064377960931918, - "loss": 0.0441, + "epoch": 0.51, + "learning_rate": 0.00022281056171217977, + "loss": 0.0573, "step": 79730 }, { - "epoch": 0.86, - "learning_rate": 0.00017062755532481016, - "loss": 0.0433, + "epoch": 0.51, + "learning_rate": 0.00022280088035782282, + "loss": 0.05, "step": 79740 }, { - "epoch": 0.86, - "learning_rate": 0.00017061133104030108, - "loss": 0.0491, + "epoch": 0.51, + "learning_rate": 0.0002227911990034659, + "loss": 0.0645, "step": 79750 }, { - "epoch": 0.86, - "learning_rate": 0.00017059510675579206, - "loss": 0.05, + "epoch": 0.51, + "learning_rate": 0.00022278151764910898, + "loss": 0.0572, "step": 79760 }, { - "epoch": 0.86, - "learning_rate": 0.00017057888247128298, - "loss": 0.0554, + "epoch": 0.51, + "learning_rate": 0.00022277183629475204, + "loss": 0.052, "step": 79770 }, { - "epoch": 0.86, - "learning_rate": 0.00017056265818677396, - "loss": 0.0541, + "epoch": 0.51, + "learning_rate": 0.00022276215494039511, + "loss": 0.0524, "step": 79780 }, { - "epoch": 0.86, - "learning_rate": 0.0001705464339022649, - "loss": 0.0477, + "epoch": 0.51, + "learning_rate": 0.00022275247358603817, + "loss": 0.0589, "step": 79790 }, { - "epoch": 0.86, - "learning_rate": 0.00017053020961775583, - "loss": 0.0416, + "epoch": 0.52, + "learning_rate": 0.00022274279223168122, + "loss": 0.0538, "step": 79800 }, { - "epoch": 0.86, - "learning_rate": 0.0001705139853332468, - "loss": 0.0387, + "epoch": 0.52, + "learning_rate": 0.0002227331108773243, + "loss": 0.0531, "step": 79810 }, { - "epoch": 0.86, - "learning_rate": 0.00017049776104873773, - "loss": 0.0415, + "epoch": 0.52, + "learning_rate": 0.00022272342952296738, + "loss": 0.0549, "step": 79820 }, { - "epoch": 0.86, - "learning_rate": 0.0001704815367642287, - "loss": 0.0493, + "epoch": 0.52, + "learning_rate": 0.00022271374816861046, + "loss": 0.0565, "step": 79830 }, { - "epoch": 0.86, - "learning_rate": 0.00017046531247971963, - "loss": 0.0447, + "epoch": 0.52, + "learning_rate": 0.0002227040668142535, + "loss": 0.057, "step": 79840 }, { - "epoch": 0.86, - "learning_rate": 0.00017044908819521058, - "loss": 0.0468, + "epoch": 0.52, + "learning_rate": 0.0002226943854598966, + "loss": 0.0609, "step": 79850 }, { - "epoch": 0.86, - "learning_rate": 0.00017043286391070153, - "loss": 0.0418, + "epoch": 0.52, + "learning_rate": 0.00022268470410553964, + "loss": 0.0578, "step": 79860 }, { - "epoch": 0.86, - "learning_rate": 0.00017041663962619248, - "loss": 0.0505, + "epoch": 0.52, + "learning_rate": 0.0002226750227511827, + "loss": 0.0512, "step": 79870 }, { - "epoch": 0.86, - "learning_rate": 0.0001704004153416834, - "loss": 0.0462, + "epoch": 0.52, + "learning_rate": 0.00022266534139682578, + "loss": 0.0577, "step": 79880 }, { - "epoch": 0.86, - "learning_rate": 0.00017038419105717438, - "loss": 0.0473, + "epoch": 0.52, + "learning_rate": 0.00022265566004246886, + "loss": 0.0538, "step": 79890 }, { - "epoch": 0.86, - "learning_rate": 0.0001703679667726653, - "loss": 0.0414, + "epoch": 0.52, + "learning_rate": 0.00022264597868811194, + "loss": 0.062, "step": 79900 }, { - "epoch": 0.86, - "learning_rate": 0.00017035174248815628, - "loss": 0.0448, + "epoch": 0.52, + "learning_rate": 0.000222636297333755, + "loss": 0.0553, "step": 79910 }, { - "epoch": 0.86, - "learning_rate": 0.0001703355182036472, - "loss": 0.0523, + "epoch": 0.52, + "learning_rate": 0.00022262661597939807, + "loss": 0.0476, "step": 79920 }, { - "epoch": 0.86, - "learning_rate": 0.00017031929391913815, - "loss": 0.0508, + "epoch": 0.52, + "learning_rate": 0.00022261693462504112, + "loss": 0.054, "step": 79930 }, { - "epoch": 0.86, - "learning_rate": 0.0001703030696346291, - "loss": 0.0464, + "epoch": 0.52, + "learning_rate": 0.00022260725327068417, + "loss": 0.0524, "step": 79940 }, { - "epoch": 0.86, - "learning_rate": 0.00017028684535012005, - "loss": 0.0442, + "epoch": 0.52, + "learning_rate": 0.00022259757191632725, + "loss": 0.0543, "step": 79950 }, { - "epoch": 0.86, - "learning_rate": 0.000170270621065611, - "loss": 0.0441, + "epoch": 0.52, + "learning_rate": 0.00022258789056197033, + "loss": 0.0609, "step": 79960 }, { - "epoch": 0.86, - "learning_rate": 0.00017025439678110195, - "loss": 0.0461, + "epoch": 0.52, + "learning_rate": 0.0002225782092076134, + "loss": 0.0496, "step": 79970 }, { - "epoch": 0.87, - "learning_rate": 0.00017023817249659287, - "loss": 0.0432, + "epoch": 0.52, + "learning_rate": 0.00022256852785325647, + "loss": 0.0477, "step": 79980 }, { - "epoch": 0.87, - "learning_rate": 0.00017022194821208385, - "loss": 0.0457, + "epoch": 0.52, + "learning_rate": 0.00022255884649889955, + "loss": 0.0562, "step": 79990 }, { - "epoch": 0.87, - "learning_rate": 0.00017020572392757477, - "loss": 0.0434, + "epoch": 0.52, + "learning_rate": 0.00022254916514454257, + "loss": 0.0536, "step": 80000 }, { - "epoch": 0.87, - "eval_cer": 0.9212356058317033, - "eval_loss": 0.03184312954545021, - "eval_runtime": 118.8761, - "eval_samples_per_second": 16.824, - "eval_steps_per_second": 4.206, + "epoch": 0.52, + "eval_cer": 0.9199647497457915, + "eval_loss": 0.03456534445285797, + "eval_runtime": 119.9236, + "eval_samples_per_second": 16.677, + "eval_steps_per_second": 4.169, "step": 80000 }, { - "epoch": 0.87, - "learning_rate": 0.00017018949964306575, - "loss": 0.0414, + "epoch": 0.52, + "learning_rate": 0.00022253948379018565, + "loss": 0.0641, "step": 80010 }, { - "epoch": 0.87, - "learning_rate": 0.00017017327535855667, - "loss": 0.0401, + "epoch": 0.52, + "learning_rate": 0.00022252980243582873, + "loss": 0.0488, "step": 80020 }, { - "epoch": 0.87, - "learning_rate": 0.00017015705107404762, - "loss": 0.0512, + "epoch": 0.52, + "learning_rate": 0.0002225201210814718, + "loss": 0.0487, "step": 80030 }, { - "epoch": 0.87, - "learning_rate": 0.00017014082678953857, - "loss": 0.0564, + "epoch": 0.52, + "learning_rate": 0.00022251043972711486, + "loss": 0.0517, "step": 80040 }, { - "epoch": 0.87, - "learning_rate": 0.00017012460250502952, - "loss": 0.0469, + "epoch": 0.52, + "learning_rate": 0.00022250075837275794, + "loss": 0.0533, "step": 80050 }, { - "epoch": 0.87, - "learning_rate": 0.00017010837822052045, - "loss": 0.0505, + "epoch": 0.52, + "learning_rate": 0.00022249107701840102, + "loss": 0.0528, "step": 80060 }, { - "epoch": 0.87, - "learning_rate": 0.00017009215393601142, - "loss": 0.0414, + "epoch": 0.52, + "learning_rate": 0.00022248139566404405, + "loss": 0.0473, "step": 80070 }, { - "epoch": 0.87, - "learning_rate": 0.00017007592965150235, - "loss": 0.0409, + "epoch": 0.52, + "learning_rate": 0.00022247171430968713, + "loss": 0.0528, "step": 80080 }, { - "epoch": 0.87, - "learning_rate": 0.00017005970536699332, - "loss": 0.0391, + "epoch": 0.52, + "learning_rate": 0.0002224620329553302, + "loss": 0.056, "step": 80090 }, { - "epoch": 0.87, - "learning_rate": 0.00017004348108248425, - "loss": 0.0423, + "epoch": 0.52, + "learning_rate": 0.0002224523516009733, + "loss": 0.0533, "step": 80100 }, { - "epoch": 0.87, - "learning_rate": 0.00017002725679797522, - "loss": 0.0452, + "epoch": 0.52, + "learning_rate": 0.00022244267024661634, + "loss": 0.0593, "step": 80110 }, { - "epoch": 0.87, - "learning_rate": 0.00017001103251346614, - "loss": 0.0439, + "epoch": 0.52, + "learning_rate": 0.00022243298889225942, + "loss": 0.0605, "step": 80120 }, { - "epoch": 0.87, - "learning_rate": 0.0001699948082289571, - "loss": 0.0472, + "epoch": 0.52, + "learning_rate": 0.0002224233075379025, + "loss": 0.0491, "step": 80130 }, { - "epoch": 0.87, - "learning_rate": 0.00016997858394444804, - "loss": 0.0433, + "epoch": 0.52, + "learning_rate": 0.00022241362618354553, + "loss": 0.051, "step": 80140 }, { - "epoch": 0.87, - "learning_rate": 0.000169962359659939, - "loss": 0.0445, + "epoch": 0.52, + "learning_rate": 0.0002224039448291886, + "loss": 0.0529, "step": 80150 }, { - "epoch": 0.87, - "learning_rate": 0.00016994613537542992, - "loss": 0.05, + "epoch": 0.52, + "learning_rate": 0.00022239426347483169, + "loss": 0.0556, "step": 80160 }, { - "epoch": 0.87, - "learning_rate": 0.0001699299110909209, - "loss": 0.0492, + "epoch": 0.52, + "learning_rate": 0.00022238458212047477, + "loss": 0.0517, "step": 80170 }, { - "epoch": 0.87, - "learning_rate": 0.00016991368680641182, - "loss": 0.0521, + "epoch": 0.52, + "learning_rate": 0.00022237490076611782, + "loss": 0.0646, "step": 80180 }, { - "epoch": 0.87, - "learning_rate": 0.0001698974625219028, - "loss": 0.0367, + "epoch": 0.52, + "learning_rate": 0.0002223652194117609, + "loss": 0.0545, "step": 80190 }, { - "epoch": 0.87, - "learning_rate": 0.00016988123823739372, - "loss": 0.0438, + "epoch": 0.52, + "learning_rate": 0.00022235553805740398, + "loss": 0.0488, "step": 80200 }, { - "epoch": 0.87, - "learning_rate": 0.00016986501395288467, - "loss": 0.0444, + "epoch": 0.52, + "learning_rate": 0.000222345856703047, + "loss": 0.0525, "step": 80210 }, { - "epoch": 0.87, - "learning_rate": 0.00016984878966837562, - "loss": 0.0407, + "epoch": 0.52, + "learning_rate": 0.00022233617534869008, + "loss": 0.0567, "step": 80220 }, { - "epoch": 0.87, - "learning_rate": 0.00016983256538386657, - "loss": 0.0468, + "epoch": 0.52, + "learning_rate": 0.00022232649399433316, + "loss": 0.0448, "step": 80230 }, { - "epoch": 0.87, - "learning_rate": 0.0001698163410993575, - "loss": 0.0385, + "epoch": 0.52, + "learning_rate": 0.00022231681263997622, + "loss": 0.0492, "step": 80240 }, { - "epoch": 0.87, - "learning_rate": 0.00016980011681484846, - "loss": 0.0472, + "epoch": 0.52, + "learning_rate": 0.0002223071312856193, + "loss": 0.051, "step": 80250 }, { - "epoch": 0.87, - "learning_rate": 0.0001697838925303394, - "loss": 0.0436, + "epoch": 0.52, + "learning_rate": 0.00022229744993126238, + "loss": 0.0451, "step": 80260 }, { - "epoch": 0.87, - "learning_rate": 0.00016976766824583036, - "loss": 0.0478, + "epoch": 0.52, + "learning_rate": 0.00022228776857690546, + "loss": 0.0485, "step": 80270 }, { - "epoch": 0.87, - "learning_rate": 0.0001697514439613213, - "loss": 0.0436, + "epoch": 0.52, + "learning_rate": 0.00022227808722254848, + "loss": 0.0519, "step": 80280 }, { - "epoch": 0.87, - "learning_rate": 0.00016973521967681226, - "loss": 0.0374, + "epoch": 0.52, + "learning_rate": 0.00022226840586819156, + "loss": 0.0552, "step": 80290 }, { - "epoch": 0.87, - "learning_rate": 0.00016971899539230319, - "loss": 0.0456, + "epoch": 0.52, + "learning_rate": 0.00022225872451383464, + "loss": 0.0598, "step": 80300 }, { - "epoch": 0.87, - "learning_rate": 0.00016970277110779414, - "loss": 0.0505, + "epoch": 0.52, + "learning_rate": 0.0002222490431594777, + "loss": 0.0481, "step": 80310 }, { - "epoch": 0.87, - "learning_rate": 0.00016968654682328509, - "loss": 0.0457, + "epoch": 0.52, + "learning_rate": 0.00022223936180512077, + "loss": 0.0521, "step": 80320 }, { - "epoch": 0.87, - "learning_rate": 0.00016967032253877604, - "loss": 0.0474, + "epoch": 0.52, + "learning_rate": 0.00022222968045076385, + "loss": 0.0528, "step": 80330 }, { - "epoch": 0.87, - "learning_rate": 0.00016965409825426696, - "loss": 0.0434, + "epoch": 0.52, + "learning_rate": 0.00022221999909640693, + "loss": 0.0475, "step": 80340 }, { - "epoch": 0.87, - "learning_rate": 0.00016963787396975794, - "loss": 0.046, + "epoch": 0.52, + "learning_rate": 0.00022221031774204996, + "loss": 0.0544, "step": 80350 }, { - "epoch": 0.87, - "learning_rate": 0.00016962164968524886, - "loss": 0.0376, + "epoch": 0.52, + "learning_rate": 0.00022220063638769304, + "loss": 0.061, "step": 80360 }, { - "epoch": 0.87, - "learning_rate": 0.00016960542540073983, - "loss": 0.0423, + "epoch": 0.52, + "learning_rate": 0.00022219095503333612, + "loss": 0.054, "step": 80370 }, { - "epoch": 0.87, - "learning_rate": 0.00016958920111623076, - "loss": 0.0452, + "epoch": 0.52, + "learning_rate": 0.00022218127367897917, + "loss": 0.0535, "step": 80380 }, { - "epoch": 0.87, - "learning_rate": 0.0001695729768317217, - "loss": 0.0498, + "epoch": 0.52, + "learning_rate": 0.00022217159232462225, + "loss": 0.0536, "step": 80390 }, { - "epoch": 0.87, - "learning_rate": 0.00016955675254721266, - "loss": 0.0477, + "epoch": 0.52, + "learning_rate": 0.00022216191097026533, + "loss": 0.05, "step": 80400 }, { - "epoch": 0.87, - "learning_rate": 0.0001695405282627036, - "loss": 0.0436, + "epoch": 0.52, + "learning_rate": 0.00022215222961590838, + "loss": 0.0475, "step": 80410 }, { - "epoch": 0.87, - "learning_rate": 0.00016952430397819453, - "loss": 0.0448, + "epoch": 0.52, + "learning_rate": 0.00022214254826155144, + "loss": 0.0543, "step": 80420 }, { - "epoch": 0.87, - "learning_rate": 0.0001695080796936855, - "loss": 0.045, + "epoch": 0.52, + "learning_rate": 0.00022213286690719452, + "loss": 0.0506, "step": 80430 }, { - "epoch": 0.87, - "learning_rate": 0.00016949185540917643, - "loss": 0.0389, + "epoch": 0.52, + "learning_rate": 0.00022212318555283757, + "loss": 0.0489, "step": 80440 }, { - "epoch": 0.87, - "learning_rate": 0.0001694756311246674, - "loss": 0.0482, + "epoch": 0.52, + "learning_rate": 0.00022211350419848065, + "loss": 0.0594, "step": 80450 }, { - "epoch": 0.87, - "learning_rate": 0.00016945940684015833, - "loss": 0.0383, + "epoch": 0.52, + "learning_rate": 0.00022210382284412373, + "loss": 0.0516, "step": 80460 }, { - "epoch": 0.87, - "learning_rate": 0.0001694431825556493, - "loss": 0.0507, + "epoch": 0.52, + "learning_rate": 0.0002220941414897668, + "loss": 0.0513, "step": 80470 }, { - "epoch": 0.87, - "learning_rate": 0.00016942695827114023, - "loss": 0.053, + "epoch": 0.52, + "learning_rate": 0.00022208446013540986, + "loss": 0.0563, "step": 80480 }, { - "epoch": 0.87, - "learning_rate": 0.00016941073398663118, - "loss": 0.0425, + "epoch": 0.52, + "learning_rate": 0.0002220747787810529, + "loss": 0.0568, "step": 80490 }, { - "epoch": 0.87, - "learning_rate": 0.00016939450970212213, - "loss": 0.048, + "epoch": 0.52, + "learning_rate": 0.000222065097426696, + "loss": 0.0532, "step": 80500 }, { - "epoch": 0.87, - "learning_rate": 0.00016937828541761308, - "loss": 0.0412, + "epoch": 0.52, + "learning_rate": 0.00022205541607233905, + "loss": 0.0533, "step": 80510 }, { - "epoch": 0.87, - "learning_rate": 0.000169362061133104, - "loss": 0.0447, + "epoch": 0.52, + "learning_rate": 0.00022204573471798212, + "loss": 0.064, "step": 80520 }, { - "epoch": 0.87, - "learning_rate": 0.00016934583684859498, - "loss": 0.0494, + "epoch": 0.52, + "learning_rate": 0.0002220360533636252, + "loss": 0.0501, "step": 80530 }, { - "epoch": 0.87, - "learning_rate": 0.0001693296125640859, - "loss": 0.0421, + "epoch": 0.52, + "learning_rate": 0.00022202637200926828, + "loss": 0.0591, "step": 80540 }, { - "epoch": 0.87, - "learning_rate": 0.00016931338827957688, - "loss": 0.0491, + "epoch": 0.52, + "learning_rate": 0.00022201669065491134, + "loss": 0.0454, "step": 80550 }, { - "epoch": 0.87, - "learning_rate": 0.0001692971639950678, - "loss": 0.037, + "epoch": 0.52, + "learning_rate": 0.0002220070093005544, + "loss": 0.0514, "step": 80560 }, { - "epoch": 0.87, - "learning_rate": 0.00016928093971055875, - "loss": 0.0514, + "epoch": 0.52, + "learning_rate": 0.00022199732794619747, + "loss": 0.0493, "step": 80570 }, { - "epoch": 0.87, - "learning_rate": 0.0001692647154260497, - "loss": 0.0429, + "epoch": 0.52, + "learning_rate": 0.00022198764659184052, + "loss": 0.0481, "step": 80580 }, { - "epoch": 0.87, - "learning_rate": 0.00016924849114154065, - "loss": 0.0432, + "epoch": 0.52, + "learning_rate": 0.0002219779652374836, + "loss": 0.0474, "step": 80590 }, { - "epoch": 0.87, - "learning_rate": 0.00016923226685703157, - "loss": 0.0393, + "epoch": 0.52, + "learning_rate": 0.00022196828388312668, + "loss": 0.05, "step": 80600 }, { - "epoch": 0.87, - "learning_rate": 0.00016921604257252255, - "loss": 0.05, + "epoch": 0.52, + "learning_rate": 0.00022195860252876973, + "loss": 0.0455, "step": 80610 }, { - "epoch": 0.87, - "learning_rate": 0.00016919981828801347, - "loss": 0.0425, + "epoch": 0.52, + "learning_rate": 0.00022194892117441281, + "loss": 0.0493, "step": 80620 }, { - "epoch": 0.87, - "learning_rate": 0.00016918359400350445, - "loss": 0.0495, + "epoch": 0.52, + "learning_rate": 0.00022193923982005587, + "loss": 0.0513, "step": 80630 }, { - "epoch": 0.87, - "learning_rate": 0.00016916736971899537, - "loss": 0.0408, + "epoch": 0.52, + "learning_rate": 0.00022192955846569892, + "loss": 0.0448, "step": 80640 }, { - "epoch": 0.87, - "learning_rate": 0.00016915114543448635, + "epoch": 0.52, + "learning_rate": 0.000221919877111342, "loss": 0.0461, "step": 80650 }, { - "epoch": 0.87, - "learning_rate": 0.00016913492114997727, - "loss": 0.0421, + "epoch": 0.52, + "learning_rate": 0.00022191019575698508, + "loss": 0.05, "step": 80660 }, { - "epoch": 0.87, - "learning_rate": 0.00016911869686546822, - "loss": 0.0463, + "epoch": 0.52, + "learning_rate": 0.00022190051440262816, + "loss": 0.0514, "step": 80670 }, { - "epoch": 0.87, - "learning_rate": 0.00016910247258095917, - "loss": 0.0408, + "epoch": 0.52, + "learning_rate": 0.0002218908330482712, + "loss": 0.0515, "step": 80680 }, { - "epoch": 0.87, - "learning_rate": 0.00016908624829645012, - "loss": 0.0401, + "epoch": 0.52, + "learning_rate": 0.0002218811516939143, + "loss": 0.0485, "step": 80690 }, { - "epoch": 0.87, - "learning_rate": 0.00016907002401194104, - "loss": 0.0401, + "epoch": 0.52, + "learning_rate": 0.00022187147033955734, + "loss": 0.049, "step": 80700 }, { - "epoch": 0.87, - "learning_rate": 0.00016905379972743202, - "loss": 0.0472, + "epoch": 0.52, + "learning_rate": 0.0002218617889852004, + "loss": 0.0489, "step": 80710 }, { - "epoch": 0.87, - "learning_rate": 0.00016903757544292294, - "loss": 0.0425, + "epoch": 0.52, + "learning_rate": 0.00022185210763084348, + "loss": 0.0537, "step": 80720 }, { - "epoch": 0.87, - "learning_rate": 0.00016902135115841392, - "loss": 0.0472, + "epoch": 0.52, + "learning_rate": 0.00022184242627648656, + "loss": 0.0529, "step": 80730 }, { - "epoch": 0.87, - "learning_rate": 0.00016900512687390484, - "loss": 0.0407, + "epoch": 0.52, + "learning_rate": 0.00022183274492212964, + "loss": 0.0562, "step": 80740 }, { - "epoch": 0.87, - "learning_rate": 0.0001689889025893958, - "loss": 0.0441, + "epoch": 0.52, + "learning_rate": 0.0002218230635677727, + "loss": 0.05, "step": 80750 }, { - "epoch": 0.87, - "learning_rate": 0.00016897267830488674, - "loss": 0.0438, + "epoch": 0.52, + "learning_rate": 0.00022181338221341577, + "loss": 0.0521, "step": 80760 }, { - "epoch": 0.87, - "learning_rate": 0.0001689564540203777, - "loss": 0.0426, + "epoch": 0.52, + "learning_rate": 0.00022180370085905882, + "loss": 0.0473, "step": 80770 }, { - "epoch": 0.87, - "learning_rate": 0.00016894022973586864, - "loss": 0.044, + "epoch": 0.52, + "learning_rate": 0.00022179401950470187, + "loss": 0.0475, "step": 80780 }, { - "epoch": 0.87, - "learning_rate": 0.0001689240054513596, - "loss": 0.0457, + "epoch": 0.52, + "learning_rate": 0.00022178433815034495, + "loss": 0.0504, "step": 80790 }, { - "epoch": 0.87, - "learning_rate": 0.0001689077811668505, - "loss": 0.0412, + "epoch": 0.52, + "learning_rate": 0.00022177465679598803, + "loss": 0.0516, "step": 80800 }, { - "epoch": 0.87, - "learning_rate": 0.0001688915568823415, - "loss": 0.042, + "epoch": 0.52, + "learning_rate": 0.0002217649754416311, + "loss": 0.0519, "step": 80810 }, { - "epoch": 0.87, - "learning_rate": 0.0001688753325978324, - "loss": 0.0442, + "epoch": 0.52, + "learning_rate": 0.00022175529408727417, + "loss": 0.0618, "step": 80820 }, { - "epoch": 0.87, - "learning_rate": 0.0001688591083133234, - "loss": 0.0403, + "epoch": 0.52, + "learning_rate": 0.00022174561273291725, + "loss": 0.0492, "step": 80830 }, { - "epoch": 0.87, - "learning_rate": 0.0001688428840288143, - "loss": 0.0462, + "epoch": 0.52, + "learning_rate": 0.00022173593137856027, + "loss": 0.0557, "step": 80840 }, { - "epoch": 0.87, - "learning_rate": 0.00016882665974430526, - "loss": 0.0491, + "epoch": 0.52, + "learning_rate": 0.00022172625002420335, + "loss": 0.0457, "step": 80850 }, { - "epoch": 0.87, - "learning_rate": 0.0001688104354597962, - "loss": 0.0407, + "epoch": 0.52, + "learning_rate": 0.00022171656866984643, + "loss": 0.0432, "step": 80860 }, { - "epoch": 0.87, - "learning_rate": 0.00016879421117528716, - "loss": 0.0406, + "epoch": 0.52, + "learning_rate": 0.0002217068873154895, + "loss": 0.0525, "step": 80870 }, { - "epoch": 0.87, - "learning_rate": 0.00016877798689077808, - "loss": 0.0439, + "epoch": 0.52, + "learning_rate": 0.00022169720596113256, + "loss": 0.0435, "step": 80880 }, { - "epoch": 0.87, - "learning_rate": 0.00016876176260626906, - "loss": 0.0357, + "epoch": 0.52, + "learning_rate": 0.00022168752460677564, + "loss": 0.0463, "step": 80890 }, { - "epoch": 0.88, - "learning_rate": 0.00016874553832175998, - "loss": 0.0436, + "epoch": 0.52, + "learning_rate": 0.00022167784325241872, + "loss": 0.0485, "step": 80900 }, { - "epoch": 0.88, - "learning_rate": 0.00016872931403725096, - "loss": 0.0459, + "epoch": 0.52, + "learning_rate": 0.00022166816189806175, + "loss": 0.0481, "step": 80910 }, { - "epoch": 0.88, - "learning_rate": 0.00016871308975274188, - "loss": 0.0548, + "epoch": 0.52, + "learning_rate": 0.00022165848054370483, + "loss": 0.0508, "step": 80920 }, { - "epoch": 0.88, - "learning_rate": 0.00016869686546823283, - "loss": 0.0445, + "epoch": 0.52, + "learning_rate": 0.0002216487991893479, + "loss": 0.0629, "step": 80930 }, { - "epoch": 0.88, - "learning_rate": 0.00016868064118372378, - "loss": 0.0461, + "epoch": 0.52, + "learning_rate": 0.000221639117834991, + "loss": 0.049, "step": 80940 }, { - "epoch": 0.88, - "learning_rate": 0.00016866441689921473, - "loss": 0.047, + "epoch": 0.52, + "learning_rate": 0.00022162943648063404, + "loss": 0.0491, "step": 80950 }, { - "epoch": 0.88, - "learning_rate": 0.00016864819261470568, - "loss": 0.0464, + "epoch": 0.52, + "learning_rate": 0.00022161975512627712, + "loss": 0.0483, "step": 80960 }, { - "epoch": 0.88, - "learning_rate": 0.00016863196833019663, - "loss": 0.0495, + "epoch": 0.52, + "learning_rate": 0.0002216100737719202, + "loss": 0.0541, "step": 80970 }, { - "epoch": 0.88, - "learning_rate": 0.00016861574404568755, - "loss": 0.0547, + "epoch": 0.52, + "learning_rate": 0.00022160039241756323, + "loss": 0.0552, "step": 80980 }, { - "epoch": 0.88, - "learning_rate": 0.00016859951976117853, - "loss": 0.0433, + "epoch": 0.52, + "learning_rate": 0.0002215907110632063, + "loss": 0.0471, "step": 80990 }, { - "epoch": 0.88, - "learning_rate": 0.00016858329547666945, - "loss": 0.0466, + "epoch": 0.52, + "learning_rate": 0.00022158102970884939, + "loss": 0.0568, "step": 81000 }, { - "epoch": 0.88, - "eval_cer": 0.9211613931487558, - "eval_loss": 0.03210368752479553, - "eval_runtime": 118.9204, - "eval_samples_per_second": 16.818, - "eval_steps_per_second": 4.204, + "epoch": 0.52, + "eval_cer": 0.9199439611343351, + "eval_loss": 0.0355331152677536, + "eval_runtime": 120.0549, + "eval_samples_per_second": 16.659, + "eval_steps_per_second": 4.165, "step": 81000 }, { - "epoch": 0.88, - "learning_rate": 0.00016856707119216043, - "loss": 0.0493, + "epoch": 0.52, + "learning_rate": 0.00022157134835449244, + "loss": 0.0538, "step": 81010 }, { - "epoch": 0.88, - "learning_rate": 0.00016855084690765135, - "loss": 0.0448, + "epoch": 0.52, + "learning_rate": 0.00022156166700013552, + "loss": 0.0606, "step": 81020 }, { - "epoch": 0.88, - "learning_rate": 0.0001685346226231423, - "loss": 0.0408, + "epoch": 0.52, + "learning_rate": 0.0002215519856457786, + "loss": 0.0529, "step": 81030 }, { - "epoch": 0.88, - "learning_rate": 0.00016851839833863325, - "loss": 0.0561, + "epoch": 0.52, + "learning_rate": 0.00022154230429142168, + "loss": 0.0556, "step": 81040 }, { - "epoch": 0.88, - "learning_rate": 0.0001685021740541242, - "loss": 0.0508, + "epoch": 0.52, + "learning_rate": 0.0002215326229370647, + "loss": 0.0502, "step": 81050 }, { - "epoch": 0.88, - "learning_rate": 0.00016848594976961512, - "loss": 0.045, + "epoch": 0.52, + "learning_rate": 0.00022152294158270778, + "loss": 0.0505, "step": 81060 }, { - "epoch": 0.88, - "learning_rate": 0.0001684697254851061, - "loss": 0.0457, + "epoch": 0.52, + "learning_rate": 0.00022151326022835086, + "loss": 0.053, "step": 81070 }, { - "epoch": 0.88, - "learning_rate": 0.00016845350120059702, - "loss": 0.0521, + "epoch": 0.52, + "learning_rate": 0.00022150357887399392, + "loss": 0.0491, "step": 81080 }, { - "epoch": 0.88, - "learning_rate": 0.000168437276916088, - "loss": 0.0428, + "epoch": 0.52, + "learning_rate": 0.000221493897519637, + "loss": 0.0528, "step": 81090 }, { - "epoch": 0.88, - "learning_rate": 0.00016842105263157892, - "loss": 0.0447, + "epoch": 0.52, + "learning_rate": 0.00022148421616528008, + "loss": 0.0614, "step": 81100 }, { - "epoch": 0.88, - "learning_rate": 0.00016840482834706987, - "loss": 0.0454, + "epoch": 0.52, + "learning_rate": 0.00022147453481092316, + "loss": 0.0537, "step": 81110 }, { - "epoch": 0.88, - "learning_rate": 0.00016838860406256082, - "loss": 0.0408, + "epoch": 0.52, + "learning_rate": 0.00022146485345656618, + "loss": 0.0541, "step": 81120 }, { - "epoch": 0.88, - "learning_rate": 0.00016837237977805177, - "loss": 0.039, + "epoch": 0.52, + "learning_rate": 0.00022145517210220926, + "loss": 0.0515, "step": 81130 }, { - "epoch": 0.88, - "learning_rate": 0.00016835615549354272, - "loss": 0.0388, + "epoch": 0.52, + "learning_rate": 0.00022144549074785234, + "loss": 0.051, "step": 81140 }, { - "epoch": 0.88, - "learning_rate": 0.00016833993120903367, - "loss": 0.048, + "epoch": 0.52, + "learning_rate": 0.0002214358093934954, + "loss": 0.0531, "step": 81150 }, { - "epoch": 0.88, - "learning_rate": 0.0001683237069245246, - "loss": 0.0443, + "epoch": 0.52, + "learning_rate": 0.00022142612803913847, + "loss": 0.0615, "step": 81160 }, { - "epoch": 0.88, - "learning_rate": 0.00016830748264001557, - "loss": 0.0396, + "epoch": 0.52, + "learning_rate": 0.00022141644668478155, + "loss": 0.053, "step": 81170 }, { - "epoch": 0.88, - "learning_rate": 0.0001682912583555065, - "loss": 0.0476, + "epoch": 0.52, + "learning_rate": 0.0002214067653304246, + "loss": 0.0436, "step": 81180 }, { - "epoch": 0.88, - "learning_rate": 0.00016827503407099747, - "loss": 0.0466, + "epoch": 0.52, + "learning_rate": 0.00022139708397606766, + "loss": 0.0557, "step": 81190 }, { - "epoch": 0.88, - "learning_rate": 0.0001682588097864884, - "loss": 0.042, + "epoch": 0.52, + "learning_rate": 0.00022138740262171074, + "loss": 0.0536, "step": 81200 }, { - "epoch": 0.88, - "learning_rate": 0.00016824258550197934, - "loss": 0.0473, + "epoch": 0.52, + "learning_rate": 0.0002213777212673538, + "loss": 0.0523, "step": 81210 }, { - "epoch": 0.88, - "learning_rate": 0.0001682263612174703, - "loss": 0.0422, + "epoch": 0.52, + "learning_rate": 0.00022136803991299687, + "loss": 0.0515, "step": 81220 }, { - "epoch": 0.88, - "learning_rate": 0.00016821013693296124, - "loss": 0.0446, + "epoch": 0.52, + "learning_rate": 0.00022135835855863995, + "loss": 0.0515, "step": 81230 }, { - "epoch": 0.88, - "learning_rate": 0.00016819391264845217, - "loss": 0.0399, + "epoch": 0.52, + "learning_rate": 0.00022134867720428303, + "loss": 0.0524, "step": 81240 }, { - "epoch": 0.88, - "learning_rate": 0.00016817768836394314, - "loss": 0.049, + "epoch": 0.52, + "learning_rate": 0.00022133899584992608, + "loss": 0.0498, "step": 81250 }, { - "epoch": 0.88, - "learning_rate": 0.00016816146407943407, - "loss": 0.0461, + "epoch": 0.52, + "learning_rate": 0.00022132931449556914, + "loss": 0.0462, "step": 81260 }, { - "epoch": 0.88, - "learning_rate": 0.00016814523979492504, - "loss": 0.0486, + "epoch": 0.52, + "learning_rate": 0.00022131963314121221, + "loss": 0.0487, "step": 81270 }, { - "epoch": 0.88, - "learning_rate": 0.00016812901551041597, - "loss": 0.0481, + "epoch": 0.52, + "learning_rate": 0.00022130995178685527, + "loss": 0.0525, "step": 81280 }, { - "epoch": 0.88, - "learning_rate": 0.00016811279122590692, - "loss": 0.0557, + "epoch": 0.52, + "learning_rate": 0.00022130027043249835, + "loss": 0.0481, "step": 81290 }, { - "epoch": 0.88, - "learning_rate": 0.00016809656694139787, - "loss": 0.0427, + "epoch": 0.52, + "learning_rate": 0.00022129058907814143, + "loss": 0.0568, "step": 81300 }, { - "epoch": 0.88, - "learning_rate": 0.00016808034265688882, - "loss": 0.0421, + "epoch": 0.52, + "learning_rate": 0.0002212809077237845, + "loss": 0.0516, "step": 81310 }, { - "epoch": 0.88, - "learning_rate": 0.00016806411837237976, - "loss": 0.0425, + "epoch": 0.52, + "learning_rate": 0.00022127122636942756, + "loss": 0.0519, "step": 81320 }, { - "epoch": 0.88, - "learning_rate": 0.00016804789408787071, - "loss": 0.0502, + "epoch": 0.52, + "learning_rate": 0.0002212615450150706, + "loss": 0.0561, "step": 81330 }, { - "epoch": 0.88, - "learning_rate": 0.00016803166980336164, - "loss": 0.0493, + "epoch": 0.52, + "learning_rate": 0.0002212518636607137, + "loss": 0.0487, "step": 81340 }, { - "epoch": 0.88, - "learning_rate": 0.00016801544551885261, - "loss": 0.0402, + "epoch": 0.53, + "learning_rate": 0.00022124218230635674, + "loss": 0.0579, "step": 81350 }, { - "epoch": 0.88, - "learning_rate": 0.00016799922123434354, - "loss": 0.0456, + "epoch": 0.53, + "learning_rate": 0.00022123250095199982, + "loss": 0.0523, "step": 81360 }, { - "epoch": 0.88, - "learning_rate": 0.00016798299694983451, - "loss": 0.0483, + "epoch": 0.53, + "learning_rate": 0.0002212228195976429, + "loss": 0.0571, "step": 81370 }, { - "epoch": 0.88, - "learning_rate": 0.00016796677266532544, - "loss": 0.0456, + "epoch": 0.53, + "learning_rate": 0.00022121313824328596, + "loss": 0.0454, "step": 81380 }, { - "epoch": 0.88, - "learning_rate": 0.00016795054838081639, - "loss": 0.0411, + "epoch": 0.53, + "learning_rate": 0.00022120345688892904, + "loss": 0.0458, "step": 81390 }, { - "epoch": 0.88, - "learning_rate": 0.00016793432409630734, - "loss": 0.0438, + "epoch": 0.53, + "learning_rate": 0.0002211937755345721, + "loss": 0.0607, "step": 81400 }, { - "epoch": 0.88, - "learning_rate": 0.00016791809981179829, - "loss": 0.0417, + "epoch": 0.53, + "learning_rate": 0.00022118409418021514, + "loss": 0.0487, "step": 81410 }, { - "epoch": 0.88, - "learning_rate": 0.0001679018755272892, - "loss": 0.0396, + "epoch": 0.53, + "learning_rate": 0.00022117441282585822, + "loss": 0.0519, "step": 81420 }, { - "epoch": 0.88, - "learning_rate": 0.00016788565124278019, - "loss": 0.0422, + "epoch": 0.53, + "learning_rate": 0.0002211647314715013, + "loss": 0.0634, "step": 81430 }, { - "epoch": 0.88, - "learning_rate": 0.0001678694269582711, - "loss": 0.0555, + "epoch": 0.53, + "learning_rate": 0.00022115505011714438, + "loss": 0.0475, "step": 81440 }, { - "epoch": 0.88, - "learning_rate": 0.00016785320267376208, - "loss": 0.0453, + "epoch": 0.53, + "learning_rate": 0.00022114536876278743, + "loss": 0.0577, "step": 81450 }, { - "epoch": 0.88, - "learning_rate": 0.000167836978389253, - "loss": 0.0498, + "epoch": 0.53, + "learning_rate": 0.00022113568740843051, + "loss": 0.0516, "step": 81460 }, { - "epoch": 0.88, - "learning_rate": 0.00016782075410474398, - "loss": 0.0409, + "epoch": 0.53, + "learning_rate": 0.00022112600605407357, + "loss": 0.0603, "step": 81470 }, { - "epoch": 0.88, - "learning_rate": 0.0001678045298202349, - "loss": 0.0411, + "epoch": 0.53, + "learning_rate": 0.00022111632469971662, + "loss": 0.0465, "step": 81480 }, { - "epoch": 0.88, - "learning_rate": 0.00016778830553572586, - "loss": 0.0496, + "epoch": 0.53, + "learning_rate": 0.0002211066433453597, + "loss": 0.0478, "step": 81490 }, { - "epoch": 0.88, - "learning_rate": 0.0001677720812512168, - "loss": 0.0461, + "epoch": 0.53, + "learning_rate": 0.00022109696199100278, + "loss": 0.0497, "step": 81500 }, { - "epoch": 0.88, - "learning_rate": 0.00016775585696670776, - "loss": 0.0436, + "epoch": 0.53, + "learning_rate": 0.00022108728063664586, + "loss": 0.0535, "step": 81510 }, { - "epoch": 0.88, - "learning_rate": 0.00016773963268219868, - "loss": 0.0425, + "epoch": 0.53, + "learning_rate": 0.0002210775992822889, + "loss": 0.0523, "step": 81520 }, { - "epoch": 0.88, - "learning_rate": 0.00016772340839768966, - "loss": 0.0455, + "epoch": 0.53, + "learning_rate": 0.000221067917927932, + "loss": 0.0639, "step": 81530 }, { - "epoch": 0.88, - "learning_rate": 0.00016770718411318058, - "loss": 0.0419, + "epoch": 0.53, + "learning_rate": 0.00022105823657357504, + "loss": 0.0515, "step": 81540 }, { - "epoch": 0.88, - "learning_rate": 0.00016769095982867156, - "loss": 0.0427, + "epoch": 0.53, + "learning_rate": 0.0002210485552192181, + "loss": 0.0516, "step": 81550 }, { - "epoch": 0.88, - "learning_rate": 0.00016767473554416248, - "loss": 0.0417, + "epoch": 0.53, + "learning_rate": 0.00022103887386486118, + "loss": 0.0494, "step": 81560 }, { - "epoch": 0.88, - "learning_rate": 0.00016765851125965343, - "loss": 0.0446, + "epoch": 0.53, + "learning_rate": 0.00022102919251050426, + "loss": 0.0496, "step": 81570 }, { - "epoch": 0.88, - "learning_rate": 0.00016764228697514438, - "loss": 0.0429, + "epoch": 0.53, + "learning_rate": 0.0002210195111561473, + "loss": 0.0542, "step": 81580 }, { - "epoch": 0.88, - "learning_rate": 0.00016762606269063533, - "loss": 0.0474, + "epoch": 0.53, + "learning_rate": 0.0002210098298017904, + "loss": 0.0542, "step": 81590 }, { - "epoch": 0.88, - "learning_rate": 0.00016760983840612625, - "loss": 0.0478, + "epoch": 0.53, + "learning_rate": 0.00022100014844743347, + "loss": 0.0519, "step": 81600 }, { - "epoch": 0.88, - "learning_rate": 0.00016759361412161723, - "loss": 0.042, + "epoch": 0.53, + "learning_rate": 0.0002209904670930765, + "loss": 0.0476, "step": 81610 }, { - "epoch": 0.88, - "learning_rate": 0.00016757738983710815, - "loss": 0.0409, + "epoch": 0.53, + "learning_rate": 0.00022098078573871957, + "loss": 0.0527, "step": 81620 }, { - "epoch": 0.88, - "learning_rate": 0.00016756116555259913, - "loss": 0.0401, + "epoch": 0.53, + "learning_rate": 0.00022097110438436265, + "loss": 0.0481, "step": 81630 }, { - "epoch": 0.88, - "learning_rate": 0.00016754494126809005, - "loss": 0.0431, + "epoch": 0.53, + "learning_rate": 0.00022096142303000573, + "loss": 0.0486, "step": 81640 }, { - "epoch": 0.88, - "learning_rate": 0.00016752871698358103, - "loss": 0.0444, + "epoch": 0.53, + "learning_rate": 0.00022095174167564879, + "loss": 0.0584, "step": 81650 }, { - "epoch": 0.88, - "learning_rate": 0.00016751249269907195, - "loss": 0.0406, + "epoch": 0.53, + "learning_rate": 0.00022094206032129187, + "loss": 0.0502, "step": 81660 }, { - "epoch": 0.88, - "learning_rate": 0.0001674962684145629, - "loss": 0.0415, + "epoch": 0.53, + "learning_rate": 0.00022093237896693495, + "loss": 0.0488, "step": 81670 }, { - "epoch": 0.88, - "learning_rate": 0.00016748004413005385, - "loss": 0.0463, + "epoch": 0.53, + "learning_rate": 0.00022092269761257797, + "loss": 0.0529, "step": 81680 }, { - "epoch": 0.88, - "learning_rate": 0.0001674638198455448, - "loss": 0.0416, + "epoch": 0.53, + "learning_rate": 0.00022091301625822105, + "loss": 0.0493, "step": 81690 }, { - "epoch": 0.88, - "learning_rate": 0.00016744759556103572, - "loss": 0.0398, + "epoch": 0.53, + "learning_rate": 0.00022090333490386413, + "loss": 0.0492, "step": 81700 }, { - "epoch": 0.88, - "learning_rate": 0.0001674313712765267, - "loss": 0.0436, + "epoch": 0.53, + "learning_rate": 0.0002208936535495072, + "loss": 0.0502, "step": 81710 }, { - "epoch": 0.88, - "learning_rate": 0.00016741514699201762, - "loss": 0.046, + "epoch": 0.53, + "learning_rate": 0.00022088397219515026, + "loss": 0.0567, "step": 81720 }, { - "epoch": 0.88, - "learning_rate": 0.0001673989227075086, - "loss": 0.0396, + "epoch": 0.53, + "learning_rate": 0.00022087429084079334, + "loss": 0.0524, "step": 81730 }, { - "epoch": 0.88, - "learning_rate": 0.00016738269842299952, - "loss": 0.0426, + "epoch": 0.53, + "learning_rate": 0.00022086460948643642, + "loss": 0.054, "step": 81740 }, { - "epoch": 0.88, - "learning_rate": 0.00016736647413849047, - "loss": 0.0468, + "epoch": 0.53, + "learning_rate": 0.00022085492813207945, + "loss": 0.0536, "step": 81750 }, { - "epoch": 0.88, - "learning_rate": 0.00016735024985398142, - "loss": 0.0417, + "epoch": 0.53, + "learning_rate": 0.00022084524677772253, + "loss": 0.0531, "step": 81760 }, { - "epoch": 0.88, - "learning_rate": 0.00016733402556947237, - "loss": 0.0465, + "epoch": 0.53, + "learning_rate": 0.0002208355654233656, + "loss": 0.0686, "step": 81770 }, { - "epoch": 0.88, - "learning_rate": 0.0001673178012849633, - "loss": 0.0416, + "epoch": 0.53, + "learning_rate": 0.00022082588406900866, + "loss": 0.0572, "step": 81780 }, { - "epoch": 0.88, - "learning_rate": 0.00016730157700045427, - "loss": 0.0428, + "epoch": 0.53, + "learning_rate": 0.00022081620271465174, + "loss": 0.0511, "step": 81790 }, { - "epoch": 0.88, - "learning_rate": 0.0001672853527159452, - "loss": 0.0464, + "epoch": 0.53, + "learning_rate": 0.00022080652136029482, + "loss": 0.0511, "step": 81800 }, { - "epoch": 0.88, - "learning_rate": 0.00016726912843143617, - "loss": 0.0442, + "epoch": 0.53, + "learning_rate": 0.0002207968400059379, + "loss": 0.0528, "step": 81810 }, { - "epoch": 0.88, - "learning_rate": 0.0001672529041469271, - "loss": 0.041, + "epoch": 0.53, + "learning_rate": 0.00022078715865158093, + "loss": 0.0476, "step": 81820 }, { - "epoch": 0.89, - "learning_rate": 0.00016723667986241807, - "loss": 0.0487, + "epoch": 0.53, + "learning_rate": 0.000220777477297224, + "loss": 0.055, "step": 81830 }, { - "epoch": 0.89, - "learning_rate": 0.000167220455577909, - "loss": 0.0464, + "epoch": 0.53, + "learning_rate": 0.00022076779594286709, + "loss": 0.0526, "step": 81840 }, { - "epoch": 0.89, - "learning_rate": 0.00016720423129339994, - "loss": 0.0479, + "epoch": 0.53, + "learning_rate": 0.00022075811458851014, + "loss": 0.048, "step": 81850 }, { - "epoch": 0.89, - "learning_rate": 0.0001671880070088909, - "loss": 0.0457, + "epoch": 0.53, + "learning_rate": 0.00022074843323415322, + "loss": 0.0499, "step": 81860 }, { - "epoch": 0.89, - "learning_rate": 0.00016717178272438184, - "loss": 0.0451, + "epoch": 0.53, + "learning_rate": 0.0002207387518797963, + "loss": 0.0472, "step": 81870 }, { - "epoch": 0.89, - "learning_rate": 0.00016715555843987276, - "loss": 0.045, + "epoch": 0.53, + "learning_rate": 0.00022072907052543938, + "loss": 0.0528, "step": 81880 }, { - "epoch": 0.89, - "learning_rate": 0.00016713933415536374, - "loss": 0.0447, + "epoch": 0.53, + "learning_rate": 0.0002207193891710824, + "loss": 0.0472, "step": 81890 }, { - "epoch": 0.89, - "learning_rate": 0.00016712310987085466, - "loss": 0.0492, + "epoch": 0.53, + "learning_rate": 0.00022070970781672548, + "loss": 0.0523, "step": 81900 }, { - "epoch": 0.89, - "learning_rate": 0.00016710688558634564, - "loss": 0.0499, + "epoch": 0.53, + "learning_rate": 0.00022070002646236856, + "loss": 0.0604, "step": 81910 }, { - "epoch": 0.89, - "learning_rate": 0.00016709066130183656, - "loss": 0.0398, + "epoch": 0.53, + "learning_rate": 0.00022069034510801162, + "loss": 0.05, "step": 81920 }, { - "epoch": 0.89, - "learning_rate": 0.0001670744370173275, - "loss": 0.0491, + "epoch": 0.53, + "learning_rate": 0.0002206806637536547, + "loss": 0.0501, "step": 81930 }, { - "epoch": 0.89, - "learning_rate": 0.00016705821273281846, - "loss": 0.049, + "epoch": 0.53, + "learning_rate": 0.00022067098239929777, + "loss": 0.0475, "step": 81940 }, { - "epoch": 0.89, - "learning_rate": 0.0001670419884483094, - "loss": 0.0472, + "epoch": 0.53, + "learning_rate": 0.00022066130104494085, + "loss": 0.0499, "step": 81950 }, { - "epoch": 0.89, - "learning_rate": 0.00016702576416380033, - "loss": 0.0401, + "epoch": 0.53, + "learning_rate": 0.00022065161969058388, + "loss": 0.056, "step": 81960 }, { - "epoch": 0.89, - "learning_rate": 0.0001670095398792913, - "loss": 0.046, + "epoch": 0.53, + "learning_rate": 0.00022064193833622696, + "loss": 0.0471, "step": 81970 }, { - "epoch": 0.89, - "learning_rate": 0.00016699331559478223, - "loss": 0.0486, + "epoch": 0.53, + "learning_rate": 0.00022063225698187, + "loss": 0.0555, "step": 81980 }, { - "epoch": 0.89, - "learning_rate": 0.0001669770913102732, - "loss": 0.0537, + "epoch": 0.53, + "learning_rate": 0.0002206225756275131, + "loss": 0.0568, "step": 81990 }, { - "epoch": 0.89, - "learning_rate": 0.00016696086702576413, - "loss": 0.0461, + "epoch": 0.53, + "learning_rate": 0.00022061289427315617, + "loss": 0.0486, "step": 82000 }, { - "epoch": 0.89, - "eval_cer": 0.9211675775390015, - "eval_loss": 0.031568411737680435, - "eval_runtime": 118.9166, - "eval_samples_per_second": 16.819, - "eval_steps_per_second": 4.205, + "epoch": 0.53, + "eval_cer": 0.9199421534289911, + "eval_loss": 0.03461761400103569, + "eval_runtime": 120.0302, + "eval_samples_per_second": 16.662, + "eval_steps_per_second": 4.166, "step": 82000 }, { - "epoch": 0.89, - "learning_rate": 0.0001669446427412551, - "loss": 0.047, + "epoch": 0.53, + "learning_rate": 0.00022060321291879925, + "loss": 0.0555, "step": 82010 }, { - "epoch": 0.89, - "learning_rate": 0.00016692841845674603, - "loss": 0.0487, + "epoch": 0.53, + "learning_rate": 0.0002205935315644423, + "loss": 0.0497, "step": 82020 }, { - "epoch": 0.89, - "learning_rate": 0.00016691219417223698, - "loss": 0.0407, + "epoch": 0.53, + "learning_rate": 0.00022058385021008536, + "loss": 0.0472, "step": 82030 }, { - "epoch": 0.89, - "learning_rate": 0.00016689596988772793, - "loss": 0.0437, + "epoch": 0.53, + "learning_rate": 0.00022057416885572844, + "loss": 0.0553, "step": 82040 }, { - "epoch": 0.89, - "learning_rate": 0.00016687974560321888, - "loss": 0.0449, + "epoch": 0.53, + "learning_rate": 0.0002205644875013715, + "loss": 0.062, "step": 82050 }, { - "epoch": 0.89, - "learning_rate": 0.0001668635213187098, - "loss": 0.0479, + "epoch": 0.53, + "learning_rate": 0.00022055480614701457, + "loss": 0.0539, "step": 82060 }, { - "epoch": 0.89, - "learning_rate": 0.00016684729703420078, - "loss": 0.0477, + "epoch": 0.53, + "learning_rate": 0.00022054512479265765, + "loss": 0.0505, "step": 82070 }, { - "epoch": 0.89, - "learning_rate": 0.0001668310727496917, - "loss": 0.0472, + "epoch": 0.53, + "learning_rate": 0.00022053544343830073, + "loss": 0.0493, "step": 82080 }, { - "epoch": 0.89, - "learning_rate": 0.00016681484846518268, - "loss": 0.0453, + "epoch": 0.53, + "learning_rate": 0.00022052576208394378, + "loss": 0.0463, "step": 82090 }, { - "epoch": 0.89, - "learning_rate": 0.0001667986241806736, - "loss": 0.0397, + "epoch": 0.53, + "learning_rate": 0.00022051608072958683, + "loss": 0.0541, "step": 82100 }, { - "epoch": 0.89, - "learning_rate": 0.00016678239989616455, - "loss": 0.0417, + "epoch": 0.53, + "learning_rate": 0.00022050639937522991, + "loss": 0.0531, "step": 82110 }, { - "epoch": 0.89, - "learning_rate": 0.0001667661756116555, - "loss": 0.0389, + "epoch": 0.53, + "learning_rate": 0.00022049671802087297, + "loss": 0.0475, "step": 82120 }, { - "epoch": 0.89, - "learning_rate": 0.00016674995132714645, - "loss": 0.041, + "epoch": 0.53, + "learning_rate": 0.00022048703666651605, + "loss": 0.0541, "step": 82130 }, { - "epoch": 0.89, - "learning_rate": 0.00016673372704263743, - "loss": 0.0415, + "epoch": 0.53, + "learning_rate": 0.00022047735531215913, + "loss": 0.0505, "step": 82140 }, { - "epoch": 0.89, - "learning_rate": 0.00016671750275812835, - "loss": 0.0501, + "epoch": 0.53, + "learning_rate": 0.0002204676739578022, + "loss": 0.0497, "step": 82150 }, { - "epoch": 0.89, - "learning_rate": 0.00016670127847361933, - "loss": 0.0388, + "epoch": 0.53, + "learning_rate": 0.00022045799260344526, + "loss": 0.0507, "step": 82160 }, { - "epoch": 0.89, - "learning_rate": 0.00016668505418911025, - "loss": 0.0461, + "epoch": 0.53, + "learning_rate": 0.0002204483112490883, + "loss": 0.0551, "step": 82170 }, { - "epoch": 0.89, - "learning_rate": 0.0001666688299046012, - "loss": 0.0449, + "epoch": 0.53, + "learning_rate": 0.00022043862989473136, + "loss": 0.0481, "step": 82180 }, { - "epoch": 0.89, - "learning_rate": 0.00016665260562009215, - "loss": 0.0476, + "epoch": 0.53, + "learning_rate": 0.00022042894854037444, + "loss": 0.046, "step": 82190 }, { - "epoch": 0.89, - "learning_rate": 0.0001666363813355831, - "loss": 0.0493, + "epoch": 0.53, + "learning_rate": 0.00022041926718601752, + "loss": 0.0567, "step": 82200 }, { - "epoch": 0.89, - "learning_rate": 0.00016662015705107402, - "loss": 0.0458, + "epoch": 0.53, + "learning_rate": 0.0002204095858316606, + "loss": 0.0481, "step": 82210 }, { - "epoch": 0.89, - "learning_rate": 0.000166603932766565, - "loss": 0.0424, + "epoch": 0.53, + "learning_rate": 0.00022039990447730366, + "loss": 0.0495, "step": 82220 }, { - "epoch": 0.89, - "learning_rate": 0.00016658770848205592, - "loss": 0.0567, + "epoch": 0.53, + "learning_rate": 0.00022039022312294674, + "loss": 0.057, "step": 82230 }, { - "epoch": 0.89, - "learning_rate": 0.0001665714841975469, - "loss": 0.0475, + "epoch": 0.53, + "learning_rate": 0.0002203805417685898, + "loss": 0.051, "step": 82240 }, { - "epoch": 0.89, - "learning_rate": 0.00016655525991303782, - "loss": 0.0443, + "epoch": 0.53, + "learning_rate": 0.00022037086041423284, + "loss": 0.0546, "step": 82250 }, { - "epoch": 0.89, - "learning_rate": 0.00016653903562852877, - "loss": 0.043, + "epoch": 0.53, + "learning_rate": 0.00022036117905987592, + "loss": 0.0457, "step": 82260 }, { - "epoch": 0.89, - "learning_rate": 0.00016652281134401972, - "loss": 0.0417, + "epoch": 0.53, + "learning_rate": 0.000220351497705519, + "loss": 0.0463, "step": 82270 }, { - "epoch": 0.89, - "learning_rate": 0.00016650658705951067, - "loss": 0.0395, + "epoch": 0.53, + "learning_rate": 0.00022034181635116208, + "loss": 0.048, "step": 82280 }, { - "epoch": 0.89, - "learning_rate": 0.0001664903627750016, - "loss": 0.0457, + "epoch": 0.53, + "learning_rate": 0.00022033213499680513, + "loss": 0.0486, "step": 82290 }, { - "epoch": 0.89, - "learning_rate": 0.00016647413849049257, - "loss": 0.0468, + "epoch": 0.53, + "learning_rate": 0.00022032245364244821, + "loss": 0.0541, "step": 82300 }, { - "epoch": 0.89, - "learning_rate": 0.0001664579142059835, - "loss": 0.0416, + "epoch": 0.53, + "learning_rate": 0.00022031277228809127, + "loss": 0.0569, "step": 82310 }, { - "epoch": 0.89, - "learning_rate": 0.00016644168992147447, - "loss": 0.0436, + "epoch": 0.53, + "learning_rate": 0.00022030309093373432, + "loss": 0.0471, "step": 82320 }, { - "epoch": 0.89, - "learning_rate": 0.0001664254656369654, - "loss": 0.0424, + "epoch": 0.53, + "learning_rate": 0.0002202934095793774, + "loss": 0.0494, "step": 82330 }, { - "epoch": 0.89, - "learning_rate": 0.00016640924135245637, - "loss": 0.0423, + "epoch": 0.53, + "learning_rate": 0.00022028372822502048, + "loss": 0.0527, "step": 82340 }, { - "epoch": 0.89, - "learning_rate": 0.0001663930170679473, - "loss": 0.0425, + "epoch": 0.53, + "learning_rate": 0.00022027404687066356, + "loss": 0.0513, "step": 82350 }, { - "epoch": 0.89, - "learning_rate": 0.00016637679278343824, - "loss": 0.0394, + "epoch": 0.53, + "learning_rate": 0.0002202643655163066, + "loss": 0.0551, "step": 82360 }, { - "epoch": 0.89, - "learning_rate": 0.0001663605684989292, - "loss": 0.0393, + "epoch": 0.53, + "learning_rate": 0.0002202546841619497, + "loss": 0.045, "step": 82370 }, { - "epoch": 0.89, - "learning_rate": 0.00016634434421442014, - "loss": 0.0446, + "epoch": 0.53, + "learning_rate": 0.00022024500280759272, + "loss": 0.0513, "step": 82380 }, { - "epoch": 0.89, - "learning_rate": 0.00016632811992991107, - "loss": 0.0412, + "epoch": 0.53, + "learning_rate": 0.0002202353214532358, + "loss": 0.0455, "step": 82390 }, { - "epoch": 0.89, - "learning_rate": 0.00016631189564540204, - "loss": 0.0421, + "epoch": 0.53, + "learning_rate": 0.00022022564009887888, + "loss": 0.0472, "step": 82400 }, { - "epoch": 0.89, - "learning_rate": 0.00016629567136089296, - "loss": 0.0379, + "epoch": 0.53, + "learning_rate": 0.00022021595874452196, + "loss": 0.0485, "step": 82410 }, { - "epoch": 0.89, - "learning_rate": 0.00016627944707638394, - "loss": 0.044, + "epoch": 0.53, + "learning_rate": 0.000220206277390165, + "loss": 0.0503, "step": 82420 }, { - "epoch": 0.89, - "learning_rate": 0.00016626322279187486, - "loss": 0.0366, + "epoch": 0.53, + "learning_rate": 0.0002201965960358081, + "loss": 0.051, "step": 82430 }, { - "epoch": 0.89, - "learning_rate": 0.00016624699850736581, - "loss": 0.0422, + "epoch": 0.53, + "learning_rate": 0.00022018691468145117, + "loss": 0.0496, "step": 82440 }, { - "epoch": 0.89, - "learning_rate": 0.00016623077422285676, - "loss": 0.0458, + "epoch": 0.53, + "learning_rate": 0.0002201772333270942, + "loss": 0.0435, "step": 82450 }, { - "epoch": 0.89, - "learning_rate": 0.0001662145499383477, - "loss": 0.0411, + "epoch": 0.53, + "learning_rate": 0.00022016755197273727, + "loss": 0.0535, "step": 82460 }, { - "epoch": 0.89, - "learning_rate": 0.00016619832565383864, - "loss": 0.0494, + "epoch": 0.53, + "learning_rate": 0.00022015787061838035, + "loss": 0.0479, "step": 82470 }, { - "epoch": 0.89, - "learning_rate": 0.0001661821013693296, - "loss": 0.0458, + "epoch": 0.53, + "learning_rate": 0.00022014818926402343, + "loss": 0.0654, "step": 82480 }, { - "epoch": 0.89, - "learning_rate": 0.00016616587708482054, - "loss": 0.0463, + "epoch": 0.53, + "learning_rate": 0.00022013850790966649, + "loss": 0.0512, "step": 82490 }, { - "epoch": 0.89, - "learning_rate": 0.0001661496528003115, - "loss": 0.0396, + "epoch": 0.53, + "learning_rate": 0.00022012882655530957, + "loss": 0.0513, "step": 82500 }, { - "epoch": 0.89, - "learning_rate": 0.00016613342851580244, - "loss": 0.0403, + "epoch": 0.53, + "learning_rate": 0.00022011914520095265, + "loss": 0.046, "step": 82510 }, { - "epoch": 0.89, - "learning_rate": 0.0001661172042312934, - "loss": 0.0415, + "epoch": 0.53, + "learning_rate": 0.00022010946384659567, + "loss": 0.0514, "step": 82520 }, { - "epoch": 0.89, - "learning_rate": 0.00016610097994678433, - "loss": 0.0484, + "epoch": 0.53, + "learning_rate": 0.00022009978249223875, + "loss": 0.0524, "step": 82530 }, { - "epoch": 0.89, - "learning_rate": 0.00016608475566227528, - "loss": 0.0508, + "epoch": 0.53, + "learning_rate": 0.00022009010113788183, + "loss": 0.0562, "step": 82540 }, { - "epoch": 0.89, - "learning_rate": 0.00016606853137776623, - "loss": 0.0424, + "epoch": 0.53, + "learning_rate": 0.0002200804197835249, + "loss": 0.0465, "step": 82550 }, { - "epoch": 0.89, - "learning_rate": 0.00016605230709325718, - "loss": 0.0479, + "epoch": 0.53, + "learning_rate": 0.00022007073842916796, + "loss": 0.0454, "step": 82560 }, { - "epoch": 0.89, - "learning_rate": 0.0001660360828087481, - "loss": 0.0438, + "epoch": 0.53, + "learning_rate": 0.00022006105707481104, + "loss": 0.0541, "step": 82570 }, { - "epoch": 0.89, - "learning_rate": 0.00016601985852423908, - "loss": 0.0468, + "epoch": 0.53, + "learning_rate": 0.00022005137572045412, + "loss": 0.0517, "step": 82580 }, { - "epoch": 0.89, - "learning_rate": 0.00016600363423973, - "loss": 0.0499, + "epoch": 0.53, + "learning_rate": 0.00022004169436609715, + "loss": 0.0503, "step": 82590 }, { - "epoch": 0.89, - "learning_rate": 0.00016598740995522098, - "loss": 0.0443, + "epoch": 0.53, + "learning_rate": 0.00022003201301174023, + "loss": 0.0578, "step": 82600 }, { - "epoch": 0.89, - "learning_rate": 0.0001659711856707119, - "loss": 0.0381, + "epoch": 0.53, + "learning_rate": 0.0002200223316573833, + "loss": 0.0613, "step": 82610 }, { - "epoch": 0.89, - "learning_rate": 0.00016595496138620286, - "loss": 0.0423, + "epoch": 0.53, + "learning_rate": 0.00022001265030302636, + "loss": 0.0479, "step": 82620 }, { - "epoch": 0.89, - "learning_rate": 0.0001659387371016938, - "loss": 0.0438, + "epoch": 0.53, + "learning_rate": 0.00022000296894866944, + "loss": 0.0515, "step": 82630 }, { - "epoch": 0.89, - "learning_rate": 0.00016592251281718476, - "loss": 0.0469, + "epoch": 0.53, + "learning_rate": 0.00021999328759431252, + "loss": 0.0479, "step": 82640 }, { - "epoch": 0.89, - "learning_rate": 0.00016590628853267568, - "loss": 0.0479, + "epoch": 0.53, + "learning_rate": 0.0002199836062399556, + "loss": 0.0486, "step": 82650 }, { - "epoch": 0.89, - "learning_rate": 0.00016589006424816665, - "loss": 0.0508, + "epoch": 0.53, + "learning_rate": 0.00021997392488559863, + "loss": 0.0481, "step": 82660 }, { - "epoch": 0.89, - "learning_rate": 0.00016587383996365758, - "loss": 0.0411, + "epoch": 0.53, + "learning_rate": 0.0002199642435312417, + "loss": 0.0601, "step": 82670 }, { - "epoch": 0.89, - "learning_rate": 0.00016585761567914855, - "loss": 0.0454, + "epoch": 0.53, + "learning_rate": 0.00021995456217688478, + "loss": 0.0491, "step": 82680 }, { - "epoch": 0.89, - "learning_rate": 0.00016584139139463948, - "loss": 0.0438, + "epoch": 0.53, + "learning_rate": 0.00021994488082252784, + "loss": 0.0525, "step": 82690 }, { - "epoch": 0.89, - "learning_rate": 0.00016582516711013045, - "loss": 0.0408, + "epoch": 0.53, + "learning_rate": 0.00021993519946817092, + "loss": 0.0461, "step": 82700 }, { - "epoch": 0.89, - "learning_rate": 0.00016580894282562138, - "loss": 0.0433, + "epoch": 0.53, + "learning_rate": 0.000219925518113814, + "loss": 0.0514, "step": 82710 }, { - "epoch": 0.89, - "learning_rate": 0.00016579271854111233, - "loss": 0.0438, + "epoch": 0.53, + "learning_rate": 0.00021991583675945708, + "loss": 0.0481, "step": 82720 }, { - "epoch": 0.89, - "learning_rate": 0.00016577649425660328, - "loss": 0.048, + "epoch": 0.53, + "learning_rate": 0.0002199061554051001, + "loss": 0.0513, "step": 82730 }, { - "epoch": 0.89, - "learning_rate": 0.00016576026997209423, - "loss": 0.0423, + "epoch": 0.53, + "learning_rate": 0.00021989647405074318, + "loss": 0.0565, "step": 82740 }, { - "epoch": 0.9, - "learning_rate": 0.00016574404568758515, - "loss": 0.0439, + "epoch": 0.53, + "learning_rate": 0.00021988679269638626, + "loss": 0.0498, "step": 82750 }, { - "epoch": 0.9, - "learning_rate": 0.00016572782140307613, - "loss": 0.0413, + "epoch": 0.53, + "learning_rate": 0.00021987711134202931, + "loss": 0.0535, "step": 82760 }, { - "epoch": 0.9, - "learning_rate": 0.00016571159711856705, - "loss": 0.0408, + "epoch": 0.53, + "learning_rate": 0.0002198674299876724, + "loss": 0.0527, "step": 82770 }, { - "epoch": 0.9, - "learning_rate": 0.00016569537283405802, - "loss": 0.0416, + "epoch": 0.53, + "learning_rate": 0.00021985774863331547, + "loss": 0.0526, "step": 82780 }, { - "epoch": 0.9, - "learning_rate": 0.00016567914854954895, - "loss": 0.0366, + "epoch": 0.53, + "learning_rate": 0.00021984806727895853, + "loss": 0.0515, "step": 82790 }, { - "epoch": 0.9, - "learning_rate": 0.0001656629242650399, - "loss": 0.0423, + "epoch": 0.53, + "learning_rate": 0.00021983838592460158, + "loss": 0.0483, "step": 82800 }, { - "epoch": 0.9, - "learning_rate": 0.00016564669998053085, - "loss": 0.0403, + "epoch": 0.53, + "learning_rate": 0.00021982870457024466, + "loss": 0.0538, "step": 82810 }, { - "epoch": 0.9, - "learning_rate": 0.0001656304756960218, - "loss": 0.0403, + "epoch": 0.53, + "learning_rate": 0.0002198190232158877, + "loss": 0.0535, "step": 82820 }, { - "epoch": 0.9, - "learning_rate": 0.00016561425141151272, - "loss": 0.0437, + "epoch": 0.53, + "learning_rate": 0.0002198093418615308, + "loss": 0.0515, "step": 82830 }, { - "epoch": 0.9, - "learning_rate": 0.0001655980271270037, - "loss": 0.0443, + "epoch": 0.53, + "learning_rate": 0.00021979966050717387, + "loss": 0.0505, "step": 82840 }, { - "epoch": 0.9, - "learning_rate": 0.00016558180284249462, - "loss": 0.0413, + "epoch": 0.53, + "learning_rate": 0.00021978997915281695, + "loss": 0.0555, "step": 82850 }, { - "epoch": 0.9, - "learning_rate": 0.0001655655785579856, - "loss": 0.0406, + "epoch": 0.53, + "learning_rate": 0.00021978029779846, + "loss": 0.0534, "step": 82860 }, { - "epoch": 0.9, - "learning_rate": 0.00016554935427347652, - "loss": 0.0417, + "epoch": 0.53, + "learning_rate": 0.00021977061644410306, + "loss": 0.0493, "step": 82870 }, { - "epoch": 0.9, - "learning_rate": 0.0001655331299889675, - "loss": 0.0398, + "epoch": 0.53, + "learning_rate": 0.00021976093508974614, + "loss": 0.0505, "step": 82880 }, { - "epoch": 0.9, - "learning_rate": 0.00016551690570445842, - "loss": 0.0418, + "epoch": 0.53, + "learning_rate": 0.0002197512537353892, + "loss": 0.0492, "step": 82890 }, { - "epoch": 0.9, - "learning_rate": 0.00016550068141994937, - "loss": 0.0382, + "epoch": 0.54, + "learning_rate": 0.00021974157238103227, + "loss": 0.049, "step": 82900 }, { - "epoch": 0.9, - "learning_rate": 0.00016548445713544032, - "loss": 0.0461, + "epoch": 0.54, + "learning_rate": 0.00021973189102667535, + "loss": 0.0492, "step": 82910 }, { - "epoch": 0.9, - "learning_rate": 0.00016546823285093127, - "loss": 0.0384, + "epoch": 0.54, + "learning_rate": 0.00021972220967231843, + "loss": 0.0491, "step": 82920 }, { - "epoch": 0.9, - "learning_rate": 0.0001654520085664222, - "loss": 0.0482, + "epoch": 0.54, + "learning_rate": 0.00021971252831796148, + "loss": 0.0528, "step": 82930 }, { - "epoch": 0.9, - "learning_rate": 0.00016543578428191317, - "loss": 0.0533, + "epoch": 0.54, + "learning_rate": 0.00021970284696360453, + "loss": 0.0541, "step": 82940 }, { - "epoch": 0.9, - "learning_rate": 0.0001654195599974041, - "loss": 0.0377, + "epoch": 0.54, + "learning_rate": 0.00021969316560924761, + "loss": 0.0519, "step": 82950 }, { - "epoch": 0.9, - "learning_rate": 0.00016540333571289507, - "loss": 0.0479, + "epoch": 0.54, + "learning_rate": 0.00021968348425489067, + "loss": 0.0515, "step": 82960 }, { - "epoch": 0.9, - "learning_rate": 0.000165387111428386, - "loss": 0.0473, + "epoch": 0.54, + "learning_rate": 0.00021967380290053375, + "loss": 0.0549, "step": 82970 }, { - "epoch": 0.9, - "learning_rate": 0.00016537088714387694, - "loss": 0.0521, + "epoch": 0.54, + "learning_rate": 0.00021966412154617683, + "loss": 0.0527, "step": 82980 }, { - "epoch": 0.9, - "learning_rate": 0.0001653546628593679, - "loss": 0.0401, + "epoch": 0.54, + "learning_rate": 0.00021965444019181988, + "loss": 0.0502, "step": 82990 }, { - "epoch": 0.9, - "learning_rate": 0.00016533843857485884, - "loss": 0.0381, + "epoch": 0.54, + "learning_rate": 0.00021964475883746296, + "loss": 0.0571, "step": 83000 }, { - "epoch": 0.9, - "eval_cer": 0.9212983332184804, - "eval_loss": 0.03114171512424946, - "eval_runtime": 119.1404, - "eval_samples_per_second": 16.787, - "eval_steps_per_second": 4.197, + "epoch": 0.54, + "eval_cer": 0.9200235001694724, + "eval_loss": 0.03383234888315201, + "eval_runtime": 120.0102, + "eval_samples_per_second": 16.665, + "eval_steps_per_second": 4.166, "step": 83000 }, { - "epoch": 0.9, - "learning_rate": 0.0001653222142903498, - "loss": 0.0454, + "epoch": 0.54, + "learning_rate": 0.000219635077483106, + "loss": 0.0469, "step": 83010 }, { - "epoch": 0.9, - "learning_rate": 0.00016530599000584074, - "loss": 0.0421, + "epoch": 0.54, + "learning_rate": 0.00021962539612874906, + "loss": 0.0574, "step": 83020 }, { - "epoch": 0.9, - "learning_rate": 0.00016528976572133166, - "loss": 0.0409, + "epoch": 0.54, + "learning_rate": 0.00021961571477439214, + "loss": 0.0527, "step": 83030 }, { - "epoch": 0.9, - "learning_rate": 0.00016527354143682264, - "loss": 0.0415, + "epoch": 0.54, + "learning_rate": 0.00021960603342003522, + "loss": 0.0436, "step": 83040 }, { - "epoch": 0.9, - "learning_rate": 0.00016525731715231356, - "loss": 0.0434, + "epoch": 0.54, + "learning_rate": 0.0002195963520656783, + "loss": 0.0538, "step": 83050 }, { - "epoch": 0.9, - "learning_rate": 0.00016524109286780454, - "loss": 0.0474, + "epoch": 0.54, + "learning_rate": 0.00021958667071132136, + "loss": 0.049, "step": 83060 }, { - "epoch": 0.9, - "learning_rate": 0.00016522486858329546, - "loss": 0.0475, + "epoch": 0.54, + "learning_rate": 0.00021957698935696444, + "loss": 0.0495, "step": 83070 }, { - "epoch": 0.9, - "learning_rate": 0.0001652086442987864, - "loss": 0.0445, + "epoch": 0.54, + "learning_rate": 0.0002195673080026075, + "loss": 0.0481, "step": 83080 }, { - "epoch": 0.9, - "learning_rate": 0.00016519242001427736, - "loss": 0.0445, + "epoch": 0.54, + "learning_rate": 0.00021955762664825054, + "loss": 0.0503, "step": 83090 }, { - "epoch": 0.9, - "learning_rate": 0.0001651761957297683, - "loss": 0.0444, + "epoch": 0.54, + "learning_rate": 0.00021954794529389362, + "loss": 0.0495, "step": 83100 }, { - "epoch": 0.9, - "learning_rate": 0.00016515997144525923, - "loss": 0.048, + "epoch": 0.54, + "learning_rate": 0.0002195382639395367, + "loss": 0.0428, "step": 83110 }, { - "epoch": 0.9, - "learning_rate": 0.0001651437471607502, - "loss": 0.0426, + "epoch": 0.54, + "learning_rate": 0.00021952858258517978, + "loss": 0.0496, "step": 83120 }, { - "epoch": 0.9, - "learning_rate": 0.00016512752287624113, - "loss": 0.0415, + "epoch": 0.54, + "learning_rate": 0.00021951890123082283, + "loss": 0.0514, "step": 83130 }, { - "epoch": 0.9, - "learning_rate": 0.0001651112985917321, - "loss": 0.046, + "epoch": 0.54, + "learning_rate": 0.0002195092198764659, + "loss": 0.0517, "step": 83140 }, { - "epoch": 0.9, - "learning_rate": 0.00016509507430722303, - "loss": 0.0415, + "epoch": 0.54, + "learning_rate": 0.00021949953852210897, + "loss": 0.0597, "step": 83150 }, { - "epoch": 0.9, - "learning_rate": 0.00016507885002271398, - "loss": 0.0467, + "epoch": 0.54, + "learning_rate": 0.00021948985716775202, + "loss": 0.0489, "step": 83160 }, { - "epoch": 0.9, - "learning_rate": 0.00016506262573820493, - "loss": 0.0436, + "epoch": 0.54, + "learning_rate": 0.0002194801758133951, + "loss": 0.0569, "step": 83170 }, { - "epoch": 0.9, - "learning_rate": 0.00016504640145369588, - "loss": 0.0442, + "epoch": 0.54, + "learning_rate": 0.00021947049445903818, + "loss": 0.0459, "step": 83180 }, { - "epoch": 0.9, - "learning_rate": 0.00016503017716918683, - "loss": 0.0423, + "epoch": 0.54, + "learning_rate": 0.00021946081310468123, + "loss": 0.0603, "step": 83190 }, { - "epoch": 0.9, - "learning_rate": 0.00016501395288467778, - "loss": 0.0457, + "epoch": 0.54, + "learning_rate": 0.0002194511317503243, + "loss": 0.0538, "step": 83200 }, { - "epoch": 0.9, - "learning_rate": 0.0001649977286001687, - "loss": 0.0418, + "epoch": 0.54, + "learning_rate": 0.0002194414503959674, + "loss": 0.0531, "step": 83210 }, { - "epoch": 0.9, - "learning_rate": 0.00016498150431565968, - "loss": 0.0488, + "epoch": 0.54, + "learning_rate": 0.00021943176904161042, + "loss": 0.0453, "step": 83220 }, { - "epoch": 0.9, - "learning_rate": 0.0001649652800311506, - "loss": 0.0442, + "epoch": 0.54, + "learning_rate": 0.0002194220876872535, + "loss": 0.046, "step": 83230 }, { - "epoch": 0.9, - "learning_rate": 0.00016494905574664158, - "loss": 0.0417, + "epoch": 0.54, + "learning_rate": 0.00021941240633289658, + "loss": 0.0528, "step": 83240 }, { - "epoch": 0.9, - "learning_rate": 0.0001649328314621325, - "loss": 0.043, + "epoch": 0.54, + "learning_rate": 0.00021940272497853966, + "loss": 0.0551, "step": 83250 }, { - "epoch": 0.9, - "learning_rate": 0.00016491660717762345, - "loss": 0.0355, + "epoch": 0.54, + "learning_rate": 0.0002193930436241827, + "loss": 0.0547, "step": 83260 }, { - "epoch": 0.9, - "learning_rate": 0.0001649003828931144, - "loss": 0.0453, + "epoch": 0.54, + "learning_rate": 0.0002193833622698258, + "loss": 0.0514, "step": 83270 }, { - "epoch": 0.9, - "learning_rate": 0.00016488415860860535, - "loss": 0.0406, + "epoch": 0.54, + "learning_rate": 0.00021937368091546887, + "loss": 0.0462, "step": 83280 }, { - "epoch": 0.9, - "learning_rate": 0.00016486793432409627, - "loss": 0.0455, + "epoch": 0.54, + "learning_rate": 0.0002193639995611119, + "loss": 0.0453, "step": 83290 }, { - "epoch": 0.9, - "learning_rate": 0.00016485171003958725, - "loss": 0.0451, + "epoch": 0.54, + "learning_rate": 0.00021935431820675497, + "loss": 0.0458, "step": 83300 }, { - "epoch": 0.9, - "learning_rate": 0.00016483548575507817, - "loss": 0.0465, + "epoch": 0.54, + "learning_rate": 0.00021934463685239805, + "loss": 0.0518, "step": 83310 }, { - "epoch": 0.9, - "learning_rate": 0.00016481926147056915, - "loss": 0.0427, + "epoch": 0.54, + "learning_rate": 0.00021933495549804113, + "loss": 0.0552, "step": 83320 }, { - "epoch": 0.9, - "learning_rate": 0.00016480303718606007, - "loss": 0.0502, + "epoch": 0.54, + "learning_rate": 0.00021932527414368419, + "loss": 0.0596, "step": 83330 }, { - "epoch": 0.9, - "learning_rate": 0.00016478681290155102, - "loss": 0.0393, + "epoch": 0.54, + "learning_rate": 0.00021931559278932727, + "loss": 0.0502, "step": 83340 }, { - "epoch": 0.9, - "learning_rate": 0.00016477058861704197, - "loss": 0.045, + "epoch": 0.54, + "learning_rate": 0.00021930591143497034, + "loss": 0.0516, "step": 83350 }, { - "epoch": 0.9, - "learning_rate": 0.00016475436433253292, - "loss": 0.0447, + "epoch": 0.54, + "learning_rate": 0.00021929623008061337, + "loss": 0.0501, "step": 83360 }, { - "epoch": 0.9, - "learning_rate": 0.00016473814004802387, - "loss": 0.0382, + "epoch": 0.54, + "learning_rate": 0.00021928654872625645, + "loss": 0.0517, "step": 83370 }, { - "epoch": 0.9, - "learning_rate": 0.00016472191576351482, - "loss": 0.0484, + "epoch": 0.54, + "learning_rate": 0.00021927686737189953, + "loss": 0.0552, "step": 83380 }, { - "epoch": 0.9, - "learning_rate": 0.00016470569147900574, - "loss": 0.0383, + "epoch": 0.54, + "learning_rate": 0.00021926718601754258, + "loss": 0.0559, "step": 83390 }, { - "epoch": 0.9, - "learning_rate": 0.00016468946719449672, - "loss": 0.0449, + "epoch": 0.54, + "learning_rate": 0.00021925750466318566, + "loss": 0.0575, "step": 83400 }, { - "epoch": 0.9, - "learning_rate": 0.00016467324290998764, - "loss": 0.047, + "epoch": 0.54, + "learning_rate": 0.00021924782330882874, + "loss": 0.0473, "step": 83410 }, { - "epoch": 0.9, - "learning_rate": 0.00016465701862547862, - "loss": 0.0459, + "epoch": 0.54, + "learning_rate": 0.00021923814195447182, + "loss": 0.0526, "step": 83420 }, { - "epoch": 0.9, - "learning_rate": 0.00016464079434096954, - "loss": 0.0418, + "epoch": 0.54, + "learning_rate": 0.00021922846060011485, + "loss": 0.0553, "step": 83430 }, { - "epoch": 0.9, - "learning_rate": 0.0001646245700564605, - "loss": 0.0433, + "epoch": 0.54, + "learning_rate": 0.00021921877924575793, + "loss": 0.0532, "step": 83440 }, { - "epoch": 0.9, - "learning_rate": 0.00016460834577195144, - "loss": 0.0438, + "epoch": 0.54, + "learning_rate": 0.000219209097891401, + "loss": 0.0499, "step": 83450 }, { - "epoch": 0.9, - "learning_rate": 0.0001645921214874424, - "loss": 0.0546, + "epoch": 0.54, + "learning_rate": 0.00021919941653704406, + "loss": 0.0603, "step": 83460 }, { - "epoch": 0.9, - "learning_rate": 0.00016457589720293331, - "loss": 0.0414, + "epoch": 0.54, + "learning_rate": 0.00021918973518268714, + "loss": 0.053, "step": 83470 }, { - "epoch": 0.9, - "learning_rate": 0.0001645596729184243, - "loss": 0.0445, + "epoch": 0.54, + "learning_rate": 0.00021918005382833022, + "loss": 0.0525, "step": 83480 }, { - "epoch": 0.9, - "learning_rate": 0.00016454344863391521, - "loss": 0.0554, + "epoch": 0.54, + "learning_rate": 0.0002191703724739733, + "loss": 0.0548, "step": 83490 }, { - "epoch": 0.9, - "learning_rate": 0.0001645272243494062, - "loss": 0.0496, + "epoch": 0.54, + "learning_rate": 0.00021916069111961633, + "loss": 0.0545, "step": 83500 }, { - "epoch": 0.9, - "learning_rate": 0.00016451100006489711, - "loss": 0.0474, + "epoch": 0.54, + "learning_rate": 0.0002191510097652594, + "loss": 0.0479, "step": 83510 }, { - "epoch": 0.9, - "learning_rate": 0.00016449477578038806, - "loss": 0.0489, + "epoch": 0.54, + "learning_rate": 0.00021914132841090248, + "loss": 0.05, "step": 83520 }, { - "epoch": 0.9, - "learning_rate": 0.00016447855149587901, - "loss": 0.0387, + "epoch": 0.54, + "learning_rate": 0.00021913164705654554, + "loss": 0.0489, "step": 83530 }, { - "epoch": 0.9, - "learning_rate": 0.00016446232721136996, - "loss": 0.0401, + "epoch": 0.54, + "learning_rate": 0.00021912196570218862, + "loss": 0.0486, "step": 83540 }, { - "epoch": 0.9, - "learning_rate": 0.0001644461029268609, - "loss": 0.05, + "epoch": 0.54, + "learning_rate": 0.0002191122843478317, + "loss": 0.048, "step": 83550 }, { - "epoch": 0.9, - "learning_rate": 0.00016442987864235186, - "loss": 0.0427, + "epoch": 0.54, + "learning_rate": 0.00021910260299347475, + "loss": 0.0514, "step": 83560 }, { - "epoch": 0.9, - "learning_rate": 0.00016441365435784279, - "loss": 0.0489, + "epoch": 0.54, + "learning_rate": 0.0002190929216391178, + "loss": 0.0538, "step": 83570 }, { - "epoch": 0.9, - "learning_rate": 0.00016439743007333376, - "loss": 0.0459, + "epoch": 0.54, + "learning_rate": 0.00021908324028476088, + "loss": 0.0485, "step": 83580 }, { - "epoch": 0.9, - "learning_rate": 0.00016438120578882469, - "loss": 0.0424, + "epoch": 0.54, + "learning_rate": 0.00021907355893040393, + "loss": 0.0593, "step": 83590 }, { - "epoch": 0.9, - "learning_rate": 0.00016436498150431566, - "loss": 0.0395, + "epoch": 0.54, + "learning_rate": 0.00021906387757604701, + "loss": 0.0515, "step": 83600 }, { - "epoch": 0.9, - "learning_rate": 0.00016434875721980658, - "loss": 0.0416, + "epoch": 0.54, + "learning_rate": 0.0002190541962216901, + "loss": 0.0563, "step": 83610 }, { - "epoch": 0.9, - "learning_rate": 0.00016433253293529753, - "loss": 0.0489, + "epoch": 0.54, + "learning_rate": 0.00021904451486733317, + "loss": 0.0499, "step": 83620 }, { - "epoch": 0.9, - "learning_rate": 0.00016431630865078848, - "loss": 0.0546, + "epoch": 0.54, + "learning_rate": 0.00021903483351297623, + "loss": 0.0497, "step": 83630 }, { - "epoch": 0.9, - "learning_rate": 0.00016430008436627943, - "loss": 0.0384, + "epoch": 0.54, + "learning_rate": 0.00021902515215861928, + "loss": 0.0542, "step": 83640 }, { - "epoch": 0.9, - "learning_rate": 0.00016428386008177036, - "loss": 0.0376, + "epoch": 0.54, + "learning_rate": 0.00021901547080426236, + "loss": 0.0476, "step": 83650 }, { - "epoch": 0.9, - "learning_rate": 0.00016426763579726133, - "loss": 0.0459, + "epoch": 0.54, + "learning_rate": 0.0002190057894499054, + "loss": 0.0495, "step": 83660 }, { - "epoch": 0.9, - "learning_rate": 0.00016425141151275226, - "loss": 0.0425, + "epoch": 0.54, + "learning_rate": 0.0002189961080955485, + "loss": 0.0506, "step": 83670 }, { - "epoch": 0.91, - "learning_rate": 0.00016423518722824323, - "loss": 0.0404, + "epoch": 0.54, + "learning_rate": 0.00021898642674119157, + "loss": 0.0467, "step": 83680 }, { - "epoch": 0.91, - "learning_rate": 0.00016421896294373416, - "loss": 0.0404, + "epoch": 0.54, + "learning_rate": 0.00021897674538683465, + "loss": 0.0505, "step": 83690 }, { - "epoch": 0.91, - "learning_rate": 0.00016420273865922513, - "loss": 0.0351, + "epoch": 0.54, + "learning_rate": 0.0002189670640324777, + "loss": 0.0426, "step": 83700 }, { - "epoch": 0.91, - "learning_rate": 0.00016418651437471606, - "loss": 0.0417, + "epoch": 0.54, + "learning_rate": 0.00021895738267812076, + "loss": 0.0519, "step": 83710 }, { - "epoch": 0.91, - "learning_rate": 0.000164170290090207, - "loss": 0.0471, + "epoch": 0.54, + "learning_rate": 0.00021894770132376384, + "loss": 0.0476, "step": 83720 }, { - "epoch": 0.91, - "learning_rate": 0.00016415406580569795, - "loss": 0.0416, + "epoch": 0.54, + "learning_rate": 0.0002189380199694069, + "loss": 0.0551, "step": 83730 }, { - "epoch": 0.91, - "learning_rate": 0.0001641378415211889, - "loss": 0.0394, + "epoch": 0.54, + "learning_rate": 0.00021892833861504997, + "loss": 0.0504, "step": 83740 }, { - "epoch": 0.91, - "learning_rate": 0.00016412161723667983, - "loss": 0.0481, + "epoch": 0.54, + "learning_rate": 0.00021891865726069305, + "loss": 0.0487, "step": 83750 }, { - "epoch": 0.91, - "learning_rate": 0.0001641053929521708, - "loss": 0.0589, + "epoch": 0.54, + "learning_rate": 0.0002189089759063361, + "loss": 0.0481, "step": 83760 }, { - "epoch": 0.91, - "learning_rate": 0.00016408916866766173, - "loss": 0.0489, + "epoch": 0.54, + "learning_rate": 0.00021889929455197918, + "loss": 0.0518, "step": 83770 }, { - "epoch": 0.91, - "learning_rate": 0.0001640729443831527, - "loss": 0.0402, + "epoch": 0.54, + "learning_rate": 0.00021888961319762223, + "loss": 0.0488, "step": 83780 }, { - "epoch": 0.91, - "learning_rate": 0.00016405672009864363, - "loss": 0.0409, + "epoch": 0.54, + "learning_rate": 0.0002188799318432653, + "loss": 0.0567, "step": 83790 }, { - "epoch": 0.91, - "learning_rate": 0.00016404049581413458, - "loss": 0.0498, + "epoch": 0.54, + "learning_rate": 0.00021887025048890837, + "loss": 0.047, "step": 83800 }, { - "epoch": 0.91, - "learning_rate": 0.00016402427152962553, - "loss": 0.044, + "epoch": 0.54, + "learning_rate": 0.00021886056913455145, + "loss": 0.0571, "step": 83810 }, { - "epoch": 0.91, - "learning_rate": 0.00016400804724511648, - "loss": 0.0401, + "epoch": 0.54, + "learning_rate": 0.00021885088778019453, + "loss": 0.0588, "step": 83820 }, { - "epoch": 0.91, - "learning_rate": 0.0001639918229606074, - "loss": 0.042, + "epoch": 0.54, + "learning_rate": 0.00021884120642583758, + "loss": 0.0546, "step": 83830 }, { - "epoch": 0.91, - "learning_rate": 0.00016397559867609838, - "loss": 0.0379, + "epoch": 0.54, + "learning_rate": 0.00021883152507148066, + "loss": 0.054, "step": 83840 }, { - "epoch": 0.91, - "learning_rate": 0.0001639593743915893, - "loss": 0.0408, + "epoch": 0.54, + "learning_rate": 0.0002188218437171237, + "loss": 0.052, "step": 83850 }, { - "epoch": 0.91, - "learning_rate": 0.00016394315010708027, - "loss": 0.0469, + "epoch": 0.54, + "learning_rate": 0.00021881216236276676, + "loss": 0.0539, "step": 83860 }, { - "epoch": 0.91, - "learning_rate": 0.0001639269258225712, - "loss": 0.0423, + "epoch": 0.54, + "learning_rate": 0.00021880248100840984, + "loss": 0.0576, "step": 83870 }, { - "epoch": 0.91, - "learning_rate": 0.00016391070153806217, - "loss": 0.0417, + "epoch": 0.54, + "learning_rate": 0.00021879279965405292, + "loss": 0.0533, "step": 83880 }, { - "epoch": 0.91, - "learning_rate": 0.0001638944772535531, - "loss": 0.0411, + "epoch": 0.54, + "learning_rate": 0.000218783118299696, + "loss": 0.0493, "step": 83890 }, { - "epoch": 0.91, - "learning_rate": 0.00016387825296904405, - "loss": 0.0424, + "epoch": 0.54, + "learning_rate": 0.00021877343694533906, + "loss": 0.0488, "step": 83900 }, { - "epoch": 0.91, - "learning_rate": 0.000163862028684535, - "loss": 0.0369, + "epoch": 0.54, + "learning_rate": 0.00021876375559098214, + "loss": 0.0507, "step": 83910 }, { - "epoch": 0.91, - "learning_rate": 0.00016384580440002595, - "loss": 0.0384, + "epoch": 0.54, + "learning_rate": 0.0002187540742366252, + "loss": 0.0512, "step": 83920 }, { - "epoch": 0.91, - "learning_rate": 0.00016382958011551687, - "loss": 0.0411, + "epoch": 0.54, + "learning_rate": 0.00021874439288226824, + "loss": 0.061, "step": 83930 }, { - "epoch": 0.91, - "learning_rate": 0.00016381335583100785, - "loss": 0.0447, + "epoch": 0.54, + "learning_rate": 0.00021873471152791132, + "loss": 0.0542, "step": 83940 }, { - "epoch": 0.91, - "learning_rate": 0.00016379713154649877, - "loss": 0.0507, + "epoch": 0.54, + "learning_rate": 0.0002187250301735544, + "loss": 0.0523, "step": 83950 }, { - "epoch": 0.91, - "learning_rate": 0.00016378090726198975, - "loss": 0.0449, + "epoch": 0.54, + "learning_rate": 0.00021871534881919745, + "loss": 0.0485, "step": 83960 }, { - "epoch": 0.91, - "learning_rate": 0.00016376468297748067, - "loss": 0.0446, + "epoch": 0.54, + "learning_rate": 0.00021870566746484053, + "loss": 0.0475, "step": 83970 }, { - "epoch": 0.91, - "learning_rate": 0.00016374845869297162, - "loss": 0.0512, + "epoch": 0.54, + "learning_rate": 0.0002186959861104836, + "loss": 0.0459, "step": 83980 }, { - "epoch": 0.91, - "learning_rate": 0.00016373223440846257, - "loss": 0.0452, + "epoch": 0.54, + "learning_rate": 0.00021868630475612664, + "loss": 0.0504, "step": 83990 }, { - "epoch": 0.91, - "learning_rate": 0.00016371601012395352, - "loss": 0.0455, + "epoch": 0.54, + "learning_rate": 0.00021867662340176972, + "loss": 0.0526, "step": 84000 }, { - "epoch": 0.91, - "eval_cer": 0.9212364893160241, - "eval_loss": 0.03061256743967533, - "eval_runtime": 118.8872, - "eval_samples_per_second": 16.823, - "eval_steps_per_second": 4.206, + "epoch": 0.54, + "eval_cer": 0.9200343464015366, + "eval_loss": 0.033935271203517914, + "eval_runtime": 120.0158, + "eval_samples_per_second": 16.664, + "eval_steps_per_second": 4.166, "step": 84000 }, { - "epoch": 0.91, - "learning_rate": 0.00016369978583944444, - "loss": 0.05, + "epoch": 0.54, + "learning_rate": 0.0002186669420474128, + "loss": 0.0611, "step": 84010 }, { - "epoch": 0.91, - "learning_rate": 0.00016368356155493542, - "loss": 0.0413, + "epoch": 0.54, + "learning_rate": 0.00021865726069305588, + "loss": 0.0523, "step": 84020 }, { - "epoch": 0.91, - "learning_rate": 0.00016366733727042634, - "loss": 0.0431, + "epoch": 0.54, + "learning_rate": 0.00021864757933869893, + "loss": 0.047, "step": 84030 }, { - "epoch": 0.91, - "learning_rate": 0.00016365111298591732, - "loss": 0.041, + "epoch": 0.54, + "learning_rate": 0.000218637897984342, + "loss": 0.0557, "step": 84040 }, { - "epoch": 0.91, - "learning_rate": 0.00016363488870140824, - "loss": 0.0453, + "epoch": 0.54, + "learning_rate": 0.0002186282166299851, + "loss": 0.0476, "step": 84050 }, { - "epoch": 0.91, - "learning_rate": 0.00016361866441689922, - "loss": 0.038, + "epoch": 0.54, + "learning_rate": 0.00021861853527562812, + "loss": 0.0577, "step": 84060 }, { - "epoch": 0.91, - "learning_rate": 0.00016360244013239014, - "loss": 0.0426, + "epoch": 0.54, + "learning_rate": 0.0002186088539212712, + "loss": 0.0547, "step": 84070 }, { - "epoch": 0.91, - "learning_rate": 0.0001635862158478811, - "loss": 0.0402, + "epoch": 0.54, + "learning_rate": 0.00021859917256691428, + "loss": 0.0524, "step": 84080 }, { - "epoch": 0.91, - "learning_rate": 0.00016356999156337204, - "loss": 0.0461, + "epoch": 0.54, + "learning_rate": 0.00021858949121255736, + "loss": 0.049, "step": 84090 }, { - "epoch": 0.91, - "learning_rate": 0.000163553767278863, - "loss": 0.0409, + "epoch": 0.54, + "learning_rate": 0.0002185798098582004, + "loss": 0.0487, "step": 84100 }, { - "epoch": 0.91, - "learning_rate": 0.0001635375429943539, - "loss": 0.0415, + "epoch": 0.54, + "learning_rate": 0.0002185701285038435, + "loss": 0.0493, "step": 84110 }, { - "epoch": 0.91, - "learning_rate": 0.0001635213187098449, - "loss": 0.0536, + "epoch": 0.54, + "learning_rate": 0.00021856044714948657, + "loss": 0.0487, "step": 84120 }, { - "epoch": 0.91, - "learning_rate": 0.0001635050944253358, - "loss": 0.0381, + "epoch": 0.54, + "learning_rate": 0.0002185507657951296, + "loss": 0.0519, "step": 84130 }, { - "epoch": 0.91, - "learning_rate": 0.0001634888701408268, - "loss": 0.04, + "epoch": 0.54, + "learning_rate": 0.00021854108444077267, + "loss": 0.0542, "step": 84140 }, { - "epoch": 0.91, - "learning_rate": 0.0001634726458563177, - "loss": 0.0442, + "epoch": 0.54, + "learning_rate": 0.00021853140308641575, + "loss": 0.048, "step": 84150 }, { - "epoch": 0.91, - "learning_rate": 0.00016345642157180866, - "loss": 0.0407, + "epoch": 0.54, + "learning_rate": 0.0002185217217320588, + "loss": 0.0484, "step": 84160 }, { - "epoch": 0.91, - "learning_rate": 0.0001634401972872996, - "loss": 0.0411, + "epoch": 0.54, + "learning_rate": 0.00021851204037770189, + "loss": 0.0466, "step": 84170 }, { - "epoch": 0.91, - "learning_rate": 0.00016342397300279056, - "loss": 0.0386, + "epoch": 0.54, + "learning_rate": 0.00021850235902334496, + "loss": 0.0492, "step": 84180 }, { - "epoch": 0.91, - "learning_rate": 0.00016340774871828148, - "loss": 0.0428, + "epoch": 0.54, + "learning_rate": 0.00021849267766898804, + "loss": 0.0482, "step": 84190 }, { - "epoch": 0.91, - "learning_rate": 0.00016339152443377246, - "loss": 0.044, + "epoch": 0.54, + "learning_rate": 0.00021848299631463107, + "loss": 0.0551, "step": 84200 }, { - "epoch": 0.91, - "learning_rate": 0.00016337530014926338, - "loss": 0.0497, + "epoch": 0.54, + "learning_rate": 0.00021847331496027415, + "loss": 0.0535, "step": 84210 }, { - "epoch": 0.91, - "learning_rate": 0.00016335907586475436, - "loss": 0.0477, + "epoch": 0.54, + "learning_rate": 0.00021846363360591723, + "loss": 0.0534, "step": 84220 }, { - "epoch": 0.91, - "learning_rate": 0.00016334285158024528, - "loss": 0.0458, + "epoch": 0.54, + "learning_rate": 0.00021845395225156028, + "loss": 0.0467, "step": 84230 }, { - "epoch": 0.91, - "learning_rate": 0.00016332662729573626, - "loss": 0.044, + "epoch": 0.54, + "learning_rate": 0.00021844427089720336, + "loss": 0.0582, "step": 84240 }, { - "epoch": 0.91, - "learning_rate": 0.00016331040301122718, - "loss": 0.0402, + "epoch": 0.54, + "learning_rate": 0.00021843458954284644, + "loss": 0.0562, "step": 84250 }, { - "epoch": 0.91, - "learning_rate": 0.00016329417872671813, - "loss": 0.0487, + "epoch": 0.54, + "learning_rate": 0.00021842490818848952, + "loss": 0.0523, "step": 84260 }, { - "epoch": 0.91, - "learning_rate": 0.00016327795444220908, - "loss": 0.0409, + "epoch": 0.54, + "learning_rate": 0.00021841522683413255, + "loss": 0.0611, "step": 84270 }, { - "epoch": 0.91, - "learning_rate": 0.00016326173015770003, - "loss": 0.0446, + "epoch": 0.54, + "learning_rate": 0.00021840554547977563, + "loss": 0.053, "step": 84280 }, { - "epoch": 0.91, - "learning_rate": 0.00016324550587319095, - "loss": 0.0474, + "epoch": 0.54, + "learning_rate": 0.0002183958641254187, + "loss": 0.0504, "step": 84290 }, { - "epoch": 0.91, - "learning_rate": 0.00016322928158868193, - "loss": 0.0482, + "epoch": 0.54, + "learning_rate": 0.00021838618277106176, + "loss": 0.0468, "step": 84300 }, { - "epoch": 0.91, - "learning_rate": 0.00016321305730417285, - "loss": 0.0411, + "epoch": 0.54, + "learning_rate": 0.00021837650141670484, + "loss": 0.057, "step": 84310 }, { - "epoch": 0.91, - "learning_rate": 0.00016319683301966383, - "loss": 0.0515, + "epoch": 0.54, + "learning_rate": 0.00021836682006234792, + "loss": 0.0475, "step": 84320 }, { - "epoch": 0.91, - "learning_rate": 0.00016318060873515475, - "loss": 0.0422, + "epoch": 0.54, + "learning_rate": 0.000218357138707991, + "loss": 0.056, "step": 84330 }, { - "epoch": 0.91, - "learning_rate": 0.0001631643844506457, - "loss": 0.0453, + "epoch": 0.54, + "learning_rate": 0.00021834745735363402, + "loss": 0.0429, "step": 84340 }, { - "epoch": 0.91, - "learning_rate": 0.00016314816016613665, - "loss": 0.0457, + "epoch": 0.54, + "learning_rate": 0.0002183377759992771, + "loss": 0.0516, "step": 84350 }, { - "epoch": 0.91, - "learning_rate": 0.0001631319358816276, - "loss": 0.043, + "epoch": 0.54, + "learning_rate": 0.00021832809464492018, + "loss": 0.0547, "step": 84360 }, { - "epoch": 0.91, - "learning_rate": 0.00016311571159711855, - "loss": 0.0424, + "epoch": 0.54, + "learning_rate": 0.00021831841329056324, + "loss": 0.0452, "step": 84370 }, { - "epoch": 0.91, - "learning_rate": 0.0001630994873126095, - "loss": 0.0439, + "epoch": 0.54, + "learning_rate": 0.00021830873193620632, + "loss": 0.0489, "step": 84380 }, { - "epoch": 0.91, - "learning_rate": 0.00016308326302810042, - "loss": 0.0387, + "epoch": 0.54, + "learning_rate": 0.0002182990505818494, + "loss": 0.0506, "step": 84390 }, { - "epoch": 0.91, - "learning_rate": 0.0001630670387435914, - "loss": 0.0446, + "epoch": 0.54, + "learning_rate": 0.00021828936922749245, + "loss": 0.0589, "step": 84400 }, { - "epoch": 0.91, - "learning_rate": 0.00016305081445908232, - "loss": 0.0546, + "epoch": 0.54, + "learning_rate": 0.0002182796878731355, + "loss": 0.0479, "step": 84410 }, { - "epoch": 0.91, - "learning_rate": 0.0001630345901745733, - "loss": 0.042, + "epoch": 0.54, + "learning_rate": 0.00021827000651877858, + "loss": 0.0445, "step": 84420 }, { - "epoch": 0.91, - "learning_rate": 0.00016301836589006422, - "loss": 0.038, + "epoch": 0.54, + "learning_rate": 0.00021826032516442163, + "loss": 0.0492, "step": 84430 }, { - "epoch": 0.91, - "learning_rate": 0.00016300214160555517, - "loss": 0.0416, + "epoch": 0.54, + "learning_rate": 0.00021825064381006471, + "loss": 0.048, "step": 84440 }, { - "epoch": 0.91, - "learning_rate": 0.00016298591732104612, - "loss": 0.0374, + "epoch": 0.55, + "learning_rate": 0.0002182409624557078, + "loss": 0.0515, "step": 84450 }, { - "epoch": 0.91, - "learning_rate": 0.00016296969303653707, - "loss": 0.0408, + "epoch": 0.55, + "learning_rate": 0.00021823128110135087, + "loss": 0.0533, "step": 84460 }, { - "epoch": 0.91, - "learning_rate": 0.000162953468752028, - "loss": 0.0455, + "epoch": 0.55, + "learning_rate": 0.00021822159974699393, + "loss": 0.05, "step": 84470 }, { - "epoch": 0.91, - "learning_rate": 0.00016293724446751897, - "loss": 0.0463, + "epoch": 0.55, + "learning_rate": 0.00021821191839263698, + "loss": 0.0503, "step": 84480 }, { - "epoch": 0.91, - "learning_rate": 0.00016292102018300992, - "loss": 0.0414, + "epoch": 0.55, + "learning_rate": 0.00021820223703828006, + "loss": 0.0515, "step": 84490 }, { - "epoch": 0.91, - "learning_rate": 0.00016290479589850087, - "loss": 0.0425, + "epoch": 0.55, + "learning_rate": 0.0002181925556839231, + "loss": 0.05, "step": 84500 }, { - "epoch": 0.91, - "learning_rate": 0.00016288857161399182, - "loss": 0.0359, + "epoch": 0.55, + "learning_rate": 0.0002181828743295662, + "loss": 0.0513, "step": 84510 }, { - "epoch": 0.91, - "learning_rate": 0.00016287234732948274, - "loss": 0.0411, + "epoch": 0.55, + "learning_rate": 0.00021817319297520927, + "loss": 0.054, "step": 84520 }, { - "epoch": 0.91, - "learning_rate": 0.00016285612304497372, - "loss": 0.0524, + "epoch": 0.55, + "learning_rate": 0.00021816351162085235, + "loss": 0.0498, "step": 84530 }, { - "epoch": 0.91, - "learning_rate": 0.00016283989876046464, - "loss": 0.0507, + "epoch": 0.55, + "learning_rate": 0.0002181538302664954, + "loss": 0.0545, "step": 84540 }, { - "epoch": 0.91, - "learning_rate": 0.00016282367447595562, - "loss": 0.0444, + "epoch": 0.55, + "learning_rate": 0.00021814414891213846, + "loss": 0.048, "step": 84550 }, { - "epoch": 0.91, - "learning_rate": 0.00016280745019144654, - "loss": 0.0473, + "epoch": 0.55, + "learning_rate": 0.00021813446755778154, + "loss": 0.0543, "step": 84560 }, { - "epoch": 0.91, - "learning_rate": 0.00016279122590693752, - "loss": 0.0433, + "epoch": 0.55, + "learning_rate": 0.0002181247862034246, + "loss": 0.0533, "step": 84570 }, { - "epoch": 0.91, - "learning_rate": 0.00016277500162242844, - "loss": 0.0392, + "epoch": 0.55, + "learning_rate": 0.00021811510484906767, + "loss": 0.0518, "step": 84580 }, { - "epoch": 0.91, - "learning_rate": 0.0001627587773379194, - "loss": 0.0447, + "epoch": 0.55, + "learning_rate": 0.00021810542349471075, + "loss": 0.061, "step": 84590 }, { - "epoch": 0.92, - "learning_rate": 0.00016274255305341034, - "loss": 0.0439, + "epoch": 0.55, + "learning_rate": 0.0002180957421403538, + "loss": 0.0457, "step": 84600 }, { - "epoch": 0.92, - "learning_rate": 0.0001627263287689013, - "loss": 0.0355, + "epoch": 0.55, + "learning_rate": 0.00021808606078599688, + "loss": 0.0518, "step": 84610 }, { - "epoch": 0.92, - "learning_rate": 0.0001627101044843922, - "loss": 0.0354, + "epoch": 0.55, + "learning_rate": 0.00021807637943163993, + "loss": 0.0532, "step": 84620 }, { - "epoch": 0.92, - "learning_rate": 0.0001626938801998832, - "loss": 0.0377, + "epoch": 0.55, + "learning_rate": 0.00021806669807728299, + "loss": 0.0514, "step": 84630 }, { - "epoch": 0.92, - "learning_rate": 0.0001626776559153741, - "loss": 0.0363, + "epoch": 0.55, + "learning_rate": 0.00021805701672292607, + "loss": 0.0516, "step": 84640 }, { - "epoch": 0.92, - "learning_rate": 0.0001626614316308651, - "loss": 0.0369, + "epoch": 0.55, + "learning_rate": 0.00021804733536856915, + "loss": 0.0442, "step": 84650 }, { - "epoch": 0.92, - "learning_rate": 0.000162645207346356, - "loss": 0.037, + "epoch": 0.55, + "learning_rate": 0.00021803765401421223, + "loss": 0.0509, "step": 84660 }, { - "epoch": 0.92, - "learning_rate": 0.00016262898306184696, - "loss": 0.0417, + "epoch": 0.55, + "learning_rate": 0.00021802797265985528, + "loss": 0.0482, "step": 84670 }, { - "epoch": 0.92, - "learning_rate": 0.0001626127587773379, - "loss": 0.036, + "epoch": 0.55, + "learning_rate": 0.00021801829130549836, + "loss": 0.0477, "step": 84680 }, { - "epoch": 0.92, - "learning_rate": 0.00016259653449282886, - "loss": 0.0514, + "epoch": 0.55, + "learning_rate": 0.0002180086099511414, + "loss": 0.0531, "step": 84690 }, { - "epoch": 0.92, - "learning_rate": 0.00016258031020831978, - "loss": 0.0442, + "epoch": 0.55, + "learning_rate": 0.00021799892859678446, + "loss": 0.0505, "step": 84700 }, { - "epoch": 0.92, - "learning_rate": 0.00016256408592381076, - "loss": 0.0473, + "epoch": 0.55, + "learning_rate": 0.00021798924724242754, + "loss": 0.0487, "step": 84710 }, { - "epoch": 0.92, - "learning_rate": 0.00016254786163930168, - "loss": 0.0418, + "epoch": 0.55, + "learning_rate": 0.00021797956588807062, + "loss": 0.0457, "step": 84720 }, { - "epoch": 0.92, - "learning_rate": 0.00016253163735479266, - "loss": 0.0437, + "epoch": 0.55, + "learning_rate": 0.0002179698845337137, + "loss": 0.0519, "step": 84730 }, { - "epoch": 0.92, - "learning_rate": 0.00016251541307028358, - "loss": 0.0421, + "epoch": 0.55, + "learning_rate": 0.00021796020317935676, + "loss": 0.0497, "step": 84740 }, { - "epoch": 0.92, - "learning_rate": 0.00016249918878577456, - "loss": 0.0442, + "epoch": 0.55, + "learning_rate": 0.00021795052182499984, + "loss": 0.0474, "step": 84750 }, { - "epoch": 0.92, - "learning_rate": 0.00016248296450126548, - "loss": 0.0424, + "epoch": 0.55, + "learning_rate": 0.0002179408404706429, + "loss": 0.0611, "step": 84760 }, { - "epoch": 0.92, - "learning_rate": 0.00016246674021675643, - "loss": 0.0456, + "epoch": 0.55, + "learning_rate": 0.00021793115911628594, + "loss": 0.0519, "step": 84770 }, { - "epoch": 0.92, - "learning_rate": 0.00016245051593224738, - "loss": 0.0478, + "epoch": 0.55, + "learning_rate": 0.00021792147776192902, + "loss": 0.0521, "step": 84780 }, { - "epoch": 0.92, - "learning_rate": 0.00016243429164773833, - "loss": 0.0435, + "epoch": 0.55, + "learning_rate": 0.0002179117964075721, + "loss": 0.0488, "step": 84790 }, { - "epoch": 0.92, - "learning_rate": 0.00016241806736322926, - "loss": 0.0452, + "epoch": 0.55, + "learning_rate": 0.00021790211505321515, + "loss": 0.049, "step": 84800 }, { - "epoch": 0.92, - "learning_rate": 0.00016240184307872023, - "loss": 0.0403, + "epoch": 0.55, + "learning_rate": 0.00021789243369885823, + "loss": 0.0504, "step": 84810 }, { - "epoch": 0.92, - "learning_rate": 0.00016238561879421115, - "loss": 0.0404, + "epoch": 0.55, + "learning_rate": 0.0002178827523445013, + "loss": 0.0447, "step": 84820 }, { - "epoch": 0.92, - "learning_rate": 0.00016236939450970213, - "loss": 0.0363, + "epoch": 0.55, + "learning_rate": 0.00021787307099014434, + "loss": 0.0485, "step": 84830 }, { - "epoch": 0.92, - "learning_rate": 0.00016235317022519305, - "loss": 0.0425, + "epoch": 0.55, + "learning_rate": 0.00021786338963578742, + "loss": 0.0443, "step": 84840 }, { - "epoch": 0.92, - "learning_rate": 0.000162336945940684, - "loss": 0.0398, + "epoch": 0.55, + "learning_rate": 0.0002178537082814305, + "loss": 0.0549, "step": 84850 }, { - "epoch": 0.92, - "learning_rate": 0.00016232072165617495, - "loss": 0.0453, + "epoch": 0.55, + "learning_rate": 0.00021784402692707358, + "loss": 0.0551, "step": 84860 }, { - "epoch": 0.92, - "learning_rate": 0.0001623044973716659, - "loss": 0.0442, + "epoch": 0.55, + "learning_rate": 0.00021783434557271663, + "loss": 0.0572, "step": 84870 }, { - "epoch": 0.92, - "learning_rate": 0.00016228827308715683, - "loss": 0.0453, + "epoch": 0.55, + "learning_rate": 0.0002178246642183597, + "loss": 0.045, "step": 84880 }, { - "epoch": 0.92, - "learning_rate": 0.0001622720488026478, - "loss": 0.0455, + "epoch": 0.55, + "learning_rate": 0.0002178149828640028, + "loss": 0.0578, "step": 84890 }, { - "epoch": 0.92, - "learning_rate": 0.00016225582451813873, - "loss": 0.0469, + "epoch": 0.55, + "learning_rate": 0.00021780530150964582, + "loss": 0.055, "step": 84900 }, { - "epoch": 0.92, - "learning_rate": 0.0001622396002336297, - "loss": 0.0362, + "epoch": 0.55, + "learning_rate": 0.0002177956201552889, + "loss": 0.0549, "step": 84910 }, { - "epoch": 0.92, - "learning_rate": 0.00016222337594912063, - "loss": 0.041, + "epoch": 0.55, + "learning_rate": 0.00021778593880093197, + "loss": 0.0457, "step": 84920 }, { - "epoch": 0.92, - "learning_rate": 0.0001622071516646116, - "loss": 0.0404, + "epoch": 0.55, + "learning_rate": 0.00021777625744657505, + "loss": 0.0565, "step": 84930 }, { - "epoch": 0.92, - "learning_rate": 0.00016219092738010252, - "loss": 0.0412, + "epoch": 0.55, + "learning_rate": 0.0002177665760922181, + "loss": 0.0468, "step": 84940 }, { - "epoch": 0.92, - "learning_rate": 0.00016217470309559347, - "loss": 0.0463, + "epoch": 0.55, + "learning_rate": 0.0002177568947378612, + "loss": 0.0526, "step": 84950 }, { - "epoch": 0.92, - "learning_rate": 0.00016215847881108442, - "loss": 0.043, + "epoch": 0.55, + "learning_rate": 0.00021774721338350427, + "loss": 0.0502, "step": 84960 }, { - "epoch": 0.92, - "learning_rate": 0.00016214225452657537, - "loss": 0.061, + "epoch": 0.55, + "learning_rate": 0.0002177375320291473, + "loss": 0.0627, "step": 84970 }, { - "epoch": 0.92, - "learning_rate": 0.0001621260302420663, - "loss": 0.0454, + "epoch": 0.55, + "learning_rate": 0.00021772785067479037, + "loss": 0.0537, "step": 84980 }, { - "epoch": 0.92, - "learning_rate": 0.00016210980595755727, - "loss": 0.0409, + "epoch": 0.55, + "learning_rate": 0.00021771816932043345, + "loss": 0.0468, "step": 84990 }, { - "epoch": 0.92, - "learning_rate": 0.0001620935816730482, - "loss": 0.0446, + "epoch": 0.55, + "learning_rate": 0.0002177084879660765, + "loss": 0.0485, "step": 85000 }, { - "epoch": 0.92, - "eval_cer": 0.9211984994902296, - "eval_loss": 0.03149057552218437, - "eval_runtime": 118.9244, - "eval_samples_per_second": 16.817, - "eval_steps_per_second": 4.204, + "epoch": 0.55, + "eval_cer": 0.9199746921251836, + "eval_loss": 0.033818814903497696, + "eval_runtime": 120.0068, + "eval_samples_per_second": 16.666, + "eval_steps_per_second": 4.166, "step": 85000 }, { - "epoch": 0.92, - "learning_rate": 0.00016207735738853917, - "loss": 0.0435, + "epoch": 0.55, + "learning_rate": 0.00021769880661171958, + "loss": 0.0553, "step": 85010 }, { - "epoch": 0.92, - "learning_rate": 0.0001620611331040301, - "loss": 0.0405, + "epoch": 0.55, + "learning_rate": 0.00021768912525736266, + "loss": 0.0487, "step": 85020 }, { - "epoch": 0.92, - "learning_rate": 0.00016204490881952105, - "loss": 0.047, + "epoch": 0.55, + "learning_rate": 0.00021767944390300574, + "loss": 0.0495, "step": 85030 }, { - "epoch": 0.92, - "learning_rate": 0.000162028684535012, - "loss": 0.0429, + "epoch": 0.55, + "learning_rate": 0.00021766976254864877, + "loss": 0.0514, "step": 85040 }, { - "epoch": 0.92, - "learning_rate": 0.00016201246025050295, - "loss": 0.0355, + "epoch": 0.55, + "learning_rate": 0.00021766008119429185, + "loss": 0.0576, "step": 85050 }, { - "epoch": 0.92, - "learning_rate": 0.0001619962359659939, - "loss": 0.047, + "epoch": 0.55, + "learning_rate": 0.00021765039983993493, + "loss": 0.0525, "step": 85060 }, { - "epoch": 0.92, - "learning_rate": 0.00016198001168148484, - "loss": 0.0428, + "epoch": 0.55, + "learning_rate": 0.00021764071848557798, + "loss": 0.0502, "step": 85070 }, { - "epoch": 0.92, - "learning_rate": 0.00016196378739697577, - "loss": 0.0427, + "epoch": 0.55, + "learning_rate": 0.00021763103713122106, + "loss": 0.0519, "step": 85080 }, { - "epoch": 0.92, - "learning_rate": 0.00016194756311246674, - "loss": 0.0446, + "epoch": 0.55, + "learning_rate": 0.00021762135577686414, + "loss": 0.0524, "step": 85090 }, { - "epoch": 0.92, - "learning_rate": 0.00016193133882795767, - "loss": 0.0467, + "epoch": 0.55, + "learning_rate": 0.00021761167442250722, + "loss": 0.0583, "step": 85100 }, { - "epoch": 0.92, - "learning_rate": 0.00016191511454344864, - "loss": 0.0404, + "epoch": 0.55, + "learning_rate": 0.00021760199306815025, + "loss": 0.0433, "step": 85110 }, { - "epoch": 0.92, - "learning_rate": 0.00016189889025893957, - "loss": 0.0444, + "epoch": 0.55, + "learning_rate": 0.00021759231171379333, + "loss": 0.0537, "step": 85120 }, { - "epoch": 0.92, - "learning_rate": 0.00016188266597443052, - "loss": 0.045, + "epoch": 0.55, + "learning_rate": 0.0002175826303594364, + "loss": 0.0552, "step": 85130 }, { - "epoch": 0.92, - "learning_rate": 0.00016186644168992147, - "loss": 0.0426, + "epoch": 0.55, + "learning_rate": 0.00021757294900507946, + "loss": 0.0569, "step": 85140 }, { - "epoch": 0.92, - "learning_rate": 0.00016185021740541242, - "loss": 0.0458, + "epoch": 0.55, + "learning_rate": 0.00021756326765072254, + "loss": 0.0494, "step": 85150 }, { - "epoch": 0.92, - "learning_rate": 0.00016183399312090334, - "loss": 0.0428, + "epoch": 0.55, + "learning_rate": 0.00021755358629636562, + "loss": 0.0748, "step": 85160 }, { - "epoch": 0.92, - "learning_rate": 0.00016181776883639432, - "loss": 0.0441, + "epoch": 0.55, + "learning_rate": 0.00021754390494200867, + "loss": 0.0764, "step": 85170 }, { - "epoch": 0.92, - "learning_rate": 0.00016180154455188524, - "loss": 0.0427, + "epoch": 0.55, + "learning_rate": 0.00021753422358765172, + "loss": 0.0512, "step": 85180 }, { - "epoch": 0.92, - "learning_rate": 0.00016178532026737621, - "loss": 0.0402, + "epoch": 0.55, + "learning_rate": 0.0002175245422332948, + "loss": 0.049, "step": 85190 }, { - "epoch": 0.92, - "learning_rate": 0.00016176909598286714, - "loss": 0.0446, + "epoch": 0.55, + "learning_rate": 0.00021751486087893786, + "loss": 0.054, "step": 85200 }, { - "epoch": 0.92, - "learning_rate": 0.0001617528716983581, - "loss": 0.0469, + "epoch": 0.55, + "learning_rate": 0.00021750517952458094, + "loss": 0.0496, "step": 85210 }, { - "epoch": 0.92, - "learning_rate": 0.00016173664741384904, - "loss": 0.0367, + "epoch": 0.55, + "learning_rate": 0.00021749549817022402, + "loss": 0.0595, "step": 85220 }, { - "epoch": 0.92, - "learning_rate": 0.00016172042312934, - "loss": 0.0384, + "epoch": 0.55, + "learning_rate": 0.0002174858168158671, + "loss": 0.0558, "step": 85230 }, { - "epoch": 0.92, - "learning_rate": 0.00016170419884483094, - "loss": 0.0412, + "epoch": 0.55, + "learning_rate": 0.00021747613546151015, + "loss": 0.0496, "step": 85240 }, { - "epoch": 0.92, - "learning_rate": 0.00016168797456032189, - "loss": 0.0414, + "epoch": 0.55, + "learning_rate": 0.0002174664541071532, + "loss": 0.0486, "step": 85250 }, { - "epoch": 0.92, - "learning_rate": 0.0001616717502758128, - "loss": 0.0398, + "epoch": 0.55, + "learning_rate": 0.00021745677275279628, + "loss": 0.0558, "step": 85260 }, { - "epoch": 0.92, - "learning_rate": 0.00016165552599130379, - "loss": 0.0438, + "epoch": 0.55, + "learning_rate": 0.00021744709139843933, + "loss": 0.0515, "step": 85270 }, { - "epoch": 0.92, - "learning_rate": 0.0001616393017067947, - "loss": 0.0402, + "epoch": 0.55, + "learning_rate": 0.00021743741004408241, + "loss": 0.053, "step": 85280 }, { - "epoch": 0.92, - "learning_rate": 0.00016162307742228569, - "loss": 0.0526, + "epoch": 0.55, + "learning_rate": 0.0002174277286897255, + "loss": 0.0518, "step": 85290 }, { - "epoch": 0.92, - "learning_rate": 0.0001616068531377766, - "loss": 0.0512, + "epoch": 0.55, + "learning_rate": 0.00021741804733536857, + "loss": 0.0567, "step": 85300 }, { - "epoch": 0.92, - "learning_rate": 0.00016159062885326756, - "loss": 0.0449, + "epoch": 0.55, + "learning_rate": 0.00021740836598101163, + "loss": 0.0505, "step": 85310 }, { - "epoch": 0.92, - "learning_rate": 0.0001615744045687585, - "loss": 0.0453, + "epoch": 0.55, + "learning_rate": 0.00021739868462665468, + "loss": 0.0476, "step": 85320 }, { - "epoch": 0.92, - "learning_rate": 0.00016155818028424946, - "loss": 0.0491, + "epoch": 0.55, + "learning_rate": 0.00021738900327229776, + "loss": 0.0489, "step": 85330 }, { - "epoch": 0.92, - "learning_rate": 0.00016154195599974038, - "loss": 0.0425, + "epoch": 0.55, + "learning_rate": 0.0002173793219179408, + "loss": 0.0532, "step": 85340 }, { - "epoch": 0.92, - "learning_rate": 0.00016152573171523136, - "loss": 0.0379, + "epoch": 0.55, + "learning_rate": 0.0002173696405635839, + "loss": 0.0627, "step": 85350 }, { - "epoch": 0.92, - "learning_rate": 0.00016150950743072228, - "loss": 0.0429, + "epoch": 0.55, + "learning_rate": 0.00021735995920922697, + "loss": 0.0552, "step": 85360 }, { - "epoch": 0.92, - "learning_rate": 0.00016149328314621326, - "loss": 0.0494, + "epoch": 0.55, + "learning_rate": 0.00021735027785487002, + "loss": 0.0488, "step": 85370 }, { - "epoch": 0.92, - "learning_rate": 0.00016147705886170418, - "loss": 0.046, + "epoch": 0.55, + "learning_rate": 0.0002173405965005131, + "loss": 0.0508, "step": 85380 }, { - "epoch": 0.92, - "learning_rate": 0.00016146083457719513, - "loss": 0.049, + "epoch": 0.55, + "learning_rate": 0.00021733091514615616, + "loss": 0.0501, "step": 85390 }, { - "epoch": 0.92, - "learning_rate": 0.00016144461029268608, - "loss": 0.0454, + "epoch": 0.55, + "learning_rate": 0.0002173212337917992, + "loss": 0.0459, "step": 85400 }, { - "epoch": 0.92, - "learning_rate": 0.00016142838600817703, - "loss": 0.0418, + "epoch": 0.55, + "learning_rate": 0.0002173115524374423, + "loss": 0.0444, "step": 85410 }, { - "epoch": 0.92, - "learning_rate": 0.00016141216172366798, - "loss": 0.0441, + "epoch": 0.55, + "learning_rate": 0.00021730187108308537, + "loss": 0.0494, "step": 85420 }, { - "epoch": 0.92, - "learning_rate": 0.00016139593743915893, - "loss": 0.0407, + "epoch": 0.55, + "learning_rate": 0.00021729218972872845, + "loss": 0.05, "step": 85430 }, { - "epoch": 0.92, - "learning_rate": 0.00016137971315464985, - "loss": 0.0475, + "epoch": 0.55, + "learning_rate": 0.0002172825083743715, + "loss": 0.0483, "step": 85440 }, { - "epoch": 0.92, - "learning_rate": 0.00016136348887014083, - "loss": 0.0461, + "epoch": 0.55, + "learning_rate": 0.00021727282702001458, + "loss": 0.0509, "step": 85450 }, { - "epoch": 0.92, - "learning_rate": 0.00016134726458563175, - "loss": 0.0481, + "epoch": 0.55, + "learning_rate": 0.00021726314566565763, + "loss": 0.0536, "step": 85460 }, { - "epoch": 0.92, - "learning_rate": 0.00016133104030112273, - "loss": 0.047, + "epoch": 0.55, + "learning_rate": 0.00021725346431130069, + "loss": 0.0496, "step": 85470 }, { - "epoch": 0.92, - "learning_rate": 0.00016131481601661365, - "loss": 0.0523, + "epoch": 0.55, + "learning_rate": 0.00021724378295694377, + "loss": 0.0559, "step": 85480 }, { - "epoch": 0.92, - "learning_rate": 0.0001612985917321046, - "loss": 0.0607, + "epoch": 0.55, + "learning_rate": 0.00021723410160258685, + "loss": 0.0507, "step": 85490 }, { - "epoch": 0.92, - "learning_rate": 0.00016128236744759555, - "loss": 0.0465, + "epoch": 0.55, + "learning_rate": 0.00021722442024822993, + "loss": 0.0461, "step": 85500 }, { - "epoch": 0.92, - "learning_rate": 0.0001612661431630865, - "loss": 0.0466, + "epoch": 0.55, + "learning_rate": 0.00021721473889387298, + "loss": 0.0538, "step": 85510 }, { - "epoch": 0.92, - "learning_rate": 0.00016124991887857742, - "loss": 0.0439, + "epoch": 0.55, + "learning_rate": 0.00021720505753951606, + "loss": 0.0473, "step": 85520 }, { - "epoch": 0.93, - "learning_rate": 0.0001612336945940684, - "loss": 0.048, + "epoch": 0.55, + "learning_rate": 0.0002171953761851591, + "loss": 0.0594, "step": 85530 }, { - "epoch": 0.93, - "learning_rate": 0.00016121747030955932, - "loss": 0.0489, + "epoch": 0.55, + "learning_rate": 0.00021718569483080216, + "loss": 0.0496, "step": 85540 }, { - "epoch": 0.93, - "learning_rate": 0.0001612012460250503, - "loss": 0.0448, + "epoch": 0.55, + "learning_rate": 0.00021717601347644524, + "loss": 0.047, "step": 85550 }, { - "epoch": 0.93, - "learning_rate": 0.00016118502174054122, - "loss": 0.041, + "epoch": 0.55, + "learning_rate": 0.00021716633212208832, + "loss": 0.0606, "step": 85560 }, { - "epoch": 0.93, - "learning_rate": 0.00016116879745603217, - "loss": 0.0405, + "epoch": 0.55, + "learning_rate": 0.00021715665076773138, + "loss": 0.0481, "step": 85570 }, { - "epoch": 0.93, - "learning_rate": 0.00016115257317152312, - "loss": 0.0433, + "epoch": 0.55, + "learning_rate": 0.00021714696941337446, + "loss": 0.0475, "step": 85580 }, { - "epoch": 0.93, - "learning_rate": 0.00016113634888701407, - "loss": 0.0412, + "epoch": 0.55, + "learning_rate": 0.00021713728805901753, + "loss": 0.0449, "step": 85590 }, { - "epoch": 0.93, - "learning_rate": 0.00016112012460250502, - "loss": 0.0473, + "epoch": 0.55, + "learning_rate": 0.00021712760670466056, + "loss": 0.0537, "step": 85600 }, { - "epoch": 0.93, - "learning_rate": 0.00016110390031799597, - "loss": 0.0399, + "epoch": 0.55, + "learning_rate": 0.00021711792535030364, + "loss": 0.0509, "step": 85610 }, { - "epoch": 0.93, - "learning_rate": 0.0001610876760334869, - "loss": 0.0428, + "epoch": 0.55, + "learning_rate": 0.00021710824399594672, + "loss": 0.0452, "step": 85620 }, { - "epoch": 0.93, - "learning_rate": 0.00016107145174897787, - "loss": 0.0406, + "epoch": 0.55, + "learning_rate": 0.0002170985626415898, + "loss": 0.0518, "step": 85630 }, { - "epoch": 0.93, - "learning_rate": 0.0001610552274644688, - "loss": 0.0512, + "epoch": 0.55, + "learning_rate": 0.00021708888128723285, + "loss": 0.047, "step": 85640 }, { - "epoch": 0.93, - "learning_rate": 0.00016103900317995977, - "loss": 0.0396, + "epoch": 0.55, + "learning_rate": 0.00021707919993287593, + "loss": 0.0594, "step": 85650 }, { - "epoch": 0.93, - "learning_rate": 0.0001610227788954507, - "loss": 0.0429, + "epoch": 0.55, + "learning_rate": 0.000217069518578519, + "loss": 0.0538, "step": 85660 }, { - "epoch": 0.93, - "learning_rate": 0.00016100655461094164, - "loss": 0.0466, + "epoch": 0.55, + "learning_rate": 0.00021705983722416204, + "loss": 0.0504, "step": 85670 }, { - "epoch": 0.93, - "learning_rate": 0.0001609903303264326, - "loss": 0.0436, + "epoch": 0.55, + "learning_rate": 0.00021705015586980512, + "loss": 0.0524, "step": 85680 }, { - "epoch": 0.93, - "learning_rate": 0.00016097410604192354, - "loss": 0.0479, + "epoch": 0.55, + "learning_rate": 0.0002170404745154482, + "loss": 0.0551, "step": 85690 }, { - "epoch": 0.93, - "learning_rate": 0.00016095788175741446, - "loss": 0.0453, + "epoch": 0.55, + "learning_rate": 0.00021703079316109128, + "loss": 0.0479, "step": 85700 }, { - "epoch": 0.93, - "learning_rate": 0.00016094165747290544, - "loss": 0.0403, + "epoch": 0.55, + "learning_rate": 0.00021702111180673433, + "loss": 0.0482, "step": 85710 }, { - "epoch": 0.93, - "learning_rate": 0.00016092543318839636, - "loss": 0.0439, + "epoch": 0.55, + "learning_rate": 0.0002170114304523774, + "loss": 0.0489, "step": 85720 }, { - "epoch": 0.93, - "learning_rate": 0.00016090920890388734, - "loss": 0.0492, + "epoch": 0.55, + "learning_rate": 0.0002170017490980205, + "loss": 0.0482, "step": 85730 }, { - "epoch": 0.93, - "learning_rate": 0.00016089298461937826, - "loss": 0.0428, + "epoch": 0.55, + "learning_rate": 0.00021699206774366351, + "loss": 0.0493, "step": 85740 }, { - "epoch": 0.93, - "learning_rate": 0.00016087676033486924, - "loss": 0.0358, + "epoch": 0.55, + "learning_rate": 0.0002169823863893066, + "loss": 0.05, "step": 85750 }, { - "epoch": 0.93, - "learning_rate": 0.00016086053605036016, - "loss": 0.0464, + "epoch": 0.55, + "learning_rate": 0.00021697270503494967, + "loss": 0.0474, "step": 85760 }, { - "epoch": 0.93, - "learning_rate": 0.0001608443117658511, - "loss": 0.0452, + "epoch": 0.55, + "learning_rate": 0.00021696302368059273, + "loss": 0.0458, "step": 85770 }, { - "epoch": 0.93, - "learning_rate": 0.00016082808748134206, - "loss": 0.0399, + "epoch": 0.55, + "learning_rate": 0.0002169533423262358, + "loss": 0.052, "step": 85780 }, { - "epoch": 0.93, - "learning_rate": 0.000160811863196833, - "loss": 0.0399, + "epoch": 0.55, + "learning_rate": 0.0002169436609718789, + "loss": 0.0481, "step": 85790 }, { - "epoch": 0.93, - "learning_rate": 0.00016079563891232393, - "loss": 0.0427, + "epoch": 0.55, + "learning_rate": 0.00021693397961752197, + "loss": 0.0524, "step": 85800 }, { - "epoch": 0.93, - "learning_rate": 0.0001607794146278149, - "loss": 0.0457, + "epoch": 0.55, + "learning_rate": 0.000216924298263165, + "loss": 0.0546, "step": 85810 }, { - "epoch": 0.93, - "learning_rate": 0.00016076319034330583, - "loss": 0.036, + "epoch": 0.55, + "learning_rate": 0.00021691461690880807, + "loss": 0.0483, "step": 85820 }, { - "epoch": 0.93, - "learning_rate": 0.0001607469660587968, - "loss": 0.0448, + "epoch": 0.55, + "learning_rate": 0.00021690493555445115, + "loss": 0.0513, "step": 85830 }, { - "epoch": 0.93, - "learning_rate": 0.00016073074177428773, - "loss": 0.0411, + "epoch": 0.55, + "learning_rate": 0.0002168952542000942, + "loss": 0.0491, "step": 85840 }, { - "epoch": 0.93, - "learning_rate": 0.00016071451748977868, - "loss": 0.0413, + "epoch": 0.55, + "learning_rate": 0.00021688557284573728, + "loss": 0.0507, "step": 85850 }, { - "epoch": 0.93, - "learning_rate": 0.00016069829320526963, - "loss": 0.0465, + "epoch": 0.55, + "learning_rate": 0.00021687589149138036, + "loss": 0.0519, "step": 85860 }, { - "epoch": 0.93, - "learning_rate": 0.00016068206892076058, - "loss": 0.0438, + "epoch": 0.55, + "learning_rate": 0.00021686621013702344, + "loss": 0.0507, "step": 85870 }, { - "epoch": 0.93, - "learning_rate": 0.0001606658446362515, - "loss": 0.0421, + "epoch": 0.55, + "learning_rate": 0.00021685652878266647, + "loss": 0.0459, "step": 85880 }, { - "epoch": 0.93, - "learning_rate": 0.00016064962035174248, - "loss": 0.0417, + "epoch": 0.55, + "learning_rate": 0.00021684684742830955, + "loss": 0.059, "step": 85890 }, { - "epoch": 0.93, - "learning_rate": 0.0001606333960672334, - "loss": 0.0388, + "epoch": 0.55, + "learning_rate": 0.00021683716607395263, + "loss": 0.0446, "step": 85900 }, { - "epoch": 0.93, - "learning_rate": 0.00016061717178272438, - "loss": 0.0411, + "epoch": 0.55, + "learning_rate": 0.00021682748471959568, + "loss": 0.0495, "step": 85910 }, { - "epoch": 0.93, - "learning_rate": 0.0001606009474982153, - "loss": 0.0428, + "epoch": 0.55, + "learning_rate": 0.00021681780336523876, + "loss": 0.0519, "step": 85920 }, { - "epoch": 0.93, - "learning_rate": 0.00016058472321370628, - "loss": 0.0384, + "epoch": 0.55, + "learning_rate": 0.00021680812201088184, + "loss": 0.0582, "step": 85930 }, { - "epoch": 0.93, - "learning_rate": 0.0001605684989291972, - "loss": 0.0395, + "epoch": 0.55, + "learning_rate": 0.00021679844065652492, + "loss": 0.0511, "step": 85940 }, { - "epoch": 0.93, - "learning_rate": 0.00016055227464468815, - "loss": 0.0406, + "epoch": 0.55, + "learning_rate": 0.00021678875930216795, + "loss": 0.0464, "step": 85950 }, { - "epoch": 0.93, - "learning_rate": 0.0001605360503601791, - "loss": 0.0415, + "epoch": 0.55, + "learning_rate": 0.00021677907794781103, + "loss": 0.048, "step": 85960 }, { - "epoch": 0.93, - "learning_rate": 0.00016051982607567005, - "loss": 0.0529, + "epoch": 0.55, + "learning_rate": 0.00021676939659345408, + "loss": 0.0539, "step": 85970 }, { - "epoch": 0.93, - "learning_rate": 0.00016050360179116098, - "loss": 0.0458, + "epoch": 0.55, + "learning_rate": 0.00021675971523909716, + "loss": 0.0509, "step": 85980 }, { - "epoch": 0.93, - "learning_rate": 0.00016048737750665195, - "loss": 0.0512, + "epoch": 0.55, + "learning_rate": 0.00021675003388474024, + "loss": 0.0466, "step": 85990 }, { - "epoch": 0.93, - "learning_rate": 0.00016047115322214288, - "loss": 0.0532, + "epoch": 0.56, + "learning_rate": 0.00021674035253038332, + "loss": 0.0489, "step": 86000 }, { - "epoch": 0.93, - "eval_cer": 0.9211993829745504, - "eval_loss": 0.030498242005705833, - "eval_runtime": 118.8053, - "eval_samples_per_second": 16.834, - "eval_steps_per_second": 4.209, + "epoch": 0.56, + "eval_cer": 0.9199322110495989, + "eval_loss": 0.03454515337944031, + "eval_runtime": 120.4354, + "eval_samples_per_second": 16.606, + "eval_steps_per_second": 4.152, "step": 86000 }, { - "epoch": 0.93, - "learning_rate": 0.00016045492893763385, - "loss": 0.0428, + "epoch": 0.56, + "learning_rate": 0.00021673067117602637, + "loss": 0.0495, "step": 86010 }, { - "epoch": 0.93, - "learning_rate": 0.00016043870465312477, - "loss": 0.0552, + "epoch": 0.56, + "learning_rate": 0.00021672098982166942, + "loss": 0.0477, "step": 86020 }, { - "epoch": 0.93, - "learning_rate": 0.00016042248036861572, - "loss": 0.044, + "epoch": 0.56, + "learning_rate": 0.0002167113084673125, + "loss": 0.0555, "step": 86030 }, { - "epoch": 0.93, - "learning_rate": 0.00016040625608410667, - "loss": 0.0458, + "epoch": 0.56, + "learning_rate": 0.00021670162711295556, + "loss": 0.0603, "step": 86040 }, { - "epoch": 0.93, - "learning_rate": 0.00016039003179959762, + "epoch": 0.56, + "learning_rate": 0.00021669194575859864, "loss": 0.049, "step": 86050 }, { - "epoch": 0.93, - "learning_rate": 0.00016037380751508855, - "loss": 0.0477, + "epoch": 0.56, + "learning_rate": 0.00021668226440424172, + "loss": 0.0533, "step": 86060 }, { - "epoch": 0.93, - "learning_rate": 0.00016035758323057952, - "loss": 0.0386, + "epoch": 0.56, + "learning_rate": 0.0002166725830498848, + "loss": 0.0547, "step": 86070 }, { - "epoch": 0.93, - "learning_rate": 0.00016034135894607045, - "loss": 0.0343, + "epoch": 0.56, + "learning_rate": 0.00021666290169552782, + "loss": 0.0583, "step": 86080 }, { - "epoch": 0.93, - "learning_rate": 0.00016032513466156142, - "loss": 0.0439, + "epoch": 0.56, + "learning_rate": 0.0002166532203411709, + "loss": 0.0493, "step": 86090 }, { - "epoch": 0.93, - "learning_rate": 0.00016030891037705235, - "loss": 0.0425, + "epoch": 0.56, + "learning_rate": 0.00021664353898681398, + "loss": 0.0558, "step": 86100 }, { - "epoch": 0.93, - "learning_rate": 0.00016029268609254332, - "loss": 0.0393, + "epoch": 0.56, + "learning_rate": 0.00021663385763245703, + "loss": 0.0515, "step": 86110 }, { - "epoch": 0.93, - "learning_rate": 0.00016027646180803425, - "loss": 0.0418, + "epoch": 0.56, + "learning_rate": 0.0002166241762781001, + "loss": 0.0532, "step": 86120 }, { - "epoch": 0.93, - "learning_rate": 0.0001602602375235252, - "loss": 0.0421, + "epoch": 0.56, + "learning_rate": 0.0002166144949237432, + "loss": 0.0486, "step": 86130 }, { - "epoch": 0.93, - "learning_rate": 0.00016024401323901614, - "loss": 0.0399, + "epoch": 0.56, + "learning_rate": 0.00021660481356938627, + "loss": 0.0521, "step": 86140 }, { - "epoch": 0.93, - "learning_rate": 0.0001602277889545071, - "loss": 0.0447, + "epoch": 0.56, + "learning_rate": 0.0002165951322150293, + "loss": 0.0427, "step": 86150 }, { - "epoch": 0.93, - "learning_rate": 0.00016021156466999802, - "loss": 0.0409, + "epoch": 0.56, + "learning_rate": 0.00021658545086067238, + "loss": 0.0454, "step": 86160 }, { - "epoch": 0.93, - "learning_rate": 0.000160195340385489, - "loss": 0.0484, + "epoch": 0.56, + "learning_rate": 0.00021657576950631543, + "loss": 0.049, "step": 86170 }, { - "epoch": 0.93, - "learning_rate": 0.00016017911610097992, - "loss": 0.0488, + "epoch": 0.56, + "learning_rate": 0.0002165660881519585, + "loss": 0.052, "step": 86180 }, { - "epoch": 0.93, - "learning_rate": 0.0001601628918164709, - "loss": 0.0447, + "epoch": 0.56, + "learning_rate": 0.0002165564067976016, + "loss": 0.0552, "step": 86190 }, { - "epoch": 0.93, - "learning_rate": 0.00016014666753196182, - "loss": 0.045, + "epoch": 0.56, + "learning_rate": 0.00021654672544324467, + "loss": 0.0474, "step": 86200 }, { - "epoch": 0.93, - "learning_rate": 0.00016013044324745277, - "loss": 0.0446, + "epoch": 0.56, + "learning_rate": 0.00021653704408888772, + "loss": 0.0553, "step": 86210 }, { - "epoch": 0.93, - "learning_rate": 0.00016011421896294372, - "loss": 0.0392, + "epoch": 0.56, + "learning_rate": 0.00021652736273453078, + "loss": 0.0538, "step": 86220 }, { - "epoch": 0.93, - "learning_rate": 0.00016009799467843467, - "loss": 0.0395, + "epoch": 0.56, + "learning_rate": 0.00021651768138017386, + "loss": 0.0544, "step": 86230 }, { - "epoch": 0.93, - "learning_rate": 0.0001600817703939256, - "loss": 0.0443, + "epoch": 0.56, + "learning_rate": 0.0002165080000258169, + "loss": 0.0511, "step": 86240 }, { - "epoch": 0.93, - "learning_rate": 0.00016006554610941657, - "loss": 0.0468, + "epoch": 0.56, + "learning_rate": 0.00021649831867146, + "loss": 0.05, "step": 86250 }, { - "epoch": 0.93, - "learning_rate": 0.0001600493218249075, - "loss": 0.0506, + "epoch": 0.56, + "learning_rate": 0.00021648863731710307, + "loss": 0.0489, "step": 86260 }, { - "epoch": 0.93, - "learning_rate": 0.00016003309754039846, - "loss": 0.0437, + "epoch": 0.56, + "learning_rate": 0.00021647895596274615, + "loss": 0.05, "step": 86270 }, { - "epoch": 0.93, - "learning_rate": 0.0001600168732558894, - "loss": 0.0395, + "epoch": 0.56, + "learning_rate": 0.0002164692746083892, + "loss": 0.0531, "step": 86280 }, { - "epoch": 0.93, - "learning_rate": 0.00016000064897138036, - "loss": 0.0386, + "epoch": 0.56, + "learning_rate": 0.00021645959325403225, + "loss": 0.0489, "step": 86290 }, { - "epoch": 0.93, - "learning_rate": 0.0001599844246868713, - "loss": 0.0426, + "epoch": 0.56, + "learning_rate": 0.00021644991189967533, + "loss": 0.0526, "step": 86300 }, { - "epoch": 0.93, - "learning_rate": 0.00015996820040236224, - "loss": 0.0403, + "epoch": 0.56, + "learning_rate": 0.00021644023054531839, + "loss": 0.0482, "step": 86310 }, { - "epoch": 0.93, - "learning_rate": 0.0001599519761178532, - "loss": 0.0446, + "epoch": 0.56, + "learning_rate": 0.00021643054919096147, + "loss": 0.0488, "step": 86320 }, { - "epoch": 0.93, - "learning_rate": 0.00015993575183334414, - "loss": 0.038, + "epoch": 0.56, + "learning_rate": 0.00021642086783660455, + "loss": 0.0475, "step": 86330 }, { - "epoch": 0.93, - "learning_rate": 0.00015991952754883506, - "loss": 0.0392, + "epoch": 0.56, + "learning_rate": 0.00021641118648224762, + "loss": 0.0588, "step": 86340 }, { - "epoch": 0.93, - "learning_rate": 0.00015990330326432604, - "loss": 0.0434, + "epoch": 0.56, + "learning_rate": 0.00021640150512789068, + "loss": 0.0484, "step": 86350 }, { - "epoch": 0.93, - "learning_rate": 0.00015988707897981696, - "loss": 0.0476, + "epoch": 0.56, + "learning_rate": 0.00021639182377353373, + "loss": 0.0564, "step": 86360 }, { - "epoch": 0.93, - "learning_rate": 0.00015987085469530794, - "loss": 0.0442, + "epoch": 0.56, + "learning_rate": 0.00021638214241917678, + "loss": 0.0518, "step": 86370 }, { - "epoch": 0.93, - "learning_rate": 0.00015985463041079886, - "loss": 0.0369, + "epoch": 0.56, + "learning_rate": 0.00021637246106481986, + "loss": 0.0489, "step": 86380 }, { - "epoch": 0.93, - "learning_rate": 0.0001598384061262898, - "loss": 0.0419, + "epoch": 0.56, + "learning_rate": 0.00021636277971046294, + "loss": 0.0516, "step": 86390 }, { - "epoch": 0.93, - "learning_rate": 0.00015982218184178076, - "loss": 0.04, + "epoch": 0.56, + "learning_rate": 0.00021635309835610602, + "loss": 0.0605, "step": 86400 }, { - "epoch": 0.93, - "learning_rate": 0.0001598059575572717, - "loss": 0.0449, + "epoch": 0.56, + "learning_rate": 0.00021634341700174907, + "loss": 0.0553, "step": 86410 }, { - "epoch": 0.93, - "learning_rate": 0.00015978973327276263, - "loss": 0.0436, + "epoch": 0.56, + "learning_rate": 0.00021633373564739215, + "loss": 0.0513, "step": 86420 }, { - "epoch": 0.93, - "learning_rate": 0.0001597735089882536, - "loss": 0.051, + "epoch": 0.56, + "learning_rate": 0.0002163240542930352, + "loss": 0.0614, "step": 86430 }, { - "epoch": 0.93, - "learning_rate": 0.00015975728470374453, - "loss": 0.0351, + "epoch": 0.56, + "learning_rate": 0.00021631437293867826, + "loss": 0.05, "step": 86440 }, { - "epoch": 0.94, - "learning_rate": 0.0001597410604192355, - "loss": 0.0393, + "epoch": 0.56, + "learning_rate": 0.00021630469158432134, + "loss": 0.0498, "step": 86450 }, { - "epoch": 0.94, - "learning_rate": 0.00015972483613472643, - "loss": 0.0425, + "epoch": 0.56, + "learning_rate": 0.00021629501022996442, + "loss": 0.0491, "step": 86460 }, { - "epoch": 0.94, - "learning_rate": 0.0001597086118502174, - "loss": 0.0418, + "epoch": 0.56, + "learning_rate": 0.0002162853288756075, + "loss": 0.048, "step": 86470 }, { - "epoch": 0.94, - "learning_rate": 0.00015969238756570833, - "loss": 0.0341, + "epoch": 0.56, + "learning_rate": 0.00021627564752125055, + "loss": 0.046, "step": 86480 }, { - "epoch": 0.94, - "learning_rate": 0.00015967616328119928, - "loss": 0.0463, + "epoch": 0.56, + "learning_rate": 0.00021626596616689363, + "loss": 0.0525, "step": 86490 }, { - "epoch": 0.94, - "learning_rate": 0.00015965993899669023, - "loss": 0.0427, + "epoch": 0.56, + "learning_rate": 0.00021625628481253668, + "loss": 0.0489, "step": 86500 }, { - "epoch": 0.94, - "learning_rate": 0.00015964371471218118, - "loss": 0.0428, + "epoch": 0.56, + "learning_rate": 0.00021624660345817974, + "loss": 0.0513, "step": 86510 }, { - "epoch": 0.94, - "learning_rate": 0.0001596274904276721, - "loss": 0.0372, + "epoch": 0.56, + "learning_rate": 0.00021623692210382282, + "loss": 0.0522, "step": 86520 }, { - "epoch": 0.94, - "learning_rate": 0.00015961126614316308, - "loss": 0.0445, + "epoch": 0.56, + "learning_rate": 0.0002162272407494659, + "loss": 0.0497, "step": 86530 }, { - "epoch": 0.94, - "learning_rate": 0.000159595041858654, - "loss": 0.046, + "epoch": 0.56, + "learning_rate": 0.00021621755939510898, + "loss": 0.0504, "step": 86540 }, { - "epoch": 0.94, - "learning_rate": 0.00015957881757414498, - "loss": 0.0404, + "epoch": 0.56, + "learning_rate": 0.00021620787804075203, + "loss": 0.0493, "step": 86550 }, { - "epoch": 0.94, - "learning_rate": 0.0001595625932896359, - "loss": 0.0452, + "epoch": 0.56, + "learning_rate": 0.0002161981966863951, + "loss": 0.0474, "step": 86560 }, { - "epoch": 0.94, - "learning_rate": 0.00015954636900512685, - "loss": 0.0428, + "epoch": 0.56, + "learning_rate": 0.00021618851533203813, + "loss": 0.0484, "step": 86570 }, { - "epoch": 0.94, - "learning_rate": 0.0001595301447206178, - "loss": 0.036, + "epoch": 0.56, + "learning_rate": 0.00021617883397768121, + "loss": 0.0512, "step": 86580 }, { - "epoch": 0.94, - "learning_rate": 0.00015951392043610875, - "loss": 0.0404, + "epoch": 0.56, + "learning_rate": 0.0002161691526233243, + "loss": 0.0484, "step": 86590 }, { - "epoch": 0.94, - "learning_rate": 0.0001594976961515997, - "loss": 0.0381, + "epoch": 0.56, + "learning_rate": 0.00021615947126896737, + "loss": 0.0402, "step": 86600 }, { - "epoch": 0.94, - "learning_rate": 0.00015948147186709065, - "loss": 0.0439, + "epoch": 0.56, + "learning_rate": 0.00021614978991461043, + "loss": 0.0515, "step": 86610 }, { - "epoch": 0.94, - "learning_rate": 0.00015946524758258157, - "loss": 0.0409, + "epoch": 0.56, + "learning_rate": 0.0002161401085602535, + "loss": 0.0487, "step": 86620 }, { - "epoch": 0.94, - "learning_rate": 0.00015944902329807255, - "loss": 0.0418, + "epoch": 0.56, + "learning_rate": 0.00021613042720589659, + "loss": 0.0471, "step": 86630 }, { - "epoch": 0.94, - "learning_rate": 0.00015943279901356347, - "loss": 0.0421, + "epoch": 0.56, + "learning_rate": 0.0002161207458515396, + "loss": 0.048, "step": 86640 }, { - "epoch": 0.94, - "learning_rate": 0.00015941657472905445, - "loss": 0.0397, + "epoch": 0.56, + "learning_rate": 0.0002161110644971827, + "loss": 0.0538, "step": 86650 }, { - "epoch": 0.94, - "learning_rate": 0.00015940035044454537, - "loss": 0.0451, + "epoch": 0.56, + "learning_rate": 0.00021610138314282577, + "loss": 0.0447, "step": 86660 }, { - "epoch": 0.94, - "learning_rate": 0.00015938412616003632, - "loss": 0.0373, + "epoch": 0.56, + "learning_rate": 0.00021609170178846885, + "loss": 0.0562, "step": 86670 }, { - "epoch": 0.94, - "learning_rate": 0.00015936790187552727, - "loss": 0.0365, + "epoch": 0.56, + "learning_rate": 0.0002160820204341119, + "loss": 0.0494, "step": 86680 }, { - "epoch": 0.94, - "learning_rate": 0.00015935167759101822, - "loss": 0.0391, + "epoch": 0.56, + "learning_rate": 0.00021607233907975498, + "loss": 0.0509, "step": 86690 }, { - "epoch": 0.94, - "learning_rate": 0.00015933545330650914, - "loss": 0.0372, + "epoch": 0.56, + "learning_rate": 0.00021606265772539806, + "loss": 0.0541, "step": 86700 }, { - "epoch": 0.94, - "learning_rate": 0.00015931922902200012, - "loss": 0.0391, + "epoch": 0.56, + "learning_rate": 0.0002160529763710411, + "loss": 0.0454, "step": 86710 }, { - "epoch": 0.94, - "learning_rate": 0.00015930300473749104, - "loss": 0.0453, + "epoch": 0.56, + "learning_rate": 0.00021604329501668417, + "loss": 0.054, "step": 86720 }, { - "epoch": 0.94, - "learning_rate": 0.00015928678045298202, - "loss": 0.051, + "epoch": 0.56, + "learning_rate": 0.00021603361366232725, + "loss": 0.0613, "step": 86730 }, { - "epoch": 0.94, - "learning_rate": 0.00015927055616847294, - "loss": 0.048, + "epoch": 0.56, + "learning_rate": 0.00021602393230797033, + "loss": 0.0486, "step": 86740 }, { - "epoch": 0.94, - "learning_rate": 0.0001592543318839639, - "loss": 0.0381, + "epoch": 0.56, + "learning_rate": 0.00021601425095361338, + "loss": 0.0711, "step": 86750 }, { - "epoch": 0.94, - "learning_rate": 0.00015923810759945484, - "loss": 0.0482, + "epoch": 0.56, + "learning_rate": 0.00021600456959925646, + "loss": 0.0554, "step": 86760 }, { - "epoch": 0.94, - "learning_rate": 0.0001592218833149458, - "loss": 0.0479, + "epoch": 0.56, + "learning_rate": 0.00021599488824489954, + "loss": 0.049, "step": 86770 }, { - "epoch": 0.94, - "learning_rate": 0.00015920565903043674, - "loss": 0.039, + "epoch": 0.56, + "learning_rate": 0.00021598520689054257, + "loss": 0.0465, "step": 86780 }, { - "epoch": 0.94, - "learning_rate": 0.0001591894347459277, - "loss": 0.0391, + "epoch": 0.56, + "learning_rate": 0.00021597552553618565, + "loss": 0.0499, "step": 86790 }, { - "epoch": 0.94, - "learning_rate": 0.0001591732104614186, - "loss": 0.043, + "epoch": 0.56, + "learning_rate": 0.00021596584418182873, + "loss": 0.0487, "step": 86800 }, { - "epoch": 0.94, - "learning_rate": 0.0001591569861769096, - "loss": 0.0427, + "epoch": 0.56, + "learning_rate": 0.00021595616282747178, + "loss": 0.0516, "step": 86810 }, { - "epoch": 0.94, - "learning_rate": 0.0001591407618924005, - "loss": 0.0443, + "epoch": 0.56, + "learning_rate": 0.00021594648147311486, + "loss": 0.0486, "step": 86820 }, { - "epoch": 0.94, - "learning_rate": 0.0001591245376078915, - "loss": 0.0507, + "epoch": 0.56, + "learning_rate": 0.00021593680011875794, + "loss": 0.0545, "step": 86830 }, { - "epoch": 0.94, - "learning_rate": 0.00015910831332338244, - "loss": 0.045, + "epoch": 0.56, + "learning_rate": 0.00021592711876440102, + "loss": 0.0491, "step": 86840 }, { - "epoch": 0.94, - "learning_rate": 0.00015909208903887336, - "loss": 0.0401, + "epoch": 0.56, + "learning_rate": 0.00021591743741004404, + "loss": 0.057, "step": 86850 }, { - "epoch": 0.94, - "learning_rate": 0.00015907586475436434, - "loss": 0.0475, + "epoch": 0.56, + "learning_rate": 0.00021590775605568712, + "loss": 0.0519, "step": 86860 }, { - "epoch": 0.94, - "learning_rate": 0.00015905964046985526, - "loss": 0.0472, + "epoch": 0.56, + "learning_rate": 0.0002158980747013302, + "loss": 0.0481, "step": 86870 }, { - "epoch": 0.94, - "learning_rate": 0.00015904341618534624, - "loss": 0.0452, + "epoch": 0.56, + "learning_rate": 0.00021588839334697326, + "loss": 0.055, "step": 86880 }, { - "epoch": 0.94, - "learning_rate": 0.00015902719190083716, - "loss": 0.0388, + "epoch": 0.56, + "learning_rate": 0.00021587871199261634, + "loss": 0.0504, "step": 86890 }, { - "epoch": 0.94, - "learning_rate": 0.0001590109676163281, - "loss": 0.0373, + "epoch": 0.56, + "learning_rate": 0.00021586903063825942, + "loss": 0.0538, "step": 86900 }, { - "epoch": 0.94, - "learning_rate": 0.00015899474333181906, - "loss": 0.0382, + "epoch": 0.56, + "learning_rate": 0.0002158593492839025, + "loss": 0.0548, "step": 86910 }, { - "epoch": 0.94, - "learning_rate": 0.00015897851904731, - "loss": 0.0479, + "epoch": 0.56, + "learning_rate": 0.00021584966792954552, + "loss": 0.0528, "step": 86920 }, { - "epoch": 0.94, - "learning_rate": 0.00015896229476280093, - "loss": 0.0445, + "epoch": 0.56, + "learning_rate": 0.0002158399865751886, + "loss": 0.0525, "step": 86930 }, { - "epoch": 0.94, - "learning_rate": 0.0001589460704782919, - "loss": 0.0472, + "epoch": 0.56, + "learning_rate": 0.00021583030522083168, + "loss": 0.0494, "step": 86940 }, { - "epoch": 0.94, - "learning_rate": 0.00015892984619378283, - "loss": 0.0401, + "epoch": 0.56, + "learning_rate": 0.00021582062386647473, + "loss": 0.049, "step": 86950 }, { - "epoch": 0.94, - "learning_rate": 0.0001589136219092738, - "loss": 0.0474, + "epoch": 0.56, + "learning_rate": 0.0002158109425121178, + "loss": 0.048, "step": 86960 }, { - "epoch": 0.94, - "learning_rate": 0.00015889739762476473, - "loss": 0.045, + "epoch": 0.56, + "learning_rate": 0.0002158012611577609, + "loss": 0.0422, "step": 86970 }, { - "epoch": 0.94, - "learning_rate": 0.0001588811733402557, - "loss": 0.0465, + "epoch": 0.56, + "learning_rate": 0.00021579157980340395, + "loss": 0.051, "step": 86980 }, { - "epoch": 0.94, - "learning_rate": 0.00015886494905574663, - "loss": 0.0388, + "epoch": 0.56, + "learning_rate": 0.000215781898449047, + "loss": 0.051, "step": 86990 }, { - "epoch": 0.94, - "learning_rate": 0.00015884872477123758, - "loss": 0.052, + "epoch": 0.56, + "learning_rate": 0.00021577221709469008, + "loss": 0.0473, "step": 87000 }, { - "epoch": 0.94, - "eval_cer": 0.9212479746121945, - "eval_loss": 0.030459340661764145, - "eval_runtime": 118.9439, - "eval_samples_per_second": 16.815, - "eval_steps_per_second": 4.204, + "epoch": 0.56, + "eval_cer": 0.9200949045305615, + "eval_loss": 0.033820219337940216, + "eval_runtime": 119.8564, + "eval_samples_per_second": 16.687, + "eval_steps_per_second": 4.172, "step": 87000 }, { - "epoch": 0.94, - "learning_rate": 0.00015883250048672853, - "loss": 0.0433, + "epoch": 0.56, + "learning_rate": 0.00021576253574033313, + "loss": 0.0527, "step": 87010 }, { - "epoch": 0.94, - "learning_rate": 0.00015881627620221948, - "loss": 0.0428, + "epoch": 0.56, + "learning_rate": 0.0002157528543859762, + "loss": 0.0451, "step": 87020 }, { - "epoch": 0.94, - "learning_rate": 0.0001588000519177104, - "loss": 0.0387, + "epoch": 0.56, + "learning_rate": 0.0002157431730316193, + "loss": 0.0548, "step": 87030 }, { - "epoch": 0.94, - "learning_rate": 0.00015878382763320138, - "loss": 0.0426, + "epoch": 0.56, + "learning_rate": 0.00021573349167726237, + "loss": 0.0487, "step": 87040 }, { - "epoch": 0.94, - "learning_rate": 0.0001587676033486923, - "loss": 0.0426, + "epoch": 0.56, + "learning_rate": 0.00021572381032290542, + "loss": 0.0535, "step": 87050 }, { - "epoch": 0.94, - "learning_rate": 0.00015875137906418328, - "loss": 0.0441, + "epoch": 0.56, + "learning_rate": 0.00021571412896854848, + "loss": 0.0517, "step": 87060 }, { - "epoch": 0.94, - "learning_rate": 0.0001587351547796742, - "loss": 0.0448, + "epoch": 0.56, + "learning_rate": 0.00021570444761419156, + "loss": 0.0513, "step": 87070 }, { - "epoch": 0.94, - "learning_rate": 0.00015871893049516515, - "loss": 0.0362, + "epoch": 0.56, + "learning_rate": 0.0002156947662598346, + "loss": 0.056, "step": 87080 }, { - "epoch": 0.94, - "learning_rate": 0.0001587027062106561, - "loss": 0.0395, + "epoch": 0.56, + "learning_rate": 0.0002156850849054777, + "loss": 0.0534, "step": 87090 }, { - "epoch": 0.94, - "learning_rate": 0.00015868648192614705, - "loss": 0.0561, + "epoch": 0.56, + "learning_rate": 0.00021567540355112077, + "loss": 0.0483, "step": 87100 }, { - "epoch": 0.94, - "learning_rate": 0.00015867025764163797, - "loss": 0.0473, + "epoch": 0.56, + "learning_rate": 0.00021566572219676385, + "loss": 0.0455, "step": 87110 }, { - "epoch": 0.94, - "learning_rate": 0.00015865403335712895, - "loss": 0.0526, + "epoch": 0.56, + "learning_rate": 0.0002156560408424069, + "loss": 0.0572, "step": 87120 }, { - "epoch": 0.94, - "learning_rate": 0.00015863780907261987, - "loss": 0.0415, + "epoch": 0.56, + "learning_rate": 0.00021564635948804995, + "loss": 0.0582, "step": 87130 }, { - "epoch": 0.94, - "learning_rate": 0.00015862158478811085, - "loss": 0.0418, + "epoch": 0.56, + "learning_rate": 0.00021563667813369303, + "loss": 0.0464, "step": 87140 }, { - "epoch": 0.94, - "learning_rate": 0.00015860536050360177, - "loss": 0.0368, + "epoch": 0.56, + "learning_rate": 0.00021562699677933609, + "loss": 0.054, "step": 87150 }, { - "epoch": 0.94, - "learning_rate": 0.00015858913621909275, - "loss": 0.0413, + "epoch": 0.56, + "learning_rate": 0.00021561731542497916, + "loss": 0.0445, "step": 87160 }, { - "epoch": 0.94, - "learning_rate": 0.00015857291193458367, - "loss": 0.0448, + "epoch": 0.56, + "learning_rate": 0.00021560763407062224, + "loss": 0.0489, "step": 87170 }, { - "epoch": 0.94, - "learning_rate": 0.00015855668765007462, - "loss": 0.0412, + "epoch": 0.56, + "learning_rate": 0.0002155979527162653, + "loss": 0.0592, "step": 87180 }, { - "epoch": 0.94, - "learning_rate": 0.00015854046336556557, - "loss": 0.0354, + "epoch": 0.56, + "learning_rate": 0.00021558827136190838, + "loss": 0.0507, "step": 87190 }, { - "epoch": 0.94, - "learning_rate": 0.00015852423908105652, - "loss": 0.0369, - "step": 87200 + "epoch": 0.56, + "learning_rate": 0.00021557859000755143, + "loss": 0.0487, + "step": 87200 }, { - "epoch": 0.94, - "learning_rate": 0.00015850801479654745, - "loss": 0.0465, + "epoch": 0.56, + "learning_rate": 0.00021556890865319448, + "loss": 0.0508, "step": 87210 }, { - "epoch": 0.94, - "learning_rate": 0.00015849179051203842, - "loss": 0.0396, + "epoch": 0.56, + "learning_rate": 0.00021555922729883756, + "loss": 0.0437, "step": 87220 }, { - "epoch": 0.94, - "learning_rate": 0.00015847556622752934, - "loss": 0.0383, + "epoch": 0.56, + "learning_rate": 0.00021554954594448064, + "loss": 0.0557, "step": 87230 }, { - "epoch": 0.94, - "learning_rate": 0.00015845934194302032, - "loss": 0.0476, + "epoch": 0.56, + "learning_rate": 0.00021553986459012372, + "loss": 0.0448, "step": 87240 }, { - "epoch": 0.94, - "learning_rate": 0.00015844311765851124, - "loss": 0.0397, + "epoch": 0.56, + "learning_rate": 0.00021553018323576677, + "loss": 0.0466, "step": 87250 }, { - "epoch": 0.94, - "learning_rate": 0.0001584268933740022, - "loss": 0.0432, + "epoch": 0.56, + "learning_rate": 0.00021552050188140985, + "loss": 0.0442, "step": 87260 }, { - "epoch": 0.94, - "learning_rate": 0.00015841066908949314, - "loss": 0.038, + "epoch": 0.56, + "learning_rate": 0.0002155108205270529, + "loss": 0.0493, "step": 87270 }, { - "epoch": 0.94, - "learning_rate": 0.0001583944448049841, - "loss": 0.0404, + "epoch": 0.56, + "learning_rate": 0.00021550113917269596, + "loss": 0.0443, "step": 87280 }, { - "epoch": 0.94, - "learning_rate": 0.00015837822052047504, - "loss": 0.0418, + "epoch": 0.56, + "learning_rate": 0.00021549145781833904, + "loss": 0.0517, "step": 87290 }, { - "epoch": 0.94, - "learning_rate": 0.000158361996235966, - "loss": 0.0399, + "epoch": 0.56, + "learning_rate": 0.00021548177646398212, + "loss": 0.0503, "step": 87300 }, { - "epoch": 0.94, - "learning_rate": 0.00015834577195145692, - "loss": 0.0509, + "epoch": 0.56, + "learning_rate": 0.0002154720951096252, + "loss": 0.0582, "step": 87310 }, { - "epoch": 0.94, - "learning_rate": 0.0001583295476669479, - "loss": 0.043, + "epoch": 0.56, + "learning_rate": 0.00021546241375526825, + "loss": 0.0552, "step": 87320 }, { - "epoch": 0.94, - "learning_rate": 0.00015831332338243882, - "loss": 0.0435, + "epoch": 0.56, + "learning_rate": 0.00021545273240091133, + "loss": 0.0592, "step": 87330 }, { - "epoch": 0.94, - "learning_rate": 0.0001582970990979298, - "loss": 0.0372, + "epoch": 0.56, + "learning_rate": 0.00021544305104655438, + "loss": 0.0571, "step": 87340 }, { - "epoch": 0.94, - "learning_rate": 0.00015828087481342071, - "loss": 0.0429, + "epoch": 0.56, + "learning_rate": 0.00021543336969219744, + "loss": 0.051, "step": 87350 }, { - "epoch": 0.94, - "learning_rate": 0.00015826465052891166, - "loss": 0.04, + "epoch": 0.56, + "learning_rate": 0.00021542368833784052, + "loss": 0.0594, "step": 87360 }, { - "epoch": 0.95, - "learning_rate": 0.00015824842624440261, - "loss": 0.0467, + "epoch": 0.56, + "learning_rate": 0.0002154140069834836, + "loss": 0.0453, "step": 87370 }, { - "epoch": 0.95, - "learning_rate": 0.00015823220195989356, - "loss": 0.0389, + "epoch": 0.56, + "learning_rate": 0.00021540432562912665, + "loss": 0.0583, "step": 87380 }, { - "epoch": 0.95, - "learning_rate": 0.0001582159776753845, - "loss": 0.0374, + "epoch": 0.56, + "learning_rate": 0.00021539464427476973, + "loss": 0.0571, "step": 87390 }, { - "epoch": 0.95, - "learning_rate": 0.00015819975339087546, - "loss": 0.0385, + "epoch": 0.56, + "learning_rate": 0.0002153849629204128, + "loss": 0.0474, "step": 87400 }, { - "epoch": 0.95, - "learning_rate": 0.00015818352910636639, - "loss": 0.0442, + "epoch": 0.56, + "learning_rate": 0.00021537528156605583, + "loss": 0.053, "step": 87410 }, { - "epoch": 0.95, - "learning_rate": 0.00015816730482185736, - "loss": 0.0441, + "epoch": 0.56, + "learning_rate": 0.00021536560021169891, + "loss": 0.0545, "step": 87420 }, { - "epoch": 0.95, - "learning_rate": 0.00015815108053734829, - "loss": 0.0379, + "epoch": 0.56, + "learning_rate": 0.000215355918857342, + "loss": 0.0521, "step": 87430 }, { - "epoch": 0.95, - "learning_rate": 0.00015813485625283924, - "loss": 0.039, + "epoch": 0.56, + "learning_rate": 0.00021534623750298507, + "loss": 0.0503, "step": 87440 }, { - "epoch": 0.95, - "learning_rate": 0.00015811863196833019, - "loss": 0.0416, + "epoch": 0.56, + "learning_rate": 0.00021533655614862813, + "loss": 0.0504, "step": 87450 }, { - "epoch": 0.95, - "learning_rate": 0.00015810240768382114, - "loss": 0.0397, + "epoch": 0.56, + "learning_rate": 0.0002153268747942712, + "loss": 0.0535, "step": 87460 }, { - "epoch": 0.95, - "learning_rate": 0.00015808618339931208, - "loss": 0.0462, + "epoch": 0.56, + "learning_rate": 0.00021531719343991429, + "loss": 0.0488, "step": 87470 }, { - "epoch": 0.95, - "learning_rate": 0.00015806995911480303, - "loss": 0.0419, + "epoch": 0.56, + "learning_rate": 0.0002153075120855573, + "loss": 0.0514, "step": 87480 }, { - "epoch": 0.95, - "learning_rate": 0.00015805373483029396, - "loss": 0.0431, + "epoch": 0.56, + "learning_rate": 0.0002152978307312004, + "loss": 0.0463, "step": 87490 }, { - "epoch": 0.95, - "learning_rate": 0.00015803751054578493, - "loss": 0.0383, + "epoch": 0.56, + "learning_rate": 0.00021528814937684347, + "loss": 0.0473, "step": 87500 }, { - "epoch": 0.95, - "learning_rate": 0.00015802128626127586, - "loss": 0.0388, + "epoch": 0.56, + "learning_rate": 0.00021527846802248655, + "loss": 0.0452, "step": 87510 }, { - "epoch": 0.95, - "learning_rate": 0.00015800506197676683, - "loss": 0.0391, + "epoch": 0.56, + "learning_rate": 0.0002152687866681296, + "loss": 0.0492, "step": 87520 }, { - "epoch": 0.95, - "learning_rate": 0.00015798883769225776, - "loss": 0.0347, + "epoch": 0.56, + "learning_rate": 0.00021525910531377268, + "loss": 0.0656, "step": 87530 }, { - "epoch": 0.95, - "learning_rate": 0.0001579726134077487, - "loss": 0.0406, + "epoch": 0.57, + "learning_rate": 0.00021524942395941576, + "loss": 0.0516, "step": 87540 }, { - "epoch": 0.95, - "learning_rate": 0.00015795638912323966, - "loss": 0.0428, + "epoch": 0.57, + "learning_rate": 0.0002152397426050588, + "loss": 0.0464, "step": 87550 }, { - "epoch": 0.95, - "learning_rate": 0.0001579401648387306, - "loss": 0.039, + "epoch": 0.57, + "learning_rate": 0.00021523006125070187, + "loss": 0.0437, "step": 87560 }, { - "epoch": 0.95, - "learning_rate": 0.00015792394055422153, - "loss": 0.0359, + "epoch": 0.57, + "learning_rate": 0.00021522037989634495, + "loss": 0.0487, "step": 87570 }, { - "epoch": 0.95, - "learning_rate": 0.0001579077162697125, - "loss": 0.0439, + "epoch": 0.57, + "learning_rate": 0.000215210698541988, + "loss": 0.0499, "step": 87580 }, { - "epoch": 0.95, - "learning_rate": 0.00015789149198520343, - "loss": 0.036, + "epoch": 0.57, + "learning_rate": 0.00021520101718763108, + "loss": 0.0465, "step": 87590 }, { - "epoch": 0.95, - "learning_rate": 0.0001578752677006944, - "loss": 0.0448, + "epoch": 0.57, + "learning_rate": 0.00021519133583327416, + "loss": 0.0503, "step": 87600 }, { - "epoch": 0.95, - "learning_rate": 0.00015785904341618533, - "loss": 0.042, + "epoch": 0.57, + "learning_rate": 0.00021518165447891724, + "loss": 0.0468, "step": 87610 }, { - "epoch": 0.95, - "learning_rate": 0.00015784281913167628, - "loss": 0.0466, + "epoch": 0.57, + "learning_rate": 0.00021517197312456027, + "loss": 0.0546, "step": 87620 }, { - "epoch": 0.95, - "learning_rate": 0.00015782659484716723, - "loss": 0.0426, + "epoch": 0.57, + "learning_rate": 0.00021516229177020335, + "loss": 0.052, "step": 87630 }, { - "epoch": 0.95, - "learning_rate": 0.00015781037056265818, - "loss": 0.0479, + "epoch": 0.57, + "learning_rate": 0.00021515261041584643, + "loss": 0.0444, "step": 87640 }, { - "epoch": 0.95, - "learning_rate": 0.00015779414627814913, - "loss": 0.0444, + "epoch": 0.57, + "learning_rate": 0.00021514292906148948, + "loss": 0.052, "step": 87650 }, { - "epoch": 0.95, - "learning_rate": 0.00015777792199364008, - "loss": 0.0371, + "epoch": 0.57, + "learning_rate": 0.00021513324770713256, + "loss": 0.0528, "step": 87660 }, { - "epoch": 0.95, - "learning_rate": 0.000157761697709131, - "loss": 0.0433, + "epoch": 0.57, + "learning_rate": 0.00021512356635277564, + "loss": 0.046, "step": 87670 }, { - "epoch": 0.95, - "learning_rate": 0.00015774547342462198, - "loss": 0.0423, + "epoch": 0.57, + "learning_rate": 0.00021511388499841872, + "loss": 0.0544, "step": 87680 }, { - "epoch": 0.95, - "learning_rate": 0.0001577292491401129, - "loss": 0.0572, + "epoch": 0.57, + "learning_rate": 0.00021510420364406174, + "loss": 0.0505, "step": 87690 }, { - "epoch": 0.95, - "learning_rate": 0.00015771302485560388, - "loss": 0.0376, + "epoch": 0.57, + "learning_rate": 0.00021509452228970482, + "loss": 0.0638, "step": 87700 }, { - "epoch": 0.95, - "learning_rate": 0.0001576968005710948, - "loss": 0.0491, + "epoch": 0.57, + "learning_rate": 0.0002150848409353479, + "loss": 0.0509, "step": 87710 }, { - "epoch": 0.95, - "learning_rate": 0.00015768057628658575, - "loss": 0.0408, + "epoch": 0.57, + "learning_rate": 0.00021507515958099096, + "loss": 0.0538, "step": 87720 }, { - "epoch": 0.95, - "learning_rate": 0.0001576643520020767, - "loss": 0.0354, + "epoch": 0.57, + "learning_rate": 0.00021506547822663404, + "loss": 0.0516, "step": 87730 }, { - "epoch": 0.95, - "learning_rate": 0.00015764812771756765, - "loss": 0.0382, + "epoch": 0.57, + "learning_rate": 0.00021505579687227712, + "loss": 0.0458, "step": 87740 }, { - "epoch": 0.95, - "learning_rate": 0.00015763190343305857, - "loss": 0.0405, + "epoch": 0.57, + "learning_rate": 0.00021504611551792017, + "loss": 0.0484, "step": 87750 }, { - "epoch": 0.95, - "learning_rate": 0.00015761567914854955, - "loss": 0.0465, + "epoch": 0.57, + "learning_rate": 0.00021503643416356322, + "loss": 0.0486, "step": 87760 }, { - "epoch": 0.95, - "learning_rate": 0.00015759945486404047, - "loss": 0.0359, + "epoch": 0.57, + "learning_rate": 0.0002150267528092063, + "loss": 0.0514, "step": 87770 }, { - "epoch": 0.95, - "learning_rate": 0.00015758323057953145, - "loss": 0.0384, + "epoch": 0.57, + "learning_rate": 0.00021501707145484935, + "loss": 0.0505, "step": 87780 }, { - "epoch": 0.95, - "learning_rate": 0.00015756700629502237, - "loss": 0.0366, + "epoch": 0.57, + "learning_rate": 0.00021500739010049243, + "loss": 0.0664, "step": 87790 }, { - "epoch": 0.95, - "learning_rate": 0.00015755078201051332, - "loss": 0.0338, + "epoch": 0.57, + "learning_rate": 0.0002149977087461355, + "loss": 0.0526, "step": 87800 }, { - "epoch": 0.95, - "learning_rate": 0.00015753455772600427, - "loss": 0.0478, + "epoch": 0.57, + "learning_rate": 0.0002149880273917786, + "loss": 0.0528, "step": 87810 }, { - "epoch": 0.95, - "learning_rate": 0.00015751833344149522, - "loss": 0.0419, + "epoch": 0.57, + "learning_rate": 0.00021497834603742165, + "loss": 0.0495, "step": 87820 }, { - "epoch": 0.95, - "learning_rate": 0.00015750210915698617, - "loss": 0.0439, + "epoch": 0.57, + "learning_rate": 0.0002149686646830647, + "loss": 0.0544, "step": 87830 }, { - "epoch": 0.95, - "learning_rate": 0.00015748588487247712, - "loss": 0.0351, + "epoch": 0.57, + "learning_rate": 0.00021495898332870778, + "loss": 0.0529, "step": 87840 }, { - "epoch": 0.95, - "learning_rate": 0.00015746966058796804, - "loss": 0.038, + "epoch": 0.57, + "learning_rate": 0.00021494930197435083, + "loss": 0.0443, "step": 87850 }, { - "epoch": 0.95, - "learning_rate": 0.00015745343630345902, - "loss": 0.0436, + "epoch": 0.57, + "learning_rate": 0.0002149396206199939, + "loss": 0.054, "step": 87860 }, { - "epoch": 0.95, - "learning_rate": 0.00015743721201894994, - "loss": 0.0412, + "epoch": 0.57, + "learning_rate": 0.000214929939265637, + "loss": 0.054, "step": 87870 }, { - "epoch": 0.95, - "learning_rate": 0.00015742098773444092, - "loss": 0.0483, + "epoch": 0.57, + "learning_rate": 0.00021492025791128007, + "loss": 0.0426, "step": 87880 }, { - "epoch": 0.95, - "learning_rate": 0.00015740476344993184, - "loss": 0.0497, + "epoch": 0.57, + "learning_rate": 0.00021491057655692312, + "loss": 0.0438, "step": 87890 }, { - "epoch": 0.95, - "learning_rate": 0.0001573885391654228, - "loss": 0.0437, + "epoch": 0.57, + "learning_rate": 0.00021490089520256617, + "loss": 0.0519, "step": 87900 }, { - "epoch": 0.95, - "learning_rate": 0.00015737231488091374, - "loss": 0.0365, + "epoch": 0.57, + "learning_rate": 0.00021489121384820925, + "loss": 0.0497, "step": 87910 }, { - "epoch": 0.95, - "learning_rate": 0.0001573560905964047, - "loss": 0.0392, + "epoch": 0.57, + "learning_rate": 0.0002148815324938523, + "loss": 0.05, "step": 87920 }, { - "epoch": 0.95, - "learning_rate": 0.0001573398663118956, - "loss": 0.0349, + "epoch": 0.57, + "learning_rate": 0.0002148718511394954, + "loss": 0.0486, "step": 87930 }, { - "epoch": 0.95, - "learning_rate": 0.0001573236420273866, - "loss": 0.0485, + "epoch": 0.57, + "learning_rate": 0.00021486216978513847, + "loss": 0.0567, "step": 87940 }, { - "epoch": 0.95, - "learning_rate": 0.0001573074177428775, - "loss": 0.0523, + "epoch": 0.57, + "learning_rate": 0.00021485248843078152, + "loss": 0.0535, "step": 87950 }, { - "epoch": 0.95, - "learning_rate": 0.0001572911934583685, - "loss": 0.0425, + "epoch": 0.57, + "learning_rate": 0.0002148428070764246, + "loss": 0.0468, "step": 87960 }, { - "epoch": 0.95, - "learning_rate": 0.0001572749691738594, - "loss": 0.0472, + "epoch": 0.57, + "learning_rate": 0.00021483312572206765, + "loss": 0.0447, "step": 87970 }, { - "epoch": 0.95, - "learning_rate": 0.0001572587448893504, - "loss": 0.0452, + "epoch": 0.57, + "learning_rate": 0.0002148234443677107, + "loss": 0.0585, "step": 87980 }, { - "epoch": 0.95, - "learning_rate": 0.0001572425206048413, - "loss": 0.0433, + "epoch": 0.57, + "learning_rate": 0.00021481376301335378, + "loss": 0.0522, "step": 87990 }, { - "epoch": 0.95, - "learning_rate": 0.00015722629632033226, - "loss": 0.0353, + "epoch": 0.57, + "learning_rate": 0.00021480408165899686, + "loss": 0.0449, "step": 88000 }, { - "epoch": 0.95, - "eval_cer": 0.9211366555877732, - "eval_loss": 0.03045099787414074, - "eval_runtime": 119.0513, - "eval_samples_per_second": 16.799, - "eval_steps_per_second": 4.2, + "epoch": 0.57, + "eval_cer": 0.9198897299740142, + "eval_loss": 0.033422499895095825, + "eval_runtime": 119.8447, + "eval_samples_per_second": 16.688, + "eval_steps_per_second": 4.172, "step": 88000 }, { - "epoch": 0.95, - "learning_rate": 0.0001572100720358232, - "loss": 0.0392, + "epoch": 0.57, + "learning_rate": 0.00021479440030463994, + "loss": 0.0464, "step": 88010 }, { - "epoch": 0.95, - "learning_rate": 0.00015719384775131416, - "loss": 0.0386, + "epoch": 0.57, + "learning_rate": 0.000214784718950283, + "loss": 0.0526, "step": 88020 }, { - "epoch": 0.95, - "learning_rate": 0.00015717762346680508, - "loss": 0.043, + "epoch": 0.57, + "learning_rate": 0.00021477503759592608, + "loss": 0.0547, "step": 88030 }, { - "epoch": 0.95, - "learning_rate": 0.00015716139918229606, - "loss": 0.037, + "epoch": 0.57, + "learning_rate": 0.00021476535624156913, + "loss": 0.0522, "step": 88040 }, { - "epoch": 0.95, - "learning_rate": 0.00015714517489778698, - "loss": 0.0383, + "epoch": 0.57, + "learning_rate": 0.00021475567488721218, + "loss": 0.0485, "step": 88050 }, { - "epoch": 0.95, - "learning_rate": 0.00015712895061327796, - "loss": 0.0433, + "epoch": 0.57, + "learning_rate": 0.00021474599353285526, + "loss": 0.047, "step": 88060 }, { - "epoch": 0.95, - "learning_rate": 0.00015711272632876888, - "loss": 0.0435, + "epoch": 0.57, + "learning_rate": 0.00021473631217849834, + "loss": 0.05, "step": 88070 }, { - "epoch": 0.95, - "learning_rate": 0.00015709650204425983, - "loss": 0.0456, + "epoch": 0.57, + "learning_rate": 0.00021472663082414142, + "loss": 0.05, "step": 88080 }, { - "epoch": 0.95, - "learning_rate": 0.00015708027775975078, - "loss": 0.0404, + "epoch": 0.57, + "learning_rate": 0.00021471694946978447, + "loss": 0.052, "step": 88090 }, { - "epoch": 0.95, - "learning_rate": 0.00015706405347524173, - "loss": 0.0402, + "epoch": 0.57, + "learning_rate": 0.00021470726811542755, + "loss": 0.0432, "step": 88100 }, { - "epoch": 0.95, - "learning_rate": 0.00015704782919073265, - "loss": 0.0404, + "epoch": 0.57, + "learning_rate": 0.0002146975867610706, + "loss": 0.0523, "step": 88110 }, { - "epoch": 0.95, - "learning_rate": 0.00015703160490622363, - "loss": 0.0589, + "epoch": 0.57, + "learning_rate": 0.00021468790540671366, + "loss": 0.0449, "step": 88120 }, { - "epoch": 0.95, - "learning_rate": 0.00015701538062171455, - "loss": 0.0407, + "epoch": 0.57, + "learning_rate": 0.00021467822405235674, + "loss": 0.0498, "step": 88130 }, { - "epoch": 0.95, - "learning_rate": 0.00015699915633720553, - "loss": 0.0481, + "epoch": 0.57, + "learning_rate": 0.00021466854269799982, + "loss": 0.0489, "step": 88140 }, { - "epoch": 0.95, - "learning_rate": 0.00015698293205269645, - "loss": 0.0404, + "epoch": 0.57, + "learning_rate": 0.00021465886134364287, + "loss": 0.0532, "step": 88150 }, { - "epoch": 0.95, - "learning_rate": 0.00015696670776818743, - "loss": 0.0507, + "epoch": 0.57, + "learning_rate": 0.00021464917998928595, + "loss": 0.0495, "step": 88160 }, { - "epoch": 0.95, - "learning_rate": 0.00015695048348367835, - "loss": 0.0387, + "epoch": 0.57, + "learning_rate": 0.00021463949863492903, + "loss": 0.0549, "step": 88170 }, { - "epoch": 0.95, - "learning_rate": 0.0001569342591991693, - "loss": 0.0485, + "epoch": 0.57, + "learning_rate": 0.00021462981728057206, + "loss": 0.0512, "step": 88180 }, { - "epoch": 0.95, - "learning_rate": 0.00015691803491466025, - "loss": 0.0452, + "epoch": 0.57, + "learning_rate": 0.00021462013592621514, + "loss": 0.0484, "step": 88190 }, { - "epoch": 0.95, - "learning_rate": 0.0001569018106301512, - "loss": 0.0426, + "epoch": 0.57, + "learning_rate": 0.00021461045457185822, + "loss": 0.0504, "step": 88200 }, { - "epoch": 0.95, - "learning_rate": 0.00015688558634564212, - "loss": 0.0456, + "epoch": 0.57, + "learning_rate": 0.0002146007732175013, + "loss": 0.0471, "step": 88210 }, { - "epoch": 0.95, - "learning_rate": 0.0001568693620611331, - "loss": 0.038, + "epoch": 0.57, + "learning_rate": 0.00021459109186314435, + "loss": 0.055, "step": 88220 }, { - "epoch": 0.95, - "learning_rate": 0.00015685313777662402, - "loss": 0.0479, + "epoch": 0.57, + "learning_rate": 0.00021458141050878743, + "loss": 0.0478, "step": 88230 }, { - "epoch": 0.95, - "learning_rate": 0.000156836913492115, - "loss": 0.0468, + "epoch": 0.57, + "learning_rate": 0.0002145717291544305, + "loss": 0.0471, "step": 88240 }, { - "epoch": 0.95, - "learning_rate": 0.00015682068920760592, - "loss": 0.0455, + "epoch": 0.57, + "learning_rate": 0.00021456204780007353, + "loss": 0.0532, "step": 88250 }, { - "epoch": 0.95, - "learning_rate": 0.00015680446492309687, - "loss": 0.0461, + "epoch": 0.57, + "learning_rate": 0.00021455236644571661, + "loss": 0.0517, "step": 88260 }, { - "epoch": 0.95, - "learning_rate": 0.00015678824063858782, - "loss": 0.0464, + "epoch": 0.57, + "learning_rate": 0.0002145426850913597, + "loss": 0.0551, "step": 88270 }, { - "epoch": 0.95, - "learning_rate": 0.00015677201635407877, - "loss": 0.0399, + "epoch": 0.57, + "learning_rate": 0.00021453300373700277, + "loss": 0.0498, "step": 88280 }, { - "epoch": 0.95, - "learning_rate": 0.0001567557920695697, - "loss": 0.0405, + "epoch": 0.57, + "learning_rate": 0.00021452332238264583, + "loss": 0.0456, "step": 88290 }, { - "epoch": 0.96, - "learning_rate": 0.00015673956778506067, - "loss": 0.0437, + "epoch": 0.57, + "learning_rate": 0.0002145136410282889, + "loss": 0.0592, "step": 88300 }, { - "epoch": 0.96, - "learning_rate": 0.0001567233435005516, - "loss": 0.0353, + "epoch": 0.57, + "learning_rate": 0.00021450395967393199, + "loss": 0.0457, "step": 88310 }, { - "epoch": 0.96, - "learning_rate": 0.00015670711921604257, - "loss": 0.045, + "epoch": 0.57, + "learning_rate": 0.000214494278319575, + "loss": 0.049, "step": 88320 }, { - "epoch": 0.96, - "learning_rate": 0.0001566908949315335, - "loss": 0.0494, + "epoch": 0.57, + "learning_rate": 0.0002144845969652181, + "loss": 0.0446, "step": 88330 }, { - "epoch": 0.96, - "learning_rate": 0.00015667467064702447, - "loss": 0.0456, + "epoch": 0.57, + "learning_rate": 0.00021447491561086117, + "loss": 0.0556, "step": 88340 }, { - "epoch": 0.96, - "learning_rate": 0.0001566584463625154, - "loss": 0.0501, + "epoch": 0.57, + "learning_rate": 0.00021446523425650422, + "loss": 0.0535, "step": 88350 }, { - "epoch": 0.96, - "learning_rate": 0.00015664222207800634, - "loss": 0.0393, + "epoch": 0.57, + "learning_rate": 0.0002144555529021473, + "loss": 0.0484, "step": 88360 }, { - "epoch": 0.96, - "learning_rate": 0.0001566259977934973, - "loss": 0.0375, + "epoch": 0.57, + "learning_rate": 0.00021444587154779038, + "loss": 0.0448, "step": 88370 }, { - "epoch": 0.96, - "learning_rate": 0.00015660977350898824, - "loss": 0.0431, + "epoch": 0.57, + "learning_rate": 0.00021443619019343346, + "loss": 0.0528, "step": 88380 }, { - "epoch": 0.96, - "learning_rate": 0.00015659354922447917, - "loss": 0.0424, + "epoch": 0.57, + "learning_rate": 0.0002144265088390765, + "loss": 0.0482, "step": 88390 }, { - "epoch": 0.96, - "learning_rate": 0.00015657732493997014, - "loss": 0.0382, + "epoch": 0.57, + "learning_rate": 0.00021441682748471957, + "loss": 0.0558, "step": 88400 }, { - "epoch": 0.96, - "learning_rate": 0.00015656110065546107, - "loss": 0.0452, + "epoch": 0.57, + "learning_rate": 0.00021440714613036265, + "loss": 0.0587, "step": 88410 }, { - "epoch": 0.96, - "learning_rate": 0.00015654487637095204, - "loss": 0.0446, + "epoch": 0.57, + "learning_rate": 0.0002143974647760057, + "loss": 0.0577, "step": 88420 }, { - "epoch": 0.96, - "learning_rate": 0.00015652865208644296, - "loss": 0.0476, + "epoch": 0.57, + "learning_rate": 0.00021438778342164878, + "loss": 0.0505, "step": 88430 }, { - "epoch": 0.96, - "learning_rate": 0.00015651242780193391, - "loss": 0.0437, + "epoch": 0.57, + "learning_rate": 0.00021437810206729186, + "loss": 0.0469, "step": 88440 }, { - "epoch": 0.96, - "learning_rate": 0.00015649620351742486, - "loss": 0.0412, + "epoch": 0.57, + "learning_rate": 0.00021436842071293494, + "loss": 0.0503, "step": 88450 }, { - "epoch": 0.96, - "learning_rate": 0.00015647997923291581, - "loss": 0.0363, + "epoch": 0.57, + "learning_rate": 0.00021435873935857797, + "loss": 0.0448, "step": 88460 }, { - "epoch": 0.96, - "learning_rate": 0.00015646375494840674, - "loss": 0.0472, + "epoch": 0.57, + "learning_rate": 0.00021434905800422105, + "loss": 0.0559, "step": 88470 }, { - "epoch": 0.96, - "learning_rate": 0.0001564475306638977, - "loss": 0.0426, + "epoch": 0.57, + "learning_rate": 0.00021433937664986413, + "loss": 0.0517, "step": 88480 }, { - "epoch": 0.96, - "learning_rate": 0.00015643130637938864, - "loss": 0.0408, + "epoch": 0.57, + "learning_rate": 0.00021432969529550718, + "loss": 0.1163, "step": 88490 }, { - "epoch": 0.96, - "learning_rate": 0.0001564150820948796, - "loss": 0.0423, + "epoch": 0.57, + "learning_rate": 0.00021432001394115026, + "loss": 0.0504, "step": 88500 }, { - "epoch": 0.96, - "learning_rate": 0.00015639885781037054, - "loss": 0.038, + "epoch": 0.57, + "learning_rate": 0.00021431033258679334, + "loss": 0.0451, "step": 88510 }, { - "epoch": 0.96, - "learning_rate": 0.0001563826335258615, - "loss": 0.0398, + "epoch": 0.57, + "learning_rate": 0.00021430065123243642, + "loss": 0.0537, "step": 88520 }, { - "epoch": 0.96, - "learning_rate": 0.00015636640924135244, - "loss": 0.0359, + "epoch": 0.57, + "learning_rate": 0.00021429096987807944, + "loss": 0.049, "step": 88530 }, { - "epoch": 0.96, - "learning_rate": 0.00015635018495684339, - "loss": 0.0409, + "epoch": 0.57, + "learning_rate": 0.00021428128852372252, + "loss": 0.0489, "step": 88540 }, { - "epoch": 0.96, - "learning_rate": 0.00015633396067233433, - "loss": 0.0419, + "epoch": 0.57, + "learning_rate": 0.00021427160716936558, + "loss": 0.0418, "step": 88550 }, { - "epoch": 0.96, - "learning_rate": 0.00015631773638782528, - "loss": 0.044, + "epoch": 0.57, + "learning_rate": 0.00021426192581500866, + "loss": 0.0468, "step": 88560 }, { - "epoch": 0.96, - "learning_rate": 0.0001563015121033162, - "loss": 0.0415, + "epoch": 0.57, + "learning_rate": 0.00021425224446065173, + "loss": 0.0465, "step": 88570 }, { - "epoch": 0.96, - "learning_rate": 0.00015628528781880718, - "loss": 0.0441, + "epoch": 0.57, + "learning_rate": 0.00021424256310629481, + "loss": 0.0432, "step": 88580 }, { - "epoch": 0.96, - "learning_rate": 0.0001562690635342981, - "loss": 0.0354, + "epoch": 0.57, + "learning_rate": 0.00021423288175193787, + "loss": 0.0567, "step": 88590 }, { - "epoch": 0.96, - "learning_rate": 0.00015625283924978908, - "loss": 0.0424, + "epoch": 0.57, + "learning_rate": 0.00021422320039758092, + "loss": 0.0526, "step": 88600 }, { - "epoch": 0.96, - "learning_rate": 0.00015623661496528, - "loss": 0.0412, + "epoch": 0.57, + "learning_rate": 0.000214213519043224, + "loss": 0.0483, "step": 88610 }, { - "epoch": 0.96, - "learning_rate": 0.00015622039068077096, - "loss": 0.0377, + "epoch": 0.57, + "learning_rate": 0.00021420383768886705, + "loss": 0.0448, "step": 88620 }, { - "epoch": 0.96, - "learning_rate": 0.0001562041663962619, - "loss": 0.0409, + "epoch": 0.57, + "learning_rate": 0.00021419415633451013, + "loss": 0.0469, "step": 88630 }, { - "epoch": 0.96, - "learning_rate": 0.00015618794211175286, - "loss": 0.0493, + "epoch": 0.57, + "learning_rate": 0.0002141844749801532, + "loss": 0.0476, "step": 88640 }, { - "epoch": 0.96, - "learning_rate": 0.0001561717178272438, - "loss": 0.0418, + "epoch": 0.57, + "learning_rate": 0.0002141747936257963, + "loss": 0.0408, "step": 88650 }, { - "epoch": 0.96, - "learning_rate": 0.00015615549354273476, - "loss": 0.0447, + "epoch": 0.57, + "learning_rate": 0.00021416511227143934, + "loss": 0.0503, "step": 88660 }, { - "epoch": 0.96, - "learning_rate": 0.00015613926925822568, - "loss": 0.0426, + "epoch": 0.57, + "learning_rate": 0.0002141554309170824, + "loss": 0.0593, "step": 88670 }, { - "epoch": 0.96, - "learning_rate": 0.00015612304497371665, - "loss": 0.0484, + "epoch": 0.57, + "learning_rate": 0.00021414574956272548, + "loss": 0.0624, "step": 88680 }, { - "epoch": 0.96, - "learning_rate": 0.00015610682068920758, - "loss": 0.0416, + "epoch": 0.57, + "learning_rate": 0.00021413606820836853, + "loss": 0.0556, "step": 88690 }, { - "epoch": 0.96, - "learning_rate": 0.00015609059640469855, - "loss": 0.0492, + "epoch": 0.57, + "learning_rate": 0.0002141263868540116, + "loss": 0.044, "step": 88700 }, { - "epoch": 0.96, - "learning_rate": 0.00015607437212018948, - "loss": 0.0398, + "epoch": 0.57, + "learning_rate": 0.0002141167054996547, + "loss": 0.05, "step": 88710 }, { - "epoch": 0.96, - "learning_rate": 0.00015605814783568043, - "loss": 0.0371, + "epoch": 0.57, + "learning_rate": 0.00021410702414529777, + "loss": 0.0497, "step": 88720 }, { - "epoch": 0.96, - "learning_rate": 0.00015604192355117138, - "loss": 0.0455, + "epoch": 0.57, + "learning_rate": 0.00021409734279094082, + "loss": 0.0502, "step": 88730 }, { - "epoch": 0.96, - "learning_rate": 0.00015602569926666233, - "loss": 0.043, + "epoch": 0.57, + "learning_rate": 0.00021408766143658387, + "loss": 0.0459, "step": 88740 }, { - "epoch": 0.96, - "learning_rate": 0.00015600947498215325, - "loss": 0.0391, + "epoch": 0.57, + "learning_rate": 0.00021407798008222695, + "loss": 0.0549, "step": 88750 }, { - "epoch": 0.96, - "learning_rate": 0.00015599325069764423, - "loss": 0.0508, + "epoch": 0.57, + "learning_rate": 0.00021406829872787, + "loss": 0.0516, "step": 88760 }, { - "epoch": 0.96, - "learning_rate": 0.00015597702641313515, - "loss": 0.0405, + "epoch": 0.57, + "learning_rate": 0.0002140586173735131, + "loss": 0.0519, "step": 88770 }, { - "epoch": 0.96, - "learning_rate": 0.00015596080212862613, - "loss": 0.0411, + "epoch": 0.57, + "learning_rate": 0.00021404893601915617, + "loss": 0.0472, "step": 88780 }, { - "epoch": 0.96, - "learning_rate": 0.00015594457784411705, - "loss": 0.0391, + "epoch": 0.57, + "learning_rate": 0.00021403925466479922, + "loss": 0.0476, "step": 88790 }, { - "epoch": 0.96, - "learning_rate": 0.000155928353559608, - "loss": 0.046, + "epoch": 0.57, + "learning_rate": 0.0002140295733104423, + "loss": 0.0503, "step": 88800 }, { - "epoch": 0.96, - "learning_rate": 0.00015591212927509895, - "loss": 0.0389, + "epoch": 0.57, + "learning_rate": 0.00021401989195608535, + "loss": 0.0544, "step": 88810 }, { - "epoch": 0.96, - "learning_rate": 0.0001558959049905899, - "loss": 0.0465, + "epoch": 0.57, + "learning_rate": 0.0002140102106017284, + "loss": 0.0512, "step": 88820 }, { - "epoch": 0.96, - "learning_rate": 0.00015587968070608085, - "loss": 0.0421, + "epoch": 0.57, + "learning_rate": 0.00021400052924737148, + "loss": 0.0436, "step": 88830 }, { - "epoch": 0.96, - "learning_rate": 0.0001558634564215718, - "loss": 0.0425, + "epoch": 0.57, + "learning_rate": 0.00021399084789301456, + "loss": 0.0572, "step": 88840 }, { - "epoch": 0.96, - "learning_rate": 0.00015584723213706272, - "loss": 0.0424, + "epoch": 0.57, + "learning_rate": 0.00021398116653865764, + "loss": 0.0486, "step": 88850 }, { - "epoch": 0.96, - "learning_rate": 0.0001558310078525537, - "loss": 0.041, + "epoch": 0.57, + "learning_rate": 0.0002139714851843007, + "loss": 0.0566, "step": 88860 }, { - "epoch": 0.96, - "learning_rate": 0.00015581478356804462, - "loss": 0.0495, + "epoch": 0.57, + "learning_rate": 0.00021396180382994378, + "loss": 0.057, "step": 88870 }, { - "epoch": 0.96, - "learning_rate": 0.0001557985592835356, - "loss": 0.0368, + "epoch": 0.57, + "learning_rate": 0.00021395212247558683, + "loss": 0.05, "step": 88880 }, { - "epoch": 0.96, - "learning_rate": 0.00015578233499902652, - "loss": 0.0462, + "epoch": 0.57, + "learning_rate": 0.00021394244112122988, + "loss": 0.048, "step": 88890 }, { - "epoch": 0.96, - "learning_rate": 0.00015576611071451747, - "loss": 0.0389, + "epoch": 0.57, + "learning_rate": 0.00021393275976687296, + "loss": 0.0551, "step": 88900 }, { - "epoch": 0.96, - "learning_rate": 0.00015574988643000842, - "loss": 0.0414, + "epoch": 0.57, + "learning_rate": 0.00021392307841251604, + "loss": 0.0545, "step": 88910 }, { - "epoch": 0.96, - "learning_rate": 0.00015573366214549937, - "loss": 0.0466, + "epoch": 0.57, + "learning_rate": 0.00021391339705815912, + "loss": 0.0476, "step": 88920 }, { - "epoch": 0.96, - "learning_rate": 0.0001557174378609903, - "loss": 0.0394, + "epoch": 0.57, + "learning_rate": 0.00021390371570380217, + "loss": 0.0507, "step": 88930 }, { - "epoch": 0.96, - "learning_rate": 0.00015570121357648127, - "loss": 0.0358, + "epoch": 0.57, + "learning_rate": 0.00021389403434944525, + "loss": 0.061, "step": 88940 }, { - "epoch": 0.96, - "learning_rate": 0.0001556849892919722, - "loss": 0.0465, + "epoch": 0.57, + "learning_rate": 0.0002138843529950883, + "loss": 0.0531, "step": 88950 }, { - "epoch": 0.96, - "learning_rate": 0.00015566876500746317, - "loss": 0.0385, + "epoch": 0.57, + "learning_rate": 0.00021387467164073136, + "loss": 0.0464, "step": 88960 }, { - "epoch": 0.96, - "learning_rate": 0.0001556525407229541, - "loss": 0.048, + "epoch": 0.57, + "learning_rate": 0.00021386499028637444, + "loss": 0.0531, "step": 88970 }, { - "epoch": 0.96, - "learning_rate": 0.00015563631643844504, - "loss": 0.0417, + "epoch": 0.57, + "learning_rate": 0.00021385530893201752, + "loss": 0.0444, "step": 88980 }, { - "epoch": 0.96, - "learning_rate": 0.000155620092153936, - "loss": 0.0391, + "epoch": 0.57, + "learning_rate": 0.00021384562757766057, + "loss": 0.0478, "step": 88990 }, { - "epoch": 0.96, - "learning_rate": 0.00015560386786942694, - "loss": 0.0469, + "epoch": 0.57, + "learning_rate": 0.00021383594622330365, + "loss": 0.0516, "step": 89000 }, { - "epoch": 0.96, - "eval_cer": 0.921160509664435, - "eval_loss": 0.030413759872317314, - "eval_runtime": 119.151, - "eval_samples_per_second": 16.785, - "eval_steps_per_second": 4.196, + "epoch": 0.57, + "eval_cer": 0.919940345723647, + "eval_loss": 0.0331486351788044, + "eval_runtime": 120.3849, + "eval_samples_per_second": 16.613, + "eval_steps_per_second": 4.153, "step": 89000 }, { - "epoch": 0.96, - "learning_rate": 0.0001555876435849179, - "loss": 0.0408, + "epoch": 0.57, + "learning_rate": 0.00021382626486894673, + "loss": 0.0438, "step": 89010 }, { - "epoch": 0.96, - "learning_rate": 0.00015557141930040884, - "loss": 0.0435, + "epoch": 0.57, + "learning_rate": 0.00021381658351458976, + "loss": 0.0481, "step": 89020 }, { - "epoch": 0.96, - "learning_rate": 0.00015555519501589976, - "loss": 0.0546, + "epoch": 0.57, + "learning_rate": 0.00021380690216023284, + "loss": 0.042, "step": 89030 }, { - "epoch": 0.96, - "learning_rate": 0.00015553897073139074, - "loss": 0.037, + "epoch": 0.57, + "learning_rate": 0.00021379722080587592, + "loss": 0.0482, "step": 89040 }, { - "epoch": 0.96, - "learning_rate": 0.00015552274644688166, - "loss": 0.0431, + "epoch": 0.57, + "learning_rate": 0.000213787539451519, + "loss": 0.0517, "step": 89050 }, { - "epoch": 0.96, - "learning_rate": 0.00015550652216237264, - "loss": 0.051, + "epoch": 0.57, + "learning_rate": 0.00021377785809716205, + "loss": 0.0447, "step": 89060 }, { - "epoch": 0.96, - "learning_rate": 0.00015549029787786356, - "loss": 0.0416, + "epoch": 0.57, + "learning_rate": 0.00021376817674280513, + "loss": 0.0501, "step": 89070 }, { - "epoch": 0.96, - "learning_rate": 0.0001554740735933545, - "loss": 0.0461, + "epoch": 0.57, + "learning_rate": 0.0002137584953884482, + "loss": 0.0514, "step": 89080 }, { - "epoch": 0.96, - "learning_rate": 0.00015545784930884546, - "loss": 0.0393, + "epoch": 0.58, + "learning_rate": 0.00021374881403409123, + "loss": 0.0523, "step": 89090 }, { - "epoch": 0.96, - "learning_rate": 0.0001554416250243364, - "loss": 0.0478, + "epoch": 0.58, + "learning_rate": 0.0002137391326797343, + "loss": 0.0483, "step": 89100 }, { - "epoch": 0.96, - "learning_rate": 0.00015542540073982733, - "loss": 0.0355, + "epoch": 0.58, + "learning_rate": 0.0002137294513253774, + "loss": 0.0572, "step": 89110 }, { - "epoch": 0.96, - "learning_rate": 0.0001554091764553183, - "loss": 0.0439, + "epoch": 0.58, + "learning_rate": 0.00021371976997102047, + "loss": 0.0533, "step": 89120 }, { - "epoch": 0.96, - "learning_rate": 0.00015539295217080923, - "loss": 0.0349, + "epoch": 0.58, + "learning_rate": 0.00021371008861666353, + "loss": 0.0492, "step": 89130 }, { - "epoch": 0.96, - "learning_rate": 0.0001553767278863002, - "loss": 0.0392, + "epoch": 0.58, + "learning_rate": 0.0002137004072623066, + "loss": 0.0538, "step": 89140 }, { - "epoch": 0.96, - "learning_rate": 0.00015536050360179113, - "loss": 0.0471, + "epoch": 0.58, + "learning_rate": 0.00021369072590794969, + "loss": 0.057, "step": 89150 }, { - "epoch": 0.96, - "learning_rate": 0.00015534427931728208, - "loss": 0.0415, + "epoch": 0.58, + "learning_rate": 0.0002136810445535927, + "loss": 0.0537, "step": 89160 }, { - "epoch": 0.96, - "learning_rate": 0.00015532805503277306, - "loss": 0.0368, + "epoch": 0.58, + "learning_rate": 0.0002136713631992358, + "loss": 0.0451, "step": 89170 }, { - "epoch": 0.96, - "learning_rate": 0.00015531183074826398, - "loss": 0.0402, + "epoch": 0.58, + "learning_rate": 0.00021366168184487887, + "loss": 0.0501, "step": 89180 }, { - "epoch": 0.96, - "learning_rate": 0.00015529560646375496, - "loss": 0.0423, + "epoch": 0.58, + "learning_rate": 0.00021365200049052192, + "loss": 0.0439, "step": 89190 }, { - "epoch": 0.96, - "learning_rate": 0.00015527938217924588, - "loss": 0.0359, + "epoch": 0.58, + "learning_rate": 0.000213642319136165, + "loss": 0.0529, "step": 89200 }, { - "epoch": 0.96, - "learning_rate": 0.00015526315789473686, - "loss": 0.0467, + "epoch": 0.58, + "learning_rate": 0.00021363263778180808, + "loss": 0.044, "step": 89210 }, { - "epoch": 0.97, - "learning_rate": 0.00015524693361022778, - "loss": 0.0391, + "epoch": 0.58, + "learning_rate": 0.00021362295642745116, + "loss": 0.0455, "step": 89220 }, { - "epoch": 0.97, - "learning_rate": 0.00015523070932571873, - "loss": 0.0419, + "epoch": 0.58, + "learning_rate": 0.0002136132750730942, + "loss": 0.0539, "step": 89230 }, { - "epoch": 0.97, - "learning_rate": 0.00015521448504120968, - "loss": 0.0379, + "epoch": 0.58, + "learning_rate": 0.00021360359371873727, + "loss": 0.0425, "step": 89240 }, { - "epoch": 0.97, - "learning_rate": 0.00015519826075670063, - "loss": 0.0345, + "epoch": 0.58, + "learning_rate": 0.00021359391236438035, + "loss": 0.0447, "step": 89250 }, { - "epoch": 0.97, - "learning_rate": 0.00015518203647219155, - "loss": 0.0355, + "epoch": 0.58, + "learning_rate": 0.0002135842310100234, + "loss": 0.049, "step": 89260 }, { - "epoch": 0.97, - "learning_rate": 0.00015516581218768253, - "loss": 0.0382, + "epoch": 0.58, + "learning_rate": 0.00021357454965566648, + "loss": 0.05, "step": 89270 }, { - "epoch": 0.97, - "learning_rate": 0.00015514958790317345, - "loss": 0.0475, + "epoch": 0.58, + "learning_rate": 0.00021356486830130956, + "loss": 0.0505, "step": 89280 }, { - "epoch": 0.97, - "learning_rate": 0.00015513336361866443, - "loss": 0.0466, + "epoch": 0.58, + "learning_rate": 0.00021355518694695264, + "loss": 0.0449, "step": 89290 }, { - "epoch": 0.97, - "learning_rate": 0.00015511713933415535, - "loss": 0.0384, + "epoch": 0.58, + "learning_rate": 0.00021354550559259567, + "loss": 0.0501, "step": 89300 }, { - "epoch": 0.97, - "learning_rate": 0.0001551009150496463, - "loss": 0.0376, + "epoch": 0.58, + "learning_rate": 0.00021353582423823875, + "loss": 0.0443, "step": 89310 }, { - "epoch": 0.97, - "learning_rate": 0.00015508469076513725, - "loss": 0.0496, + "epoch": 0.58, + "learning_rate": 0.00021352614288388182, + "loss": 0.0478, "step": 89320 }, { - "epoch": 0.97, - "learning_rate": 0.0001550684664806282, - "loss": 0.0403, + "epoch": 0.58, + "learning_rate": 0.00021351646152952488, + "loss": 0.0536, "step": 89330 }, { - "epoch": 0.97, - "learning_rate": 0.00015505224219611915, - "loss": 0.0489, + "epoch": 0.58, + "learning_rate": 0.00021350678017516796, + "loss": 0.0638, "step": 89340 }, { - "epoch": 0.97, - "learning_rate": 0.0001550360179116101, - "loss": 0.0368, + "epoch": 0.58, + "learning_rate": 0.00021349709882081104, + "loss": 0.0515, "step": 89350 }, { - "epoch": 0.97, - "learning_rate": 0.00015501979362710102, - "loss": 0.0484, + "epoch": 0.58, + "learning_rate": 0.0002134874174664541, + "loss": 0.0458, "step": 89360 }, { - "epoch": 0.97, - "learning_rate": 0.000155003569342592, - "loss": 0.0371, + "epoch": 0.58, + "learning_rate": 0.00021347773611209714, + "loss": 0.0497, "step": 89370 }, { - "epoch": 0.97, - "learning_rate": 0.00015498734505808292, - "loss": 0.0424, + "epoch": 0.58, + "learning_rate": 0.00021346805475774022, + "loss": 0.0471, "step": 89380 }, { - "epoch": 0.97, - "learning_rate": 0.0001549711207735739, - "loss": 0.0426, + "epoch": 0.58, + "learning_rate": 0.00021345837340338327, + "loss": 0.0479, "step": 89390 }, { - "epoch": 0.97, - "learning_rate": 0.00015495489648906482, - "loss": 0.0384, + "epoch": 0.58, + "learning_rate": 0.00021344869204902635, + "loss": 0.0452, "step": 89400 }, { - "epoch": 0.97, - "learning_rate": 0.00015493867220455577, - "loss": 0.0365, + "epoch": 0.58, + "learning_rate": 0.00021343901069466943, + "loss": 0.04, "step": 89410 }, { - "epoch": 0.97, - "learning_rate": 0.00015492244792004672, - "loss": 0.0434, + "epoch": 0.58, + "learning_rate": 0.00021342932934031251, + "loss": 0.0482, "step": 89420 }, { - "epoch": 0.97, - "learning_rate": 0.00015490622363553767, - "loss": 0.0434, + "epoch": 0.58, + "learning_rate": 0.00021341964798595557, + "loss": 0.0575, "step": 89430 }, { - "epoch": 0.97, - "learning_rate": 0.0001548899993510286, - "loss": 0.0475, + "epoch": 0.58, + "learning_rate": 0.00021340996663159862, + "loss": 0.048, "step": 89440 }, { - "epoch": 0.97, - "learning_rate": 0.00015487377506651957, - "loss": 0.0428, + "epoch": 0.58, + "learning_rate": 0.0002134002852772417, + "loss": 0.0497, "step": 89450 }, { - "epoch": 0.97, - "learning_rate": 0.0001548575507820105, - "loss": 0.0445, + "epoch": 0.58, + "learning_rate": 0.00021339060392288475, + "loss": 0.0513, "step": 89460 }, { - "epoch": 0.97, - "learning_rate": 0.00015484132649750147, - "loss": 0.0391, + "epoch": 0.58, + "learning_rate": 0.00021338092256852783, + "loss": 0.0529, "step": 89470 }, { - "epoch": 0.97, - "learning_rate": 0.0001548251022129924, - "loss": 0.0427, + "epoch": 0.58, + "learning_rate": 0.0002133712412141709, + "loss": 0.0537, "step": 89480 }, { - "epoch": 0.97, - "learning_rate": 0.00015480887792848334, - "loss": 0.0397, + "epoch": 0.58, + "learning_rate": 0.000213361559859814, + "loss": 0.0507, "step": 89490 }, { - "epoch": 0.97, - "learning_rate": 0.0001547926536439743, - "loss": 0.0403, + "epoch": 0.58, + "learning_rate": 0.00021335187850545704, + "loss": 0.0535, "step": 89500 }, { - "epoch": 0.97, - "learning_rate": 0.00015477642935946524, - "loss": 0.0471, + "epoch": 0.58, + "learning_rate": 0.0002133421971511001, + "loss": 0.0499, "step": 89510 }, { - "epoch": 0.97, - "learning_rate": 0.0001547602050749562, - "loss": 0.0513, + "epoch": 0.58, + "learning_rate": 0.00021333251579674318, + "loss": 0.0537, "step": 89520 }, { - "epoch": 0.97, - "learning_rate": 0.00015474398079044714, - "loss": 0.0386, + "epoch": 0.58, + "learning_rate": 0.00021332283444238623, + "loss": 0.0521, "step": 89530 }, { - "epoch": 0.97, - "learning_rate": 0.00015472775650593806, - "loss": 0.0442, + "epoch": 0.58, + "learning_rate": 0.0002133131530880293, + "loss": 0.0481, "step": 89540 }, { - "epoch": 0.97, - "learning_rate": 0.00015471153222142904, - "loss": 0.0505, + "epoch": 0.58, + "learning_rate": 0.0002133034717336724, + "loss": 0.0475, "step": 89550 }, { - "epoch": 0.97, - "learning_rate": 0.00015469530793691996, - "loss": 0.042, + "epoch": 0.58, + "learning_rate": 0.00021329379037931544, + "loss": 0.0481, "step": 89560 }, { - "epoch": 0.97, - "learning_rate": 0.00015467908365241094, - "loss": 0.0356, + "epoch": 0.58, + "learning_rate": 0.00021328410902495852, + "loss": 0.0476, "step": 89570 }, { - "epoch": 0.97, - "learning_rate": 0.00015466285936790186, - "loss": 0.045, + "epoch": 0.58, + "learning_rate": 0.00021327442767060157, + "loss": 0.059, "step": 89580 }, { - "epoch": 0.97, - "learning_rate": 0.0001546466350833928, - "loss": 0.0446, + "epoch": 0.58, + "learning_rate": 0.00021326474631624463, + "loss": 0.0473, "step": 89590 }, { - "epoch": 0.97, - "learning_rate": 0.00015463041079888376, - "loss": 0.037, + "epoch": 0.58, + "learning_rate": 0.0002132550649618877, + "loss": 0.0578, "step": 89600 }, { - "epoch": 0.97, - "learning_rate": 0.0001546141865143747, - "loss": 0.0388, + "epoch": 0.58, + "learning_rate": 0.0002132453836075308, + "loss": 0.0483, "step": 89610 }, { - "epoch": 0.97, - "learning_rate": 0.00015459796222986564, - "loss": 0.0358, + "epoch": 0.58, + "learning_rate": 0.00021323570225317387, + "loss": 0.0484, "step": 89620 }, { - "epoch": 0.97, - "learning_rate": 0.0001545817379453566, - "loss": 0.0384, + "epoch": 0.58, + "learning_rate": 0.00021322602089881692, + "loss": 0.06, "step": 89630 }, { - "epoch": 0.97, - "learning_rate": 0.00015456551366084753, - "loss": 0.0436, + "epoch": 0.58, + "learning_rate": 0.00021321633954446, + "loss": 0.0464, "step": 89640 }, { - "epoch": 0.97, - "learning_rate": 0.0001545492893763385, - "loss": 0.0438, + "epoch": 0.58, + "learning_rate": 0.00021320665819010305, + "loss": 0.0454, "step": 89650 }, { - "epoch": 0.97, - "learning_rate": 0.00015453306509182943, - "loss": 0.0433, + "epoch": 0.58, + "learning_rate": 0.0002131969768357461, + "loss": 0.0541, "step": 89660 }, { - "epoch": 0.97, - "learning_rate": 0.00015451684080732038, - "loss": 0.0424, + "epoch": 0.58, + "learning_rate": 0.00021318729548138918, + "loss": 0.0554, "step": 89670 }, { - "epoch": 0.97, - "learning_rate": 0.00015450061652281133, - "loss": 0.047, + "epoch": 0.58, + "learning_rate": 0.00021317761412703226, + "loss": 0.0464, "step": 89680 }, { - "epoch": 0.97, - "learning_rate": 0.00015448439223830228, - "loss": 0.0403, + "epoch": 0.58, + "learning_rate": 0.00021316793277267534, + "loss": 0.0485, "step": 89690 }, { - "epoch": 0.97, - "learning_rate": 0.00015446816795379323, - "loss": 0.0405, + "epoch": 0.58, + "learning_rate": 0.0002131582514183184, + "loss": 0.0474, "step": 89700 }, { - "epoch": 0.97, - "learning_rate": 0.00015445194366928418, - "loss": 0.04, + "epoch": 0.58, + "learning_rate": 0.00021314857006396148, + "loss": 0.0523, "step": 89710 }, { - "epoch": 0.97, - "learning_rate": 0.0001544357193847751, - "loss": 0.0417, + "epoch": 0.58, + "learning_rate": 0.00021313888870960453, + "loss": 0.0531, "step": 89720 }, { - "epoch": 0.97, - "learning_rate": 0.00015441949510026608, - "loss": 0.0461, + "epoch": 0.58, + "learning_rate": 0.00021312920735524758, + "loss": 0.0479, "step": 89730 }, { - "epoch": 0.97, - "learning_rate": 0.000154403270815757, - "loss": 0.0401, - "step": 89740 + "epoch": 0.58, + "learning_rate": 0.00021311952600089066, + "loss": 0.045, + "step": 89740 }, { - "epoch": 0.97, - "learning_rate": 0.00015438704653124798, - "loss": 0.0412, + "epoch": 0.58, + "learning_rate": 0.00021310984464653374, + "loss": 0.0457, "step": 89750 }, { - "epoch": 0.97, - "learning_rate": 0.0001543708222467389, - "loss": 0.0364, + "epoch": 0.58, + "learning_rate": 0.0002131001632921768, + "loss": 0.0488, "step": 89760 }, { - "epoch": 0.97, - "learning_rate": 0.00015435459796222985, - "loss": 0.0388, + "epoch": 0.58, + "learning_rate": 0.00021309048193781987, + "loss": 0.0575, "step": 89770 }, { - "epoch": 0.97, - "learning_rate": 0.0001543383736777208, - "loss": 0.0443, + "epoch": 0.58, + "learning_rate": 0.00021308080058346295, + "loss": 0.0511, "step": 89780 }, { - "epoch": 0.97, - "learning_rate": 0.00015432214939321175, - "loss": 0.0399, + "epoch": 0.58, + "learning_rate": 0.00021307111922910598, + "loss": 0.0524, "step": 89790 }, { - "epoch": 0.97, - "learning_rate": 0.00015430592510870268, - "loss": 0.0413, + "epoch": 0.58, + "learning_rate": 0.00021306143787474906, + "loss": 0.0504, "step": 89800 }, { - "epoch": 0.97, - "learning_rate": 0.00015428970082419365, - "loss": 0.0439, + "epoch": 0.58, + "learning_rate": 0.00021305175652039214, + "loss": 0.0492, "step": 89810 }, { - "epoch": 0.97, - "learning_rate": 0.00015427347653968458, - "loss": 0.0403, + "epoch": 0.58, + "learning_rate": 0.00021304207516603522, + "loss": 0.0521, "step": 89820 }, { - "epoch": 0.97, - "learning_rate": 0.00015425725225517555, - "loss": 0.0352, + "epoch": 0.58, + "learning_rate": 0.00021303239381167827, + "loss": 0.0517, "step": 89830 }, { - "epoch": 0.97, - "learning_rate": 0.00015424102797066648, - "loss": 0.0392, + "epoch": 0.58, + "learning_rate": 0.00021302271245732135, + "loss": 0.0474, "step": 89840 }, { - "epoch": 0.97, - "learning_rate": 0.00015422480368615743, - "loss": 0.0383, + "epoch": 0.58, + "learning_rate": 0.00021301303110296443, + "loss": 0.0559, "step": 89850 }, { - "epoch": 0.97, - "learning_rate": 0.00015420857940164838, - "loss": 0.0413, + "epoch": 0.58, + "learning_rate": 0.00021300334974860746, + "loss": 0.0526, "step": 89860 }, { - "epoch": 0.97, - "learning_rate": 0.00015419235511713933, - "loss": 0.042, + "epoch": 0.58, + "learning_rate": 0.00021299366839425054, + "loss": 0.054, "step": 89870 }, { - "epoch": 0.97, - "learning_rate": 0.00015417613083263027, - "loss": 0.0418, + "epoch": 0.58, + "learning_rate": 0.00021298398703989362, + "loss": 0.0497, "step": 89880 }, { - "epoch": 0.97, - "learning_rate": 0.00015415990654812122, - "loss": 0.0392, + "epoch": 0.58, + "learning_rate": 0.0002129743056855367, + "loss": 0.0537, "step": 89890 }, { - "epoch": 0.97, - "learning_rate": 0.00015414368226361215, - "loss": 0.04, + "epoch": 0.58, + "learning_rate": 0.00021296462433117975, + "loss": 0.0481, "step": 89900 }, { - "epoch": 0.97, - "learning_rate": 0.00015412745797910312, - "loss": 0.0409, + "epoch": 0.58, + "learning_rate": 0.00021295494297682283, + "loss": 0.0457, "step": 89910 }, { - "epoch": 0.97, - "learning_rate": 0.00015411123369459405, - "loss": 0.0465, + "epoch": 0.58, + "learning_rate": 0.0002129452616224659, + "loss": 0.0505, "step": 89920 }, { - "epoch": 0.97, - "learning_rate": 0.00015409500941008502, - "loss": 0.0425, + "epoch": 0.58, + "learning_rate": 0.00021293558026810893, + "loss": 0.0466, "step": 89930 }, { - "epoch": 0.97, - "learning_rate": 0.00015407878512557595, - "loss": 0.0481, + "epoch": 0.58, + "learning_rate": 0.000212925898913752, + "loss": 0.0525, "step": 89940 }, { - "epoch": 0.97, - "learning_rate": 0.0001540625608410669, - "loss": 0.039, + "epoch": 0.58, + "learning_rate": 0.0002129162175593951, + "loss": 0.0482, "step": 89950 }, { - "epoch": 0.97, - "learning_rate": 0.00015404633655655785, - "loss": 0.0404, + "epoch": 0.58, + "learning_rate": 0.00021290653620503815, + "loss": 0.068, "step": 89960 }, { - "epoch": 0.97, - "learning_rate": 0.0001540301122720488, - "loss": 0.0409, + "epoch": 0.58, + "learning_rate": 0.00021289685485068123, + "loss": 0.0501, "step": 89970 }, { - "epoch": 0.97, - "learning_rate": 0.00015401388798753972, - "loss": 0.039, + "epoch": 0.58, + "learning_rate": 0.0002128871734963243, + "loss": 0.0417, "step": 89980 }, { - "epoch": 0.97, - "learning_rate": 0.0001539976637030307, - "loss": 0.039, + "epoch": 0.58, + "learning_rate": 0.00021287749214196738, + "loss": 0.0546, "step": 89990 }, { - "epoch": 0.97, - "learning_rate": 0.00015398143941852162, - "loss": 0.0387, + "epoch": 0.58, + "learning_rate": 0.0002128678107876104, + "loss": 0.0537, "step": 90000 }, { - "epoch": 0.97, - "eval_cer": 0.9212179361452872, - "eval_loss": 0.03033587709069252, - "eval_runtime": 118.8044, - "eval_samples_per_second": 16.834, - "eval_steps_per_second": 4.209, + "epoch": 0.58, + "eval_cer": 0.9199249802282228, + "eval_loss": 0.03311315178871155, + "eval_runtime": 119.7145, + "eval_samples_per_second": 16.706, + "eval_steps_per_second": 4.177, "step": 90000 }, { - "epoch": 0.97, - "learning_rate": 0.0001539652151340126, - "loss": 0.0447, + "epoch": 0.58, + "learning_rate": 0.0002128581294332535, + "loss": 0.0477, "step": 90010 }, { - "epoch": 0.97, - "learning_rate": 0.00015394899084950352, - "loss": 0.0417, + "epoch": 0.58, + "learning_rate": 0.00021284844807889657, + "loss": 0.057, "step": 90020 }, { - "epoch": 0.97, - "learning_rate": 0.0001539327665649945, - "loss": 0.0423, + "epoch": 0.58, + "learning_rate": 0.00021283876672453962, + "loss": 0.0535, "step": 90030 }, { - "epoch": 0.97, - "learning_rate": 0.00015391654228048542, - "loss": 0.0488, + "epoch": 0.58, + "learning_rate": 0.0002128290853701827, + "loss": 0.0485, "step": 90040 }, { - "epoch": 0.97, - "learning_rate": 0.00015390031799597637, - "loss": 0.044, + "epoch": 0.58, + "learning_rate": 0.00021281940401582578, + "loss": 0.0517, "step": 90050 }, { - "epoch": 0.97, - "learning_rate": 0.00015388409371146732, - "loss": 0.0488, + "epoch": 0.58, + "learning_rate": 0.00021280972266146886, + "loss": 0.0503, "step": 90060 }, { - "epoch": 0.97, - "learning_rate": 0.00015386786942695827, - "loss": 0.0359, + "epoch": 0.58, + "learning_rate": 0.0002128000413071119, + "loss": 0.0543, "step": 90070 }, { - "epoch": 0.97, - "learning_rate": 0.0001538516451424492, - "loss": 0.0393, + "epoch": 0.58, + "learning_rate": 0.00021279035995275497, + "loss": 0.0519, "step": 90080 }, { - "epoch": 0.97, - "learning_rate": 0.00015383542085794017, - "loss": 0.0361, + "epoch": 0.58, + "learning_rate": 0.00021278067859839805, + "loss": 0.0541, "step": 90090 }, { - "epoch": 0.97, - "learning_rate": 0.0001538191965734311, - "loss": 0.0519, + "epoch": 0.58, + "learning_rate": 0.0002127709972440411, + "loss": 0.0505, "step": 90100 }, { - "epoch": 0.97, - "learning_rate": 0.00015380297228892207, - "loss": 0.0473, + "epoch": 0.58, + "learning_rate": 0.00021276131588968418, + "loss": 0.048, "step": 90110 }, { - "epoch": 0.97, - "learning_rate": 0.000153786748004413, - "loss": 0.0403, + "epoch": 0.58, + "learning_rate": 0.00021275163453532726, + "loss": 0.0522, "step": 90120 }, { - "epoch": 0.97, - "learning_rate": 0.00015377052371990394, - "loss": 0.0438, + "epoch": 0.58, + "learning_rate": 0.00021274195318097034, + "loss": 0.0512, "step": 90130 }, { - "epoch": 0.97, - "learning_rate": 0.0001537542994353949, - "loss": 0.0463, + "epoch": 0.58, + "learning_rate": 0.00021273227182661336, + "loss": 0.0437, "step": 90140 }, { - "epoch": 0.98, - "learning_rate": 0.00015373807515088584, - "loss": 0.0447, + "epoch": 0.58, + "learning_rate": 0.00021272259047225644, + "loss": 0.0542, "step": 90150 }, { - "epoch": 0.98, - "learning_rate": 0.00015372185086637676, - "loss": 0.0543, + "epoch": 0.58, + "learning_rate": 0.0002127129091178995, + "loss": 0.0521, "step": 90160 }, { - "epoch": 0.98, - "learning_rate": 0.00015370562658186774, - "loss": 0.0398, + "epoch": 0.58, + "learning_rate": 0.00021270322776354258, + "loss": 0.0516, "step": 90170 }, { - "epoch": 0.98, - "learning_rate": 0.00015368940229735866, - "loss": 0.039, + "epoch": 0.58, + "learning_rate": 0.00021269354640918566, + "loss": 0.0454, "step": 90180 }, { - "epoch": 0.98, - "learning_rate": 0.00015367317801284964, - "loss": 0.0524, + "epoch": 0.58, + "learning_rate": 0.00021268386505482874, + "loss": 0.0542, "step": 90190 }, { - "epoch": 0.98, - "learning_rate": 0.00015365695372834056, - "loss": 0.0406, + "epoch": 0.58, + "learning_rate": 0.0002126741837004718, + "loss": 0.0483, "step": 90200 }, { - "epoch": 0.98, - "learning_rate": 0.00015364072944383154, - "loss": 0.0465, + "epoch": 0.58, + "learning_rate": 0.00021266450234611484, + "loss": 0.0497, "step": 90210 }, { - "epoch": 0.98, - "learning_rate": 0.00015362450515932246, - "loss": 0.042, + "epoch": 0.58, + "learning_rate": 0.00021265482099175792, + "loss": 0.0517, "step": 90220 }, { - "epoch": 0.98, - "learning_rate": 0.0001536082808748134, - "loss": 0.0397, + "epoch": 0.58, + "learning_rate": 0.00021264513963740097, + "loss": 0.0515, "step": 90230 }, { - "epoch": 0.98, - "learning_rate": 0.00015359205659030436, - "loss": 0.0372, + "epoch": 0.58, + "learning_rate": 0.00021263545828304405, + "loss": 0.0488, "step": 90240 }, { - "epoch": 0.98, - "learning_rate": 0.0001535758323057953, - "loss": 0.0418, + "epoch": 0.58, + "learning_rate": 0.00021262577692868713, + "loss": 0.0493, "step": 90250 }, { - "epoch": 0.98, - "learning_rate": 0.00015355960802128623, - "loss": 0.0511, + "epoch": 0.58, + "learning_rate": 0.00021261609557433021, + "loss": 0.0463, "step": 90260 }, { - "epoch": 0.98, - "learning_rate": 0.0001535433837367772, - "loss": 0.0372, + "epoch": 0.58, + "learning_rate": 0.00021260641421997327, + "loss": 0.0461, "step": 90270 }, { - "epoch": 0.98, - "learning_rate": 0.00015352715945226813, - "loss": 0.0398, + "epoch": 0.58, + "learning_rate": 0.00021259673286561632, + "loss": 0.0532, "step": 90280 }, { - "epoch": 0.98, - "learning_rate": 0.0001535109351677591, - "loss": 0.0457, + "epoch": 0.58, + "learning_rate": 0.0002125870515112594, + "loss": 0.0472, "step": 90290 }, { - "epoch": 0.98, - "learning_rate": 0.00015349471088325003, - "loss": 0.0473, + "epoch": 0.58, + "learning_rate": 0.00021257737015690245, + "loss": 0.0452, "step": 90300 }, { - "epoch": 0.98, - "learning_rate": 0.00015347848659874098, - "loss": 0.043, + "epoch": 0.58, + "learning_rate": 0.00021256768880254553, + "loss": 0.0578, "step": 90310 }, { - "epoch": 0.98, - "learning_rate": 0.00015346226231423193, - "loss": 0.0486, + "epoch": 0.58, + "learning_rate": 0.0002125580074481886, + "loss": 0.0577, "step": 90320 }, { - "epoch": 0.98, - "learning_rate": 0.00015344603802972288, - "loss": 0.0504, + "epoch": 0.58, + "learning_rate": 0.0002125483260938317, + "loss": 0.0534, "step": 90330 }, { - "epoch": 0.98, - "learning_rate": 0.0001534298137452138, - "loss": 0.0423, + "epoch": 0.58, + "learning_rate": 0.00021253864473947474, + "loss": 0.0518, "step": 90340 }, { - "epoch": 0.98, - "learning_rate": 0.00015341358946070478, - "loss": 0.044, + "epoch": 0.58, + "learning_rate": 0.0002125289633851178, + "loss": 0.0528, "step": 90350 }, { - "epoch": 0.98, - "learning_rate": 0.0001533973651761957, - "loss": 0.0424, + "epoch": 0.58, + "learning_rate": 0.00021251928203076085, + "loss": 0.0554, "step": 90360 }, { - "epoch": 0.98, - "learning_rate": 0.00015338114089168668, - "loss": 0.0459, + "epoch": 0.58, + "learning_rate": 0.00021250960067640393, + "loss": 0.0505, "step": 90370 }, { - "epoch": 0.98, - "learning_rate": 0.0001533649166071776, - "loss": 0.0468, + "epoch": 0.58, + "learning_rate": 0.000212499919322047, + "loss": 0.0485, "step": 90380 }, { - "epoch": 0.98, - "learning_rate": 0.00015334869232266858, - "loss": 0.0427, + "epoch": 0.58, + "learning_rate": 0.0002124902379676901, + "loss": 0.0504, "step": 90390 }, { - "epoch": 0.98, - "learning_rate": 0.0001533324680381595, - "loss": 0.042, + "epoch": 0.58, + "learning_rate": 0.00021248055661333314, + "loss": 0.0462, "step": 90400 }, { - "epoch": 0.98, - "learning_rate": 0.00015331624375365045, - "loss": 0.0407, + "epoch": 0.58, + "learning_rate": 0.00021247087525897622, + "loss": 0.0508, "step": 90410 }, { - "epoch": 0.98, - "learning_rate": 0.0001533000194691414, - "loss": 0.0439, + "epoch": 0.58, + "learning_rate": 0.00021246119390461927, + "loss": 0.0552, "step": 90420 }, { - "epoch": 0.98, - "learning_rate": 0.00015328379518463235, - "loss": 0.0466, + "epoch": 0.58, + "learning_rate": 0.00021245151255026233, + "loss": 0.0415, "step": 90430 }, { - "epoch": 0.98, - "learning_rate": 0.00015326757090012327, - "loss": 0.0415, + "epoch": 0.58, + "learning_rate": 0.0002124418311959054, + "loss": 0.0486, "step": 90440 }, { - "epoch": 0.98, - "learning_rate": 0.00015325134661561425, - "loss": 0.0359, + "epoch": 0.58, + "learning_rate": 0.00021243214984154849, + "loss": 0.052, "step": 90450 }, { - "epoch": 0.98, - "learning_rate": 0.00015323512233110517, - "loss": 0.0378, + "epoch": 0.58, + "learning_rate": 0.00021242246848719157, + "loss": 0.0517, "step": 90460 }, { - "epoch": 0.98, - "learning_rate": 0.00015321889804659615, - "loss": 0.046, + "epoch": 0.58, + "learning_rate": 0.00021241278713283462, + "loss": 0.0559, "step": 90470 }, { - "epoch": 0.98, - "learning_rate": 0.00015320267376208707, - "loss": 0.0376, + "epoch": 0.58, + "learning_rate": 0.0002124031057784777, + "loss": 0.05, "step": 90480 }, { - "epoch": 0.98, - "learning_rate": 0.00015318644947757802, - "loss": 0.0377, + "epoch": 0.58, + "learning_rate": 0.00021239342442412075, + "loss": 0.0508, "step": 90490 }, { - "epoch": 0.98, - "learning_rate": 0.00015317022519306897, - "loss": 0.0457, + "epoch": 0.58, + "learning_rate": 0.0002123837430697638, + "loss": 0.0454, "step": 90500 }, { - "epoch": 0.98, - "learning_rate": 0.00015315400090855992, - "loss": 0.0398, + "epoch": 0.58, + "learning_rate": 0.00021237406171540688, + "loss": 0.0501, "step": 90510 }, { - "epoch": 0.98, - "learning_rate": 0.00015313777662405084, - "loss": 0.0374, + "epoch": 0.58, + "learning_rate": 0.00021236438036104996, + "loss": 0.0474, "step": 90520 }, { - "epoch": 0.98, - "learning_rate": 0.00015312155233954182, - "loss": 0.0353, + "epoch": 0.58, + "learning_rate": 0.00021235469900669304, + "loss": 0.0457, "step": 90530 }, { - "epoch": 0.98, - "learning_rate": 0.00015310532805503274, - "loss": 0.0385, + "epoch": 0.58, + "learning_rate": 0.0002123450176523361, + "loss": 0.049, "step": 90540 }, { - "epoch": 0.98, - "learning_rate": 0.00015308910377052372, - "loss": 0.0365, + "epoch": 0.58, + "learning_rate": 0.00021233533629797918, + "loss": 0.0512, "step": 90550 }, { - "epoch": 0.98, - "learning_rate": 0.00015307287948601464, - "loss": 0.043, + "epoch": 0.58, + "learning_rate": 0.0002123256549436222, + "loss": 0.0469, "step": 90560 }, { - "epoch": 0.98, - "learning_rate": 0.00015305665520150562, - "loss": 0.0395, + "epoch": 0.58, + "learning_rate": 0.00021231597358926528, + "loss": 0.0553, "step": 90570 }, { - "epoch": 0.98, - "learning_rate": 0.00015304043091699654, - "loss": 0.0416, + "epoch": 0.58, + "learning_rate": 0.00021230629223490836, + "loss": 0.0468, "step": 90580 }, { - "epoch": 0.98, - "learning_rate": 0.0001530242066324875, - "loss": 0.0384, + "epoch": 0.58, + "learning_rate": 0.00021229661088055144, + "loss": 0.0458, "step": 90590 }, { - "epoch": 0.98, - "learning_rate": 0.00015300798234797844, - "loss": 0.0344, + "epoch": 0.58, + "learning_rate": 0.0002122869295261945, + "loss": 0.0467, "step": 90600 }, { - "epoch": 0.98, - "learning_rate": 0.0001529917580634694, - "loss": 0.0461, + "epoch": 0.58, + "learning_rate": 0.00021227724817183757, + "loss": 0.0498, "step": 90610 }, { - "epoch": 0.98, - "learning_rate": 0.00015297553377896031, - "loss": 0.0429, + "epoch": 0.58, + "learning_rate": 0.00021226756681748065, + "loss": 0.0591, "step": 90620 }, { - "epoch": 0.98, - "learning_rate": 0.0001529593094944513, - "loss": 0.0418, + "epoch": 0.58, + "learning_rate": 0.00021225788546312368, + "loss": 0.0484, "step": 90630 }, { - "epoch": 0.98, - "learning_rate": 0.0001529430852099422, - "loss": 0.0403, + "epoch": 0.59, + "learning_rate": 0.00021224820410876676, + "loss": 0.0445, "step": 90640 }, { - "epoch": 0.98, - "learning_rate": 0.0001529268609254332, - "loss": 0.0366, + "epoch": 0.59, + "learning_rate": 0.00021223852275440984, + "loss": 0.0564, "step": 90650 }, { - "epoch": 0.98, - "learning_rate": 0.0001529106366409241, - "loss": 0.0376, + "epoch": 0.59, + "learning_rate": 0.00021222884140005292, + "loss": 0.0522, "step": 90660 }, { - "epoch": 0.98, - "learning_rate": 0.00015289441235641506, - "loss": 0.0364, + "epoch": 0.59, + "learning_rate": 0.00021221916004569597, + "loss": 0.0515, "step": 90670 }, { - "epoch": 0.98, - "learning_rate": 0.000152878188071906, - "loss": 0.0468, + "epoch": 0.59, + "learning_rate": 0.00021220947869133905, + "loss": 0.0505, "step": 90680 }, { - "epoch": 0.98, - "learning_rate": 0.00015286196378739696, - "loss": 0.0401, + "epoch": 0.59, + "learning_rate": 0.00021219979733698213, + "loss": 0.0424, "step": 90690 }, { - "epoch": 0.98, - "learning_rate": 0.00015284573950288788, - "loss": 0.0346, + "epoch": 0.59, + "learning_rate": 0.00021219011598262516, + "loss": 0.0464, "step": 90700 }, { - "epoch": 0.98, - "learning_rate": 0.00015282951521837886, - "loss": 0.0367, + "epoch": 0.59, + "learning_rate": 0.00021218043462826824, + "loss": 0.0443, "step": 90710 }, { - "epoch": 0.98, - "learning_rate": 0.00015281329093386978, - "loss": 0.0348, + "epoch": 0.59, + "learning_rate": 0.00021217075327391132, + "loss": 0.0468, "step": 90720 }, { - "epoch": 0.98, - "learning_rate": 0.00015279706664936076, - "loss": 0.0472, + "epoch": 0.59, + "learning_rate": 0.0002121610719195544, + "loss": 0.0441, "step": 90730 }, { - "epoch": 0.98, - "learning_rate": 0.00015278084236485168, - "loss": 0.0411, + "epoch": 0.59, + "learning_rate": 0.00021215139056519745, + "loss": 0.0515, "step": 90740 }, { - "epoch": 0.98, - "learning_rate": 0.00015276461808034266, - "loss": 0.0358, + "epoch": 0.59, + "learning_rate": 0.00021214170921084053, + "loss": 0.0489, "step": 90750 }, { - "epoch": 0.98, - "learning_rate": 0.00015274839379583358, - "loss": 0.0412, + "epoch": 0.59, + "learning_rate": 0.0002121320278564836, + "loss": 0.0552, "step": 90760 }, { - "epoch": 0.98, - "learning_rate": 0.00015273216951132453, - "loss": 0.0401, + "epoch": 0.59, + "learning_rate": 0.00021212234650212663, + "loss": 0.0487, "step": 90770 }, { - "epoch": 0.98, - "learning_rate": 0.00015271594522681548, - "loss": 0.0389, + "epoch": 0.59, + "learning_rate": 0.0002121126651477697, + "loss": 0.0467, "step": 90780 }, { - "epoch": 0.98, - "learning_rate": 0.00015269972094230643, - "loss": 0.0451, + "epoch": 0.59, + "learning_rate": 0.0002121029837934128, + "loss": 0.0475, "step": 90790 }, { - "epoch": 0.98, - "learning_rate": 0.00015268349665779736, - "loss": 0.0447, + "epoch": 0.59, + "learning_rate": 0.00021209330243905585, + "loss": 0.0526, "step": 90800 }, { - "epoch": 0.98, - "learning_rate": 0.00015266727237328833, - "loss": 0.0419, + "epoch": 0.59, + "learning_rate": 0.00021208362108469892, + "loss": 0.0482, "step": 90810 }, { - "epoch": 0.98, - "learning_rate": 0.00015265104808877926, - "loss": 0.0363, + "epoch": 0.59, + "learning_rate": 0.000212073939730342, + "loss": 0.0457, "step": 90820 }, { - "epoch": 0.98, - "learning_rate": 0.00015263482380427023, - "loss": 0.0381, + "epoch": 0.59, + "learning_rate": 0.00021206425837598508, + "loss": 0.0469, "step": 90830 }, { - "epoch": 0.98, - "learning_rate": 0.00015261859951976115, - "loss": 0.0401, + "epoch": 0.59, + "learning_rate": 0.0002120545770216281, + "loss": 0.0524, "step": 90840 }, { - "epoch": 0.98, - "learning_rate": 0.0001526023752352521, - "loss": 0.0399, + "epoch": 0.59, + "learning_rate": 0.0002120448956672712, + "loss": 0.0576, "step": 90850 }, { - "epoch": 0.98, - "learning_rate": 0.00015258615095074305, - "loss": 0.047, + "epoch": 0.59, + "learning_rate": 0.00021203521431291427, + "loss": 0.0503, "step": 90860 }, { - "epoch": 0.98, - "learning_rate": 0.000152569926666234, - "loss": 0.0464, + "epoch": 0.59, + "learning_rate": 0.00021202553295855732, + "loss": 0.0461, "step": 90870 }, { - "epoch": 0.98, - "learning_rate": 0.00015255370238172495, - "loss": 0.0474, + "epoch": 0.59, + "learning_rate": 0.0002120158516042004, + "loss": 0.0451, "step": 90880 }, { - "epoch": 0.98, - "learning_rate": 0.0001525374780972159, - "loss": 0.0393, + "epoch": 0.59, + "learning_rate": 0.00021200617024984348, + "loss": 0.0511, "step": 90890 }, { - "epoch": 0.98, - "learning_rate": 0.00015252125381270683, - "loss": 0.0479, + "epoch": 0.59, + "learning_rate": 0.00021199648889548656, + "loss": 0.0453, "step": 90900 }, { - "epoch": 0.98, - "learning_rate": 0.0001525050295281978, - "loss": 0.0396, + "epoch": 0.59, + "learning_rate": 0.0002119868075411296, + "loss": 0.047, "step": 90910 }, { - "epoch": 0.98, - "learning_rate": 0.00015248880524368873, - "loss": 0.043, + "epoch": 0.59, + "learning_rate": 0.00021197712618677267, + "loss": 0.0459, "step": 90920 }, { - "epoch": 0.98, - "learning_rate": 0.0001524725809591797, - "loss": 0.0418, + "epoch": 0.59, + "learning_rate": 0.00021196744483241575, + "loss": 0.0481, "step": 90930 }, { - "epoch": 0.98, - "learning_rate": 0.00015245635667467063, - "loss": 0.0488, + "epoch": 0.59, + "learning_rate": 0.0002119577634780588, + "loss": 0.0467, "step": 90940 }, { - "epoch": 0.98, - "learning_rate": 0.00015244013239016158, - "loss": 0.0364, + "epoch": 0.59, + "learning_rate": 0.00021194808212370188, + "loss": 0.0501, "step": 90950 }, { - "epoch": 0.98, - "learning_rate": 0.00015242390810565252, - "loss": 0.0416, + "epoch": 0.59, + "learning_rate": 0.00021193840076934496, + "loss": 0.0442, "step": 90960 }, { - "epoch": 0.98, - "learning_rate": 0.00015240768382114347, - "loss": 0.0484, + "epoch": 0.59, + "learning_rate": 0.000211928719414988, + "loss": 0.0472, "step": 90970 }, { - "epoch": 0.98, - "learning_rate": 0.0001523914595366344, - "loss": 0.0459, + "epoch": 0.59, + "learning_rate": 0.00021191903806063106, + "loss": 0.0452, "step": 90980 }, { - "epoch": 0.98, - "learning_rate": 0.00015237523525212537, - "loss": 0.0465, + "epoch": 0.59, + "learning_rate": 0.00021190935670627414, + "loss": 0.0497, "step": 90990 }, { - "epoch": 0.98, - "learning_rate": 0.0001523590109676163, - "loss": 0.0478, + "epoch": 0.59, + "learning_rate": 0.0002118996753519172, + "loss": 0.0477, "step": 91000 }, { - "epoch": 0.98, - "eval_cer": 0.9211993829745504, - "eval_loss": 0.030189067125320435, - "eval_runtime": 118.9859, - "eval_samples_per_second": 16.809, - "eval_steps_per_second": 4.202, + "epoch": 0.59, + "eval_cer": 0.9199819229465597, + "eval_loss": 0.03264106065034866, + "eval_runtime": 119.6718, + "eval_samples_per_second": 16.712, + "eval_steps_per_second": 4.178, "step": 91000 }, { - "epoch": 0.98, - "learning_rate": 0.00015234278668310727, - "loss": 0.0403, + "epoch": 0.59, + "learning_rate": 0.00021188999399756028, + "loss": 0.056, "step": 91010 }, { - "epoch": 0.98, - "learning_rate": 0.0001523265623985982, - "loss": 0.0437, + "epoch": 0.59, + "learning_rate": 0.00021188031264320336, + "loss": 0.0529, "step": 91020 }, { - "epoch": 0.98, - "learning_rate": 0.00015231033811408915, - "loss": 0.0475, + "epoch": 0.59, + "learning_rate": 0.00021187063128884644, + "loss": 0.0468, "step": 91030 }, { - "epoch": 0.98, - "learning_rate": 0.0001522941138295801, - "loss": 0.0368, + "epoch": 0.59, + "learning_rate": 0.0002118609499344895, + "loss": 0.0472, "step": 91040 }, { - "epoch": 0.98, - "learning_rate": 0.00015227788954507105, - "loss": 0.0416, + "epoch": 0.59, + "learning_rate": 0.00021185126858013254, + "loss": 0.0527, "step": 91050 }, { - "epoch": 0.98, - "learning_rate": 0.000152261665260562, - "loss": 0.0379, + "epoch": 0.59, + "learning_rate": 0.00021184158722577562, + "loss": 0.0541, "step": 91060 }, { - "epoch": 0.99, - "learning_rate": 0.00015224544097605295, - "loss": 0.0397, + "epoch": 0.59, + "learning_rate": 0.00021183190587141867, + "loss": 0.0429, "step": 91070 }, { - "epoch": 0.99, - "learning_rate": 0.00015222921669154387, - "loss": 0.0434, + "epoch": 0.59, + "learning_rate": 0.00021182222451706175, + "loss": 0.0446, "step": 91080 }, { - "epoch": 0.99, - "learning_rate": 0.00015221299240703484, - "loss": 0.0452, + "epoch": 0.59, + "learning_rate": 0.00021181254316270483, + "loss": 0.0524, "step": 91090 }, { - "epoch": 0.99, - "learning_rate": 0.00015219676812252577, - "loss": 0.0409, + "epoch": 0.59, + "learning_rate": 0.00021180286180834791, + "loss": 0.0433, "step": 91100 }, { - "epoch": 0.99, - "learning_rate": 0.00015218054383801674, - "loss": 0.04, + "epoch": 0.59, + "learning_rate": 0.00021179318045399097, + "loss": 0.0505, "step": 91110 }, { - "epoch": 0.99, - "learning_rate": 0.00015216431955350767, - "loss": 0.0539, + "epoch": 0.59, + "learning_rate": 0.00021178349909963402, + "loss": 0.054, "step": 91120 }, { - "epoch": 0.99, - "learning_rate": 0.00015214809526899862, - "loss": 0.0589, + "epoch": 0.59, + "learning_rate": 0.0002117738177452771, + "loss": 0.0486, "step": 91130 }, { - "epoch": 0.99, - "learning_rate": 0.00015213187098448957, - "loss": 0.0458, + "epoch": 0.59, + "learning_rate": 0.00021176413639092015, + "loss": 0.0462, "step": 91140 }, { - "epoch": 0.99, - "learning_rate": 0.00015211564669998052, - "loss": 0.0388, + "epoch": 0.59, + "learning_rate": 0.00021175445503656323, + "loss": 0.0481, "step": 91150 }, { - "epoch": 0.99, - "learning_rate": 0.00015209942241547144, - "loss": 0.0366, + "epoch": 0.59, + "learning_rate": 0.0002117447736822063, + "loss": 0.0505, "step": 91160 }, { - "epoch": 0.99, - "learning_rate": 0.00015208319813096242, - "loss": 0.0403, + "epoch": 0.59, + "learning_rate": 0.00021173509232784936, + "loss": 0.0531, "step": 91170 }, { - "epoch": 0.99, - "learning_rate": 0.00015206697384645334, - "loss": 0.0496, + "epoch": 0.59, + "learning_rate": 0.00021172541097349244, + "loss": 0.0476, "step": 91180 }, { - "epoch": 0.99, - "learning_rate": 0.00015205074956194432, - "loss": 0.0358, + "epoch": 0.59, + "learning_rate": 0.0002117157296191355, + "loss": 0.0498, "step": 91190 }, { - "epoch": 0.99, - "learning_rate": 0.00015203452527743524, - "loss": 0.0407, + "epoch": 0.59, + "learning_rate": 0.00021170604826477855, + "loss": 0.0485, "step": 91200 }, { - "epoch": 0.99, - "learning_rate": 0.0001520183009929262, - "loss": 0.0398, + "epoch": 0.59, + "learning_rate": 0.00021169636691042163, + "loss": 0.0466, "step": 91210 }, { - "epoch": 0.99, - "learning_rate": 0.00015200207670841714, - "loss": 0.0392, + "epoch": 0.59, + "learning_rate": 0.0002116866855560647, + "loss": 0.0466, "step": 91220 }, { - "epoch": 0.99, - "learning_rate": 0.0001519858524239081, - "loss": 0.0423, + "epoch": 0.59, + "learning_rate": 0.0002116770042017078, + "loss": 0.0501, "step": 91230 }, { - "epoch": 0.99, - "learning_rate": 0.00015196962813939904, - "loss": 0.0438, + "epoch": 0.59, + "learning_rate": 0.00021166732284735084, + "loss": 0.0461, "step": 91240 }, { - "epoch": 0.99, - "learning_rate": 0.00015195340385489, - "loss": 0.0384, + "epoch": 0.59, + "learning_rate": 0.00021165764149299392, + "loss": 0.0438, "step": 91250 }, { - "epoch": 0.99, - "learning_rate": 0.0001519371795703809, - "loss": 0.0429, + "epoch": 0.59, + "learning_rate": 0.00021164796013863697, + "loss": 0.0458, "step": 91260 }, { - "epoch": 0.99, - "learning_rate": 0.00015192095528587189, - "loss": 0.0372, + "epoch": 0.59, + "learning_rate": 0.00021163827878428003, + "loss": 0.0465, "step": 91270 }, { - "epoch": 0.99, - "learning_rate": 0.0001519047310013628, - "loss": 0.0425, + "epoch": 0.59, + "learning_rate": 0.0002116285974299231, + "loss": 0.0528, "step": 91280 }, { - "epoch": 0.99, - "learning_rate": 0.00015188850671685379, - "loss": 0.0421, + "epoch": 0.59, + "learning_rate": 0.00021161891607556619, + "loss": 0.0629, "step": 91290 }, { - "epoch": 0.99, - "learning_rate": 0.0001518722824323447, - "loss": 0.041, + "epoch": 0.59, + "learning_rate": 0.00021160923472120927, + "loss": 0.0443, "step": 91300 }, { - "epoch": 0.99, - "learning_rate": 0.00015185605814783566, - "loss": 0.0404, + "epoch": 0.59, + "learning_rate": 0.00021159955336685232, + "loss": 0.0418, "step": 91310 }, { - "epoch": 0.99, - "learning_rate": 0.0001518398338633266, - "loss": 0.0407, + "epoch": 0.59, + "learning_rate": 0.0002115898720124954, + "loss": 0.051, "step": 91320 }, { - "epoch": 0.99, - "learning_rate": 0.00015182360957881756, - "loss": 0.04, + "epoch": 0.59, + "learning_rate": 0.00021158019065813845, + "loss": 0.0489, "step": 91330 }, { - "epoch": 0.99, - "learning_rate": 0.00015180738529430848, - "loss": 0.0435, + "epoch": 0.59, + "learning_rate": 0.0002115705093037815, + "loss": 0.0514, "step": 91340 }, { - "epoch": 0.99, - "learning_rate": 0.00015179116100979946, - "loss": 0.0447, + "epoch": 0.59, + "learning_rate": 0.00021156082794942458, + "loss": 0.0498, "step": 91350 }, { - "epoch": 0.99, - "learning_rate": 0.00015177493672529038, - "loss": 0.0376, + "epoch": 0.59, + "learning_rate": 0.00021155114659506766, + "loss": 0.0522, "step": 91360 }, { - "epoch": 0.99, - "learning_rate": 0.00015175871244078136, - "loss": 0.0418, + "epoch": 0.59, + "learning_rate": 0.00021154146524071072, + "loss": 0.0533, "step": 91370 }, { - "epoch": 0.99, - "learning_rate": 0.00015174248815627228, - "loss": 0.0437, + "epoch": 0.59, + "learning_rate": 0.0002115317838863538, + "loss": 0.0489, "step": 91380 }, { - "epoch": 0.99, - "learning_rate": 0.00015172626387176323, - "loss": 0.0404, + "epoch": 0.59, + "learning_rate": 0.00021152210253199688, + "loss": 0.0494, "step": 91390 }, { - "epoch": 0.99, - "learning_rate": 0.00015171003958725418, - "loss": 0.0433, + "epoch": 0.59, + "learning_rate": 0.0002115124211776399, + "loss": 0.0494, "step": 91400 }, { - "epoch": 0.99, - "learning_rate": 0.00015169381530274513, - "loss": 0.044, + "epoch": 0.59, + "learning_rate": 0.00021150273982328298, + "loss": 0.0682, "step": 91410 }, { - "epoch": 0.99, - "learning_rate": 0.00015167759101823608, - "loss": 0.0447, + "epoch": 0.59, + "learning_rate": 0.00021149305846892606, + "loss": 0.0581, "step": 91420 }, { - "epoch": 0.99, - "learning_rate": 0.00015166136673372703, - "loss": 0.0389, + "epoch": 0.59, + "learning_rate": 0.00021148337711456914, + "loss": 0.0529, "step": 91430 }, { - "epoch": 0.99, - "learning_rate": 0.00015164514244921795, - "loss": 0.034, + "epoch": 0.59, + "learning_rate": 0.0002114736957602122, + "loss": 0.0519, "step": 91440 }, { - "epoch": 0.99, - "learning_rate": 0.00015162891816470893, - "loss": 0.0411, + "epoch": 0.59, + "learning_rate": 0.00021146401440585527, + "loss": 0.048, "step": 91450 }, { - "epoch": 0.99, - "learning_rate": 0.00015161269388019985, - "loss": 0.0421, + "epoch": 0.59, + "learning_rate": 0.00021145433305149835, + "loss": 0.0517, "step": 91460 }, { - "epoch": 0.99, - "learning_rate": 0.00015159646959569083, - "loss": 0.0464, + "epoch": 0.59, + "learning_rate": 0.00021144465169714138, + "loss": 0.0518, "step": 91470 }, { - "epoch": 0.99, - "learning_rate": 0.00015158024531118175, - "loss": 0.043, + "epoch": 0.59, + "learning_rate": 0.00021143497034278446, + "loss": 0.0509, "step": 91480 }, { - "epoch": 0.99, - "learning_rate": 0.0001515640210266727, - "loss": 0.0459, + "epoch": 0.59, + "learning_rate": 0.00021142528898842754, + "loss": 0.054, "step": 91490 }, { - "epoch": 0.99, - "learning_rate": 0.00015154779674216365, - "loss": 0.0477, + "epoch": 0.59, + "learning_rate": 0.00021141560763407062, + "loss": 0.0419, "step": 91500 }, { - "epoch": 0.99, - "learning_rate": 0.0001515315724576546, - "loss": 0.0544, + "epoch": 0.59, + "learning_rate": 0.00021140592627971367, + "loss": 0.049, "step": 91510 }, { - "epoch": 0.99, - "learning_rate": 0.00015151534817314558, - "loss": 0.0393, + "epoch": 0.59, + "learning_rate": 0.00021139624492535675, + "loss": 0.048, "step": 91520 }, { - "epoch": 0.99, - "learning_rate": 0.0001514991238886365, - "loss": 0.0397, + "epoch": 0.59, + "learning_rate": 0.00021138656357099983, + "loss": 0.0517, "step": 91530 }, { - "epoch": 0.99, - "learning_rate": 0.00015148289960412745, - "loss": 0.0466, + "epoch": 0.59, + "learning_rate": 0.00021137688221664286, + "loss": 0.0512, "step": 91540 }, { - "epoch": 0.99, - "learning_rate": 0.0001514666753196184, - "loss": 0.0394, + "epoch": 0.59, + "learning_rate": 0.00021136720086228594, + "loss": 0.0492, "step": 91550 }, { - "epoch": 0.99, - "learning_rate": 0.00015145045103510935, - "loss": 0.0377, + "epoch": 0.59, + "learning_rate": 0.00021135751950792901, + "loss": 0.0592, "step": 91560 }, { - "epoch": 0.99, - "learning_rate": 0.0001514342267506003, - "loss": 0.0436, + "epoch": 0.59, + "learning_rate": 0.00021134783815357207, + "loss": 0.0502, "step": 91570 }, { - "epoch": 0.99, - "learning_rate": 0.00015141800246609125, - "loss": 0.0367, + "epoch": 0.59, + "learning_rate": 0.00021133815679921515, + "loss": 0.0492, "step": 91580 }, { - "epoch": 0.99, - "learning_rate": 0.00015140177818158217, - "loss": 0.0412, + "epoch": 0.59, + "learning_rate": 0.00021132847544485823, + "loss": 0.0541, "step": 91590 }, { - "epoch": 0.99, - "learning_rate": 0.00015138555389707315, - "loss": 0.0361, + "epoch": 0.59, + "learning_rate": 0.0002113187940905013, + "loss": 0.0474, "step": 91600 }, { - "epoch": 0.99, - "learning_rate": 0.00015136932961256407, - "loss": 0.0395, + "epoch": 0.59, + "learning_rate": 0.00021130911273614433, + "loss": 0.0472, "step": 91610 }, { - "epoch": 0.99, - "learning_rate": 0.00015135310532805505, - "loss": 0.0409, + "epoch": 0.59, + "learning_rate": 0.0002112994313817874, + "loss": 0.0542, "step": 91620 }, { - "epoch": 0.99, - "learning_rate": 0.00015133688104354597, - "loss": 0.0397, + "epoch": 0.59, + "learning_rate": 0.0002112897500274305, + "loss": 0.0559, "step": 91630 }, { - "epoch": 0.99, - "learning_rate": 0.00015132065675903692, - "loss": 0.0459, + "epoch": 0.59, + "learning_rate": 0.00021128006867307354, + "loss": 0.0537, "step": 91640 }, { - "epoch": 0.99, - "learning_rate": 0.00015130443247452787, - "loss": 0.0421, + "epoch": 0.59, + "learning_rate": 0.00021127038731871662, + "loss": 0.0525, "step": 91650 }, { - "epoch": 0.99, - "learning_rate": 0.00015128820819001882, - "loss": 0.0474, + "epoch": 0.59, + "learning_rate": 0.0002112607059643597, + "loss": 0.0582, "step": 91660 }, { - "epoch": 0.99, - "learning_rate": 0.00015127198390550974, - "loss": 0.0357, + "epoch": 0.59, + "learning_rate": 0.00021125102461000278, + "loss": 0.0511, "step": 91670 }, { - "epoch": 0.99, - "learning_rate": 0.00015125575962100072, - "loss": 0.042, + "epoch": 0.59, + "learning_rate": 0.0002112413432556458, + "loss": 0.0542, "step": 91680 }, { - "epoch": 0.99, - "learning_rate": 0.00015123953533649164, - "loss": 0.0387, + "epoch": 0.59, + "learning_rate": 0.0002112316619012889, + "loss": 0.052, "step": 91690 }, { - "epoch": 0.99, - "learning_rate": 0.00015122331105198262, - "loss": 0.044, + "epoch": 0.59, + "learning_rate": 0.00021122198054693197, + "loss": 0.046, "step": 91700 }, { - "epoch": 0.99, - "learning_rate": 0.00015120708676747354, - "loss": 0.038, + "epoch": 0.59, + "learning_rate": 0.00021121229919257502, + "loss": 0.0452, "step": 91710 }, { - "epoch": 0.99, - "learning_rate": 0.0001511908624829645, - "loss": 0.0381, + "epoch": 0.59, + "learning_rate": 0.0002112026178382181, + "loss": 0.0485, "step": 91720 }, { - "epoch": 0.99, - "learning_rate": 0.00015117463819845544, - "loss": 0.0435, + "epoch": 0.59, + "learning_rate": 0.00021119293648386118, + "loss": 0.046, "step": 91730 }, { - "epoch": 0.99, - "learning_rate": 0.0001511584139139464, - "loss": 0.0372, + "epoch": 0.59, + "learning_rate": 0.00021118325512950423, + "loss": 0.0452, "step": 91740 }, { - "epoch": 0.99, - "learning_rate": 0.00015114218962943734, - "loss": 0.0465, + "epoch": 0.59, + "learning_rate": 0.0002111735737751473, + "loss": 0.0517, "step": 91750 }, { - "epoch": 0.99, - "learning_rate": 0.0001511259653449283, - "loss": 0.0396, + "epoch": 0.59, + "learning_rate": 0.00021116389242079037, + "loss": 0.0489, "step": 91760 }, { - "epoch": 0.99, - "learning_rate": 0.0001511097410604192, - "loss": 0.0469, + "epoch": 0.59, + "learning_rate": 0.00021115421106643342, + "loss": 0.0497, "step": 91770 }, { - "epoch": 0.99, - "learning_rate": 0.0001510935167759102, - "loss": 0.0466, + "epoch": 0.59, + "learning_rate": 0.0002111445297120765, + "loss": 0.0536, "step": 91780 }, { - "epoch": 0.99, - "learning_rate": 0.0001510772924914011, - "loss": 0.0431, + "epoch": 0.59, + "learning_rate": 0.00021113484835771958, + "loss": 0.0472, "step": 91790 }, { - "epoch": 0.99, - "learning_rate": 0.0001510610682068921, - "loss": 0.0462, + "epoch": 0.59, + "learning_rate": 0.00021112516700336266, + "loss": 0.0498, "step": 91800 }, { - "epoch": 0.99, - "learning_rate": 0.000151044843922383, - "loss": 0.0417, + "epoch": 0.59, + "learning_rate": 0.0002111154856490057, + "loss": 0.0537, "step": 91810 }, { - "epoch": 0.99, - "learning_rate": 0.00015102861963787396, - "loss": 0.0422, + "epoch": 0.59, + "learning_rate": 0.00021110580429464876, + "loss": 0.0404, "step": 91820 }, { - "epoch": 0.99, - "learning_rate": 0.0001510123953533649, - "loss": 0.0434, + "epoch": 0.59, + "learning_rate": 0.00021109612294029184, + "loss": 0.0606, "step": 91830 }, { - "epoch": 0.99, - "learning_rate": 0.00015099617106885586, - "loss": 0.0409, + "epoch": 0.59, + "learning_rate": 0.0002110864415859349, + "loss": 0.0515, "step": 91840 }, { - "epoch": 0.99, - "learning_rate": 0.00015097994678434678, - "loss": 0.039, + "epoch": 0.59, + "learning_rate": 0.00021107676023157798, + "loss": 0.0516, "step": 91850 }, { - "epoch": 0.99, - "learning_rate": 0.00015096372249983776, - "loss": 0.0434, + "epoch": 0.59, + "learning_rate": 0.00021106707887722106, + "loss": 0.0461, "step": 91860 }, { - "epoch": 0.99, - "learning_rate": 0.00015094749821532868, - "loss": 0.0399, + "epoch": 0.59, + "learning_rate": 0.00021105739752286414, + "loss": 0.0633, "step": 91870 }, { - "epoch": 0.99, - "learning_rate": 0.00015093127393081966, - "loss": 0.0422, + "epoch": 0.59, + "learning_rate": 0.0002110477161685072, + "loss": 0.0486, "step": 91880 }, { - "epoch": 0.99, - "learning_rate": 0.00015091504964631058, - "loss": 0.037, + "epoch": 0.59, + "learning_rate": 0.00021103803481415024, + "loss": 0.048, "step": 91890 }, { - "epoch": 0.99, - "learning_rate": 0.00015089882536180153, - "loss": 0.0471, + "epoch": 0.59, + "learning_rate": 0.00021102835345979332, + "loss": 0.0479, "step": 91900 }, { - "epoch": 0.99, - "learning_rate": 0.00015088260107729248, - "loss": 0.0438, + "epoch": 0.59, + "learning_rate": 0.00021101867210543637, + "loss": 0.0496, "step": 91910 }, { - "epoch": 0.99, - "learning_rate": 0.00015086637679278343, - "loss": 0.0448, + "epoch": 0.59, + "learning_rate": 0.00021100899075107945, + "loss": 0.0539, "step": 91920 }, { - "epoch": 0.99, - "learning_rate": 0.00015085015250827438, - "loss": 0.0351, + "epoch": 0.59, + "learning_rate": 0.00021099930939672253, + "loss": 0.049, "step": 91930 }, { - "epoch": 0.99, - "learning_rate": 0.00015083392822376533, - "loss": 0.041, + "epoch": 0.59, + "learning_rate": 0.00021098962804236559, + "loss": 0.0505, "step": 91940 }, { - "epoch": 0.99, - "learning_rate": 0.00015081770393925625, - "loss": 0.041, + "epoch": 0.59, + "learning_rate": 0.00021097994668800867, + "loss": 0.0507, "step": 91950 }, { - "epoch": 0.99, - "learning_rate": 0.00015080147965474723, - "loss": 0.0399, + "epoch": 0.59, + "learning_rate": 0.00021097026533365172, + "loss": 0.0503, "step": 91960 }, { - "epoch": 0.99, - "learning_rate": 0.00015078525537023815, - "loss": 0.036, + "epoch": 0.59, + "learning_rate": 0.00021096058397929477, + "loss": 0.0507, "step": 91970 }, { - "epoch": 0.99, - "learning_rate": 0.00015076903108572913, - "loss": 0.0467, + "epoch": 0.59, + "learning_rate": 0.00021095090262493785, + "loss": 0.0574, "step": 91980 }, { - "epoch": 0.99, - "learning_rate": 0.00015075280680122005, - "loss": 0.0479, + "epoch": 0.59, + "learning_rate": 0.00021094122127058093, + "loss": 0.0533, "step": 91990 }, { - "epoch": 1.0, - "learning_rate": 0.000150736582516711, - "loss": 0.0395, + "epoch": 0.59, + "learning_rate": 0.000210931539916224, + "loss": 0.046, "step": 92000 }, { - "epoch": 1.0, - "eval_cer": 0.921151674821227, - "eval_loss": 0.029919525608420372, - "eval_runtime": 118.8521, - "eval_samples_per_second": 16.828, - "eval_steps_per_second": 4.207, + "epoch": 0.59, + "eval_cer": 0.9200949045305615, + "eval_loss": 0.03254178166389465, + "eval_runtime": 119.8756, + "eval_samples_per_second": 16.684, + "eval_steps_per_second": 4.171, "step": 92000 }, { - "epoch": 1.0, - "learning_rate": 0.00015072035823220195, - "loss": 0.0406, + "epoch": 0.59, + "learning_rate": 0.00021092185856186706, + "loss": 0.0445, "step": 92010 }, { - "epoch": 1.0, - "learning_rate": 0.0001507041339476929, - "loss": 0.0406, + "epoch": 0.59, + "learning_rate": 0.00021091217720751014, + "loss": 0.0458, "step": 92020 }, { - "epoch": 1.0, - "learning_rate": 0.00015068790966318383, - "loss": 0.0381, + "epoch": 0.59, + "learning_rate": 0.0002109024958531532, + "loss": 0.0502, "step": 92030 }, { - "epoch": 1.0, - "learning_rate": 0.0001506716853786748, - "loss": 0.038, + "epoch": 0.59, + "learning_rate": 0.00021089281449879625, + "loss": 0.0528, "step": 92040 }, { - "epoch": 1.0, - "learning_rate": 0.00015065546109416572, - "loss": 0.0378, + "epoch": 0.59, + "learning_rate": 0.00021088313314443933, + "loss": 0.0521, "step": 92050 }, { - "epoch": 1.0, - "learning_rate": 0.0001506392368096567, - "loss": 0.0377, + "epoch": 0.59, + "learning_rate": 0.0002108734517900824, + "loss": 0.0571, "step": 92060 }, { - "epoch": 1.0, - "learning_rate": 0.00015062301252514762, - "loss": 0.0409, + "epoch": 0.59, + "learning_rate": 0.0002108637704357255, + "loss": 0.0488, "step": 92070 }, { - "epoch": 1.0, - "learning_rate": 0.00015060678824063857, - "loss": 0.0451, + "epoch": 0.59, + "learning_rate": 0.00021085408908136854, + "loss": 0.0457, "step": 92080 }, { - "epoch": 1.0, - "learning_rate": 0.00015059056395612952, - "loss": 0.038, + "epoch": 0.59, + "learning_rate": 0.00021084440772701162, + "loss": 0.0514, "step": 92090 }, { - "epoch": 1.0, - "learning_rate": 0.00015057433967162047, - "loss": 0.0411, + "epoch": 0.59, + "learning_rate": 0.00021083472637265467, + "loss": 0.0479, "step": 92100 }, { - "epoch": 1.0, - "learning_rate": 0.00015055811538711142, - "loss": 0.0399, + "epoch": 0.59, + "learning_rate": 0.00021082504501829773, + "loss": 0.0509, "step": 92110 }, { - "epoch": 1.0, - "learning_rate": 0.00015054189110260237, - "loss": 0.0467, + "epoch": 0.59, + "learning_rate": 0.0002108153636639408, + "loss": 0.0438, "step": 92120 }, { - "epoch": 1.0, - "learning_rate": 0.0001505256668180933, - "loss": 0.0451, + "epoch": 0.59, + "learning_rate": 0.00021080568230958389, + "loss": 0.0483, "step": 92130 }, { - "epoch": 1.0, - "learning_rate": 0.00015050944253358427, - "loss": 0.0342, + "epoch": 0.59, + "learning_rate": 0.00021079600095522694, + "loss": 0.0515, "step": 92140 }, { - "epoch": 1.0, - "learning_rate": 0.0001504932182490752, - "loss": 0.0437, + "epoch": 0.59, + "learning_rate": 0.00021078631960087002, + "loss": 0.0504, "step": 92150 }, { - "epoch": 1.0, - "learning_rate": 0.00015047699396456617, - "loss": 0.0427, + "epoch": 0.59, + "learning_rate": 0.0002107766382465131, + "loss": 0.0476, "step": 92160 }, { - "epoch": 1.0, - "learning_rate": 0.0001504607696800571, - "loss": 0.0364, + "epoch": 0.59, + "learning_rate": 0.00021076695689215612, + "loss": 0.0458, "step": 92170 }, { - "epoch": 1.0, - "learning_rate": 0.00015044454539554804, - "loss": 0.0453, + "epoch": 0.59, + "learning_rate": 0.0002107572755377992, + "loss": 0.049, "step": 92180 }, { - "epoch": 1.0, - "learning_rate": 0.000150428321111039, - "loss": 0.0421, + "epoch": 0.6, + "learning_rate": 0.00021074759418344228, + "loss": 0.0449, "step": 92190 }, { - "epoch": 1.0, - "learning_rate": 0.00015041209682652994, - "loss": 0.0417, + "epoch": 0.6, + "learning_rate": 0.00021073791282908536, + "loss": 0.0426, "step": 92200 }, { - "epoch": 1.0, - "learning_rate": 0.00015039587254202087, - "loss": 0.0422, + "epoch": 0.6, + "learning_rate": 0.00021072823147472842, + "loss": 0.0565, "step": 92210 }, { - "epoch": 1.0, - "learning_rate": 0.00015037964825751184, - "loss": 0.04, + "epoch": 0.6, + "learning_rate": 0.0002107185501203715, + "loss": 0.0472, "step": 92220 }, { - "epoch": 1.0, - "learning_rate": 0.00015036342397300277, - "loss": 0.0452, + "epoch": 0.6, + "learning_rate": 0.00021070886876601457, + "loss": 0.0489, "step": 92230 }, { - "epoch": 1.0, - "learning_rate": 0.00015034719968849374, - "loss": 0.0385, + "epoch": 0.6, + "learning_rate": 0.0002106991874116576, + "loss": 0.0495, "step": 92240 }, { - "epoch": 1.0, - "learning_rate": 0.00015033097540398467, - "loss": 0.0459, + "epoch": 0.6, + "learning_rate": 0.00021068950605730068, + "loss": 0.049, "step": 92250 }, { - "epoch": 1.0, - "learning_rate": 0.00015031475111947564, - "loss": 0.0421, + "epoch": 0.6, + "learning_rate": 0.00021067982470294376, + "loss": 0.0475, "step": 92260 }, { - "epoch": 1.0, - "learning_rate": 0.00015029852683496657, - "loss": 0.0383, + "epoch": 0.6, + "learning_rate": 0.00021067014334858684, + "loss": 0.043, "step": 92270 }, { - "epoch": 1.0, - "learning_rate": 0.00015028230255045752, - "loss": 0.0396, + "epoch": 0.6, + "learning_rate": 0.0002106604619942299, + "loss": 0.0543, "step": 92280 }, { - "epoch": 1.0, - "learning_rate": 0.00015026607826594846, - "loss": 0.0372, + "epoch": 0.6, + "learning_rate": 0.00021065078063987297, + "loss": 0.0463, "step": 92290 }, { - "epoch": 1.0, - "learning_rate": 0.00015024985398143941, - "loss": 0.0403, + "epoch": 0.6, + "learning_rate": 0.00021064109928551605, + "loss": 0.0455, "step": 92300 }, { - "epoch": 1.0, - "learning_rate": 0.00015023362969693034, - "loss": 0.0505, + "epoch": 0.6, + "learning_rate": 0.00021063141793115908, + "loss": 0.0449, "step": 92310 }, { - "epoch": 1.0, - "learning_rate": 0.00015021740541242131, - "loss": 0.0388, + "epoch": 0.6, + "learning_rate": 0.00021062173657680216, + "loss": 0.0604, "step": 92320 }, { - "epoch": 1.0, - "learning_rate": 0.00015020118112791224, - "loss": 0.0485, + "epoch": 0.6, + "learning_rate": 0.00021061205522244524, + "loss": 0.0475, "step": 92330 }, { - "epoch": 1.0, - "learning_rate": 0.00015018495684340321, - "loss": 0.0504, + "epoch": 0.6, + "learning_rate": 0.0002106023738680883, + "loss": 0.0466, "step": 92340 }, { - "epoch": 1.0, - "learning_rate": 0.00015016873255889414, - "loss": 0.043, + "epoch": 0.6, + "learning_rate": 0.00021059269251373137, + "loss": 0.0513, "step": 92350 }, { - "epoch": 1.0, - "learning_rate": 0.00015015250827438509, - "loss": 0.047, + "epoch": 0.6, + "learning_rate": 0.00021058301115937445, + "loss": 0.0567, "step": 92360 }, { - "epoch": 1.0, - "learning_rate": 0.00015013628398987604, - "loss": 0.0402, + "epoch": 0.6, + "learning_rate": 0.00021057332980501753, + "loss": 0.0552, "step": 92370 }, { - "epoch": 1.0, - "learning_rate": 0.00015012005970536699, - "loss": 0.0406, + "epoch": 0.6, + "learning_rate": 0.00021056364845066055, + "loss": 0.0534, "step": 92380 }, { - "epoch": 1.0, - "learning_rate": 0.0001501038354208579, - "loss": 0.0348, + "epoch": 0.6, + "learning_rate": 0.00021055396709630363, + "loss": 0.0448, "step": 92390 }, { - "epoch": 1.0, - "learning_rate": 0.00015008761113634889, - "loss": 0.047, + "epoch": 0.6, + "learning_rate": 0.00021054428574194671, + "loss": 0.0477, "step": 92400 }, { - "epoch": 1.0, - "learning_rate": 0.0001500713868518398, - "loss": 0.0407, + "epoch": 0.6, + "learning_rate": 0.00021053460438758977, + "loss": 0.0485, "step": 92410 }, { - "epoch": 1.0, - "learning_rate": 0.00015005516256733078, - "loss": 0.0406, + "epoch": 0.6, + "learning_rate": 0.00021052492303323285, + "loss": 0.0528, "step": 92420 }, { - "epoch": 1.0, - "learning_rate": 0.0001500389382828217, - "loss": 0.0392, + "epoch": 0.6, + "learning_rate": 0.00021051524167887593, + "loss": 0.0484, "step": 92430 }, { - "epoch": 1.0, - "learning_rate": 0.00015002271399831268, - "loss": 0.0443, + "epoch": 0.6, + "learning_rate": 0.000210505560324519, + "loss": 0.049, "step": 92440 }, { - "epoch": 1.0, - "learning_rate": 0.0001500064897138036, - "loss": 0.0405, + "epoch": 0.6, + "learning_rate": 0.00021049587897016203, + "loss": 0.0463, "step": 92450 }, { - "epoch": 1.0, - "learning_rate": 0.00014999026542929456, - "loss": 0.0349, + "epoch": 0.6, + "learning_rate": 0.0002104861976158051, + "loss": 0.0531, "step": 92460 }, { - "epoch": 1.0, - "learning_rate": 0.0001499740411447855, - "loss": 0.0372, + "epoch": 0.6, + "learning_rate": 0.0002104765162614482, + "loss": 0.0471, "step": 92470 }, { - "epoch": 1.0, - "learning_rate": 0.00014995781686027643, - "loss": 0.0385, + "epoch": 0.6, + "learning_rate": 0.00021046683490709124, + "loss": 0.0473, "step": 92480 }, { - "epoch": 1.0, - "learning_rate": 0.00014994159257576738, - "loss": 0.0407, + "epoch": 0.6, + "learning_rate": 0.00021045715355273432, + "loss": 0.0518, "step": 92490 }, { - "epoch": 1.0, - "learning_rate": 0.00014992536829125833, - "loss": 0.0359, + "epoch": 0.6, + "learning_rate": 0.0002104474721983774, + "loss": 0.053, "step": 92500 }, { - "epoch": 1.0, - "learning_rate": 0.00014990914400674928, - "loss": 0.0387, + "epoch": 0.6, + "learning_rate": 0.00021043779084402048, + "loss": 0.0507, "step": 92510 }, { - "epoch": 1.0, - "learning_rate": 0.00014989291972224023, - "loss": 0.0396, + "epoch": 0.6, + "learning_rate": 0.0002104281094896635, + "loss": 0.0484, "step": 92520 }, { - "epoch": 1.0, - "learning_rate": 0.00014987669543773118, - "loss": 0.0364, + "epoch": 0.6, + "learning_rate": 0.0002104184281353066, + "loss": 0.0447, "step": 92530 }, { - "epoch": 1.0, - "learning_rate": 0.00014986047115322213, - "loss": 0.0364, + "epoch": 0.6, + "learning_rate": 0.00021040874678094964, + "loss": 0.0584, "step": 92540 }, { - "epoch": 1.0, - "learning_rate": 0.00014984424686871308, - "loss": 0.03, + "epoch": 0.6, + "learning_rate": 0.00021039906542659272, + "loss": 0.0502, "step": 92550 }, { - "epoch": 1.0, - "learning_rate": 0.00014982802258420403, - "loss": 0.0371, + "epoch": 0.6, + "learning_rate": 0.0002103893840722358, + "loss": 0.0454, "step": 92560 }, { - "epoch": 1.0, - "learning_rate": 0.00014981179829969495, - "loss": 0.0387, + "epoch": 0.6, + "learning_rate": 0.00021037970271787888, + "loss": 0.0462, "step": 92570 }, { - "epoch": 1.0, - "learning_rate": 0.0001497955740151859, - "loss": 0.0382, + "epoch": 0.6, + "learning_rate": 0.00021037002136352193, + "loss": 0.0464, "step": 92580 }, { - "epoch": 1.0, - "learning_rate": 0.00014977934973067685, - "loss": 0.0429, + "epoch": 0.6, + "learning_rate": 0.000210360340009165, + "loss": 0.045, "step": 92590 }, { - "epoch": 1.0, - "learning_rate": 0.0001497631254461678, - "loss": 0.0345, + "epoch": 0.6, + "learning_rate": 0.00021035065865480807, + "loss": 0.0529, "step": 92600 }, { - "epoch": 1.0, - "learning_rate": 0.00014974690116165875, - "loss": 0.0373, + "epoch": 0.6, + "learning_rate": 0.00021034097730045112, + "loss": 0.0531, "step": 92610 }, { - "epoch": 1.0, - "learning_rate": 0.0001497306768771497, - "loss": 0.0391, + "epoch": 0.6, + "learning_rate": 0.0002103312959460942, + "loss": 0.0426, "step": 92620 }, { - "epoch": 1.0, - "learning_rate": 0.00014971445259264065, - "loss": 0.0388, + "epoch": 0.6, + "learning_rate": 0.00021032161459173728, + "loss": 0.0457, "step": 92630 }, { - "epoch": 1.0, - "learning_rate": 0.0001496982283081316, - "loss": 0.0339, + "epoch": 0.6, + "learning_rate": 0.00021031193323738036, + "loss": 0.0523, "step": 92640 }, { - "epoch": 1.0, - "learning_rate": 0.00014968200402362255, - "loss": 0.0383, + "epoch": 0.6, + "learning_rate": 0.0002103022518830234, + "loss": 0.0678, "step": 92650 }, { - "epoch": 1.0, - "learning_rate": 0.00014966577973911347, - "loss": 0.0407, + "epoch": 0.6, + "learning_rate": 0.00021029257052866646, + "loss": 0.0532, "step": 92660 }, { - "epoch": 1.0, - "learning_rate": 0.00014964955545460442, - "loss": 0.0384, + "epoch": 0.6, + "learning_rate": 0.00021028288917430954, + "loss": 0.0492, "step": 92670 }, { - "epoch": 1.0, - "learning_rate": 0.00014963333117009537, - "loss": 0.0363, + "epoch": 0.6, + "learning_rate": 0.0002102732078199526, + "loss": 0.0506, "step": 92680 }, { - "epoch": 1.0, - "learning_rate": 0.00014961710688558635, - "loss": 0.0425, + "epoch": 0.6, + "learning_rate": 0.00021026352646559568, + "loss": 0.0488, "step": 92690 }, { - "epoch": 1.0, - "learning_rate": 0.0001496008826010773, - "loss": 0.0383, + "epoch": 0.6, + "learning_rate": 0.00021025384511123876, + "loss": 0.0459, "step": 92700 }, { - "epoch": 1.0, - "learning_rate": 0.00014958465831656825, - "loss": 0.0354, + "epoch": 0.6, + "learning_rate": 0.00021024416375688184, + "loss": 0.0559, "step": 92710 }, { - "epoch": 1.0, - "learning_rate": 0.00014956843403205917, - "loss": 0.0425, + "epoch": 0.6, + "learning_rate": 0.0002102344824025249, + "loss": 0.0514, "step": 92720 }, { - "epoch": 1.0, - "learning_rate": 0.00014955220974755012, - "loss": 0.0332, + "epoch": 0.6, + "learning_rate": 0.00021022480104816794, + "loss": 0.0515, "step": 92730 }, { - "epoch": 1.0, - "learning_rate": 0.00014953598546304107, - "loss": 0.0333, + "epoch": 0.6, + "learning_rate": 0.000210215119693811, + "loss": 0.0467, "step": 92740 }, { - "epoch": 1.0, - "learning_rate": 0.00014951976117853202, - "loss": 0.0413, + "epoch": 0.6, + "learning_rate": 0.00021020543833945407, + "loss": 0.043, "step": 92750 }, { - "epoch": 1.0, - "learning_rate": 0.00014950353689402297, - "loss": 0.0366, + "epoch": 0.6, + "learning_rate": 0.00021019575698509715, + "loss": 0.0517, "step": 92760 }, { - "epoch": 1.0, - "learning_rate": 0.00014948731260951392, - "loss": 0.0399, + "epoch": 0.6, + "learning_rate": 0.00021018607563074023, + "loss": 0.052, "step": 92770 }, { - "epoch": 1.0, - "learning_rate": 0.00014947108832500487, - "loss": 0.0359, + "epoch": 0.6, + "learning_rate": 0.00021017639427638329, + "loss": 0.0475, "step": 92780 }, { - "epoch": 1.0, - "learning_rate": 0.00014945486404049582, - "loss": 0.0334, + "epoch": 0.6, + "learning_rate": 0.00021016671292202637, + "loss": 0.0493, "step": 92790 }, { - "epoch": 1.0, - "learning_rate": 0.00014943863975598677, - "loss": 0.0329, + "epoch": 0.6, + "learning_rate": 0.00021015703156766942, + "loss": 0.0417, "step": 92800 }, { - "epoch": 1.0, - "learning_rate": 0.0001494224154714777, - "loss": 0.0393, + "epoch": 0.6, + "learning_rate": 0.00021014735021331247, + "loss": 0.046, "step": 92810 }, { - "epoch": 1.0, - "learning_rate": 0.00014940619118696864, - "loss": 0.0377, + "epoch": 0.6, + "learning_rate": 0.00021013766885895555, + "loss": 0.0434, "step": 92820 }, { - "epoch": 1.0, - "learning_rate": 0.0001493899669024596, - "loss": 0.0456, + "epoch": 0.6, + "learning_rate": 0.00021012798750459863, + "loss": 0.045, "step": 92830 }, { - "epoch": 1.0, - "learning_rate": 0.00014937374261795054, - "loss": 0.0388, + "epoch": 0.6, + "learning_rate": 0.0002101183061502417, + "loss": 0.0453, "step": 92840 }, { - "epoch": 1.0, - "learning_rate": 0.0001493575183334415, - "loss": 0.0436, + "epoch": 0.6, + "learning_rate": 0.00021010862479588476, + "loss": 0.0497, "step": 92850 }, { - "epoch": 1.0, - "learning_rate": 0.00014934129404893244, - "loss": 0.0396, + "epoch": 0.6, + "learning_rate": 0.00021009894344152784, + "loss": 0.0501, "step": 92860 }, { - "epoch": 1.0, - "learning_rate": 0.0001493250697644234, - "loss": 0.0381, + "epoch": 0.6, + "learning_rate": 0.0002100892620871709, + "loss": 0.0499, "step": 92870 }, { - "epoch": 1.0, - "learning_rate": 0.00014930884547991434, - "loss": 0.0426, + "epoch": 0.6, + "learning_rate": 0.00021007958073281395, + "loss": 0.0563, "step": 92880 }, { - "epoch": 1.0, - "learning_rate": 0.0001492926211954053, - "loss": 0.0452, + "epoch": 0.6, + "learning_rate": 0.00021006989937845703, + "loss": 0.0472, "step": 92890 }, { - "epoch": 1.0, - "learning_rate": 0.0001492763969108962, - "loss": 0.0421, + "epoch": 0.6, + "learning_rate": 0.0002100602180241001, + "loss": 0.0569, "step": 92900 }, { - "epoch": 1.0, - "learning_rate": 0.00014926017262638716, - "loss": 0.0396, + "epoch": 0.6, + "learning_rate": 0.0002100505366697432, + "loss": 0.0529, "step": 92910 }, { - "epoch": 1.01, - "learning_rate": 0.0001492439483418781, - "loss": 0.0334, + "epoch": 0.6, + "learning_rate": 0.00021004085531538624, + "loss": 0.0555, "step": 92920 }, { - "epoch": 1.01, - "learning_rate": 0.00014922772405736906, - "loss": 0.0373, + "epoch": 0.6, + "learning_rate": 0.00021003117396102932, + "loss": 0.0436, "step": 92930 }, { - "epoch": 1.01, - "learning_rate": 0.00014921149977286, - "loss": 0.0395, + "epoch": 0.6, + "learning_rate": 0.00021002149260667237, + "loss": 0.0453, "step": 92940 }, { - "epoch": 1.01, - "learning_rate": 0.00014919527548835096, - "loss": 0.0402, + "epoch": 0.6, + "learning_rate": 0.00021001181125231543, + "loss": 0.0428, "step": 92950 }, { - "epoch": 1.01, - "learning_rate": 0.0001491790512038419, - "loss": 0.0405, + "epoch": 0.6, + "learning_rate": 0.0002100021298979585, + "loss": 0.0493, "step": 92960 }, { - "epoch": 1.01, - "learning_rate": 0.00014916282691933286, - "loss": 0.0368, + "epoch": 0.6, + "learning_rate": 0.00020999244854360158, + "loss": 0.0481, "step": 92970 }, { - "epoch": 1.01, - "learning_rate": 0.0001491466026348238, - "loss": 0.0379, + "epoch": 0.6, + "learning_rate": 0.00020998276718924464, + "loss": 0.0458, "step": 92980 }, { - "epoch": 1.01, - "learning_rate": 0.00014913037835031473, - "loss": 0.0344, + "epoch": 0.6, + "learning_rate": 0.00020997308583488772, + "loss": 0.0525, "step": 92990 }, { - "epoch": 1.01, - "learning_rate": 0.00014911415406580568, - "loss": 0.0387, + "epoch": 0.6, + "learning_rate": 0.00020996340448053077, + "loss": 0.0545, "step": 93000 }, { - "epoch": 1.01, - "eval_cer": 0.9212311884100993, - "eval_loss": 0.029003417119383812, - "eval_runtime": 119.5319, - "eval_samples_per_second": 16.732, - "eval_steps_per_second": 4.183, + "epoch": 0.6, + "eval_cer": 0.9199846345045758, + "eval_loss": 0.032582107931375504, + "eval_runtime": 120.1286, + "eval_samples_per_second": 16.649, + "eval_steps_per_second": 4.162, "step": 93000 }, { - "epoch": 1.01, - "learning_rate": 0.00014909792978129663, - "loss": 0.0347, + "epoch": 0.6, + "learning_rate": 0.00020995372312617382, + "loss": 0.0485, "step": 93010 }, { - "epoch": 1.01, - "learning_rate": 0.00014908170549678758, - "loss": 0.0397, + "epoch": 0.6, + "learning_rate": 0.0002099440417718169, + "loss": 0.0466, "step": 93020 }, { - "epoch": 1.01, - "learning_rate": 0.00014906548121227853, - "loss": 0.0401, + "epoch": 0.6, + "learning_rate": 0.00020993436041745998, + "loss": 0.0516, "step": 93030 }, { - "epoch": 1.01, - "learning_rate": 0.00014904925692776948, - "loss": 0.0373, + "epoch": 0.6, + "learning_rate": 0.00020992467906310306, + "loss": 0.0437, "step": 93040 }, { - "epoch": 1.01, - "learning_rate": 0.00014903303264326043, - "loss": 0.036, + "epoch": 0.6, + "learning_rate": 0.00020991499770874611, + "loss": 0.0578, "step": 93050 }, { - "epoch": 1.01, - "learning_rate": 0.00014901680835875138, - "loss": 0.0376, + "epoch": 0.6, + "learning_rate": 0.0002099053163543892, + "loss": 0.0552, "step": 93060 }, { - "epoch": 1.01, - "learning_rate": 0.00014900058407424233, - "loss": 0.0355, + "epoch": 0.6, + "learning_rate": 0.00020989563500003225, + "loss": 0.0467, "step": 93070 }, { - "epoch": 1.01, - "learning_rate": 0.00014898435978973325, - "loss": 0.0381, + "epoch": 0.6, + "learning_rate": 0.0002098859536456753, + "loss": 0.0512, "step": 93080 }, { - "epoch": 1.01, - "learning_rate": 0.0001489681355052242, - "loss": 0.0364, + "epoch": 0.6, + "learning_rate": 0.00020987627229131838, + "loss": 0.0482, "step": 93090 }, { - "epoch": 1.01, - "learning_rate": 0.00014895191122071515, - "loss": 0.0376, + "epoch": 0.6, + "learning_rate": 0.00020986659093696146, + "loss": 0.0494, "step": 93100 }, { - "epoch": 1.01, - "learning_rate": 0.0001489356869362061, - "loss": 0.0342, + "epoch": 0.6, + "learning_rate": 0.00020985690958260454, + "loss": 0.0499, "step": 93110 }, { - "epoch": 1.01, - "learning_rate": 0.00014891946265169705, - "loss": 0.0351, + "epoch": 0.6, + "learning_rate": 0.0002098472282282476, + "loss": 0.0539, "step": 93120 }, { - "epoch": 1.01, - "learning_rate": 0.000148903238367188, - "loss": 0.0425, + "epoch": 0.6, + "learning_rate": 0.00020983754687389067, + "loss": 0.0462, "step": 93130 }, { - "epoch": 1.01, - "learning_rate": 0.00014888701408267895, - "loss": 0.0373, + "epoch": 0.6, + "learning_rate": 0.00020982786551953372, + "loss": 0.0451, "step": 93140 }, { - "epoch": 1.01, - "learning_rate": 0.0001488707897981699, - "loss": 0.0395, + "epoch": 0.6, + "learning_rate": 0.00020981818416517678, + "loss": 0.0465, "step": 93150 }, { - "epoch": 1.01, - "learning_rate": 0.00014885456551366085, - "loss": 0.0357, + "epoch": 0.6, + "learning_rate": 0.00020980850281081986, + "loss": 0.0497, "step": 93160 }, { - "epoch": 1.01, - "learning_rate": 0.00014883834122915177, - "loss": 0.0404, + "epoch": 0.6, + "learning_rate": 0.00020979882145646294, + "loss": 0.0473, "step": 93170 }, { - "epoch": 1.01, - "learning_rate": 0.00014882211694464272, - "loss": 0.0382, + "epoch": 0.6, + "learning_rate": 0.000209789140102106, + "loss": 0.0426, "step": 93180 }, { - "epoch": 1.01, - "learning_rate": 0.00014880589266013367, - "loss": 0.0442, + "epoch": 0.6, + "learning_rate": 0.00020977945874774907, + "loss": 0.0486, "step": 93190 }, { - "epoch": 1.01, - "learning_rate": 0.00014878966837562462, - "loss": 0.032, + "epoch": 0.6, + "learning_rate": 0.00020976977739339215, + "loss": 0.0478, "step": 93200 }, { - "epoch": 1.01, - "learning_rate": 0.00014877344409111557, - "loss": 0.0403, + "epoch": 0.6, + "learning_rate": 0.00020976009603903517, + "loss": 0.0504, "step": 93210 }, { - "epoch": 1.01, - "learning_rate": 0.00014875721980660652, - "loss": 0.0399, + "epoch": 0.6, + "learning_rate": 0.00020975041468467825, + "loss": 0.0478, "step": 93220 }, { - "epoch": 1.01, - "learning_rate": 0.00014874099552209747, - "loss": 0.031, + "epoch": 0.6, + "learning_rate": 0.00020974073333032133, + "loss": 0.0476, "step": 93230 }, { - "epoch": 1.01, - "learning_rate": 0.00014872477123758842, - "loss": 0.0404, + "epoch": 0.6, + "learning_rate": 0.00020973105197596441, + "loss": 0.0446, "step": 93240 }, { - "epoch": 1.01, - "learning_rate": 0.00014870854695307937, - "loss": 0.0366, + "epoch": 0.6, + "learning_rate": 0.00020972137062160747, + "loss": 0.0489, "step": 93250 }, { - "epoch": 1.01, - "learning_rate": 0.0001486923226685703, - "loss": 0.0371, + "epoch": 0.6, + "learning_rate": 0.00020971168926725055, + "loss": 0.0434, "step": 93260 }, { - "epoch": 1.01, - "learning_rate": 0.00014867609838406124, - "loss": 0.0451, + "epoch": 0.6, + "learning_rate": 0.00020970200791289363, + "loss": 0.0527, "step": 93270 }, { - "epoch": 1.01, - "learning_rate": 0.0001486598740995522, - "loss": 0.0381, + "epoch": 0.6, + "learning_rate": 0.00020969232655853665, + "loss": 0.0471, "step": 93280 }, { - "epoch": 1.01, - "learning_rate": 0.00014864364981504314, - "loss": 0.0393, + "epoch": 0.6, + "learning_rate": 0.00020968264520417973, + "loss": 0.0532, "step": 93290 }, { - "epoch": 1.01, - "learning_rate": 0.0001486274255305341, - "loss": 0.0392, + "epoch": 0.6, + "learning_rate": 0.0002096729638498228, + "loss": 0.0472, "step": 93300 }, { - "epoch": 1.01, - "learning_rate": 0.00014861120124602504, - "loss": 0.0393, + "epoch": 0.6, + "learning_rate": 0.0002096632824954659, + "loss": 0.0506, "step": 93310 }, { - "epoch": 1.01, - "learning_rate": 0.000148594976961516, - "loss": 0.041, + "epoch": 0.6, + "learning_rate": 0.00020965360114110894, + "loss": 0.0429, "step": 93320 }, { - "epoch": 1.01, - "learning_rate": 0.00014857875267700694, - "loss": 0.0435, + "epoch": 0.6, + "learning_rate": 0.00020964391978675202, + "loss": 0.0497, "step": 93330 }, { - "epoch": 1.01, - "learning_rate": 0.0001485625283924979, - "loss": 0.0405, + "epoch": 0.6, + "learning_rate": 0.0002096342384323951, + "loss": 0.0468, "step": 93340 }, { - "epoch": 1.01, - "learning_rate": 0.00014854630410798882, - "loss": 0.0362, + "epoch": 0.6, + "learning_rate": 0.00020962455707803813, + "loss": 0.0456, "step": 93350 }, { - "epoch": 1.01, - "learning_rate": 0.00014853007982347977, - "loss": 0.0332, + "epoch": 0.6, + "learning_rate": 0.0002096148757236812, + "loss": 0.0515, "step": 93360 }, { - "epoch": 1.01, - "learning_rate": 0.00014851385553897071, - "loss": 0.0459, + "epoch": 0.6, + "learning_rate": 0.0002096051943693243, + "loss": 0.0552, "step": 93370 }, { - "epoch": 1.01, - "learning_rate": 0.00014849763125446166, - "loss": 0.0357, + "epoch": 0.6, + "learning_rate": 0.00020959551301496734, + "loss": 0.0444, "step": 93380 }, { - "epoch": 1.01, - "learning_rate": 0.00014848140696995261, - "loss": 0.0376, + "epoch": 0.6, + "learning_rate": 0.00020958583166061042, + "loss": 0.0413, "step": 93390 }, { - "epoch": 1.01, - "learning_rate": 0.00014846518268544356, - "loss": 0.0438, + "epoch": 0.6, + "learning_rate": 0.0002095761503062535, + "loss": 0.0435, "step": 93400 }, { - "epoch": 1.01, - "learning_rate": 0.00014844895840093451, - "loss": 0.0393, + "epoch": 0.6, + "learning_rate": 0.00020956646895189658, + "loss": 0.0472, "step": 93410 }, { - "epoch": 1.01, - "learning_rate": 0.00014843273411642546, - "loss": 0.0405, + "epoch": 0.6, + "learning_rate": 0.0002095567875975396, + "loss": 0.0498, "step": 93420 }, { - "epoch": 1.01, - "learning_rate": 0.0001484165098319164, - "loss": 0.0343, + "epoch": 0.6, + "learning_rate": 0.00020954710624318269, + "loss": 0.044, "step": 93430 }, { - "epoch": 1.01, - "learning_rate": 0.00014840028554740734, - "loss": 0.0409, + "epoch": 0.6, + "learning_rate": 0.00020953742488882577, + "loss": 0.0432, "step": 93440 }, { - "epoch": 1.01, - "learning_rate": 0.00014838406126289829, - "loss": 0.0376, + "epoch": 0.6, + "learning_rate": 0.00020952774353446882, + "loss": 0.05, "step": 93450 }, { - "epoch": 1.01, - "learning_rate": 0.00014836783697838924, - "loss": 0.0417, + "epoch": 0.6, + "learning_rate": 0.0002095180621801119, + "loss": 0.0461, "step": 93460 }, { - "epoch": 1.01, - "learning_rate": 0.00014835161269388019, - "loss": 0.0389, + "epoch": 0.6, + "learning_rate": 0.00020950838082575498, + "loss": 0.0469, "step": 93470 }, { - "epoch": 1.01, - "learning_rate": 0.00014833538840937114, - "loss": 0.0393, + "epoch": 0.6, + "learning_rate": 0.00020949869947139806, + "loss": 0.0506, "step": 93480 }, { - "epoch": 1.01, - "learning_rate": 0.00014831916412486208, - "loss": 0.0396, + "epoch": 0.6, + "learning_rate": 0.00020948901811704108, + "loss": 0.0404, "step": 93490 }, { - "epoch": 1.01, - "learning_rate": 0.00014830293984035303, - "loss": 0.0412, + "epoch": 0.6, + "learning_rate": 0.00020947933676268416, + "loss": 0.0529, "step": 93500 }, { - "epoch": 1.01, - "learning_rate": 0.00014828671555584398, - "loss": 0.0356, + "epoch": 0.6, + "learning_rate": 0.00020946965540832724, + "loss": 0.0501, "step": 93510 }, { - "epoch": 1.01, - "learning_rate": 0.00014827049127133493, - "loss": 0.0369, + "epoch": 0.6, + "learning_rate": 0.0002094599740539703, + "loss": 0.0453, "step": 93520 }, { - "epoch": 1.01, - "learning_rate": 0.00014825426698682586, - "loss": 0.0355, + "epoch": 0.6, + "learning_rate": 0.00020945029269961338, + "loss": 0.0504, "step": 93530 }, { - "epoch": 1.01, - "learning_rate": 0.0001482380427023168, - "loss": 0.0322, + "epoch": 0.6, + "learning_rate": 0.00020944061134525646, + "loss": 0.0497, "step": 93540 }, { - "epoch": 1.01, - "learning_rate": 0.00014822181841780776, - "loss": 0.041, + "epoch": 0.6, + "learning_rate": 0.0002094309299908995, + "loss": 0.0523, "step": 93550 }, { - "epoch": 1.01, - "learning_rate": 0.0001482055941332987, - "loss": 0.0381, + "epoch": 0.6, + "learning_rate": 0.00020942124863654256, + "loss": 0.0538, "step": 93560 }, { - "epoch": 1.01, - "learning_rate": 0.00014818936984878966, - "loss": 0.0321, + "epoch": 0.6, + "learning_rate": 0.00020941156728218564, + "loss": 0.0496, "step": 93570 }, { - "epoch": 1.01, - "learning_rate": 0.0001481731455642806, - "loss": 0.0381, + "epoch": 0.6, + "learning_rate": 0.0002094018859278287, + "loss": 0.045, "step": 93580 }, { - "epoch": 1.01, - "learning_rate": 0.00014815692127977156, - "loss": 0.0366, + "epoch": 0.6, + "learning_rate": 0.00020939220457347177, + "loss": 0.0509, "step": 93590 }, { - "epoch": 1.01, - "learning_rate": 0.0001481406969952625, - "loss": 0.036, + "epoch": 0.6, + "learning_rate": 0.00020938252321911485, + "loss": 0.0492, "step": 93600 }, { - "epoch": 1.01, - "learning_rate": 0.00014812447271075346, - "loss": 0.0322, + "epoch": 0.6, + "learning_rate": 0.00020937284186475793, + "loss": 0.0528, "step": 93610 }, { - "epoch": 1.01, - "learning_rate": 0.0001481082484262444, - "loss": 0.0387, + "epoch": 0.6, + "learning_rate": 0.00020936316051040099, + "loss": 0.0524, "step": 93620 }, { - "epoch": 1.01, - "learning_rate": 0.00014809202414173533, - "loss": 0.0351, + "epoch": 0.6, + "learning_rate": 0.00020935347915604404, + "loss": 0.0452, "step": 93630 }, { - "epoch": 1.01, - "learning_rate": 0.00014807579985722628, - "loss": 0.0384, + "epoch": 0.6, + "learning_rate": 0.00020934379780168712, + "loss": 0.0497, "step": 93640 }, { - "epoch": 1.01, - "learning_rate": 0.00014805957557271723, - "loss": 0.0363, + "epoch": 0.6, + "learning_rate": 0.00020933411644733017, + "loss": 0.0479, "step": 93650 }, { - "epoch": 1.01, - "learning_rate": 0.00014804335128820818, - "loss": 0.0335, + "epoch": 0.6, + "learning_rate": 0.00020932443509297325, + "loss": 0.0486, "step": 93660 }, { - "epoch": 1.01, - "learning_rate": 0.00014802712700369913, - "loss": 0.0386, + "epoch": 0.6, + "learning_rate": 0.00020931475373861633, + "loss": 0.0582, "step": 93670 }, { - "epoch": 1.01, - "learning_rate": 0.00014801090271919008, - "loss": 0.0341, + "epoch": 0.6, + "learning_rate": 0.0002093050723842594, + "loss": 0.0484, "step": 93680 }, { - "epoch": 1.01, - "learning_rate": 0.00014799467843468103, - "loss": 0.0331, + "epoch": 0.6, + "learning_rate": 0.00020929539102990246, + "loss": 0.0523, "step": 93690 }, { - "epoch": 1.01, - "learning_rate": 0.00014797845415017198, - "loss": 0.0371, + "epoch": 0.6, + "learning_rate": 0.00020928570967554552, + "loss": 0.0514, "step": 93700 }, { - "epoch": 1.01, - "learning_rate": 0.00014796222986566293, - "loss": 0.041, + "epoch": 0.6, + "learning_rate": 0.0002092760283211886, + "loss": 0.0475, "step": 93710 }, { - "epoch": 1.01, - "learning_rate": 0.00014794600558115385, - "loss": 0.0354, + "epoch": 0.6, + "learning_rate": 0.00020926634696683165, + "loss": 0.0447, "step": 93720 }, { - "epoch": 1.01, - "learning_rate": 0.0001479297812966448, - "loss": 0.0305, + "epoch": 0.6, + "learning_rate": 0.00020925666561247473, + "loss": 0.0442, "step": 93730 }, { - "epoch": 1.01, - "learning_rate": 0.00014791355701213575, - "loss": 0.0381, + "epoch": 0.61, + "learning_rate": 0.0002092469842581178, + "loss": 0.0457, "step": 93740 }, { - "epoch": 1.01, - "learning_rate": 0.0001478973327276267, - "loss": 0.0319, + "epoch": 0.61, + "learning_rate": 0.00020923730290376086, + "loss": 0.0476, "step": 93750 }, { - "epoch": 1.01, - "learning_rate": 0.00014788110844311765, - "loss": 0.0352, + "epoch": 0.61, + "learning_rate": 0.00020922762154940394, + "loss": 0.0557, "step": 93760 }, { - "epoch": 1.01, - "learning_rate": 0.0001478648841586086, - "loss": 0.0402, + "epoch": 0.61, + "learning_rate": 0.000209217940195047, + "loss": 0.0442, "step": 93770 }, { - "epoch": 1.01, - "learning_rate": 0.00014784865987409955, - "loss": 0.0404, + "epoch": 0.61, + "learning_rate": 0.00020920825884069005, + "loss": 0.0426, "step": 93780 }, { - "epoch": 1.01, - "learning_rate": 0.0001478324355895905, - "loss": 0.0349, + "epoch": 0.61, + "learning_rate": 0.00020919857748633312, + "loss": 0.0437, "step": 93790 }, { - "epoch": 1.01, - "learning_rate": 0.00014781621130508145, - "loss": 0.0361, + "epoch": 0.61, + "learning_rate": 0.0002091888961319762, + "loss": 0.0464, "step": 93800 }, { - "epoch": 1.01, - "learning_rate": 0.00014779998702057237, - "loss": 0.0352, + "epoch": 0.61, + "learning_rate": 0.00020917921477761928, + "loss": 0.0566, "step": 93810 }, { - "epoch": 1.01, - "learning_rate": 0.00014778376273606332, - "loss": 0.0342, + "epoch": 0.61, + "learning_rate": 0.00020916953342326234, + "loss": 0.0411, "step": 93820 }, { - "epoch": 1.01, - "learning_rate": 0.00014776753845155427, - "loss": 0.0379, + "epoch": 0.61, + "learning_rate": 0.00020915985206890542, + "loss": 0.0572, "step": 93830 }, { - "epoch": 1.01, - "learning_rate": 0.00014775131416704522, - "loss": 0.0365, + "epoch": 0.61, + "learning_rate": 0.00020915017071454847, + "loss": 0.0462, "step": 93840 }, { - "epoch": 1.02, - "learning_rate": 0.00014773508988253617, - "loss": 0.0392, + "epoch": 0.61, + "learning_rate": 0.00020914048936019152, + "loss": 0.0505, "step": 93850 }, { - "epoch": 1.02, - "learning_rate": 0.00014771886559802712, - "loss": 0.0376, + "epoch": 0.61, + "learning_rate": 0.0002091308080058346, + "loss": 0.0532, "step": 93860 }, { - "epoch": 1.02, - "learning_rate": 0.00014770264131351807, - "loss": 0.0336, + "epoch": 0.61, + "learning_rate": 0.00020912112665147768, + "loss": 0.0642, "step": 93870 }, { - "epoch": 1.02, - "learning_rate": 0.00014768641702900902, - "loss": 0.037, + "epoch": 0.61, + "learning_rate": 0.00020911144529712076, + "loss": 0.0502, "step": 93880 }, { - "epoch": 1.02, - "learning_rate": 0.00014767019274449997, - "loss": 0.0381, + "epoch": 0.61, + "learning_rate": 0.00020910176394276381, + "loss": 0.0464, "step": 93890 }, { - "epoch": 1.02, - "learning_rate": 0.0001476539684599909, - "loss": 0.0378, + "epoch": 0.61, + "learning_rate": 0.0002090920825884069, + "loss": 0.0494, "step": 93900 }, { - "epoch": 1.02, - "learning_rate": 0.00014763774417548184, - "loss": 0.0431, + "epoch": 0.61, + "learning_rate": 0.00020908240123404995, + "loss": 0.053, "step": 93910 }, { - "epoch": 1.02, - "learning_rate": 0.0001476215198909728, - "loss": 0.036, + "epoch": 0.61, + "learning_rate": 0.000209072719879693, + "loss": 0.0442, "step": 93920 }, { - "epoch": 1.02, - "learning_rate": 0.00014760529560646374, - "loss": 0.0316, + "epoch": 0.61, + "learning_rate": 0.00020906303852533608, + "loss": 0.0465, "step": 93930 }, { - "epoch": 1.02, - "learning_rate": 0.0001475890713219547, - "loss": 0.0349, + "epoch": 0.61, + "learning_rate": 0.00020905335717097916, + "loss": 0.0621, "step": 93940 }, { - "epoch": 1.02, - "learning_rate": 0.00014757284703744564, - "loss": 0.0369, + "epoch": 0.61, + "learning_rate": 0.0002090436758166222, + "loss": 0.0483, "step": 93950 }, { - "epoch": 1.02, - "learning_rate": 0.0001475566227529366, - "loss": 0.0366, + "epoch": 0.61, + "learning_rate": 0.0002090339944622653, + "loss": 0.0527, "step": 93960 }, { - "epoch": 1.02, - "learning_rate": 0.00014754039846842754, - "loss": 0.039, + "epoch": 0.61, + "learning_rate": 0.00020902431310790837, + "loss": 0.0465, "step": 93970 }, { - "epoch": 1.02, - "learning_rate": 0.0001475241741839185, - "loss": 0.0353, + "epoch": 0.61, + "learning_rate": 0.0002090146317535514, + "loss": 0.0564, "step": 93980 }, { - "epoch": 1.02, - "learning_rate": 0.0001475079498994094, - "loss": 0.0307, + "epoch": 0.61, + "learning_rate": 0.00020900495039919448, + "loss": 0.0523, "step": 93990 }, { - "epoch": 1.02, - "learning_rate": 0.00014749172561490036, - "loss": 0.0356, + "epoch": 0.61, + "learning_rate": 0.00020899526904483756, + "loss": 0.0473, "step": 94000 }, { - "epoch": 1.02, - "eval_cer": 0.9211940820686255, - "eval_loss": 0.028705304488539696, - "eval_runtime": 119.4713, - "eval_samples_per_second": 16.74, - "eval_steps_per_second": 4.185, + "epoch": 0.61, + "eval_cer": 0.920060558129025, + "eval_loss": 0.03265640139579773, + "eval_runtime": 119.8353, + "eval_samples_per_second": 16.69, + "eval_steps_per_second": 4.172, "step": 94000 }, { - "epoch": 1.02, - "learning_rate": 0.0001474755013303913, - "loss": 0.0327, + "epoch": 0.61, + "learning_rate": 0.00020898558769048064, + "loss": 0.052, "step": 94010 }, { - "epoch": 1.02, - "learning_rate": 0.00014745927704588226, - "loss": 0.0376, + "epoch": 0.61, + "learning_rate": 0.0002089759063361237, + "loss": 0.0431, "step": 94020 }, { - "epoch": 1.02, - "learning_rate": 0.0001474430527613732, - "loss": 0.0333, + "epoch": 0.61, + "learning_rate": 0.00020896622498176677, + "loss": 0.0509, "step": 94030 }, { - "epoch": 1.02, - "learning_rate": 0.00014742682847686416, - "loss": 0.0332, + "epoch": 0.61, + "learning_rate": 0.00020895654362740985, + "loss": 0.05, "step": 94040 }, { - "epoch": 1.02, - "learning_rate": 0.0001474106041923551, - "loss": 0.04, + "epoch": 0.61, + "learning_rate": 0.00020894686227305287, + "loss": 0.0506, "step": 94050 }, { - "epoch": 1.02, - "learning_rate": 0.00014739437990784606, - "loss": 0.0349, + "epoch": 0.61, + "learning_rate": 0.00020893718091869595, + "loss": 0.0515, "step": 94060 }, { - "epoch": 1.02, - "learning_rate": 0.000147378155623337, - "loss": 0.0331, + "epoch": 0.61, + "learning_rate": 0.00020892749956433903, + "loss": 0.05, "step": 94070 }, { - "epoch": 1.02, - "learning_rate": 0.00014736193133882793, - "loss": 0.0378, + "epoch": 0.61, + "learning_rate": 0.00020891781820998211, + "loss": 0.0521, "step": 94080 }, { - "epoch": 1.02, - "learning_rate": 0.00014734570705431888, - "loss": 0.0404, + "epoch": 0.61, + "learning_rate": 0.00020890813685562517, + "loss": 0.0495, "step": 94090 }, { - "epoch": 1.02, - "learning_rate": 0.00014732948276980983, - "loss": 0.0361, + "epoch": 0.61, + "learning_rate": 0.00020889845550126825, + "loss": 0.0478, "step": 94100 }, { - "epoch": 1.02, - "learning_rate": 0.00014731325848530078, - "loss": 0.0406, + "epoch": 0.61, + "learning_rate": 0.00020888877414691133, + "loss": 0.0556, "step": 94110 }, { - "epoch": 1.02, - "learning_rate": 0.00014729703420079173, - "loss": 0.0385, + "epoch": 0.61, + "learning_rate": 0.00020887909279255435, + "loss": 0.0469, "step": 94120 }, { - "epoch": 1.02, - "learning_rate": 0.00014728080991628268, - "loss": 0.0338, + "epoch": 0.61, + "learning_rate": 0.00020886941143819743, + "loss": 0.0485, "step": 94130 }, { - "epoch": 1.02, - "learning_rate": 0.00014726458563177363, - "loss": 0.0386, + "epoch": 0.61, + "learning_rate": 0.0002088597300838405, + "loss": 0.0493, "step": 94140 }, { - "epoch": 1.02, - "learning_rate": 0.00014724836134726458, - "loss": 0.0337, + "epoch": 0.61, + "learning_rate": 0.00020885004872948356, + "loss": 0.0518, "step": 94150 }, { - "epoch": 1.02, - "learning_rate": 0.00014723213706275553, - "loss": 0.0371, + "epoch": 0.61, + "learning_rate": 0.00020884036737512664, + "loss": 0.0532, "step": 94160 }, { - "epoch": 1.02, - "learning_rate": 0.00014721591277824645, - "loss": 0.0372, + "epoch": 0.61, + "learning_rate": 0.00020883068602076972, + "loss": 0.0538, "step": 94170 }, { - "epoch": 1.02, - "learning_rate": 0.0001471996884937374, - "loss": 0.0354, + "epoch": 0.61, + "learning_rate": 0.0002088210046664128, + "loss": 0.0549, "step": 94180 }, { - "epoch": 1.02, - "learning_rate": 0.00014718346420922835, - "loss": 0.0362, + "epoch": 0.61, + "learning_rate": 0.00020881132331205583, + "loss": 0.0483, "step": 94190 }, { - "epoch": 1.02, - "learning_rate": 0.0001471672399247193, - "loss": 0.0401, + "epoch": 0.61, + "learning_rate": 0.0002088016419576989, + "loss": 0.0467, "step": 94200 }, { - "epoch": 1.02, - "learning_rate": 0.00014715101564021025, - "loss": 0.0403, + "epoch": 0.61, + "learning_rate": 0.000208791960603342, + "loss": 0.0541, "step": 94210 }, { - "epoch": 1.02, - "learning_rate": 0.0001471347913557012, - "loss": 0.0413, + "epoch": 0.61, + "learning_rate": 0.00020878227924898504, + "loss": 0.0426, "step": 94220 }, { - "epoch": 1.02, - "learning_rate": 0.00014711856707119215, - "loss": 0.0422, + "epoch": 0.61, + "learning_rate": 0.00020877259789462812, + "loss": 0.0496, "step": 94230 }, { - "epoch": 1.02, - "learning_rate": 0.0001471023427866831, - "loss": 0.0527, + "epoch": 0.61, + "learning_rate": 0.0002087629165402712, + "loss": 0.0547, "step": 94240 }, { - "epoch": 1.02, - "learning_rate": 0.00014708611850217405, - "loss": 0.049, + "epoch": 0.61, + "learning_rate": 0.00020875323518591428, + "loss": 0.048, "step": 94250 }, { - "epoch": 1.02, - "learning_rate": 0.00014706989421766497, - "loss": 0.0366, + "epoch": 0.61, + "learning_rate": 0.0002087435538315573, + "loss": 0.0454, "step": 94260 }, { - "epoch": 1.02, - "learning_rate": 0.00014705366993315592, - "loss": 0.037, + "epoch": 0.61, + "learning_rate": 0.00020873387247720039, + "loss": 0.0496, "step": 94270 }, { - "epoch": 1.02, - "learning_rate": 0.00014703744564864687, - "loss": 0.0428, + "epoch": 0.61, + "learning_rate": 0.00020872419112284347, + "loss": 0.0596, "step": 94280 }, { - "epoch": 1.02, - "learning_rate": 0.00014702122136413782, - "loss": 0.0396, + "epoch": 0.61, + "learning_rate": 0.00020871450976848652, + "loss": 0.0453, "step": 94290 }, { - "epoch": 1.02, - "learning_rate": 0.00014700499707962877, - "loss": 0.0366, + "epoch": 0.61, + "learning_rate": 0.0002087048284141296, + "loss": 0.0519, "step": 94300 }, { - "epoch": 1.02, - "learning_rate": 0.00014698877279511972, - "loss": 0.0397, + "epoch": 0.61, + "learning_rate": 0.00020869514705977268, + "loss": 0.0484, "step": 94310 }, { - "epoch": 1.02, - "learning_rate": 0.00014697254851061067, - "loss": 0.0441, + "epoch": 0.61, + "learning_rate": 0.00020868546570541576, + "loss": 0.0497, "step": 94320 }, { - "epoch": 1.02, - "learning_rate": 0.00014695632422610162, - "loss": 0.0364, + "epoch": 0.61, + "learning_rate": 0.00020867578435105878, + "loss": 0.0439, "step": 94330 }, { - "epoch": 1.02, - "learning_rate": 0.00014694009994159257, - "loss": 0.0353, + "epoch": 0.61, + "learning_rate": 0.00020866610299670186, + "loss": 0.0548, "step": 94340 }, { - "epoch": 1.02, - "learning_rate": 0.0001469238756570835, - "loss": 0.038, + "epoch": 0.61, + "learning_rate": 0.00020865642164234492, + "loss": 0.0517, "step": 94350 }, { - "epoch": 1.02, - "learning_rate": 0.00014690765137257444, - "loss": 0.0329, + "epoch": 0.61, + "learning_rate": 0.000208646740287988, + "loss": 0.0487, "step": 94360 }, { - "epoch": 1.02, - "learning_rate": 0.0001468914270880654, - "loss": 0.0345, + "epoch": 0.61, + "learning_rate": 0.00020863705893363108, + "loss": 0.0433, "step": 94370 }, { - "epoch": 1.02, - "learning_rate": 0.00014687520280355634, - "loss": 0.0396, + "epoch": 0.61, + "learning_rate": 0.00020862737757927416, + "loss": 0.0566, "step": 94380 }, { - "epoch": 1.02, - "learning_rate": 0.0001468589785190473, - "loss": 0.0382, + "epoch": 0.61, + "learning_rate": 0.0002086176962249172, + "loss": 0.0479, "step": 94390 }, { - "epoch": 1.02, - "learning_rate": 0.00014684275423453824, - "loss": 0.0385, + "epoch": 0.61, + "learning_rate": 0.00020860801487056026, + "loss": 0.05, "step": 94400 }, { - "epoch": 1.02, - "learning_rate": 0.0001468265299500292, - "loss": 0.0362, + "epoch": 0.61, + "learning_rate": 0.00020859833351620334, + "loss": 0.0505, "step": 94410 }, { - "epoch": 1.02, - "learning_rate": 0.00014681030566552014, - "loss": 0.0451, + "epoch": 0.61, + "learning_rate": 0.0002085886521618464, + "loss": 0.0516, "step": 94420 }, { - "epoch": 1.02, - "learning_rate": 0.0001467940813810111, - "loss": 0.0364, + "epoch": 0.61, + "learning_rate": 0.00020857897080748947, + "loss": 0.0455, "step": 94430 }, { - "epoch": 1.02, - "learning_rate": 0.00014677785709650202, - "loss": 0.0388, + "epoch": 0.61, + "learning_rate": 0.00020856928945313255, + "loss": 0.0502, "step": 94440 }, { - "epoch": 1.02, - "learning_rate": 0.00014676163281199296, - "loss": 0.0387, + "epoch": 0.61, + "learning_rate": 0.00020855960809877563, + "loss": 0.0543, "step": 94450 }, { - "epoch": 1.02, - "learning_rate": 0.00014674540852748391, - "loss": 0.0358, + "epoch": 0.61, + "learning_rate": 0.00020854992674441868, + "loss": 0.0518, "step": 94460 }, { - "epoch": 1.02, - "learning_rate": 0.00014672918424297486, - "loss": 0.0344, + "epoch": 0.61, + "learning_rate": 0.00020854024539006174, + "loss": 0.0477, "step": 94470 }, { - "epoch": 1.02, - "learning_rate": 0.00014671295995846581, - "loss": 0.035, + "epoch": 0.61, + "learning_rate": 0.00020853056403570482, + "loss": 0.0445, "step": 94480 }, { - "epoch": 1.02, - "learning_rate": 0.00014669673567395676, - "loss": 0.0367, + "epoch": 0.61, + "learning_rate": 0.00020852088268134787, + "loss": 0.0496, "step": 94490 }, { - "epoch": 1.02, - "learning_rate": 0.00014668051138944771, - "loss": 0.0401, + "epoch": 0.61, + "learning_rate": 0.00020851120132699095, + "loss": 0.0489, "step": 94500 }, { - "epoch": 1.02, - "learning_rate": 0.00014666428710493866, - "loss": 0.0338, + "epoch": 0.61, + "learning_rate": 0.00020850151997263403, + "loss": 0.0438, "step": 94510 }, { - "epoch": 1.02, - "learning_rate": 0.0001466480628204296, - "loss": 0.0434, + "epoch": 0.61, + "learning_rate": 0.0002084918386182771, + "loss": 0.0533, "step": 94520 }, { - "epoch": 1.02, - "learning_rate": 0.00014663183853592054, - "loss": 0.039, + "epoch": 0.61, + "learning_rate": 0.00020848215726392016, + "loss": 0.0485, "step": 94530 }, { - "epoch": 1.02, - "learning_rate": 0.00014661561425141149, - "loss": 0.0413, + "epoch": 0.61, + "learning_rate": 0.00020847247590956321, + "loss": 0.055, "step": 94540 }, { - "epoch": 1.02, - "learning_rate": 0.00014659938996690244, - "loss": 0.0388, + "epoch": 0.61, + "learning_rate": 0.00020846279455520627, + "loss": 0.0498, "step": 94550 }, { - "epoch": 1.02, - "learning_rate": 0.00014658316568239339, - "loss": 0.0345, + "epoch": 0.61, + "learning_rate": 0.00020845311320084935, + "loss": 0.0512, "step": 94560 }, { - "epoch": 1.02, - "learning_rate": 0.00014656694139788433, - "loss": 0.0428, + "epoch": 0.61, + "learning_rate": 0.00020844343184649243, + "loss": 0.052, "step": 94570 }, { - "epoch": 1.02, - "learning_rate": 0.00014655071711337528, - "loss": 0.04, + "epoch": 0.61, + "learning_rate": 0.0002084337504921355, + "loss": 0.0493, "step": 94580 }, { - "epoch": 1.02, - "learning_rate": 0.00014653449282886623, - "loss": 0.0442, + "epoch": 0.61, + "learning_rate": 0.00020842406913777856, + "loss": 0.0571, "step": 94590 }, { - "epoch": 1.02, - "learning_rate": 0.00014651826854435718, - "loss": 0.0367, + "epoch": 0.61, + "learning_rate": 0.00020841438778342164, + "loss": 0.0525, "step": 94600 }, { - "epoch": 1.02, - "learning_rate": 0.00014650204425984813, - "loss": 0.0403, + "epoch": 0.61, + "learning_rate": 0.0002084047064290647, + "loss": 0.0498, "step": 94610 }, { - "epoch": 1.02, - "learning_rate": 0.00014648581997533906, - "loss": 0.0459, + "epoch": 0.61, + "learning_rate": 0.00020839502507470774, + "loss": 0.0529, "step": 94620 }, { - "epoch": 1.02, - "learning_rate": 0.00014646959569083, - "loss": 0.0377, + "epoch": 0.61, + "learning_rate": 0.00020838534372035082, + "loss": 0.0473, "step": 94630 }, { - "epoch": 1.02, - "learning_rate": 0.00014645337140632096, - "loss": 0.0363, + "epoch": 0.61, + "learning_rate": 0.0002083756623659939, + "loss": 0.0476, "step": 94640 }, { - "epoch": 1.02, - "learning_rate": 0.0001464371471218119, - "loss": 0.0382, + "epoch": 0.61, + "learning_rate": 0.00020836598101163698, + "loss": 0.0433, "step": 94650 }, { - "epoch": 1.02, - "learning_rate": 0.00014642092283730286, - "loss": 0.0366, + "epoch": 0.61, + "learning_rate": 0.00020835629965728004, + "loss": 0.0443, "step": 94660 }, { - "epoch": 1.02, - "learning_rate": 0.0001464046985527938, - "loss": 0.0432, + "epoch": 0.61, + "learning_rate": 0.00020834661830292312, + "loss": 0.0473, "step": 94670 }, { - "epoch": 1.02, - "learning_rate": 0.00014638847426828476, - "loss": 0.0363, + "epoch": 0.61, + "learning_rate": 0.00020833693694856617, + "loss": 0.049, "step": 94680 }, { - "epoch": 1.02, - "learning_rate": 0.0001463722499837757, - "loss": 0.0369, + "epoch": 0.61, + "learning_rate": 0.00020832725559420922, + "loss": 0.0505, "step": 94690 }, { - "epoch": 1.02, - "learning_rate": 0.00014635602569926665, - "loss": 0.0413, + "epoch": 0.61, + "learning_rate": 0.0002083175742398523, + "loss": 0.0535, "step": 94700 }, { - "epoch": 1.02, - "learning_rate": 0.00014633980141475758, - "loss": 0.0294, + "epoch": 0.61, + "learning_rate": 0.00020830789288549538, + "loss": 0.0577, "step": 94710 }, { - "epoch": 1.02, - "learning_rate": 0.00014632357713024853, - "loss": 0.0478, + "epoch": 0.61, + "learning_rate": 0.00020829821153113846, + "loss": 0.0528, "step": 94720 }, { - "epoch": 1.02, - "learning_rate": 0.00014630735284573948, - "loss": 0.036, + "epoch": 0.61, + "learning_rate": 0.00020828853017678151, + "loss": 0.0523, "step": 94730 }, { - "epoch": 1.02, - "learning_rate": 0.00014629112856123043, - "loss": 0.035, + "epoch": 0.61, + "learning_rate": 0.0002082788488224246, + "loss": 0.0452, "step": 94740 }, { - "epoch": 1.02, - "learning_rate": 0.00014627490427672138, - "loss": 0.0344, + "epoch": 0.61, + "learning_rate": 0.00020826916746806762, + "loss": 0.0472, "step": 94750 }, { - "epoch": 1.02, - "learning_rate": 0.00014625867999221233, - "loss": 0.0348, + "epoch": 0.61, + "learning_rate": 0.0002082594861137107, + "loss": 0.0548, "step": 94760 }, { - "epoch": 1.03, - "learning_rate": 0.00014624245570770328, - "loss": 0.0418, + "epoch": 0.61, + "learning_rate": 0.00020824980475935378, + "loss": 0.0472, "step": 94770 }, { - "epoch": 1.03, - "learning_rate": 0.00014622623142319423, - "loss": 0.0344, + "epoch": 0.61, + "learning_rate": 0.00020824012340499686, + "loss": 0.0466, "step": 94780 }, { - "epoch": 1.03, - "learning_rate": 0.00014621000713868518, - "loss": 0.0326, + "epoch": 0.61, + "learning_rate": 0.0002082304420506399, + "loss": 0.0472, "step": 94790 }, { - "epoch": 1.03, - "learning_rate": 0.0001461937828541761, - "loss": 0.0398, + "epoch": 0.61, + "learning_rate": 0.000208220760696283, + "loss": 0.0534, "step": 94800 }, { - "epoch": 1.03, - "learning_rate": 0.00014617755856966705, - "loss": 0.037, + "epoch": 0.61, + "learning_rate": 0.00020821107934192607, + "loss": 0.0546, "step": 94810 }, { - "epoch": 1.03, - "learning_rate": 0.000146161334285158, - "loss": 0.039, + "epoch": 0.61, + "learning_rate": 0.0002082013979875691, + "loss": 0.0452, "step": 94820 }, { - "epoch": 1.03, - "learning_rate": 0.00014614511000064895, - "loss": 0.0335, + "epoch": 0.61, + "learning_rate": 0.00020819171663321218, + "loss": 0.0442, "step": 94830 }, { - "epoch": 1.03, - "learning_rate": 0.0001461288857161399, - "loss": 0.0388, + "epoch": 0.61, + "learning_rate": 0.00020818203527885526, + "loss": 0.0509, "step": 94840 }, { - "epoch": 1.03, - "learning_rate": 0.00014611266143163085, - "loss": 0.0337, + "epoch": 0.61, + "learning_rate": 0.00020817235392449834, + "loss": 0.0488, "step": 94850 }, { - "epoch": 1.03, - "learning_rate": 0.0001460964371471218, - "loss": 0.0352, + "epoch": 0.61, + "learning_rate": 0.0002081626725701414, + "loss": 0.0504, "step": 94860 }, { - "epoch": 1.03, - "learning_rate": 0.00014608021286261275, - "loss": 0.0383, + "epoch": 0.61, + "learning_rate": 0.00020815299121578447, + "loss": 0.0469, "step": 94870 }, { - "epoch": 1.03, - "learning_rate": 0.0001460639885781037, - "loss": 0.0371, + "epoch": 0.61, + "learning_rate": 0.00020814330986142755, + "loss": 0.0565, "step": 94880 }, { - "epoch": 1.03, - "learning_rate": 0.00014604776429359462, - "loss": 0.0367, + "epoch": 0.61, + "learning_rate": 0.00020813362850707057, + "loss": 0.0489, "step": 94890 }, { - "epoch": 1.03, - "learning_rate": 0.00014603154000908557, - "loss": 0.0376, + "epoch": 0.61, + "learning_rate": 0.00020812394715271365, + "loss": 0.0584, "step": 94900 }, { - "epoch": 1.03, - "learning_rate": 0.00014601531572457652, - "loss": 0.0357, + "epoch": 0.61, + "learning_rate": 0.00020811426579835673, + "loss": 0.0402, "step": 94910 }, { - "epoch": 1.03, - "learning_rate": 0.00014599909144006747, - "loss": 0.0383, + "epoch": 0.61, + "learning_rate": 0.0002081045844439998, + "loss": 0.0478, "step": 94920 }, { - "epoch": 1.03, - "learning_rate": 0.00014598286715555842, - "loss": 0.0376, + "epoch": 0.61, + "learning_rate": 0.00020809490308964287, + "loss": 0.048, "step": 94930 }, { - "epoch": 1.03, - "learning_rate": 0.00014596664287104937, - "loss": 0.039, + "epoch": 0.61, + "learning_rate": 0.00020808522173528595, + "loss": 0.0471, "step": 94940 }, { - "epoch": 1.03, - "learning_rate": 0.00014595041858654032, - "loss": 0.0376, + "epoch": 0.61, + "learning_rate": 0.00020807554038092903, + "loss": 0.0402, "step": 94950 }, { - "epoch": 1.03, - "learning_rate": 0.00014593419430203127, - "loss": 0.0408, + "epoch": 0.61, + "learning_rate": 0.00020806585902657205, + "loss": 0.0445, "step": 94960 }, { - "epoch": 1.03, - "learning_rate": 0.00014591797001752222, - "loss": 0.0377, + "epoch": 0.61, + "learning_rate": 0.00020805617767221513, + "loss": 0.0478, "step": 94970 }, { - "epoch": 1.03, - "learning_rate": 0.00014590174573301314, - "loss": 0.0407, + "epoch": 0.61, + "learning_rate": 0.0002080464963178582, + "loss": 0.0475, "step": 94980 }, { - "epoch": 1.03, - "learning_rate": 0.0001458855214485041, - "loss": 0.0372, + "epoch": 0.61, + "learning_rate": 0.00020803681496350126, + "loss": 0.0556, "step": 94990 }, { - "epoch": 1.03, - "learning_rate": 0.00014586929716399504, - "loss": 0.0381, + "epoch": 0.61, + "learning_rate": 0.00020802713360914434, + "loss": 0.0558, "step": 95000 }, { - "epoch": 1.03, - "eval_cer": 0.9211666940546807, - "eval_loss": 0.02949533425271511, - "eval_runtime": 119.3031, - "eval_samples_per_second": 16.764, - "eval_steps_per_second": 4.191, + "epoch": 0.61, + "eval_cer": 0.9198942492373743, + "eval_loss": 0.032361067831516266, + "eval_runtime": 119.7802, + "eval_samples_per_second": 16.697, + "eval_steps_per_second": 4.174, "step": 95000 }, { - "epoch": 1.03, - "learning_rate": 0.000145853072879486, - "loss": 0.0365, + "epoch": 0.61, + "learning_rate": 0.00020801745225478742, + "loss": 0.0497, "step": 95010 }, { - "epoch": 1.03, - "learning_rate": 0.00014583684859497694, - "loss": 0.034, + "epoch": 0.61, + "learning_rate": 0.0002080077709004305, + "loss": 0.0482, "step": 95020 }, { - "epoch": 1.03, - "learning_rate": 0.0001458206243104679, - "loss": 0.034, + "epoch": 0.61, + "learning_rate": 0.00020799808954607353, + "loss": 0.0471, "step": 95030 }, { - "epoch": 1.03, - "learning_rate": 0.00014580440002595884, - "loss": 0.038, + "epoch": 0.61, + "learning_rate": 0.0002079884081917166, + "loss": 0.051, "step": 95040 }, { - "epoch": 1.03, - "learning_rate": 0.0001457881757414498, - "loss": 0.0428, + "epoch": 0.61, + "learning_rate": 0.0002079787268373597, + "loss": 0.0508, "step": 95050 }, { - "epoch": 1.03, - "learning_rate": 0.00014577195145694074, - "loss": 0.0399, + "epoch": 0.61, + "learning_rate": 0.00020796904548300274, + "loss": 0.0464, "step": 95060 }, { - "epoch": 1.03, - "learning_rate": 0.0001457557271724317, - "loss": 0.0337, + "epoch": 0.61, + "learning_rate": 0.00020795936412864582, + "loss": 0.0461, "step": 95070 }, { - "epoch": 1.03, - "learning_rate": 0.00014573950288792264, - "loss": 0.0501, + "epoch": 0.61, + "learning_rate": 0.0002079496827742889, + "loss": 0.054, "step": 95080 }, { - "epoch": 1.03, - "learning_rate": 0.0001457232786034136, - "loss": 0.0367, + "epoch": 0.61, + "learning_rate": 0.00020794000141993198, + "loss": 0.0533, "step": 95090 }, { - "epoch": 1.03, - "learning_rate": 0.00014570705431890454, - "loss": 0.0416, + "epoch": 0.61, + "learning_rate": 0.000207930320065575, + "loss": 0.049, "step": 95100 }, { - "epoch": 1.03, - "learning_rate": 0.0001456908300343955, - "loss": 0.035, + "epoch": 0.61, + "learning_rate": 0.00020792063871121809, + "loss": 0.0538, "step": 95110 }, { - "epoch": 1.03, - "learning_rate": 0.00014567460574988644, - "loss": 0.0434, + "epoch": 0.61, + "learning_rate": 0.00020791095735686117, + "loss": 0.0467, "step": 95120 }, { - "epoch": 1.03, - "learning_rate": 0.00014565838146537736, - "loss": 0.0331, + "epoch": 0.61, + "learning_rate": 0.00020790127600250422, + "loss": 0.0458, "step": 95130 }, { - "epoch": 1.03, - "learning_rate": 0.0001456421571808683, - "loss": 0.0379, + "epoch": 0.61, + "learning_rate": 0.0002078915946481473, + "loss": 0.0494, "step": 95140 }, { - "epoch": 1.03, - "learning_rate": 0.00014562593289635926, - "loss": 0.0373, + "epoch": 0.61, + "learning_rate": 0.00020788191329379038, + "loss": 0.0464, "step": 95150 }, { - "epoch": 1.03, - "learning_rate": 0.0001456097086118502, - "loss": 0.0374, + "epoch": 0.61, + "learning_rate": 0.00020787223193943343, + "loss": 0.0524, "step": 95160 }, { - "epoch": 1.03, - "learning_rate": 0.00014559348432734116, - "loss": 0.0364, + "epoch": 0.61, + "learning_rate": 0.00020786255058507648, + "loss": 0.0468, "step": 95170 }, { - "epoch": 1.03, - "learning_rate": 0.0001455772600428321, - "loss": 0.0319, + "epoch": 0.61, + "learning_rate": 0.00020785286923071956, + "loss": 0.0474, "step": 95180 }, { - "epoch": 1.03, - "learning_rate": 0.00014556103575832306, - "loss": 0.039, + "epoch": 0.61, + "learning_rate": 0.00020784318787636262, + "loss": 0.0433, "step": 95190 }, { - "epoch": 1.03, - "learning_rate": 0.000145544811473814, - "loss": 0.0408, + "epoch": 0.61, + "learning_rate": 0.0002078335065220057, + "loss": 0.0484, "step": 95200 }, { - "epoch": 1.03, - "learning_rate": 0.00014552858718930496, - "loss": 0.0345, + "epoch": 0.61, + "learning_rate": 0.00020782382516764877, + "loss": 0.0421, "step": 95210 }, { - "epoch": 1.03, - "learning_rate": 0.00014551236290479588, - "loss": 0.0365, + "epoch": 0.61, + "learning_rate": 0.00020781414381329185, + "loss": 0.0593, "step": 95220 }, { - "epoch": 1.03, - "learning_rate": 0.00014549613862028683, - "loss": 0.0369, + "epoch": 0.61, + "learning_rate": 0.0002078044624589349, + "loss": 0.0488, "step": 95230 }, { - "epoch": 1.03, - "learning_rate": 0.00014547991433577778, - "loss": 0.0371, + "epoch": 0.61, + "learning_rate": 0.00020779478110457796, + "loss": 0.0494, "step": 95240 }, { - "epoch": 1.03, - "learning_rate": 0.00014546369005126873, - "loss": 0.0345, + "epoch": 0.61, + "learning_rate": 0.00020778509975022104, + "loss": 0.0425, "step": 95250 }, { - "epoch": 1.03, - "learning_rate": 0.00014544746576675968, - "loss": 0.0343, + "epoch": 0.61, + "learning_rate": 0.0002077754183958641, + "loss": 0.0542, "step": 95260 }, { - "epoch": 1.03, - "learning_rate": 0.00014543124148225063, - "loss": 0.0349, + "epoch": 0.61, + "learning_rate": 0.00020776573704150717, + "loss": 0.0502, "step": 95270 }, { - "epoch": 1.03, - "learning_rate": 0.00014541501719774158, - "loss": 0.0365, + "epoch": 0.61, + "learning_rate": 0.00020775605568715025, + "loss": 0.0414, "step": 95280 }, { - "epoch": 1.03, - "learning_rate": 0.00014539879291323253, - "loss": 0.0389, + "epoch": 0.62, + "learning_rate": 0.00020774637433279333, + "loss": 0.0474, "step": 95290 }, { - "epoch": 1.03, - "learning_rate": 0.00014538256862872348, - "loss": 0.036, + "epoch": 0.62, + "learning_rate": 0.00020773669297843638, + "loss": 0.0454, "step": 95300 }, { - "epoch": 1.03, - "learning_rate": 0.0001453663443442144, - "loss": 0.0367, + "epoch": 0.62, + "learning_rate": 0.00020772701162407944, + "loss": 0.047, "step": 95310 }, { - "epoch": 1.03, - "learning_rate": 0.00014535012005970535, - "loss": 0.0414, + "epoch": 0.62, + "learning_rate": 0.00020771733026972252, + "loss": 0.0514, "step": 95320 }, { - "epoch": 1.03, - "learning_rate": 0.0001453338957751963, - "loss": 0.0371, + "epoch": 0.62, + "learning_rate": 0.00020770764891536557, + "loss": 0.0447, "step": 95330 }, { - "epoch": 1.03, - "learning_rate": 0.00014531767149068725, - "loss": 0.042, + "epoch": 0.62, + "learning_rate": 0.00020769796756100865, + "loss": 0.0501, "step": 95340 }, { - "epoch": 1.03, - "learning_rate": 0.0001453014472061782, - "loss": 0.0354, + "epoch": 0.62, + "learning_rate": 0.00020768828620665173, + "loss": 0.0457, "step": 95350 }, { - "epoch": 1.03, - "learning_rate": 0.00014528522292166915, - "loss": 0.0369, + "epoch": 0.62, + "learning_rate": 0.00020767860485229478, + "loss": 0.0497, "step": 95360 }, { - "epoch": 1.03, - "learning_rate": 0.0001452689986371601, - "loss": 0.0353, + "epoch": 0.62, + "learning_rate": 0.00020766892349793786, + "loss": 0.0437, "step": 95370 }, { - "epoch": 1.03, - "learning_rate": 0.00014525277435265105, - "loss": 0.0355, + "epoch": 0.62, + "learning_rate": 0.00020765924214358091, + "loss": 0.0487, "step": 95380 }, { - "epoch": 1.03, - "learning_rate": 0.000145236550068142, - "loss": 0.0387, + "epoch": 0.62, + "learning_rate": 0.00020764956078922397, + "loss": 0.0509, "step": 95390 }, { - "epoch": 1.03, - "learning_rate": 0.00014522032578363292, - "loss": 0.0374, + "epoch": 0.62, + "learning_rate": 0.00020763987943486705, + "loss": 0.0455, "step": 95400 }, { - "epoch": 1.03, - "learning_rate": 0.00014520410149912387, - "loss": 0.0409, + "epoch": 0.62, + "learning_rate": 0.00020763019808051013, + "loss": 0.0466, "step": 95410 }, { - "epoch": 1.03, - "learning_rate": 0.00014518787721461482, - "loss": 0.039, + "epoch": 0.62, + "learning_rate": 0.0002076205167261532, + "loss": 0.0484, "step": 95420 }, { - "epoch": 1.03, - "learning_rate": 0.00014517165293010577, - "loss": 0.0353, + "epoch": 0.62, + "learning_rate": 0.00020761083537179626, + "loss": 0.0387, "step": 95430 }, { - "epoch": 1.03, - "learning_rate": 0.00014515542864559672, - "loss": 0.0347, + "epoch": 0.62, + "learning_rate": 0.00020760115401743934, + "loss": 0.048, "step": 95440 }, { - "epoch": 1.03, - "learning_rate": 0.00014513920436108767, - "loss": 0.0383, + "epoch": 0.62, + "learning_rate": 0.0002075914726630824, + "loss": 0.0443, "step": 95450 }, { - "epoch": 1.03, - "learning_rate": 0.00014512298007657862, - "loss": 0.0354, + "epoch": 0.62, + "learning_rate": 0.00020758179130872544, + "loss": 0.0458, "step": 95460 }, { - "epoch": 1.03, - "learning_rate": 0.00014510675579206957, - "loss": 0.038, + "epoch": 0.62, + "learning_rate": 0.00020757210995436852, + "loss": 0.0438, "step": 95470 }, { - "epoch": 1.03, - "learning_rate": 0.00014509053150756052, - "loss": 0.0455, + "epoch": 0.62, + "learning_rate": 0.0002075624286000116, + "loss": 0.0489, "step": 95480 }, { - "epoch": 1.03, - "learning_rate": 0.00014507430722305144, - "loss": 0.0419, + "epoch": 0.62, + "learning_rate": 0.00020755274724565468, + "loss": 0.0486, "step": 95490 }, { - "epoch": 1.03, - "learning_rate": 0.0001450580829385424, - "loss": 0.0401, + "epoch": 0.62, + "learning_rate": 0.00020754306589129774, + "loss": 0.0404, "step": 95500 }, { - "epoch": 1.03, - "learning_rate": 0.00014504185865403334, - "loss": 0.0369, + "epoch": 0.62, + "learning_rate": 0.00020753338453694082, + "loss": 0.0457, "step": 95510 }, { - "epoch": 1.03, - "learning_rate": 0.0001450256343695243, - "loss": 0.0383, + "epoch": 0.62, + "learning_rate": 0.00020752370318258387, + "loss": 0.0515, "step": 95520 }, { - "epoch": 1.03, - "learning_rate": 0.00014500941008501524, - "loss": 0.0328, + "epoch": 0.62, + "learning_rate": 0.00020751402182822692, + "loss": 0.0484, "step": 95530 }, { - "epoch": 1.03, - "learning_rate": 0.0001449931858005062, - "loss": 0.0361, + "epoch": 0.62, + "learning_rate": 0.00020750434047387, + "loss": 0.0443, "step": 95540 }, { - "epoch": 1.03, - "learning_rate": 0.00014497696151599714, - "loss": 0.0349, + "epoch": 0.62, + "learning_rate": 0.00020749465911951308, + "loss": 0.0426, "step": 95550 }, { - "epoch": 1.03, - "learning_rate": 0.0001449607372314881, - "loss": 0.0411, + "epoch": 0.62, + "learning_rate": 0.00020748497776515613, + "loss": 0.049, "step": 95560 }, { - "epoch": 1.03, - "learning_rate": 0.00014494451294697904, - "loss": 0.0374, + "epoch": 0.62, + "learning_rate": 0.00020747529641079921, + "loss": 0.047, "step": 95570 }, { - "epoch": 1.03, - "learning_rate": 0.00014492828866246996, - "loss": 0.0316, + "epoch": 0.62, + "learning_rate": 0.0002074656150564423, + "loss": 0.0508, "step": 95580 }, { - "epoch": 1.03, - "learning_rate": 0.0001449120643779609, - "loss": 0.0417, + "epoch": 0.62, + "learning_rate": 0.00020745593370208532, + "loss": 0.0471, "step": 95590 }, { - "epoch": 1.03, - "learning_rate": 0.00014489584009345186, - "loss": 0.0368, + "epoch": 0.62, + "learning_rate": 0.0002074462523477284, + "loss": 0.0467, "step": 95600 }, { - "epoch": 1.03, - "learning_rate": 0.0001448796158089428, - "loss": 0.0387, + "epoch": 0.62, + "learning_rate": 0.00020743657099337148, + "loss": 0.0468, "step": 95610 }, { - "epoch": 1.03, - "learning_rate": 0.00014486339152443376, - "loss": 0.0349, + "epoch": 0.62, + "learning_rate": 0.00020742688963901456, + "loss": 0.0495, "step": 95620 }, { - "epoch": 1.03, - "learning_rate": 0.0001448471672399247, - "loss": 0.0353, + "epoch": 0.62, + "learning_rate": 0.0002074172082846576, + "loss": 0.0488, "step": 95630 }, { - "epoch": 1.03, - "learning_rate": 0.00014483094295541566, - "loss": 0.0331, + "epoch": 0.62, + "learning_rate": 0.0002074075269303007, + "loss": 0.0444, "step": 95640 }, { - "epoch": 1.03, - "learning_rate": 0.0001448147186709066, - "loss": 0.0317, + "epoch": 0.62, + "learning_rate": 0.00020739784557594377, + "loss": 0.0443, "step": 95650 }, { - "epoch": 1.03, - "learning_rate": 0.00014479849438639756, - "loss": 0.0391, + "epoch": 0.62, + "learning_rate": 0.0002073881642215868, + "loss": 0.0481, "step": 95660 }, { - "epoch": 1.03, - "learning_rate": 0.00014478227010188848, - "loss": 0.0392, + "epoch": 0.62, + "learning_rate": 0.00020737848286722988, + "loss": 0.0543, "step": 95670 }, { - "epoch": 1.03, - "learning_rate": 0.00014476604581737943, - "loss": 0.0323, + "epoch": 0.62, + "learning_rate": 0.00020736880151287296, + "loss": 0.0462, "step": 95680 }, { - "epoch": 1.03, - "learning_rate": 0.00014474982153287038, - "loss": 0.0382, + "epoch": 0.62, + "learning_rate": 0.00020735912015851604, + "loss": 0.0464, "step": 95690 }, { - "epoch": 1.04, - "learning_rate": 0.00014473359724836133, - "loss": 0.0417, + "epoch": 0.62, + "learning_rate": 0.0002073494388041591, + "loss": 0.0509, "step": 95700 }, { - "epoch": 1.04, - "learning_rate": 0.00014471737296385228, - "loss": 0.0389, + "epoch": 0.62, + "learning_rate": 0.00020733975744980217, + "loss": 0.0508, "step": 95710 }, { - "epoch": 1.04, - "learning_rate": 0.00014470114867934323, - "loss": 0.0304, + "epoch": 0.62, + "learning_rate": 0.00020733007609544525, + "loss": 0.0503, "step": 95720 }, { - "epoch": 1.04, - "learning_rate": 0.00014468492439483418, - "loss": 0.0362, + "epoch": 0.62, + "learning_rate": 0.00020732039474108827, + "loss": 0.0507, "step": 95730 }, { - "epoch": 1.04, - "learning_rate": 0.00014466870011032513, - "loss": 0.0421, + "epoch": 0.62, + "learning_rate": 0.00020731071338673135, + "loss": 0.0464, "step": 95740 }, { - "epoch": 1.04, - "learning_rate": 0.00014465247582581608, - "loss": 0.0413, + "epoch": 0.62, + "learning_rate": 0.00020730103203237443, + "loss": 0.0449, "step": 95750 }, { - "epoch": 1.04, - "learning_rate": 0.00014463625154130703, - "loss": 0.036, + "epoch": 0.62, + "learning_rate": 0.00020729135067801749, + "loss": 0.0467, "step": 95760 }, { - "epoch": 1.04, - "learning_rate": 0.00014462002725679796, - "loss": 0.039, + "epoch": 0.62, + "learning_rate": 0.00020728166932366057, + "loss": 0.0469, "step": 95770 }, { - "epoch": 1.04, - "learning_rate": 0.0001446038029722889, - "loss": 0.0428, + "epoch": 0.62, + "learning_rate": 0.00020727198796930365, + "loss": 0.0466, "step": 95780 }, { - "epoch": 1.04, - "learning_rate": 0.00014458757868777985, - "loss": 0.0298, + "epoch": 0.62, + "learning_rate": 0.00020726230661494673, + "loss": 0.06, "step": 95790 }, { - "epoch": 1.04, - "learning_rate": 0.0001445713544032708, - "loss": 0.0455, + "epoch": 0.62, + "learning_rate": 0.00020725262526058975, + "loss": 0.0534, "step": 95800 }, { - "epoch": 1.04, - "learning_rate": 0.00014455513011876175, - "loss": 0.0418, + "epoch": 0.62, + "learning_rate": 0.00020724294390623283, + "loss": 0.0512, "step": 95810 }, { - "epoch": 1.04, - "learning_rate": 0.0001445389058342527, - "loss": 0.0448, + "epoch": 0.62, + "learning_rate": 0.0002072332625518759, + "loss": 0.0521, "step": 95820 }, { - "epoch": 1.04, - "learning_rate": 0.00014452268154974365, - "loss": 0.04, + "epoch": 0.62, + "learning_rate": 0.00020722358119751896, + "loss": 0.0515, "step": 95830 }, { - "epoch": 1.04, - "learning_rate": 0.0001445064572652346, - "loss": 0.0454, + "epoch": 0.62, + "learning_rate": 0.00020721389984316204, + "loss": 0.051, "step": 95840 }, { - "epoch": 1.04, - "learning_rate": 0.00014449023298072555, - "loss": 0.0365, + "epoch": 0.62, + "learning_rate": 0.00020720421848880512, + "loss": 0.059, "step": 95850 }, { - "epoch": 1.04, - "learning_rate": 0.00014447400869621648, - "loss": 0.0316, + "epoch": 0.62, + "learning_rate": 0.0002071945371344482, + "loss": 0.0495, "step": 95860 }, { - "epoch": 1.04, - "learning_rate": 0.00014445778441170743, - "loss": 0.0369, + "epoch": 0.62, + "learning_rate": 0.00020718485578009123, + "loss": 0.0516, "step": 95870 }, { - "epoch": 1.04, - "learning_rate": 0.00014444156012719838, - "loss": 0.033, + "epoch": 0.62, + "learning_rate": 0.0002071751744257343, + "loss": 0.0564, "step": 95880 }, { - "epoch": 1.04, - "learning_rate": 0.00014442533584268933, - "loss": 0.0334, + "epoch": 0.62, + "learning_rate": 0.0002071654930713774, + "loss": 0.0491, "step": 95890 }, { - "epoch": 1.04, - "learning_rate": 0.00014440911155818027, - "loss": 0.0339, + "epoch": 0.62, + "learning_rate": 0.00020715581171702044, + "loss": 0.0542, "step": 95900 }, { - "epoch": 1.04, - "learning_rate": 0.00014439288727367122, - "loss": 0.0333, + "epoch": 0.62, + "learning_rate": 0.00020714613036266352, + "loss": 0.0465, "step": 95910 }, { - "epoch": 1.04, - "learning_rate": 0.00014437666298916217, - "loss": 0.0408, + "epoch": 0.62, + "learning_rate": 0.0002071364490083066, + "loss": 0.044, "step": 95920 }, { - "epoch": 1.04, - "learning_rate": 0.00014436043870465312, - "loss": 0.0341, + "epoch": 0.62, + "learning_rate": 0.00020712676765394965, + "loss": 0.0424, "step": 95930 }, { - "epoch": 1.04, - "learning_rate": 0.00014434421442014407, - "loss": 0.0375, + "epoch": 0.62, + "learning_rate": 0.0002071170862995927, + "loss": 0.0548, "step": 95940 }, { - "epoch": 1.04, - "learning_rate": 0.000144327990135635, - "loss": 0.039, + "epoch": 0.62, + "learning_rate": 0.00020710740494523578, + "loss": 0.0477, "step": 95950 }, { - "epoch": 1.04, - "learning_rate": 0.00014431176585112595, - "loss": 0.0422, + "epoch": 0.62, + "learning_rate": 0.00020709772359087884, + "loss": 0.05, "step": 95960 }, { - "epoch": 1.04, - "learning_rate": 0.0001442955415666169, - "loss": 0.0347, + "epoch": 0.62, + "learning_rate": 0.00020708804223652192, + "loss": 0.0559, "step": 95970 }, { - "epoch": 1.04, - "learning_rate": 0.00014427931728210785, - "loss": 0.0368, + "epoch": 0.62, + "learning_rate": 0.000207078360882165, + "loss": 0.0466, "step": 95980 }, { - "epoch": 1.04, - "learning_rate": 0.0001442630929975988, - "loss": 0.0385, + "epoch": 0.62, + "learning_rate": 0.00020706867952780808, + "loss": 0.046, "step": 95990 }, { - "epoch": 1.04, - "learning_rate": 0.00014424686871308975, - "loss": 0.0386, + "epoch": 0.62, + "learning_rate": 0.00020705899817345113, + "loss": 0.0428, "step": 96000 }, { - "epoch": 1.04, - "eval_cer": 0.9212532755181194, - "eval_loss": 0.028391998261213303, - "eval_runtime": 119.0955, - "eval_samples_per_second": 16.793, - "eval_steps_per_second": 4.198, + "epoch": 0.62, + "eval_cer": 0.9199810190938877, + "eval_loss": 0.03174648433923721, + "eval_runtime": 120.4054, + "eval_samples_per_second": 16.611, + "eval_steps_per_second": 4.153, "step": 96000 }, { - "epoch": 1.04, - "learning_rate": 0.0001442306444285807, - "loss": 0.0421, + "epoch": 0.62, + "learning_rate": 0.00020704931681909418, + "loss": 0.051, "step": 96010 }, { - "epoch": 1.04, - "learning_rate": 0.00014421442014407165, - "loss": 0.0403, + "epoch": 0.62, + "learning_rate": 0.00020703963546473726, + "loss": 0.0442, "step": 96020 }, { - "epoch": 1.04, - "learning_rate": 0.0001441981958595626, - "loss": 0.034, + "epoch": 0.62, + "learning_rate": 0.00020702995411038031, + "loss": 0.0422, "step": 96030 }, { - "epoch": 1.04, - "learning_rate": 0.00014418197157505352, - "loss": 0.0321, + "epoch": 0.62, + "learning_rate": 0.0002070202727560234, + "loss": 0.0429, "step": 96040 }, { - "epoch": 1.04, - "learning_rate": 0.00014416574729054447, - "loss": 0.0401, + "epoch": 0.62, + "learning_rate": 0.00020701059140166647, + "loss": 0.056, "step": 96050 }, { - "epoch": 1.04, - "learning_rate": 0.00014414952300603542, - "loss": 0.0385, + "epoch": 0.62, + "learning_rate": 0.00020700091004730955, + "loss": 0.0473, "step": 96060 }, { - "epoch": 1.04, - "learning_rate": 0.00014413329872152637, - "loss": 0.0353, + "epoch": 0.62, + "learning_rate": 0.0002069912286929526, + "loss": 0.0483, "step": 96070 }, { - "epoch": 1.04, - "learning_rate": 0.00014411707443701732, - "loss": 0.0481, + "epoch": 0.62, + "learning_rate": 0.00020698154733859566, + "loss": 0.0554, "step": 96080 }, { - "epoch": 1.04, - "learning_rate": 0.00014410085015250827, - "loss": 0.0344, + "epoch": 0.62, + "learning_rate": 0.00020697186598423874, + "loss": 0.0527, "step": 96090 }, { - "epoch": 1.04, - "learning_rate": 0.00014408462586799922, - "loss": 0.0358, + "epoch": 0.62, + "learning_rate": 0.0002069621846298818, + "loss": 0.0518, "step": 96100 }, { - "epoch": 1.04, - "learning_rate": 0.00014406840158349017, - "loss": 0.0368, + "epoch": 0.62, + "learning_rate": 0.00020695250327552487, + "loss": 0.0602, "step": 96110 }, { - "epoch": 1.04, - "learning_rate": 0.00014405217729898112, - "loss": 0.0445, + "epoch": 0.62, + "learning_rate": 0.00020694282192116795, + "loss": 0.0469, "step": 96120 }, { - "epoch": 1.04, - "learning_rate": 0.00014403595301447204, - "loss": 0.0361, + "epoch": 0.62, + "learning_rate": 0.000206933140566811, + "loss": 0.0523, "step": 96130 }, { - "epoch": 1.04, - "learning_rate": 0.000144019728729963, - "loss": 0.038, + "epoch": 0.62, + "learning_rate": 0.00020692345921245408, + "loss": 0.0508, "step": 96140 }, { - "epoch": 1.04, - "learning_rate": 0.00014400350444545394, - "loss": 0.0415, + "epoch": 0.62, + "learning_rate": 0.00020691377785809714, + "loss": 0.0484, "step": 96150 }, { - "epoch": 1.04, - "learning_rate": 0.0001439872801609449, - "loss": 0.0378, + "epoch": 0.62, + "learning_rate": 0.0002069040965037402, + "loss": 0.0551, "step": 96160 }, { - "epoch": 1.04, - "learning_rate": 0.00014397105587643584, - "loss": 0.0385, + "epoch": 0.62, + "learning_rate": 0.00020689441514938327, + "loss": 0.0461, "step": 96170 }, { - "epoch": 1.04, - "learning_rate": 0.0001439548315919268, - "loss": 0.0383, + "epoch": 0.62, + "learning_rate": 0.00020688473379502635, + "loss": 0.0524, "step": 96180 }, { - "epoch": 1.04, - "learning_rate": 0.00014393860730741774, - "loss": 0.0293, + "epoch": 0.62, + "learning_rate": 0.00020687505244066943, + "loss": 0.0503, "step": 96190 }, { - "epoch": 1.04, - "learning_rate": 0.0001439223830229087, - "loss": 0.04, + "epoch": 0.62, + "learning_rate": 0.00020686537108631248, + "loss": 0.0449, "step": 96200 }, { - "epoch": 1.04, - "learning_rate": 0.00014390615873839964, - "loss": 0.0386, + "epoch": 0.62, + "learning_rate": 0.00020685568973195556, + "loss": 0.0493, "step": 96210 }, { - "epoch": 1.04, - "learning_rate": 0.00014388993445389056, - "loss": 0.0364, + "epoch": 0.62, + "learning_rate": 0.00020684600837759861, + "loss": 0.0451, "step": 96220 }, { - "epoch": 1.04, - "learning_rate": 0.0001438737101693815, - "loss": 0.0328, + "epoch": 0.62, + "learning_rate": 0.00020683632702324167, + "loss": 0.0518, "step": 96230 }, { - "epoch": 1.04, - "learning_rate": 0.00014385748588487246, - "loss": 0.0351, + "epoch": 0.62, + "learning_rate": 0.00020682664566888475, + "loss": 0.0516, "step": 96240 }, { - "epoch": 1.04, - "learning_rate": 0.0001438412616003634, - "loss": 0.0373, + "epoch": 0.62, + "learning_rate": 0.00020681696431452783, + "loss": 0.0592, "step": 96250 }, { - "epoch": 1.04, - "learning_rate": 0.00014382503731585436, - "loss": 0.0351, + "epoch": 0.62, + "learning_rate": 0.0002068072829601709, + "loss": 0.0432, "step": 96260 }, { - "epoch": 1.04, - "learning_rate": 0.0001438088130313453, - "loss": 0.0351, + "epoch": 0.62, + "learning_rate": 0.00020679760160581396, + "loss": 0.0436, "step": 96270 }, { - "epoch": 1.04, - "learning_rate": 0.00014379258874683626, - "loss": 0.0339, + "epoch": 0.62, + "learning_rate": 0.00020678792025145704, + "loss": 0.0475, "step": 96280 }, { - "epoch": 1.04, - "learning_rate": 0.0001437763644623272, - "loss": 0.0393, + "epoch": 0.62, + "learning_rate": 0.0002067782388971001, + "loss": 0.0489, "step": 96290 }, { - "epoch": 1.04, - "learning_rate": 0.00014376014017781816, - "loss": 0.0373, + "epoch": 0.62, + "learning_rate": 0.00020676855754274314, + "loss": 0.0475, "step": 96300 }, { - "epoch": 1.04, - "learning_rate": 0.00014374391589330908, - "loss": 0.0411, + "epoch": 0.62, + "learning_rate": 0.00020675887618838622, + "loss": 0.0427, "step": 96310 }, { - "epoch": 1.04, - "learning_rate": 0.00014372769160880003, - "loss": 0.0415, + "epoch": 0.62, + "learning_rate": 0.0002067491948340293, + "loss": 0.0445, "step": 96320 }, { - "epoch": 1.04, - "learning_rate": 0.00014371146732429098, - "loss": 0.0355, + "epoch": 0.62, + "learning_rate": 0.00020673951347967236, + "loss": 0.0449, "step": 96330 }, { - "epoch": 1.04, - "learning_rate": 0.00014369524303978193, - "loss": 0.04, + "epoch": 0.62, + "learning_rate": 0.00020672983212531544, + "loss": 0.0467, "step": 96340 }, { - "epoch": 1.04, - "learning_rate": 0.00014367901875527288, - "loss": 0.0402, + "epoch": 0.62, + "learning_rate": 0.00020672015077095852, + "loss": 0.0558, "step": 96350 }, { - "epoch": 1.04, - "learning_rate": 0.00014366279447076383, - "loss": 0.0443, + "epoch": 0.62, + "learning_rate": 0.00020671046941660154, + "loss": 0.0419, "step": 96360 }, { - "epoch": 1.04, - "learning_rate": 0.00014364657018625478, - "loss": 0.0374, + "epoch": 0.62, + "learning_rate": 0.00020670078806224462, + "loss": 0.0509, "step": 96370 }, { - "epoch": 1.04, - "learning_rate": 0.00014363034590174573, - "loss": 0.0382, + "epoch": 0.62, + "learning_rate": 0.0002066911067078877, + "loss": 0.0469, "step": 96380 }, { - "epoch": 1.04, - "learning_rate": 0.00014361412161723668, - "loss": 0.0394, + "epoch": 0.62, + "learning_rate": 0.00020668142535353078, + "loss": 0.0533, "step": 96390 }, { - "epoch": 1.04, - "learning_rate": 0.0001435978973327276, - "loss": 0.0334, + "epoch": 0.62, + "learning_rate": 0.00020667174399917383, + "loss": 0.0451, "step": 96400 }, { - "epoch": 1.04, - "learning_rate": 0.00014358167304821855, - "loss": 0.0363, + "epoch": 0.62, + "learning_rate": 0.0002066620626448169, + "loss": 0.0465, "step": 96410 }, { - "epoch": 1.04, - "learning_rate": 0.0001435654487637095, - "loss": 0.0419, + "epoch": 0.62, + "learning_rate": 0.00020665238129046, + "loss": 0.048, "step": 96420 }, { - "epoch": 1.04, - "learning_rate": 0.00014354922447920045, - "loss": 0.0415, + "epoch": 0.62, + "learning_rate": 0.00020664269993610302, + "loss": 0.059, "step": 96430 }, { - "epoch": 1.04, - "learning_rate": 0.0001435330001946914, - "loss": 0.0423, + "epoch": 0.62, + "learning_rate": 0.0002066330185817461, + "loss": 0.045, "step": 96440 }, { - "epoch": 1.04, - "learning_rate": 0.00014351677591018235, - "loss": 0.0351, + "epoch": 0.62, + "learning_rate": 0.00020662333722738918, + "loss": 0.0479, "step": 96450 }, { - "epoch": 1.04, - "learning_rate": 0.0001435005516256733, - "loss": 0.0423, + "epoch": 0.62, + "learning_rate": 0.00020661365587303226, + "loss": 0.0484, "step": 96460 }, { - "epoch": 1.04, - "learning_rate": 0.00014348432734116425, - "loss": 0.0407, + "epoch": 0.62, + "learning_rate": 0.0002066039745186753, + "loss": 0.0527, "step": 96470 }, { - "epoch": 1.04, - "learning_rate": 0.0001434681030566552, - "loss": 0.0397, + "epoch": 0.62, + "learning_rate": 0.0002065942931643184, + "loss": 0.0511, "step": 96480 }, { - "epoch": 1.04, - "learning_rate": 0.00014345187877214612, - "loss": 0.041, + "epoch": 0.62, + "learning_rate": 0.00020658461180996147, + "loss": 0.0463, "step": 96490 }, { - "epoch": 1.04, - "learning_rate": 0.00014343565448763707, - "loss": 0.0418, + "epoch": 0.62, + "learning_rate": 0.0002065749304556045, + "loss": 0.0482, "step": 96500 }, { - "epoch": 1.04, - "learning_rate": 0.00014341943020312802, - "loss": 0.0361, + "epoch": 0.62, + "learning_rate": 0.00020656524910124758, + "loss": 0.0566, "step": 96510 }, { - "epoch": 1.04, - "learning_rate": 0.00014340320591861897, - "loss": 0.0329, + "epoch": 0.62, + "learning_rate": 0.00020655556774689066, + "loss": 0.0579, "step": 96520 }, { - "epoch": 1.04, - "learning_rate": 0.00014338698163410992, - "loss": 0.0406, + "epoch": 0.62, + "learning_rate": 0.0002065458863925337, + "loss": 0.0491, "step": 96530 }, { - "epoch": 1.04, - "learning_rate": 0.00014337075734960087, - "loss": 0.0393, + "epoch": 0.62, + "learning_rate": 0.0002065362050381768, + "loss": 0.0432, "step": 96540 }, { - "epoch": 1.04, - "learning_rate": 0.00014335453306509182, - "loss": 0.0378, + "epoch": 0.62, + "learning_rate": 0.00020652652368381987, + "loss": 0.0444, "step": 96550 }, { - "epoch": 1.04, - "learning_rate": 0.00014333830878058277, - "loss": 0.0324, + "epoch": 0.62, + "learning_rate": 0.00020651684232946295, + "loss": 0.0471, "step": 96560 }, { - "epoch": 1.04, - "learning_rate": 0.00014332208449607372, - "loss": 0.0366, + "epoch": 0.62, + "learning_rate": 0.00020650716097510597, + "loss": 0.0486, "step": 96570 }, { - "epoch": 1.04, - "learning_rate": 0.00014330586021156464, - "loss": 0.0354, + "epoch": 0.62, + "learning_rate": 0.00020649747962074905, + "loss": 0.0491, "step": 96580 }, { - "epoch": 1.04, - "learning_rate": 0.0001432896359270556, - "loss": 0.0318, + "epoch": 0.62, + "learning_rate": 0.00020648779826639213, + "loss": 0.0573, "step": 96590 }, { - "epoch": 1.04, - "learning_rate": 0.00014327341164254654, - "loss": 0.0369, + "epoch": 0.62, + "learning_rate": 0.00020647811691203519, + "loss": 0.0497, "step": 96600 }, { - "epoch": 1.04, - "learning_rate": 0.0001432571873580375, - "loss": 0.0398, + "epoch": 0.62, + "learning_rate": 0.00020646843555767827, + "loss": 0.0475, "step": 96610 }, { - "epoch": 1.05, - "learning_rate": 0.00014324096307352844, - "loss": 0.0333, + "epoch": 0.62, + "learning_rate": 0.00020645875420332134, + "loss": 0.0442, "step": 96620 }, { - "epoch": 1.05, - "learning_rate": 0.0001432247387890194, - "loss": 0.035, + "epoch": 0.62, + "learning_rate": 0.00020644907284896442, + "loss": 0.053, "step": 96630 }, { - "epoch": 1.05, - "learning_rate": 0.00014320851450451034, - "loss": 0.0353, + "epoch": 0.62, + "learning_rate": 0.00020643939149460745, + "loss": 0.056, "step": 96640 }, { - "epoch": 1.05, - "learning_rate": 0.0001431922902200013, - "loss": 0.0475, + "epoch": 0.62, + "learning_rate": 0.00020642971014025053, + "loss": 0.053, "step": 96650 }, { - "epoch": 1.05, - "learning_rate": 0.00014317606593549224, - "loss": 0.034, + "epoch": 0.62, + "learning_rate": 0.0002064200287858936, + "loss": 0.0436, "step": 96660 }, { - "epoch": 1.05, - "learning_rate": 0.00014315984165098316, - "loss": 0.033, + "epoch": 0.62, + "learning_rate": 0.00020641034743153666, + "loss": 0.0444, "step": 96670 }, { - "epoch": 1.05, - "learning_rate": 0.0001431436173664741, - "loss": 0.0402, + "epoch": 0.62, + "learning_rate": 0.00020640066607717974, + "loss": 0.0504, "step": 96680 }, { - "epoch": 1.05, - "learning_rate": 0.00014312739308196506, - "loss": 0.0449, + "epoch": 0.62, + "learning_rate": 0.00020639098472282282, + "loss": 0.0569, "step": 96690 }, { - "epoch": 1.05, - "learning_rate": 0.000143111168797456, - "loss": 0.0415, + "epoch": 0.62, + "learning_rate": 0.0002063813033684659, + "loss": 0.0485, "step": 96700 }, { - "epoch": 1.05, - "learning_rate": 0.00014309494451294696, - "loss": 0.0334, + "epoch": 0.62, + "learning_rate": 0.00020637162201410893, + "loss": 0.0472, "step": 96710 }, { - "epoch": 1.05, - "learning_rate": 0.0001430787202284379, - "loss": 0.0328, + "epoch": 0.62, + "learning_rate": 0.000206361940659752, + "loss": 0.0508, "step": 96720 }, { - "epoch": 1.05, - "learning_rate": 0.00014306249594392886, - "loss": 0.0408, + "epoch": 0.62, + "learning_rate": 0.00020635225930539506, + "loss": 0.0497, "step": 96730 }, { - "epoch": 1.05, - "learning_rate": 0.0001430462716594198, - "loss": 0.0413, + "epoch": 0.62, + "learning_rate": 0.00020634257795103814, + "loss": 0.0491, "step": 96740 }, { - "epoch": 1.05, - "learning_rate": 0.00014303004737491076, - "loss": 0.0509, + "epoch": 0.62, + "learning_rate": 0.00020633289659668122, + "loss": 0.0435, "step": 96750 }, { - "epoch": 1.05, - "learning_rate": 0.00014301382309040168, - "loss": 0.0379, + "epoch": 0.62, + "learning_rate": 0.0002063232152423243, + "loss": 0.0487, "step": 96760 }, { - "epoch": 1.05, - "learning_rate": 0.00014299759880589263, - "loss": 0.0381, + "epoch": 0.62, + "learning_rate": 0.00020631353388796735, + "loss": 0.0544, "step": 96770 }, { - "epoch": 1.05, - "learning_rate": 0.00014298137452138358, - "loss": 0.0371, + "epoch": 0.62, + "learning_rate": 0.0002063038525336104, + "loss": 0.0504, "step": 96780 }, { - "epoch": 1.05, - "learning_rate": 0.00014296515023687453, - "loss": 0.0395, + "epoch": 0.62, + "learning_rate": 0.00020629417117925348, + "loss": 0.0352, "step": 96790 }, { - "epoch": 1.05, - "learning_rate": 0.00014294892595236548, - "loss": 0.0411, + "epoch": 0.62, + "learning_rate": 0.00020628448982489654, + "loss": 0.0436, "step": 96800 }, { - "epoch": 1.05, - "learning_rate": 0.00014293270166785643, - "loss": 0.0428, + "epoch": 0.62, + "learning_rate": 0.00020627480847053962, + "loss": 0.0494, "step": 96810 }, { - "epoch": 1.05, - "learning_rate": 0.00014291647738334738, - "loss": 0.0441, + "epoch": 0.62, + "learning_rate": 0.0002062651271161827, + "loss": 0.0509, "step": 96820 }, { - "epoch": 1.05, - "learning_rate": 0.00014290025309883833, - "loss": 0.0351, + "epoch": 0.62, + "learning_rate": 0.00020625544576182578, + "loss": 0.0494, "step": 96830 }, { - "epoch": 1.05, - "learning_rate": 0.00014288402881432928, - "loss": 0.0365, + "epoch": 0.63, + "learning_rate": 0.00020624576440746883, + "loss": 0.0428, "step": 96840 }, { - "epoch": 1.05, - "learning_rate": 0.0001428678045298202, - "loss": 0.0369, + "epoch": 0.63, + "learning_rate": 0.00020623608305311188, + "loss": 0.0541, "step": 96850 }, { - "epoch": 1.05, - "learning_rate": 0.00014285158024531115, - "loss": 0.0419, + "epoch": 0.63, + "learning_rate": 0.00020622640169875496, + "loss": 0.0451, "step": 96860 }, { - "epoch": 1.05, - "learning_rate": 0.0001428353559608021, - "loss": 0.0334, + "epoch": 0.63, + "learning_rate": 0.00020621672034439801, + "loss": 0.05, "step": 96870 }, { - "epoch": 1.05, - "learning_rate": 0.00014281913167629305, - "loss": 0.0354, + "epoch": 0.63, + "learning_rate": 0.0002062070389900411, + "loss": 0.0437, "step": 96880 }, { - "epoch": 1.05, - "learning_rate": 0.000142802907391784, - "loss": 0.0352, + "epoch": 0.63, + "learning_rate": 0.00020619735763568417, + "loss": 0.0576, "step": 96890 }, { - "epoch": 1.05, - "learning_rate": 0.00014278668310727495, - "loss": 0.033, + "epoch": 0.63, + "learning_rate": 0.00020618767628132725, + "loss": 0.0505, "step": 96900 }, { - "epoch": 1.05, - "learning_rate": 0.0001427704588227659, - "loss": 0.0402, + "epoch": 0.63, + "learning_rate": 0.0002061779949269703, + "loss": 0.0491, "step": 96910 }, { - "epoch": 1.05, - "learning_rate": 0.00014275423453825685, - "loss": 0.0381, + "epoch": 0.63, + "learning_rate": 0.00020616831357261336, + "loss": 0.0487, "step": 96920 }, { - "epoch": 1.05, - "learning_rate": 0.0001427380102537478, - "loss": 0.0429, + "epoch": 0.63, + "learning_rate": 0.0002061586322182564, + "loss": 0.0514, "step": 96930 }, { - "epoch": 1.05, - "learning_rate": 0.00014272178596923873, - "loss": 0.0353, + "epoch": 0.63, + "learning_rate": 0.0002061489508638995, + "loss": 0.0471, "step": 96940 }, { - "epoch": 1.05, - "learning_rate": 0.00014270556168472968, - "loss": 0.0374, + "epoch": 0.63, + "learning_rate": 0.00020613926950954257, + "loss": 0.0534, "step": 96950 }, { - "epoch": 1.05, - "learning_rate": 0.00014268933740022063, - "loss": 0.0347, + "epoch": 0.63, + "learning_rate": 0.00020612958815518565, + "loss": 0.0542, "step": 96960 }, { - "epoch": 1.05, - "learning_rate": 0.00014267311311571158, - "loss": 0.0382, + "epoch": 0.63, + "learning_rate": 0.0002061199068008287, + "loss": 0.0501, "step": 96970 }, { - "epoch": 1.05, - "learning_rate": 0.00014265688883120252, - "loss": 0.0405, + "epoch": 0.63, + "learning_rate": 0.00020611022544647178, + "loss": 0.0416, "step": 96980 }, { - "epoch": 1.05, - "learning_rate": 0.00014264066454669347, - "loss": 0.0392, + "epoch": 0.63, + "learning_rate": 0.00020610054409211484, + "loss": 0.0542, "step": 96990 }, { - "epoch": 1.05, - "learning_rate": 0.00014262444026218442, - "loss": 0.038, + "epoch": 0.63, + "learning_rate": 0.0002060908627377579, + "loss": 0.0596, "step": 97000 }, { - "epoch": 1.05, - "eval_cer": 0.9212002664588712, - "eval_loss": 0.029298238456249237, - "eval_runtime": 119.3023, - "eval_samples_per_second": 16.764, - "eval_steps_per_second": 4.191, + "epoch": 0.63, + "eval_cer": 0.9199656535984635, + "eval_loss": 0.03143526241183281, + "eval_runtime": 119.7543, + "eval_samples_per_second": 16.701, + "eval_steps_per_second": 4.175, "step": 97000 }, { - "epoch": 1.05, - "learning_rate": 0.00014260821597767537, - "loss": 0.0346, + "epoch": 0.63, + "learning_rate": 0.00020608118138340097, + "loss": 0.0548, "step": 97010 }, { - "epoch": 1.05, - "learning_rate": 0.00014259199169316632, - "loss": 0.0412, + "epoch": 0.63, + "learning_rate": 0.00020607150002904405, + "loss": 0.0474, "step": 97020 }, { - "epoch": 1.05, - "learning_rate": 0.00014257576740865725, - "loss": 0.0432, + "epoch": 0.63, + "learning_rate": 0.00020606181867468713, + "loss": 0.0456, "step": 97030 }, { - "epoch": 1.05, - "learning_rate": 0.0001425595431241482, - "loss": 0.0361, + "epoch": 0.63, + "learning_rate": 0.00020605213732033018, + "loss": 0.0412, "step": 97040 }, { - "epoch": 1.05, - "learning_rate": 0.00014254331883963915, - "loss": 0.0342, + "epoch": 0.63, + "learning_rate": 0.00020604245596597326, + "loss": 0.052, "step": 97050 }, { - "epoch": 1.05, - "learning_rate": 0.0001425270945551301, - "loss": 0.0422, + "epoch": 0.63, + "learning_rate": 0.00020603277461161631, + "loss": 0.0492, "step": 97060 }, { - "epoch": 1.05, - "learning_rate": 0.00014251087027062105, - "loss": 0.0346, + "epoch": 0.63, + "learning_rate": 0.00020602309325725937, + "loss": 0.0521, "step": 97070 }, { - "epoch": 1.05, - "learning_rate": 0.000142494645986112, - "loss": 0.0383, + "epoch": 0.63, + "learning_rate": 0.00020601341190290245, + "loss": 0.0481, "step": 97080 }, { - "epoch": 1.05, - "learning_rate": 0.00014247842170160295, - "loss": 0.0404, + "epoch": 0.63, + "learning_rate": 0.00020600373054854553, + "loss": 0.05, "step": 97090 }, { - "epoch": 1.05, - "learning_rate": 0.0001424621974170939, - "loss": 0.0429, + "epoch": 0.63, + "learning_rate": 0.0002059940491941886, + "loss": 0.0501, "step": 97100 }, { - "epoch": 1.05, - "learning_rate": 0.00014244597313258484, - "loss": 0.035, + "epoch": 0.63, + "learning_rate": 0.00020598436783983166, + "loss": 0.0458, "step": 97110 }, { - "epoch": 1.05, - "learning_rate": 0.00014242974884807577, - "loss": 0.0437, + "epoch": 0.63, + "learning_rate": 0.00020597468648547474, + "loss": 0.0567, "step": 97120 }, { - "epoch": 1.05, - "learning_rate": 0.00014241352456356672, - "loss": 0.039, + "epoch": 0.63, + "learning_rate": 0.00020596500513111776, + "loss": 0.0485, "step": 97130 }, { - "epoch": 1.05, - "learning_rate": 0.00014239730027905767, - "loss": 0.0383, + "epoch": 0.63, + "learning_rate": 0.00020595532377676084, + "loss": 0.0453, "step": 97140 }, { - "epoch": 1.05, - "learning_rate": 0.00014238107599454862, - "loss": 0.0385, + "epoch": 0.63, + "learning_rate": 0.00020594564242240392, + "loss": 0.0426, "step": 97150 }, { - "epoch": 1.05, - "learning_rate": 0.00014236485171003957, - "loss": 0.037, + "epoch": 0.63, + "learning_rate": 0.000205935961068047, + "loss": 0.0449, "step": 97160 }, { - "epoch": 1.05, - "learning_rate": 0.00014234862742553052, - "loss": 0.0363, + "epoch": 0.63, + "learning_rate": 0.00020592627971369006, + "loss": 0.0394, "step": 97170 }, { - "epoch": 1.05, - "learning_rate": 0.00014233240314102147, - "loss": 0.0379, + "epoch": 0.63, + "learning_rate": 0.00020591659835933314, + "loss": 0.0435, "step": 97180 }, { - "epoch": 1.05, - "learning_rate": 0.00014231617885651242, - "loss": 0.0422, + "epoch": 0.63, + "learning_rate": 0.00020590691700497622, + "loss": 0.0556, "step": 97190 }, { - "epoch": 1.05, - "learning_rate": 0.00014229995457200337, - "loss": 0.0426, + "epoch": 0.63, + "learning_rate": 0.00020589723565061924, + "loss": 0.0482, "step": 97200 }, { - "epoch": 1.05, - "learning_rate": 0.00014228373028749432, - "loss": 0.0346, + "epoch": 0.63, + "learning_rate": 0.00020588755429626232, + "loss": 0.0484, "step": 97210 }, { - "epoch": 1.05, - "learning_rate": 0.00014226750600298524, - "loss": 0.0431, + "epoch": 0.63, + "learning_rate": 0.0002058778729419054, + "loss": 0.055, "step": 97220 }, { - "epoch": 1.05, - "learning_rate": 0.0001422512817184762, - "loss": 0.0347, + "epoch": 0.63, + "learning_rate": 0.00020586819158754848, + "loss": 0.0455, "step": 97230 }, { - "epoch": 1.05, - "learning_rate": 0.00014223505743396714, - "loss": 0.0421, + "epoch": 0.63, + "learning_rate": 0.00020585851023319153, + "loss": 0.0533, "step": 97240 }, { - "epoch": 1.05, - "learning_rate": 0.0001422188331494581, - "loss": 0.0454, + "epoch": 0.63, + "learning_rate": 0.0002058488288788346, + "loss": 0.0487, "step": 97250 }, { - "epoch": 1.05, - "learning_rate": 0.00014220260886494904, - "loss": 0.0382, + "epoch": 0.63, + "learning_rate": 0.0002058391475244777, + "loss": 0.051, "step": 97260 }, { - "epoch": 1.05, - "learning_rate": 0.00014218638458044, - "loss": 0.0382, + "epoch": 0.63, + "learning_rate": 0.00020582946617012072, + "loss": 0.0416, "step": 97270 }, { - "epoch": 1.05, - "learning_rate": 0.00014217016029593094, - "loss": 0.0364, + "epoch": 0.63, + "learning_rate": 0.0002058197848157638, + "loss": 0.0572, "step": 97280 }, { - "epoch": 1.05, - "learning_rate": 0.0001421539360114219, - "loss": 0.0413, + "epoch": 0.63, + "learning_rate": 0.00020581010346140688, + "loss": 0.05, "step": 97290 }, { - "epoch": 1.05, - "learning_rate": 0.00014213771172691284, - "loss": 0.0406, + "epoch": 0.63, + "learning_rate": 0.00020580042210704996, + "loss": 0.0443, "step": 97300 }, { - "epoch": 1.05, - "learning_rate": 0.00014212148744240376, - "loss": 0.0344, + "epoch": 0.63, + "learning_rate": 0.000205790740752693, + "loss": 0.0472, "step": 97310 }, { - "epoch": 1.05, - "learning_rate": 0.0001421052631578947, - "loss": 0.0371, + "epoch": 0.63, + "learning_rate": 0.0002057810593983361, + "loss": 0.0498, "step": 97320 }, { - "epoch": 1.05, - "learning_rate": 0.00014208903887338566, - "loss": 0.0369, + "epoch": 0.63, + "learning_rate": 0.00020577137804397917, + "loss": 0.0465, "step": 97330 }, { - "epoch": 1.05, - "learning_rate": 0.0001420728145888766, - "loss": 0.0299, + "epoch": 0.63, + "learning_rate": 0.0002057616966896222, + "loss": 0.0519, "step": 97340 }, { - "epoch": 1.05, - "learning_rate": 0.00014205659030436756, - "loss": 0.0392, + "epoch": 0.63, + "learning_rate": 0.00020575201533526528, + "loss": 0.0467, "step": 97350 }, { - "epoch": 1.05, - "learning_rate": 0.0001420403660198585, - "loss": 0.0363, + "epoch": 0.63, + "learning_rate": 0.00020574233398090836, + "loss": 0.0531, "step": 97360 }, { - "epoch": 1.05, - "learning_rate": 0.00014202414173534946, - "loss": 0.0387, + "epoch": 0.63, + "learning_rate": 0.0002057326526265514, + "loss": 0.052, "step": 97370 }, { - "epoch": 1.05, - "learning_rate": 0.0001420079174508404, - "loss": 0.0373, + "epoch": 0.63, + "learning_rate": 0.0002057229712721945, + "loss": 0.0476, "step": 97380 }, { - "epoch": 1.05, - "learning_rate": 0.00014199169316633136, - "loss": 0.0398, + "epoch": 0.63, + "learning_rate": 0.00020571328991783757, + "loss": 0.0519, "step": 97390 }, { - "epoch": 1.05, - "learning_rate": 0.0001419754688818223, - "loss": 0.0348, + "epoch": 0.63, + "learning_rate": 0.00020570360856348065, + "loss": 0.0399, "step": 97400 }, { - "epoch": 1.05, - "learning_rate": 0.00014195924459731326, - "loss": 0.0407, + "epoch": 0.63, + "learning_rate": 0.00020569392720912367, + "loss": 0.0501, "step": 97410 }, { - "epoch": 1.05, - "learning_rate": 0.0001419430203128042, - "loss": 0.0351, + "epoch": 0.63, + "learning_rate": 0.00020568424585476675, + "loss": 0.0435, "step": 97420 }, { - "epoch": 1.05, - "learning_rate": 0.00014192679602829516, - "loss": 0.0331, + "epoch": 0.63, + "learning_rate": 0.00020567456450040983, + "loss": 0.0456, "step": 97430 }, { - "epoch": 1.05, - "learning_rate": 0.0001419105717437861, - "loss": 0.0338, + "epoch": 0.63, + "learning_rate": 0.00020566488314605289, + "loss": 0.0445, "step": 97440 }, { - "epoch": 1.05, - "learning_rate": 0.00014189434745927703, - "loss": 0.0402, + "epoch": 0.63, + "learning_rate": 0.00020565520179169596, + "loss": 0.0452, "step": 97450 }, { - "epoch": 1.05, - "learning_rate": 0.00014187812317476798, - "loss": 0.0389, + "epoch": 0.63, + "learning_rate": 0.00020564552043733904, + "loss": 0.0524, "step": 97460 }, { - "epoch": 1.05, - "learning_rate": 0.00014186189889025893, - "loss": 0.0335, + "epoch": 0.63, + "learning_rate": 0.00020563583908298212, + "loss": 0.0454, "step": 97470 }, { - "epoch": 1.05, - "learning_rate": 0.00014184567460574988, - "loss": 0.0296, + "epoch": 0.63, + "learning_rate": 0.00020562615772862515, + "loss": 0.0461, "step": 97480 }, { - "epoch": 1.05, - "learning_rate": 0.00014182945032124083, - "loss": 0.0423, + "epoch": 0.63, + "learning_rate": 0.00020561647637426823, + "loss": 0.0425, "step": 97490 }, { - "epoch": 1.05, - "learning_rate": 0.00014181322603673178, - "loss": 0.0347, + "epoch": 0.63, + "learning_rate": 0.0002056067950199113, + "loss": 0.047, "step": 97500 }, { - "epoch": 1.05, - "learning_rate": 0.00014179700175222273, - "loss": 0.035, + "epoch": 0.63, + "learning_rate": 0.00020559711366555436, + "loss": 0.0455, "step": 97510 }, { - "epoch": 1.05, - "learning_rate": 0.00014178077746771368, - "loss": 0.0336, + "epoch": 0.63, + "learning_rate": 0.00020558743231119744, + "loss": 0.0613, "step": 97520 }, { - "epoch": 1.05, - "learning_rate": 0.00014176455318320463, - "loss": 0.0322, + "epoch": 0.63, + "learning_rate": 0.00020557775095684052, + "loss": 0.0464, "step": 97530 }, { - "epoch": 1.06, - "learning_rate": 0.00014174832889869555, - "loss": 0.0363, + "epoch": 0.63, + "learning_rate": 0.00020556806960248357, + "loss": 0.0572, "step": 97540 }, { - "epoch": 1.06, - "learning_rate": 0.0001417321046141865, - "loss": 0.0353, + "epoch": 0.63, + "learning_rate": 0.00020555838824812663, + "loss": 0.0429, "step": 97550 }, { - "epoch": 1.06, - "learning_rate": 0.00014171588032967745, - "loss": 0.0359, + "epoch": 0.63, + "learning_rate": 0.0002055487068937697, + "loss": 0.0461, "step": 97560 }, { - "epoch": 1.06, - "learning_rate": 0.0001416996560451684, - "loss": 0.0344, + "epoch": 0.63, + "learning_rate": 0.00020553902553941276, + "loss": 0.0505, "step": 97570 }, { - "epoch": 1.06, - "learning_rate": 0.00014168343176065935, - "loss": 0.0404, + "epoch": 0.63, + "learning_rate": 0.00020552934418505584, + "loss": 0.0502, "step": 97580 }, { - "epoch": 1.06, - "learning_rate": 0.0001416672074761503, - "loss": 0.033, + "epoch": 0.63, + "learning_rate": 0.00020551966283069892, + "loss": 0.0458, "step": 97590 }, { - "epoch": 1.06, - "learning_rate": 0.00014165098319164125, - "loss": 0.0369, + "epoch": 0.63, + "learning_rate": 0.000205509981476342, + "loss": 0.0481, "step": 97600 }, { - "epoch": 1.06, - "learning_rate": 0.0001416347589071322, - "loss": 0.0399, + "epoch": 0.63, + "learning_rate": 0.00020550030012198505, + "loss": 0.0472, "step": 97610 }, { - "epoch": 1.06, - "learning_rate": 0.00014161853462262315, - "loss": 0.0444, + "epoch": 0.63, + "learning_rate": 0.0002054906187676281, + "loss": 0.0531, "step": 97620 }, { - "epoch": 1.06, - "learning_rate": 0.00014160231033811407, - "loss": 0.0364, + "epoch": 0.63, + "learning_rate": 0.00020548093741327118, + "loss": 0.0597, "step": 97630 }, { - "epoch": 1.06, - "learning_rate": 0.00014158608605360502, - "loss": 0.0389, + "epoch": 0.63, + "learning_rate": 0.00020547125605891424, + "loss": 0.045, "step": 97640 }, { - "epoch": 1.06, - "learning_rate": 0.00014156986176909597, - "loss": 0.0392, + "epoch": 0.63, + "learning_rate": 0.00020546157470455732, + "loss": 0.0601, "step": 97650 }, { - "epoch": 1.06, - "learning_rate": 0.00014155363748458692, - "loss": 0.0401, + "epoch": 0.63, + "learning_rate": 0.0002054518933502004, + "loss": 0.0496, "step": 97660 }, { - "epoch": 1.06, - "learning_rate": 0.00014153741320007787, - "loss": 0.0342, + "epoch": 0.63, + "learning_rate": 0.00020544221199584348, + "loss": 0.0511, "step": 97670 }, { - "epoch": 1.06, - "learning_rate": 0.00014152118891556882, - "loss": 0.0319, + "epoch": 0.63, + "learning_rate": 0.00020543253064148653, + "loss": 0.049, "step": 97680 }, { - "epoch": 1.06, - "learning_rate": 0.00014150496463105977, - "loss": 0.0332, + "epoch": 0.63, + "learning_rate": 0.00020542284928712958, + "loss": 0.0469, "step": 97690 }, { - "epoch": 1.06, - "learning_rate": 0.00014148874034655072, - "loss": 0.0447, + "epoch": 0.63, + "learning_rate": 0.00020541316793277266, + "loss": 0.0496, "step": 97700 }, { - "epoch": 1.06, - "learning_rate": 0.00014147251606204167, - "loss": 0.0425, + "epoch": 0.63, + "learning_rate": 0.00020540348657841571, + "loss": 0.0507, "step": 97710 }, { - "epoch": 1.06, - "learning_rate": 0.0001414562917775326, - "loss": 0.0378, + "epoch": 0.63, + "learning_rate": 0.0002053938052240588, + "loss": 0.0453, "step": 97720 }, { - "epoch": 1.06, - "learning_rate": 0.00014144006749302354, - "loss": 0.0366, + "epoch": 0.63, + "learning_rate": 0.00020538412386970187, + "loss": 0.0446, "step": 97730 }, { - "epoch": 1.06, - "learning_rate": 0.0001414238432085145, - "loss": 0.0311, + "epoch": 0.63, + "learning_rate": 0.00020537444251534493, + "loss": 0.0486, "step": 97740 }, { - "epoch": 1.06, - "learning_rate": 0.00014140761892400544, - "loss": 0.0371, + "epoch": 0.63, + "learning_rate": 0.000205364761160988, + "loss": 0.0488, "step": 97750 }, { - "epoch": 1.06, - "learning_rate": 0.0001413913946394964, - "loss": 0.0353, + "epoch": 0.63, + "learning_rate": 0.00020535507980663106, + "loss": 0.0445, "step": 97760 }, { - "epoch": 1.06, - "learning_rate": 0.00014137517035498734, - "loss": 0.036, + "epoch": 0.63, + "learning_rate": 0.0002053453984522741, + "loss": 0.0518, "step": 97770 }, { - "epoch": 1.06, - "learning_rate": 0.0001413589460704783, - "loss": 0.0334, + "epoch": 0.63, + "learning_rate": 0.0002053357170979172, + "loss": 0.0543, "step": 97780 }, { - "epoch": 1.06, - "learning_rate": 0.00014134272178596924, - "loss": 0.0359, + "epoch": 0.63, + "learning_rate": 0.00020532603574356027, + "loss": 0.0393, "step": 97790 }, { - "epoch": 1.06, - "learning_rate": 0.0001413264975014602, - "loss": 0.0342, + "epoch": 0.63, + "learning_rate": 0.00020531635438920335, + "loss": 0.0579, "step": 97800 }, { - "epoch": 1.06, - "learning_rate": 0.0001413102732169511, - "loss": 0.0381, + "epoch": 0.63, + "learning_rate": 0.0002053066730348464, + "loss": 0.0514, "step": 97810 }, { - "epoch": 1.06, - "learning_rate": 0.00014129404893244206, - "loss": 0.0391, + "epoch": 0.63, + "learning_rate": 0.00020529699168048948, + "loss": 0.0494, "step": 97820 }, { - "epoch": 1.06, - "learning_rate": 0.000141277824647933, - "loss": 0.0367, + "epoch": 0.63, + "learning_rate": 0.00020528731032613254, + "loss": 0.0472, "step": 97830 }, { - "epoch": 1.06, - "learning_rate": 0.00014126160036342396, - "loss": 0.0308, + "epoch": 0.63, + "learning_rate": 0.0002052776289717756, + "loss": 0.0454, "step": 97840 }, { - "epoch": 1.06, - "learning_rate": 0.0001412453760789149, - "loss": 0.0334, + "epoch": 0.63, + "learning_rate": 0.00020526794761741867, + "loss": 0.0432, "step": 97850 }, { - "epoch": 1.06, - "learning_rate": 0.00014122915179440586, - "loss": 0.0341, + "epoch": 0.63, + "learning_rate": 0.00020525826626306175, + "loss": 0.0518, "step": 97860 }, { - "epoch": 1.06, - "learning_rate": 0.0001412129275098968, - "loss": 0.0331, + "epoch": 0.63, + "learning_rate": 0.00020524858490870483, + "loss": 0.0429, "step": 97870 }, { - "epoch": 1.06, - "learning_rate": 0.00014119670322538776, - "loss": 0.0358, + "epoch": 0.63, + "learning_rate": 0.00020523890355434788, + "loss": 0.0499, "step": 97880 }, { - "epoch": 1.06, - "learning_rate": 0.0001411804789408787, - "loss": 0.0428, + "epoch": 0.63, + "learning_rate": 0.00020522922219999096, + "loss": 0.0494, "step": 97890 }, { - "epoch": 1.06, - "learning_rate": 0.00014116425465636966, - "loss": 0.0365, + "epoch": 0.63, + "learning_rate": 0.000205219540845634, + "loss": 0.0502, "step": 97900 }, { - "epoch": 1.06, - "learning_rate": 0.00014114803037186058, - "loss": 0.0373, + "epoch": 0.63, + "learning_rate": 0.00020520985949127707, + "loss": 0.0528, "step": 97910 }, { - "epoch": 1.06, - "learning_rate": 0.00014113180608735153, - "loss": 0.0369, + "epoch": 0.63, + "learning_rate": 0.00020520017813692015, + "loss": 0.0549, "step": 97920 }, { - "epoch": 1.06, - "learning_rate": 0.00014111558180284248, - "loss": 0.0381, + "epoch": 0.63, + "learning_rate": 0.00020519049678256323, + "loss": 0.0453, "step": 97930 }, { - "epoch": 1.06, - "learning_rate": 0.00014109935751833343, - "loss": 0.0293, + "epoch": 0.63, + "learning_rate": 0.00020518081542820628, + "loss": 0.0441, "step": 97940 }, { - "epoch": 1.06, - "learning_rate": 0.00014108313323382438, - "loss": 0.0349, + "epoch": 0.63, + "learning_rate": 0.00020517113407384936, + "loss": 0.043, "step": 97950 }, { - "epoch": 1.06, - "learning_rate": 0.00014106690894931533, - "loss": 0.0337, + "epoch": 0.63, + "learning_rate": 0.00020516145271949244, + "loss": 0.0487, "step": 97960 }, { - "epoch": 1.06, - "learning_rate": 0.00014105068466480628, - "loss": 0.0366, + "epoch": 0.63, + "learning_rate": 0.00020515177136513546, + "loss": 0.0453, "step": 97970 }, { - "epoch": 1.06, - "learning_rate": 0.00014103446038029723, - "loss": 0.0348, + "epoch": 0.63, + "learning_rate": 0.00020514209001077854, + "loss": 0.0484, "step": 97980 }, { - "epoch": 1.06, - "learning_rate": 0.00014101823609578818, - "loss": 0.0365, + "epoch": 0.63, + "learning_rate": 0.00020513240865642162, + "loss": 0.0405, "step": 97990 }, { - "epoch": 1.06, - "learning_rate": 0.0001410020118112791, - "loss": 0.0346, + "epoch": 0.63, + "learning_rate": 0.0002051227273020647, + "loss": 0.0449, "step": 98000 }, { - "epoch": 1.06, - "eval_cer": 0.9211843637410967, - "eval_loss": 0.028429720550775528, - "eval_runtime": 118.8211, - "eval_samples_per_second": 16.832, - "eval_steps_per_second": 4.208, + "epoch": 0.63, + "eval_cer": 0.920000903852672, + "eval_loss": 0.03220009431242943, + "eval_runtime": 120.0197, + "eval_samples_per_second": 16.664, + "eval_steps_per_second": 4.166, "step": 98000 }, { - "epoch": 1.06, - "learning_rate": 0.00014098578752677005, - "loss": 0.0411, + "epoch": 0.63, + "learning_rate": 0.00020511304594770776, + "loss": 0.043, "step": 98010 }, { - "epoch": 1.06, - "learning_rate": 0.000140969563242261, - "loss": 0.0418, + "epoch": 0.63, + "learning_rate": 0.00020510336459335084, + "loss": 0.0485, "step": 98020 }, { - "epoch": 1.06, - "learning_rate": 0.00014095333895775195, - "loss": 0.0347, + "epoch": 0.63, + "learning_rate": 0.00020509368323899392, + "loss": 0.0456, "step": 98030 }, { - "epoch": 1.06, - "learning_rate": 0.0001409371146732429, - "loss": 0.0379, + "epoch": 0.63, + "learning_rate": 0.00020508400188463694, + "loss": 0.0481, "step": 98040 }, { - "epoch": 1.06, - "learning_rate": 0.00014092089038873385, - "loss": 0.0351, + "epoch": 0.63, + "learning_rate": 0.00020507432053028002, + "loss": 0.0455, "step": 98050 }, { - "epoch": 1.06, - "learning_rate": 0.0001409046661042248, - "loss": 0.0406, + "epoch": 0.63, + "learning_rate": 0.0002050646391759231, + "loss": 0.0482, "step": 98060 }, { - "epoch": 1.06, - "learning_rate": 0.00014088844181971575, - "loss": 0.0392, + "epoch": 0.63, + "learning_rate": 0.00020505495782156618, + "loss": 0.0381, "step": 98070 }, { - "epoch": 1.06, - "learning_rate": 0.0001408722175352067, - "loss": 0.0393, + "epoch": 0.63, + "learning_rate": 0.00020504527646720923, + "loss": 0.0417, "step": 98080 }, { - "epoch": 1.06, - "learning_rate": 0.00014085599325069762, - "loss": 0.0356, + "epoch": 0.63, + "learning_rate": 0.0002050355951128523, + "loss": 0.0404, "step": 98090 }, { - "epoch": 1.06, - "learning_rate": 0.00014083976896618857, - "loss": 0.0362, + "epoch": 0.63, + "learning_rate": 0.0002050259137584954, + "loss": 0.0457, "step": 98100 }, { - "epoch": 1.06, - "learning_rate": 0.00014082354468167952, - "loss": 0.0365, + "epoch": 0.63, + "learning_rate": 0.00020501623240413842, + "loss": 0.0467, "step": 98110 }, { - "epoch": 1.06, - "learning_rate": 0.00014080732039717047, - "loss": 0.0394, + "epoch": 0.63, + "learning_rate": 0.0002050065510497815, + "loss": 0.052, "step": 98120 }, { - "epoch": 1.06, - "learning_rate": 0.00014079109611266142, - "loss": 0.0373, + "epoch": 0.63, + "learning_rate": 0.00020499686969542458, + "loss": 0.0446, "step": 98130 }, { - "epoch": 1.06, - "learning_rate": 0.00014077487182815237, - "loss": 0.0355, + "epoch": 0.63, + "learning_rate": 0.00020498718834106763, + "loss": 0.0449, "step": 98140 }, { - "epoch": 1.06, - "learning_rate": 0.00014075864754364332, - "loss": 0.0327, + "epoch": 0.63, + "learning_rate": 0.0002049775069867107, + "loss": 0.0481, "step": 98150 }, { - "epoch": 1.06, - "learning_rate": 0.00014074242325913427, - "loss": 0.0402, + "epoch": 0.63, + "learning_rate": 0.0002049678256323538, + "loss": 0.0447, "step": 98160 }, { - "epoch": 1.06, - "learning_rate": 0.00014072619897462522, - "loss": 0.037, + "epoch": 0.63, + "learning_rate": 0.00020495814427799687, + "loss": 0.0543, "step": 98170 }, { - "epoch": 1.06, - "learning_rate": 0.00014070997469011615, - "loss": 0.0321, + "epoch": 0.63, + "learning_rate": 0.0002049484629236399, + "loss": 0.0556, "step": 98180 }, { - "epoch": 1.06, - "learning_rate": 0.0001406937504056071, - "loss": 0.0399, + "epoch": 0.63, + "learning_rate": 0.00020493878156928297, + "loss": 0.0458, "step": 98190 }, { - "epoch": 1.06, - "learning_rate": 0.00014067752612109804, - "loss": 0.0304, + "epoch": 0.63, + "learning_rate": 0.00020492910021492605, + "loss": 0.0418, "step": 98200 }, { - "epoch": 1.06, - "learning_rate": 0.000140661301836589, - "loss": 0.0343, + "epoch": 0.63, + "learning_rate": 0.0002049194188605691, + "loss": 0.049, "step": 98210 }, { - "epoch": 1.06, - "learning_rate": 0.00014064507755207994, - "loss": 0.04, + "epoch": 0.63, + "learning_rate": 0.0002049097375062122, + "loss": 0.0488, "step": 98220 }, { - "epoch": 1.06, - "learning_rate": 0.0001406288532675709, - "loss": 0.0367, + "epoch": 0.63, + "learning_rate": 0.00020490005615185527, + "loss": 0.0489, "step": 98230 }, { - "epoch": 1.06, - "learning_rate": 0.00014061262898306184, - "loss": 0.0396, + "epoch": 0.63, + "learning_rate": 0.00020489037479749835, + "loss": 0.0493, "step": 98240 }, { - "epoch": 1.06, - "learning_rate": 0.0001405964046985528, - "loss": 0.0451, + "epoch": 0.63, + "learning_rate": 0.00020488069344314137, + "loss": 0.0485, "step": 98250 }, { - "epoch": 1.06, - "learning_rate": 0.00014058018041404374, - "loss": 0.0408, + "epoch": 0.63, + "learning_rate": 0.00020487101208878445, + "loss": 0.0517, "step": 98260 }, { - "epoch": 1.06, - "learning_rate": 0.00014056395612953467, - "loss": 0.0354, + "epoch": 0.63, + "learning_rate": 0.00020486133073442753, + "loss": 0.0428, "step": 98270 }, { - "epoch": 1.06, - "learning_rate": 0.00014054773184502562, - "loss": 0.0357, + "epoch": 0.63, + "learning_rate": 0.00020485164938007058, + "loss": 0.0493, "step": 98280 }, { - "epoch": 1.06, - "learning_rate": 0.00014053150756051657, - "loss": 0.0409, + "epoch": 0.63, + "learning_rate": 0.00020484196802571366, + "loss": 0.0418, "step": 98290 }, { - "epoch": 1.06, - "learning_rate": 0.00014051528327600752, - "loss": 0.0334, + "epoch": 0.63, + "learning_rate": 0.00020483228667135674, + "loss": 0.0514, "step": 98300 }, { - "epoch": 1.06, - "learning_rate": 0.00014049905899149846, - "loss": 0.0388, + "epoch": 0.63, + "learning_rate": 0.00020482260531699982, + "loss": 0.0442, "step": 98310 }, { - "epoch": 1.06, - "learning_rate": 0.00014048283470698941, - "loss": 0.0396, + "epoch": 0.63, + "learning_rate": 0.00020481292396264285, + "loss": 0.05, "step": 98320 }, { - "epoch": 1.06, - "learning_rate": 0.00014046661042248036, - "loss": 0.0385, + "epoch": 0.63, + "learning_rate": 0.00020480324260828593, + "loss": 0.0453, "step": 98330 }, { - "epoch": 1.06, - "learning_rate": 0.00014045038613797131, - "loss": 0.0417, + "epoch": 0.63, + "learning_rate": 0.00020479356125392898, + "loss": 0.0429, "step": 98340 }, { - "epoch": 1.06, - "learning_rate": 0.00014043416185346226, - "loss": 0.0444, + "epoch": 0.63, + "learning_rate": 0.00020478387989957206, + "loss": 0.0461, "step": 98350 }, { - "epoch": 1.06, - "learning_rate": 0.0001404179375689532, - "loss": 0.0425, + "epoch": 0.63, + "learning_rate": 0.00020477419854521514, + "loss": 0.0458, "step": 98360 }, { - "epoch": 1.06, - "learning_rate": 0.00014040171328444414, - "loss": 0.0364, + "epoch": 0.63, + "learning_rate": 0.00020476451719085822, + "loss": 0.045, "step": 98370 }, { - "epoch": 1.06, - "learning_rate": 0.00014038548899993509, - "loss": 0.0328, + "epoch": 0.63, + "learning_rate": 0.00020475483583650127, + "loss": 0.0465, "step": 98380 }, { - "epoch": 1.06, - "learning_rate": 0.00014036926471542604, - "loss": 0.0329, + "epoch": 0.64, + "learning_rate": 0.00020474515448214433, + "loss": 0.0466, "step": 98390 }, { - "epoch": 1.06, - "learning_rate": 0.00014035304043091699, - "loss": 0.0346, + "epoch": 0.64, + "learning_rate": 0.0002047354731277874, + "loss": 0.0434, "step": 98400 }, { - "epoch": 1.06, - "learning_rate": 0.00014033681614640794, - "loss": 0.036, + "epoch": 0.64, + "learning_rate": 0.00020472579177343046, + "loss": 0.0447, "step": 98410 }, { - "epoch": 1.06, - "learning_rate": 0.00014032059186189889, - "loss": 0.0434, + "epoch": 0.64, + "learning_rate": 0.00020471611041907354, + "loss": 0.0483, "step": 98420 }, { - "epoch": 1.06, - "learning_rate": 0.00014030436757738984, - "loss": 0.0417, + "epoch": 0.64, + "learning_rate": 0.00020470642906471662, + "loss": 0.0509, "step": 98430 }, { - "epoch": 1.06, - "learning_rate": 0.00014028814329288078, - "loss": 0.0281, + "epoch": 0.64, + "learning_rate": 0.0002046967477103597, + "loss": 0.0433, "step": 98440 }, { - "epoch": 1.06, - "learning_rate": 0.0001402719190083717, - "loss": 0.0338, + "epoch": 0.64, + "learning_rate": 0.00020468706635600275, + "loss": 0.0487, "step": 98450 }, { - "epoch": 1.06, - "learning_rate": 0.00014025569472386266, - "loss": 0.0399, + "epoch": 0.64, + "learning_rate": 0.0002046773850016458, + "loss": 0.0474, "step": 98460 }, { - "epoch": 1.07, - "learning_rate": 0.0001402394704393536, - "loss": 0.037, + "epoch": 0.64, + "learning_rate": 0.00020466770364728888, + "loss": 0.0533, "step": 98470 }, { - "epoch": 1.07, - "learning_rate": 0.00014022324615484456, - "loss": 0.0419, + "epoch": 0.64, + "learning_rate": 0.00020465802229293194, + "loss": 0.0476, "step": 98480 }, { - "epoch": 1.07, - "learning_rate": 0.0001402070218703355, - "loss": 0.0361, + "epoch": 0.64, + "learning_rate": 0.00020464834093857502, + "loss": 0.0491, "step": 98490 }, { - "epoch": 1.07, - "learning_rate": 0.00014019079758582646, - "loss": 0.0341, + "epoch": 0.64, + "learning_rate": 0.0002046386595842181, + "loss": 0.0455, "step": 98500 }, { - "epoch": 1.07, - "learning_rate": 0.0001401745733013174, - "loss": 0.0357, + "epoch": 0.64, + "learning_rate": 0.00020462897822986118, + "loss": 0.0526, "step": 98510 }, { - "epoch": 1.07, - "learning_rate": 0.00014015834901680836, - "loss": 0.0282, + "epoch": 0.64, + "learning_rate": 0.00020461929687550423, + "loss": 0.0479, "step": 98520 }, { - "epoch": 1.07, - "learning_rate": 0.0001401421247322993, - "loss": 0.0454, + "epoch": 0.64, + "learning_rate": 0.00020460961552114728, + "loss": 0.0476, "step": 98530 }, { - "epoch": 1.07, - "learning_rate": 0.00014012590044779023, - "loss": 0.0366, + "epoch": 0.64, + "learning_rate": 0.00020459993416679033, + "loss": 0.0516, "step": 98540 }, { - "epoch": 1.07, - "learning_rate": 0.00014010967616328118, - "loss": 0.0389, + "epoch": 0.64, + "learning_rate": 0.00020459025281243341, + "loss": 0.0484, "step": 98550 }, { - "epoch": 1.07, - "learning_rate": 0.00014009345187877213, - "loss": 0.036, + "epoch": 0.64, + "learning_rate": 0.0002045805714580765, + "loss": 0.0525, "step": 98560 }, { - "epoch": 1.07, - "learning_rate": 0.00014007722759426308, - "loss": 0.0401, + "epoch": 0.64, + "learning_rate": 0.00020457089010371957, + "loss": 0.0496, "step": 98570 }, { - "epoch": 1.07, - "learning_rate": 0.00014006100330975403, - "loss": 0.0384, + "epoch": 0.64, + "learning_rate": 0.00020456120874936263, + "loss": 0.0442, "step": 98580 }, { - "epoch": 1.07, - "learning_rate": 0.00014004477902524498, - "loss": 0.0377, + "epoch": 0.64, + "learning_rate": 0.0002045515273950057, + "loss": 0.0482, "step": 98590 }, { - "epoch": 1.07, - "learning_rate": 0.00014002855474073593, - "loss": 0.0446, + "epoch": 0.64, + "learning_rate": 0.00020454184604064876, + "loss": 0.0488, "step": 98600 }, { - "epoch": 1.07, - "learning_rate": 0.00014001233045622688, - "loss": 0.0337, + "epoch": 0.64, + "learning_rate": 0.0002045321646862918, + "loss": 0.0519, "step": 98610 }, { - "epoch": 1.07, - "learning_rate": 0.00013999610617171783, - "loss": 0.0309, + "epoch": 0.64, + "learning_rate": 0.0002045224833319349, + "loss": 0.05, "step": 98620 }, { - "epoch": 1.07, - "learning_rate": 0.00013997988188720875, - "loss": 0.0383, + "epoch": 0.64, + "learning_rate": 0.00020451280197757797, + "loss": 0.0433, "step": 98630 }, { - "epoch": 1.07, - "learning_rate": 0.0001399636576026997, - "loss": 0.0344, - "step": 98640 + "epoch": 0.64, + "learning_rate": 0.00020450312062322105, + "loss": 0.0445, + "step": 98640 }, { - "epoch": 1.07, - "learning_rate": 0.00013994743331819065, - "loss": 0.0438, + "epoch": 0.64, + "learning_rate": 0.0002044934392688641, + "loss": 0.048, "step": 98650 }, { - "epoch": 1.07, - "learning_rate": 0.0001399312090336816, - "loss": 0.0382, + "epoch": 0.64, + "learning_rate": 0.00020448375791450718, + "loss": 0.0476, "step": 98660 }, { - "epoch": 1.07, - "learning_rate": 0.00013991498474917255, - "loss": 0.0384, + "epoch": 0.64, + "learning_rate": 0.00020447407656015024, + "loss": 0.0441, "step": 98670 }, { - "epoch": 1.07, - "learning_rate": 0.0001398987604646635, - "loss": 0.0397, + "epoch": 0.64, + "learning_rate": 0.0002044643952057933, + "loss": 0.0441, "step": 98680 }, { - "epoch": 1.07, - "learning_rate": 0.00013988253618015445, - "loss": 0.0355, + "epoch": 0.64, + "learning_rate": 0.00020445471385143637, + "loss": 0.0404, "step": 98690 }, { - "epoch": 1.07, - "learning_rate": 0.0001398663118956454, - "loss": 0.0323, + "epoch": 0.64, + "learning_rate": 0.00020444503249707945, + "loss": 0.0442, "step": 98700 }, { - "epoch": 1.07, - "learning_rate": 0.00013985008761113635, - "loss": 0.0388, + "epoch": 0.64, + "learning_rate": 0.00020443535114272253, + "loss": 0.0461, "step": 98710 }, { - "epoch": 1.07, - "learning_rate": 0.00013983386332662727, - "loss": 0.0417, + "epoch": 0.64, + "learning_rate": 0.00020442566978836558, + "loss": 0.0492, "step": 98720 }, { - "epoch": 1.07, - "learning_rate": 0.00013981763904211822, - "loss": 0.0403, + "epoch": 0.64, + "learning_rate": 0.00020441598843400866, + "loss": 0.0456, "step": 98730 }, { - "epoch": 1.07, - "learning_rate": 0.00013980141475760917, - "loss": 0.0355, + "epoch": 0.64, + "learning_rate": 0.00020440630707965169, + "loss": 0.0501, "step": 98740 }, { - "epoch": 1.07, - "learning_rate": 0.00013978519047310012, - "loss": 0.0384, + "epoch": 0.64, + "learning_rate": 0.00020439662572529477, + "loss": 0.0418, "step": 98750 }, { - "epoch": 1.07, - "learning_rate": 0.00013976896618859107, - "loss": 0.0335, + "epoch": 0.64, + "learning_rate": 0.00020438694437093785, + "loss": 0.0413, "step": 98760 }, { - "epoch": 1.07, - "learning_rate": 0.00013975274190408202, - "loss": 0.0402, + "epoch": 0.64, + "learning_rate": 0.00020437726301658093, + "loss": 0.0482, "step": 98770 }, { - "epoch": 1.07, - "learning_rate": 0.00013973651761957297, - "loss": 0.0432, + "epoch": 0.64, + "learning_rate": 0.00020436758166222398, + "loss": 0.0524, "step": 98780 }, { - "epoch": 1.07, - "learning_rate": 0.00013972029333506392, - "loss": 0.0309, + "epoch": 0.64, + "learning_rate": 0.00020435790030786706, + "loss": 0.0442, "step": 98790 }, { - "epoch": 1.07, - "learning_rate": 0.00013970406905055487, - "loss": 0.0371, + "epoch": 0.64, + "learning_rate": 0.00020434821895351014, + "loss": 0.051, "step": 98800 }, { - "epoch": 1.07, - "learning_rate": 0.0001396878447660458, - "loss": 0.0425, + "epoch": 0.64, + "learning_rate": 0.00020433853759915316, + "loss": 0.0427, "step": 98810 }, { - "epoch": 1.07, - "learning_rate": 0.00013967162048153674, - "loss": 0.0408, + "epoch": 0.64, + "learning_rate": 0.00020432885624479624, + "loss": 0.0445, "step": 98820 }, { - "epoch": 1.07, - "learning_rate": 0.0001396553961970277, - "loss": 0.0362, + "epoch": 0.64, + "learning_rate": 0.00020431917489043932, + "loss": 0.0493, "step": 98830 }, { - "epoch": 1.07, - "learning_rate": 0.00013963917191251864, - "loss": 0.0442, + "epoch": 0.64, + "learning_rate": 0.0002043094935360824, + "loss": 0.0458, "step": 98840 }, { - "epoch": 1.07, - "learning_rate": 0.0001396229476280096, - "loss": 0.0324, + "epoch": 0.64, + "learning_rate": 0.00020429981218172546, + "loss": 0.0565, "step": 98850 }, { - "epoch": 1.07, - "learning_rate": 0.00013960672334350054, - "loss": 0.0384, + "epoch": 0.64, + "learning_rate": 0.00020429013082736853, + "loss": 0.054, "step": 98860 }, { - "epoch": 1.07, - "learning_rate": 0.0001395904990589915, - "loss": 0.0349, + "epoch": 0.64, + "learning_rate": 0.00020428044947301161, + "loss": 0.046, "step": 98870 }, { - "epoch": 1.07, - "learning_rate": 0.00013957427477448244, - "loss": 0.0316, + "epoch": 0.64, + "learning_rate": 0.00020427076811865464, + "loss": 0.0451, "step": 98880 }, { - "epoch": 1.07, - "learning_rate": 0.0001395580504899734, - "loss": 0.0372, + "epoch": 0.64, + "learning_rate": 0.00020426108676429772, + "loss": 0.0492, "step": 98890 }, { - "epoch": 1.07, - "learning_rate": 0.0001395418262054643, - "loss": 0.0318, + "epoch": 0.64, + "learning_rate": 0.0002042514054099408, + "loss": 0.0461, "step": 98900 }, { - "epoch": 1.07, - "learning_rate": 0.00013952560192095526, - "loss": 0.0351, + "epoch": 0.64, + "learning_rate": 0.00020424172405558388, + "loss": 0.047, "step": 98910 }, { - "epoch": 1.07, - "learning_rate": 0.0001395093776364462, - "loss": 0.0344, + "epoch": 0.64, + "learning_rate": 0.00020423204270122693, + "loss": 0.0456, "step": 98920 }, { - "epoch": 1.07, - "learning_rate": 0.00013949315335193716, - "loss": 0.0386, + "epoch": 0.64, + "learning_rate": 0.00020422236134687, + "loss": 0.0457, "step": 98930 }, { - "epoch": 1.07, - "learning_rate": 0.0001394769290674281, - "loss": 0.0408, + "epoch": 0.64, + "learning_rate": 0.0002042126799925131, + "loss": 0.0439, "step": 98940 }, { - "epoch": 1.07, - "learning_rate": 0.00013946070478291906, - "loss": 0.037, + "epoch": 0.64, + "learning_rate": 0.00020420299863815612, + "loss": 0.0442, "step": 98950 }, { - "epoch": 1.07, - "learning_rate": 0.00013944448049841, - "loss": 0.0386, + "epoch": 0.64, + "learning_rate": 0.0002041933172837992, + "loss": 0.0476, "step": 98960 }, { - "epoch": 1.07, - "learning_rate": 0.00013942825621390096, - "loss": 0.0311, + "epoch": 0.64, + "learning_rate": 0.00020418363592944228, + "loss": 0.0525, "step": 98970 }, { - "epoch": 1.07, - "learning_rate": 0.0001394120319293919, - "loss": 0.0309, + "epoch": 0.64, + "learning_rate": 0.00020417395457508533, + "loss": 0.0444, "step": 98980 }, { - "epoch": 1.07, - "learning_rate": 0.00013939580764488283, - "loss": 0.0393, + "epoch": 0.64, + "learning_rate": 0.0002041642732207284, + "loss": 0.0536, "step": 98990 }, { - "epoch": 1.07, - "learning_rate": 0.00013937958336037378, - "loss": 0.0357, + "epoch": 0.64, + "learning_rate": 0.0002041545918663715, + "loss": 0.041, "step": 99000 }, { - "epoch": 1.07, - "eval_cer": 0.9211622766330766, - "eval_loss": 0.028519801795482635, - "eval_runtime": 118.9736, - "eval_samples_per_second": 16.81, - "eval_steps_per_second": 4.203, + "epoch": 0.64, + "eval_cer": 0.9199168455541746, + "eval_loss": 0.031374961137771606, + "eval_runtime": 119.7911, + "eval_samples_per_second": 16.696, + "eval_steps_per_second": 4.174, "step": 99000 }, { - "epoch": 1.07, - "learning_rate": 0.00013936335907586473, - "loss": 0.0341, + "epoch": 0.64, + "learning_rate": 0.00020414491051201457, + "loss": 0.0421, "step": 99010 }, { - "epoch": 1.07, - "learning_rate": 0.00013934713479135568, - "loss": 0.0381, + "epoch": 0.64, + "learning_rate": 0.0002041352291576576, + "loss": 0.052, "step": 99020 }, { - "epoch": 1.07, - "learning_rate": 0.00013933091050684663, - "loss": 0.0327, + "epoch": 0.64, + "learning_rate": 0.00020412554780330067, + "loss": 0.055, "step": 99030 }, { - "epoch": 1.07, - "learning_rate": 0.00013931468622233758, - "loss": 0.0333, + "epoch": 0.64, + "learning_rate": 0.00020411586644894375, + "loss": 0.0496, "step": 99040 }, { - "epoch": 1.07, - "learning_rate": 0.00013929846193782853, - "loss": 0.0371, + "epoch": 0.64, + "learning_rate": 0.0002041061850945868, + "loss": 0.0434, "step": 99050 }, { - "epoch": 1.07, - "learning_rate": 0.00013928223765331948, - "loss": 0.0382, + "epoch": 0.64, + "learning_rate": 0.0002040965037402299, + "loss": 0.0449, "step": 99060 }, { - "epoch": 1.07, - "learning_rate": 0.00013926601336881043, - "loss": 0.0417, + "epoch": 0.64, + "learning_rate": 0.00020408682238587297, + "loss": 0.0464, "step": 99070 }, { - "epoch": 1.07, - "learning_rate": 0.00013924978908430135, - "loss": 0.0359, + "epoch": 0.64, + "learning_rate": 0.00020407714103151605, + "loss": 0.05, "step": 99080 }, { - "epoch": 1.07, - "learning_rate": 0.0001392335647997923, - "loss": 0.0366, + "epoch": 0.64, + "learning_rate": 0.00020406745967715907, + "loss": 0.0438, "step": 99090 }, { - "epoch": 1.07, - "learning_rate": 0.00013921734051528325, - "loss": 0.0383, + "epoch": 0.64, + "learning_rate": 0.00020405777832280215, + "loss": 0.052, "step": 99100 }, { - "epoch": 1.07, - "learning_rate": 0.0001392011162307742, - "loss": 0.0359, + "epoch": 0.64, + "learning_rate": 0.00020404809696844523, + "loss": 0.043, "step": 99110 }, { - "epoch": 1.07, - "learning_rate": 0.00013918489194626515, - "loss": 0.0354, + "epoch": 0.64, + "learning_rate": 0.00020403841561408828, + "loss": 0.0469, "step": 99120 }, { - "epoch": 1.07, - "learning_rate": 0.0001391686676617561, - "loss": 0.0359, + "epoch": 0.64, + "learning_rate": 0.00020402873425973136, + "loss": 0.0458, "step": 99130 }, { - "epoch": 1.07, - "learning_rate": 0.00013915244337724705, - "loss": 0.0383, + "epoch": 0.64, + "learning_rate": 0.00020401905290537444, + "loss": 0.0505, "step": 99140 }, { - "epoch": 1.07, - "learning_rate": 0.000139136219092738, - "loss": 0.036, + "epoch": 0.64, + "learning_rate": 0.0002040093715510175, + "loss": 0.0452, "step": 99150 }, { - "epoch": 1.07, - "learning_rate": 0.00013911999480822895, - "loss": 0.0356, + "epoch": 0.64, + "learning_rate": 0.00020399969019666055, + "loss": 0.044, "step": 99160 }, { - "epoch": 1.07, - "learning_rate": 0.00013910377052371987, - "loss": 0.0394, + "epoch": 0.64, + "learning_rate": 0.00020399000884230363, + "loss": 0.0562, "step": 99170 }, { - "epoch": 1.07, - "learning_rate": 0.00013908754623921082, - "loss": 0.0382, + "epoch": 0.64, + "learning_rate": 0.00020398032748794668, + "loss": 0.0437, "step": 99180 }, { - "epoch": 1.07, - "learning_rate": 0.00013907132195470177, - "loss": 0.0348, + "epoch": 0.64, + "learning_rate": 0.00020397064613358976, + "loss": 0.0437, "step": 99190 }, { - "epoch": 1.07, - "learning_rate": 0.00013905509767019272, - "loss": 0.0381, + "epoch": 0.64, + "learning_rate": 0.00020396096477923284, + "loss": 0.0531, "step": 99200 }, { - "epoch": 1.07, - "learning_rate": 0.00013903887338568367, - "loss": 0.0367, + "epoch": 0.64, + "learning_rate": 0.00020395128342487592, + "loss": 0.0487, "step": 99210 }, { - "epoch": 1.07, - "learning_rate": 0.00013902264910117462, - "loss": 0.04, + "epoch": 0.64, + "learning_rate": 0.00020394160207051897, + "loss": 0.0442, "step": 99220 }, { - "epoch": 1.07, - "learning_rate": 0.00013900642481666557, - "loss": 0.0351, + "epoch": 0.64, + "learning_rate": 0.00020393192071616203, + "loss": 0.0418, "step": 99230 }, { - "epoch": 1.07, - "learning_rate": 0.00013899020053215652, - "loss": 0.0381, + "epoch": 0.64, + "learning_rate": 0.0002039222393618051, + "loss": 0.0455, "step": 99240 }, { - "epoch": 1.07, - "learning_rate": 0.00013897397624764747, - "loss": 0.0349, + "epoch": 0.64, + "learning_rate": 0.00020391255800744816, + "loss": 0.0404, "step": 99250 }, { - "epoch": 1.07, - "learning_rate": 0.0001389577519631384, - "loss": 0.0388, + "epoch": 0.64, + "learning_rate": 0.00020390287665309124, + "loss": 0.0446, "step": 99260 }, { - "epoch": 1.07, - "learning_rate": 0.00013894152767862934, - "loss": 0.0401, + "epoch": 0.64, + "learning_rate": 0.00020389319529873432, + "loss": 0.0501, "step": 99270 }, { - "epoch": 1.07, - "learning_rate": 0.0001389253033941203, - "loss": 0.0387, + "epoch": 0.64, + "learning_rate": 0.0002038835139443774, + "loss": 0.0462, "step": 99280 }, { - "epoch": 1.07, - "learning_rate": 0.00013890907910961124, - "loss": 0.0352, + "epoch": 0.64, + "learning_rate": 0.00020387383259002045, + "loss": 0.0435, "step": 99290 }, { - "epoch": 1.07, - "learning_rate": 0.0001388928548251022, - "loss": 0.0331, + "epoch": 0.64, + "learning_rate": 0.0002038641512356635, + "loss": 0.0411, "step": 99300 }, { - "epoch": 1.07, - "learning_rate": 0.00013887663054059314, - "loss": 0.0383, + "epoch": 0.64, + "learning_rate": 0.00020385446988130658, + "loss": 0.0448, "step": 99310 }, { - "epoch": 1.07, - "learning_rate": 0.0001388604062560841, - "loss": 0.0404, + "epoch": 0.64, + "learning_rate": 0.00020384478852694964, + "loss": 0.0513, "step": 99320 }, { - "epoch": 1.07, - "learning_rate": 0.00013884418197157504, - "loss": 0.0441, + "epoch": 0.64, + "learning_rate": 0.00020383510717259272, + "loss": 0.0451, "step": 99330 }, { - "epoch": 1.07, - "learning_rate": 0.000138827957687066, - "loss": 0.0452, + "epoch": 0.64, + "learning_rate": 0.0002038254258182358, + "loss": 0.0423, "step": 99340 }, { - "epoch": 1.07, - "learning_rate": 0.00013881173340255694, - "loss": 0.0353, + "epoch": 0.64, + "learning_rate": 0.00020381574446387885, + "loss": 0.0548, "step": 99350 }, { - "epoch": 1.07, - "learning_rate": 0.00013879550911804787, - "loss": 0.0398, + "epoch": 0.64, + "learning_rate": 0.00020380606310952193, + "loss": 0.0534, "step": 99360 }, { - "epoch": 1.07, - "learning_rate": 0.00013877928483353882, - "loss": 0.044, + "epoch": 0.64, + "learning_rate": 0.00020379638175516498, + "loss": 0.0445, "step": 99370 }, { - "epoch": 1.07, - "learning_rate": 0.00013876306054902977, - "loss": 0.0375, + "epoch": 0.64, + "learning_rate": 0.00020378670040080803, + "loss": 0.0425, "step": 99380 }, { - "epoch": 1.08, - "learning_rate": 0.00013874683626452071, - "loss": 0.0433, + "epoch": 0.64, + "learning_rate": 0.0002037770190464511, + "loss": 0.044, "step": 99390 }, { - "epoch": 1.08, - "learning_rate": 0.00013873061198001166, - "loss": 0.0397, + "epoch": 0.64, + "learning_rate": 0.0002037673376920942, + "loss": 0.0484, "step": 99400 }, { - "epoch": 1.08, - "learning_rate": 0.00013871438769550261, - "loss": 0.0385, + "epoch": 0.64, + "learning_rate": 0.00020375765633773727, + "loss": 0.0431, "step": 99410 }, { - "epoch": 1.08, - "learning_rate": 0.00013869816341099356, - "loss": 0.0346, + "epoch": 0.64, + "learning_rate": 0.00020374797498338033, + "loss": 0.0464, "step": 99420 }, { - "epoch": 1.08, - "learning_rate": 0.00013868193912648451, - "loss": 0.0339, + "epoch": 0.64, + "learning_rate": 0.0002037382936290234, + "loss": 0.0525, "step": 99430 }, { - "epoch": 1.08, - "learning_rate": 0.00013866571484197546, - "loss": 0.0363, + "epoch": 0.64, + "learning_rate": 0.00020372861227466646, + "loss": 0.0483, "step": 99440 }, { - "epoch": 1.08, - "learning_rate": 0.00013864949055746639, - "loss": 0.0372, + "epoch": 0.64, + "learning_rate": 0.0002037189309203095, + "loss": 0.0471, "step": 99450 }, { - "epoch": 1.08, - "learning_rate": 0.00013863326627295734, - "loss": 0.0375, + "epoch": 0.64, + "learning_rate": 0.0002037092495659526, + "loss": 0.0454, "step": 99460 }, { - "epoch": 1.08, - "learning_rate": 0.00013861704198844829, - "loss": 0.0413, + "epoch": 0.64, + "learning_rate": 0.00020369956821159567, + "loss": 0.0464, "step": 99470 }, { - "epoch": 1.08, - "learning_rate": 0.00013860081770393924, - "loss": 0.0412, + "epoch": 0.64, + "learning_rate": 0.00020368988685723875, + "loss": 0.0515, "step": 99480 }, { - "epoch": 1.08, - "learning_rate": 0.00013858459341943019, - "loss": 0.0387, + "epoch": 0.64, + "learning_rate": 0.0002036802055028818, + "loss": 0.0463, "step": 99490 }, { - "epoch": 1.08, - "learning_rate": 0.00013856836913492114, - "loss": 0.0419, + "epoch": 0.64, + "learning_rate": 0.00020367052414852488, + "loss": 0.0513, "step": 99500 }, { - "epoch": 1.08, - "learning_rate": 0.00013855214485041209, - "loss": 0.0352, + "epoch": 0.64, + "learning_rate": 0.00020366084279416794, + "loss": 0.0452, "step": 99510 }, { - "epoch": 1.08, - "learning_rate": 0.00013853592056590303, - "loss": 0.0371, + "epoch": 0.64, + "learning_rate": 0.000203651161439811, + "loss": 0.0462, "step": 99520 }, { - "epoch": 1.08, - "learning_rate": 0.00013851969628139398, - "loss": 0.0404, + "epoch": 0.64, + "learning_rate": 0.00020364148008545407, + "loss": 0.0465, "step": 99530 }, { - "epoch": 1.08, - "learning_rate": 0.0001385034719968849, - "loss": 0.0367, + "epoch": 0.64, + "learning_rate": 0.00020363179873109715, + "loss": 0.0484, "step": 99540 }, { - "epoch": 1.08, - "learning_rate": 0.00013848724771237586, - "loss": 0.0367, + "epoch": 0.64, + "learning_rate": 0.0002036221173767402, + "loss": 0.0482, "step": 99550 }, { - "epoch": 1.08, - "learning_rate": 0.0001384710234278668, - "loss": 0.0313, + "epoch": 0.64, + "learning_rate": 0.00020361243602238328, + "loss": 0.0533, "step": 99560 }, { - "epoch": 1.08, - "learning_rate": 0.00013845479914335776, - "loss": 0.0348, + "epoch": 0.64, + "learning_rate": 0.00020360275466802636, + "loss": 0.049, "step": 99570 }, { - "epoch": 1.08, - "learning_rate": 0.0001384385748588487, - "loss": 0.0377, + "epoch": 0.64, + "learning_rate": 0.00020359307331366939, + "loss": 0.052, "step": 99580 }, { - "epoch": 1.08, - "learning_rate": 0.00013842235057433966, - "loss": 0.0378, + "epoch": 0.64, + "learning_rate": 0.00020358339195931247, + "loss": 0.046, "step": 99590 }, { - "epoch": 1.08, - "learning_rate": 0.0001384061262898306, - "loss": 0.032, + "epoch": 0.64, + "learning_rate": 0.00020357371060495555, + "loss": 0.0468, "step": 99600 }, { - "epoch": 1.08, - "learning_rate": 0.00013838990200532156, - "loss": 0.0385, + "epoch": 0.64, + "learning_rate": 0.00020356402925059862, + "loss": 0.0473, "step": 99610 }, { - "epoch": 1.08, - "learning_rate": 0.0001383736777208125, - "loss": 0.0392, + "epoch": 0.64, + "learning_rate": 0.00020355434789624168, + "loss": 0.0488, "step": 99620 }, { - "epoch": 1.08, - "learning_rate": 0.00013835745343630343, - "loss": 0.0356, + "epoch": 0.64, + "learning_rate": 0.00020354466654188476, + "loss": 0.0472, "step": 99630 }, { - "epoch": 1.08, - "learning_rate": 0.00013834122915179438, - "loss": 0.0382, + "epoch": 0.64, + "learning_rate": 0.00020353498518752784, + "loss": 0.0508, "step": 99640 }, { - "epoch": 1.08, - "learning_rate": 0.00013832500486728533, - "loss": 0.0372, + "epoch": 0.64, + "learning_rate": 0.00020352530383317086, + "loss": 0.0458, "step": 99650 }, { - "epoch": 1.08, - "learning_rate": 0.00013830878058277628, - "loss": 0.037, + "epoch": 0.64, + "learning_rate": 0.00020351562247881394, + "loss": 0.0429, "step": 99660 }, { - "epoch": 1.08, - "learning_rate": 0.00013829255629826723, - "loss": 0.0345, + "epoch": 0.64, + "learning_rate": 0.00020350594112445702, + "loss": 0.053, "step": 99670 }, { - "epoch": 1.08, - "learning_rate": 0.00013827633201375818, - "loss": 0.0374, + "epoch": 0.64, + "learning_rate": 0.0002034962597701001, + "loss": 0.0543, "step": 99680 }, { - "epoch": 1.08, - "learning_rate": 0.00013826010772924913, - "loss": 0.034, + "epoch": 0.64, + "learning_rate": 0.00020348657841574315, + "loss": 0.0457, "step": 99690 }, { - "epoch": 1.08, - "learning_rate": 0.00013824388344474008, - "loss": 0.0317, + "epoch": 0.64, + "learning_rate": 0.00020347689706138623, + "loss": 0.0441, "step": 99700 }, { - "epoch": 1.08, - "learning_rate": 0.00013822765916023103, - "loss": 0.0405, + "epoch": 0.64, + "learning_rate": 0.00020346721570702931, + "loss": 0.0499, "step": 99710 }, { - "epoch": 1.08, - "learning_rate": 0.00013821143487572195, - "loss": 0.0355, + "epoch": 0.64, + "learning_rate": 0.00020345753435267234, + "loss": 0.0405, "step": 99720 }, { - "epoch": 1.08, - "learning_rate": 0.00013819521059121293, - "loss": 0.0337, + "epoch": 0.64, + "learning_rate": 0.00020344785299831542, + "loss": 0.0452, "step": 99730 }, { - "epoch": 1.08, - "learning_rate": 0.00013817898630670388, - "loss": 0.0322, + "epoch": 0.64, + "learning_rate": 0.0002034381716439585, + "loss": 0.0442, "step": 99740 }, { - "epoch": 1.08, - "learning_rate": 0.00013816276202219483, - "loss": 0.0378, + "epoch": 0.64, + "learning_rate": 0.00020342849028960155, + "loss": 0.0453, "step": 99750 }, { - "epoch": 1.08, - "learning_rate": 0.00013814653773768578, - "loss": 0.0353, + "epoch": 0.64, + "learning_rate": 0.00020341880893524463, + "loss": 0.046, "step": 99760 }, { - "epoch": 1.08, - "learning_rate": 0.0001381303134531767, - "loss": 0.0373, + "epoch": 0.64, + "learning_rate": 0.0002034091275808877, + "loss": 0.047, "step": 99770 }, { - "epoch": 1.08, - "learning_rate": 0.00013811408916866765, - "loss": 0.0369, + "epoch": 0.64, + "learning_rate": 0.0002033994462265308, + "loss": 0.0488, "step": 99780 }, { - "epoch": 1.08, - "learning_rate": 0.0001380978648841586, - "loss": 0.0417, + "epoch": 0.64, + "learning_rate": 0.00020338976487217382, + "loss": 0.0508, "step": 99790 }, { - "epoch": 1.08, - "learning_rate": 0.00013808164059964955, - "loss": 0.0396, + "epoch": 0.64, + "learning_rate": 0.0002033800835178169, + "loss": 0.0525, "step": 99800 }, { - "epoch": 1.08, - "learning_rate": 0.0001380654163151405, - "loss": 0.033, + "epoch": 0.64, + "learning_rate": 0.00020337040216345998, + "loss": 0.0474, "step": 99810 }, { - "epoch": 1.08, - "learning_rate": 0.00013804919203063145, - "loss": 0.0368, + "epoch": 0.64, + "learning_rate": 0.00020336072080910303, + "loss": 0.05, "step": 99820 }, { - "epoch": 1.08, - "learning_rate": 0.0001380329677461224, - "loss": 0.0451, + "epoch": 0.64, + "learning_rate": 0.0002033510394547461, + "loss": 0.0409, "step": 99830 }, { - "epoch": 1.08, - "learning_rate": 0.00013801674346161335, - "loss": 0.0338, + "epoch": 0.64, + "learning_rate": 0.0002033413581003892, + "loss": 0.0426, "step": 99840 }, { - "epoch": 1.08, - "learning_rate": 0.0001380005191771043, - "loss": 0.0373, + "epoch": 0.64, + "learning_rate": 0.00020333167674603221, + "loss": 0.0485, "step": 99850 }, { - "epoch": 1.08, - "learning_rate": 0.00013798429489259522, - "loss": 0.0357, + "epoch": 0.64, + "learning_rate": 0.0002033219953916753, + "loss": 0.0488, "step": 99860 }, { - "epoch": 1.08, - "learning_rate": 0.00013796807060808617, - "loss": 0.0366, + "epoch": 0.64, + "learning_rate": 0.00020331231403731837, + "loss": 0.048, "step": 99870 }, { - "epoch": 1.08, - "learning_rate": 0.00013795184632357712, - "loss": 0.0372, + "epoch": 0.64, + "learning_rate": 0.00020330263268296145, + "loss": 0.0496, "step": 99880 }, { - "epoch": 1.08, - "learning_rate": 0.00013793562203906807, - "loss": 0.0344, + "epoch": 0.64, + "learning_rate": 0.0002032929513286045, + "loss": 0.045, "step": 99890 }, { - "epoch": 1.08, - "learning_rate": 0.00013791939775455902, - "loss": 0.0429, + "epoch": 0.64, + "learning_rate": 0.00020328326997424759, + "loss": 0.0524, "step": 99900 }, { - "epoch": 1.08, - "learning_rate": 0.00013790317347004997, - "loss": 0.0376, - "step": 99910 + "epoch": 0.64, + "learning_rate": 0.00020327358861989067, + "loss": 0.049, + "step": 99910 }, { - "epoch": 1.08, - "learning_rate": 0.00013788694918554092, - "loss": 0.0401, + "epoch": 0.64, + "learning_rate": 0.0002032639072655337, + "loss": 0.0527, "step": 99920 }, { - "epoch": 1.08, - "learning_rate": 0.00013787072490103187, - "loss": 0.0434, + "epoch": 0.64, + "learning_rate": 0.00020325422591117677, + "loss": 0.0494, "step": 99930 }, { - "epoch": 1.08, - "learning_rate": 0.00013785450061652282, - "loss": 0.0362, + "epoch": 0.65, + "learning_rate": 0.00020324454455681985, + "loss": 0.0595, "step": 99940 }, { - "epoch": 1.08, - "learning_rate": 0.00013783827633201374, - "loss": 0.0321, + "epoch": 0.65, + "learning_rate": 0.0002032348632024629, + "loss": 0.0497, "step": 99950 }, { - "epoch": 1.08, - "learning_rate": 0.0001378220520475047, - "loss": 0.0327, + "epoch": 0.65, + "learning_rate": 0.00020322518184810598, + "loss": 0.0456, "step": 99960 }, { - "epoch": 1.08, - "learning_rate": 0.00013780582776299564, - "loss": 0.0352, + "epoch": 0.65, + "learning_rate": 0.00020321550049374906, + "loss": 0.049, "step": 99970 }, { - "epoch": 1.08, - "learning_rate": 0.0001377896034784866, - "loss": 0.0369, + "epoch": 0.65, + "learning_rate": 0.00020320581913939214, + "loss": 0.0575, "step": 99980 }, { - "epoch": 1.08, - "learning_rate": 0.00013777337919397754, - "loss": 0.0371, + "epoch": 0.65, + "learning_rate": 0.00020319613778503517, + "loss": 0.0502, "step": 99990 }, { - "epoch": 1.08, - "learning_rate": 0.0001377571549094685, - "loss": 0.0446, + "epoch": 0.65, + "learning_rate": 0.00020318645643067825, + "loss": 0.0464, "step": 100000 }, { - "epoch": 1.08, - "eval_cer": 0.92111103454247, - "eval_loss": 0.028674758970737457, - "eval_runtime": 119.2599, - "eval_samples_per_second": 16.77, - "eval_steps_per_second": 4.193, + "epoch": 0.65, + "eval_cer": 0.9199602304824314, + "eval_loss": 0.031852345913648605, + "eval_runtime": 119.8085, + "eval_samples_per_second": 16.693, + "eval_steps_per_second": 4.173, "step": 100000 }, { - "epoch": 1.08, - "learning_rate": 0.00013774093062495944, - "loss": 0.0349, + "epoch": 0.65, + "learning_rate": 0.00020317677507632133, + "loss": 0.0428, "step": 100010 }, { - "epoch": 1.08, - "learning_rate": 0.0001377247063404504, - "loss": 0.0337, + "epoch": 0.65, + "learning_rate": 0.00020316709372196438, + "loss": 0.0554, "step": 100020 }, { - "epoch": 1.08, - "learning_rate": 0.00013770848205594134, - "loss": 0.0334, + "epoch": 0.65, + "learning_rate": 0.00020315741236760746, + "loss": 0.0511, "step": 100030 }, { - "epoch": 1.08, - "learning_rate": 0.0001376922577714323, - "loss": 0.0391, + "epoch": 0.65, + "learning_rate": 0.00020314773101325054, + "loss": 0.0443, "step": 100040 }, { - "epoch": 1.08, - "learning_rate": 0.0001376760334869232, - "loss": 0.0341, + "epoch": 0.65, + "learning_rate": 0.00020313804965889362, + "loss": 0.0414, "step": 100050 }, { - "epoch": 1.08, - "learning_rate": 0.00013765980920241416, - "loss": 0.0305, + "epoch": 0.65, + "learning_rate": 0.00020312836830453665, + "loss": 0.0453, "step": 100060 }, { - "epoch": 1.08, - "learning_rate": 0.0001376435849179051, - "loss": 0.0389, + "epoch": 0.65, + "learning_rate": 0.00020311868695017973, + "loss": 0.0445, "step": 100070 }, { - "epoch": 1.08, - "learning_rate": 0.00013762736063339606, - "loss": 0.0373, + "epoch": 0.65, + "learning_rate": 0.0002031090055958228, + "loss": 0.0548, "step": 100080 }, { - "epoch": 1.08, - "learning_rate": 0.000137611136348887, - "loss": 0.0379, + "epoch": 0.65, + "learning_rate": 0.00020309932424146586, + "loss": 0.0541, "step": 100090 }, { - "epoch": 1.08, - "learning_rate": 0.00013759491206437796, - "loss": 0.0363, + "epoch": 0.65, + "learning_rate": 0.00020308964288710894, + "loss": 0.0486, "step": 100100 }, { - "epoch": 1.08, - "learning_rate": 0.0001375786877798689, - "loss": 0.0371, + "epoch": 0.65, + "learning_rate": 0.00020307996153275202, + "loss": 0.0559, "step": 100110 }, { - "epoch": 1.08, - "learning_rate": 0.00013756246349535986, - "loss": 0.0377, + "epoch": 0.65, + "learning_rate": 0.00020307028017839507, + "loss": 0.052, "step": 100120 }, { - "epoch": 1.08, - "learning_rate": 0.0001375462392108508, - "loss": 0.0339, + "epoch": 0.65, + "learning_rate": 0.00020306059882403812, + "loss": 0.0437, "step": 100130 }, { - "epoch": 1.08, - "learning_rate": 0.00013753001492634173, - "loss": 0.0418, + "epoch": 0.65, + "learning_rate": 0.0002030509174696812, + "loss": 0.047, "step": 100140 }, { - "epoch": 1.08, - "learning_rate": 0.00013751379064183268, - "loss": 0.0332, + "epoch": 0.65, + "learning_rate": 0.00020304123611532426, + "loss": 0.0514, "step": 100150 }, { - "epoch": 1.08, - "learning_rate": 0.00013749756635732363, - "loss": 0.0353, + "epoch": 0.65, + "learning_rate": 0.00020303155476096734, + "loss": 0.0514, "step": 100160 }, { - "epoch": 1.08, - "learning_rate": 0.00013748134207281458, - "loss": 0.0358, + "epoch": 0.65, + "learning_rate": 0.00020302187340661042, + "loss": 0.0455, "step": 100170 }, { - "epoch": 1.08, - "learning_rate": 0.00013746511778830553, - "loss": 0.0341, + "epoch": 0.65, + "learning_rate": 0.0002030121920522535, + "loss": 0.0497, "step": 100180 }, { - "epoch": 1.08, - "learning_rate": 0.00013744889350379648, - "loss": 0.0336, + "epoch": 0.65, + "learning_rate": 0.00020300251069789655, + "loss": 0.0497, "step": 100190 }, { - "epoch": 1.08, - "learning_rate": 0.00013743266921928743, - "loss": 0.0406, + "epoch": 0.65, + "learning_rate": 0.0002029928293435396, + "loss": 0.0506, "step": 100200 }, { - "epoch": 1.08, - "learning_rate": 0.00013741644493477838, - "loss": 0.0358, + "epoch": 0.65, + "learning_rate": 0.00020298314798918268, + "loss": 0.045, "step": 100210 }, { - "epoch": 1.08, - "learning_rate": 0.00013740022065026933, - "loss": 0.0444, + "epoch": 0.65, + "learning_rate": 0.00020297346663482573, + "loss": 0.0523, "step": 100220 }, { - "epoch": 1.08, - "learning_rate": 0.00013738399636576025, - "loss": 0.0356, + "epoch": 0.65, + "learning_rate": 0.0002029637852804688, + "loss": 0.0544, "step": 100230 }, { - "epoch": 1.08, - "learning_rate": 0.0001373677720812512, - "loss": 0.038, + "epoch": 0.65, + "learning_rate": 0.0002029541039261119, + "loss": 0.0438, "step": 100240 }, { - "epoch": 1.08, - "learning_rate": 0.00013735154779674215, - "loss": 0.0331, + "epoch": 0.65, + "learning_rate": 0.00020294442257175497, + "loss": 0.0459, "step": 100250 }, { - "epoch": 1.08, - "learning_rate": 0.0001373353235122331, - "loss": 0.0352, + "epoch": 0.65, + "learning_rate": 0.00020293474121739803, + "loss": 0.0476, "step": 100260 }, { - "epoch": 1.08, - "learning_rate": 0.00013731909922772405, - "loss": 0.0424, + "epoch": 0.65, + "learning_rate": 0.00020292505986304108, + "loss": 0.0431, "step": 100270 }, { - "epoch": 1.08, - "learning_rate": 0.000137302874943215, - "loss": 0.0379, + "epoch": 0.65, + "learning_rate": 0.00020291537850868416, + "loss": 0.0439, "step": 100280 }, { - "epoch": 1.08, - "learning_rate": 0.00013728665065870595, - "loss": 0.0328, + "epoch": 0.65, + "learning_rate": 0.0002029056971543272, + "loss": 0.045, "step": 100290 }, { - "epoch": 1.08, - "learning_rate": 0.0001372704263741969, - "loss": 0.0366, + "epoch": 0.65, + "learning_rate": 0.0002028960157999703, + "loss": 0.0543, "step": 100300 }, { - "epoch": 1.08, - "learning_rate": 0.00013725420208968785, - "loss": 0.0365, + "epoch": 0.65, + "learning_rate": 0.00020288633444561337, + "loss": 0.048, "step": 100310 }, { - "epoch": 1.09, - "learning_rate": 0.00013723797780517877, - "loss": 0.0394, + "epoch": 0.65, + "learning_rate": 0.00020287665309125642, + "loss": 0.0411, "step": 100320 }, { - "epoch": 1.09, - "learning_rate": 0.00013722175352066972, - "loss": 0.0328, + "epoch": 0.65, + "learning_rate": 0.0002028669717368995, + "loss": 0.044, "step": 100330 }, { - "epoch": 1.09, - "learning_rate": 0.00013720552923616067, - "loss": 0.0407, + "epoch": 0.65, + "learning_rate": 0.00020285729038254256, + "loss": 0.0529, "step": 100340 }, { - "epoch": 1.09, - "learning_rate": 0.00013718930495165162, - "loss": 0.0359, + "epoch": 0.65, + "learning_rate": 0.0002028476090281856, + "loss": 0.045, "step": 100350 }, { - "epoch": 1.09, - "learning_rate": 0.00013717308066714257, - "loss": 0.036, + "epoch": 0.65, + "learning_rate": 0.0002028379276738287, + "loss": 0.0443, "step": 100360 }, { - "epoch": 1.09, - "learning_rate": 0.00013715685638263352, - "loss": 0.029, + "epoch": 0.65, + "learning_rate": 0.00020282824631947177, + "loss": 0.0456, "step": 100370 }, { - "epoch": 1.09, - "learning_rate": 0.00013714063209812447, - "loss": 0.0374, + "epoch": 0.65, + "learning_rate": 0.00020281856496511485, + "loss": 0.0499, "step": 100380 }, { - "epoch": 1.09, - "learning_rate": 0.00013712440781361542, - "loss": 0.0433, + "epoch": 0.65, + "learning_rate": 0.0002028088836107579, + "loss": 0.0487, "step": 100390 }, { - "epoch": 1.09, - "learning_rate": 0.00013710818352910637, - "loss": 0.0337, + "epoch": 0.65, + "learning_rate": 0.00020279920225640098, + "loss": 0.0576, "step": 100400 }, { - "epoch": 1.09, - "learning_rate": 0.0001370919592445973, - "loss": 0.0363, + "epoch": 0.65, + "learning_rate": 0.00020278952090204403, + "loss": 0.0486, "step": 100410 }, { - "epoch": 1.09, - "learning_rate": 0.00013707573496008824, - "loss": 0.0372, + "epoch": 0.65, + "learning_rate": 0.00020277983954768709, + "loss": 0.0443, "step": 100420 }, { - "epoch": 1.09, - "learning_rate": 0.0001370595106755792, - "loss": 0.0374, + "epoch": 0.65, + "learning_rate": 0.00020277015819333016, + "loss": 0.0468, "step": 100430 }, { - "epoch": 1.09, - "learning_rate": 0.00013704328639107014, - "loss": 0.0394, + "epoch": 0.65, + "learning_rate": 0.00020276047683897324, + "loss": 0.0493, "step": 100440 }, { - "epoch": 1.09, - "learning_rate": 0.0001370270621065611, - "loss": 0.04, + "epoch": 0.65, + "learning_rate": 0.00020275079548461632, + "loss": 0.0523, "step": 100450 }, { - "epoch": 1.09, - "learning_rate": 0.00013701083782205204, - "loss": 0.0357, + "epoch": 0.65, + "learning_rate": 0.00020274111413025938, + "loss": 0.0506, "step": 100460 }, { - "epoch": 1.09, - "learning_rate": 0.000136994613537543, - "loss": 0.0334, + "epoch": 0.65, + "learning_rate": 0.00020273143277590246, + "loss": 0.0417, "step": 100470 }, { - "epoch": 1.09, - "learning_rate": 0.00013697838925303394, - "loss": 0.0326, + "epoch": 0.65, + "learning_rate": 0.0002027217514215455, + "loss": 0.0403, "step": 100480 }, { - "epoch": 1.09, - "learning_rate": 0.0001369621649685249, - "loss": 0.0323, + "epoch": 0.65, + "learning_rate": 0.00020271207006718856, + "loss": 0.0601, "step": 100490 }, { - "epoch": 1.09, - "learning_rate": 0.00013694594068401581, - "loss": 0.0402, + "epoch": 0.65, + "learning_rate": 0.00020270238871283164, + "loss": 0.0448, "step": 100500 }, { - "epoch": 1.09, - "learning_rate": 0.00013692971639950676, - "loss": 0.0355, + "epoch": 0.65, + "learning_rate": 0.00020269270735847472, + "loss": 0.0474, "step": 100510 }, { - "epoch": 1.09, - "learning_rate": 0.00013691349211499771, - "loss": 0.0334, + "epoch": 0.65, + "learning_rate": 0.00020268302600411777, + "loss": 0.0451, "step": 100520 }, { - "epoch": 1.09, - "learning_rate": 0.00013689726783048866, - "loss": 0.0325, + "epoch": 0.65, + "learning_rate": 0.00020267334464976085, + "loss": 0.0433, "step": 100530 }, { - "epoch": 1.09, - "learning_rate": 0.0001368810435459796, - "loss": 0.0315, + "epoch": 0.65, + "learning_rate": 0.00020266366329540393, + "loss": 0.0482, "step": 100540 }, { - "epoch": 1.09, - "learning_rate": 0.00013686481926147056, - "loss": 0.0356, + "epoch": 0.65, + "learning_rate": 0.00020265398194104696, + "loss": 0.0442, "step": 100550 }, { - "epoch": 1.09, - "learning_rate": 0.0001368485949769615, - "loss": 0.0368, + "epoch": 0.65, + "learning_rate": 0.00020264430058669004, + "loss": 0.0504, "step": 100560 }, { - "epoch": 1.09, - "learning_rate": 0.00013683237069245246, - "loss": 0.0367, + "epoch": 0.65, + "learning_rate": 0.00020263461923233312, + "loss": 0.0479, "step": 100570 }, { - "epoch": 1.09, - "learning_rate": 0.0001368161464079434, - "loss": 0.0384, + "epoch": 0.65, + "learning_rate": 0.0002026249378779762, + "loss": 0.0538, "step": 100580 }, { - "epoch": 1.09, - "learning_rate": 0.00013679992212343434, - "loss": 0.0353, + "epoch": 0.65, + "learning_rate": 0.00020261525652361925, + "loss": 0.0466, "step": 100590 }, { - "epoch": 1.09, - "learning_rate": 0.00013678369783892528, - "loss": 0.0343, + "epoch": 0.65, + "learning_rate": 0.00020260557516926233, + "loss": 0.0458, "step": 100600 }, { - "epoch": 1.09, - "learning_rate": 0.00013676747355441623, - "loss": 0.0363, + "epoch": 0.65, + "learning_rate": 0.0002025958938149054, + "loss": 0.0468, "step": 100610 }, { - "epoch": 1.09, - "learning_rate": 0.00013675124926990718, - "loss": 0.033, + "epoch": 0.65, + "learning_rate": 0.00020258621246054844, + "loss": 0.0568, "step": 100620 }, { - "epoch": 1.09, - "learning_rate": 0.00013673502498539813, - "loss": 0.0349, + "epoch": 0.65, + "learning_rate": 0.00020257653110619152, + "loss": 0.0486, "step": 100630 }, { - "epoch": 1.09, - "learning_rate": 0.00013671880070088908, - "loss": 0.0381, + "epoch": 0.65, + "learning_rate": 0.0002025668497518346, + "loss": 0.0468, "step": 100640 }, { - "epoch": 1.09, - "learning_rate": 0.00013670257641638003, - "loss": 0.0375, + "epoch": 0.65, + "learning_rate": 0.00020255716839747768, + "loss": 0.0455, "step": 100650 }, { - "epoch": 1.09, - "learning_rate": 0.00013668635213187098, - "loss": 0.033, + "epoch": 0.65, + "learning_rate": 0.00020254748704312073, + "loss": 0.0515, "step": 100660 }, { - "epoch": 1.09, - "learning_rate": 0.00013667012784736193, - "loss": 0.0376, + "epoch": 0.65, + "learning_rate": 0.0002025378056887638, + "loss": 0.0435, "step": 100670 }, { - "epoch": 1.09, - "learning_rate": 0.00013665390356285286, - "loss": 0.0378, + "epoch": 0.65, + "learning_rate": 0.0002025281243344069, + "loss": 0.0456, "step": 100680 }, { - "epoch": 1.09, - "learning_rate": 0.0001366376792783438, - "loss": 0.0447, + "epoch": 0.65, + "learning_rate": 0.00020251844298004991, + "loss": 0.0408, "step": 100690 }, { - "epoch": 1.09, - "learning_rate": 0.00013662145499383476, - "loss": 0.0389, + "epoch": 0.65, + "learning_rate": 0.000202508761625693, + "loss": 0.0528, "step": 100700 }, { - "epoch": 1.09, - "learning_rate": 0.0001366052307093257, - "loss": 0.0405, + "epoch": 0.65, + "learning_rate": 0.00020249908027133607, + "loss": 0.0402, "step": 100710 }, { - "epoch": 1.09, - "learning_rate": 0.00013658900642481665, - "loss": 0.0439, + "epoch": 0.65, + "learning_rate": 0.00020248939891697913, + "loss": 0.0497, "step": 100720 }, { - "epoch": 1.09, - "learning_rate": 0.0001365727821403076, - "loss": 0.0383, + "epoch": 0.65, + "learning_rate": 0.0002024797175626222, + "loss": 0.0427, "step": 100730 }, { - "epoch": 1.09, - "learning_rate": 0.00013655655785579855, - "loss": 0.0399, + "epoch": 0.65, + "learning_rate": 0.00020247003620826529, + "loss": 0.0526, "step": 100740 }, { - "epoch": 1.09, - "learning_rate": 0.0001365403335712895, - "loss": 0.0391, + "epoch": 0.65, + "learning_rate": 0.00020246035485390837, + "loss": 0.041, "step": 100750 }, { - "epoch": 1.09, - "learning_rate": 0.00013652410928678045, - "loss": 0.0328, + "epoch": 0.65, + "learning_rate": 0.0002024506734995514, + "loss": 0.0444, "step": 100760 }, { - "epoch": 1.09, - "learning_rate": 0.00013650788500227138, - "loss": 0.0367, + "epoch": 0.65, + "learning_rate": 0.00020244099214519447, + "loss": 0.0448, "step": 100770 }, { - "epoch": 1.09, - "learning_rate": 0.00013649166071776233, - "loss": 0.0368, + "epoch": 0.65, + "learning_rate": 0.00020243131079083755, + "loss": 0.0482, "step": 100780 }, { - "epoch": 1.09, - "learning_rate": 0.00013647543643325328, - "loss": 0.0371, + "epoch": 0.65, + "learning_rate": 0.0002024216294364806, + "loss": 0.0457, "step": 100790 }, { - "epoch": 1.09, - "learning_rate": 0.00013645921214874423, - "loss": 0.0358, + "epoch": 0.65, + "learning_rate": 0.00020241194808212368, + "loss": 0.0468, "step": 100800 }, { - "epoch": 1.09, - "learning_rate": 0.00013644298786423518, - "loss": 0.0478, + "epoch": 0.65, + "learning_rate": 0.00020240226672776676, + "loss": 0.0431, "step": 100810 }, { - "epoch": 1.09, - "learning_rate": 0.00013642676357972613, - "loss": 0.0372, + "epoch": 0.65, + "learning_rate": 0.00020239258537340984, + "loss": 0.0416, "step": 100820 }, { - "epoch": 1.09, - "learning_rate": 0.00013641053929521708, - "loss": 0.0402, + "epoch": 0.65, + "learning_rate": 0.00020238290401905287, + "loss": 0.0398, "step": 100830 }, { - "epoch": 1.09, - "learning_rate": 0.00013639431501070803, - "loss": 0.0326, + "epoch": 0.65, + "learning_rate": 0.00020237322266469595, + "loss": 0.0487, "step": 100840 }, { - "epoch": 1.09, - "learning_rate": 0.00013637809072619897, - "loss": 0.0295, + "epoch": 0.65, + "learning_rate": 0.00020236354131033903, + "loss": 0.0479, "step": 100850 }, { - "epoch": 1.09, - "learning_rate": 0.0001363618664416899, - "loss": 0.0446, + "epoch": 0.65, + "learning_rate": 0.00020235385995598208, + "loss": 0.0425, "step": 100860 }, { - "epoch": 1.09, - "learning_rate": 0.00013634564215718085, - "loss": 0.0356, + "epoch": 0.65, + "learning_rate": 0.00020234417860162516, + "loss": 0.0442, "step": 100870 }, { - "epoch": 1.09, - "learning_rate": 0.0001363294178726718, - "loss": 0.0408, + "epoch": 0.65, + "learning_rate": 0.00020233449724726824, + "loss": 0.0416, "step": 100880 }, { - "epoch": 1.09, - "learning_rate": 0.00013631319358816275, - "loss": 0.035, + "epoch": 0.65, + "learning_rate": 0.00020232481589291132, + "loss": 0.048, "step": 100890 }, { - "epoch": 1.09, - "learning_rate": 0.0001362969693036537, - "loss": 0.0275, + "epoch": 0.65, + "learning_rate": 0.00020231513453855435, + "loss": 0.0416, "step": 100900 }, { - "epoch": 1.09, - "learning_rate": 0.00013628074501914465, - "loss": 0.0356, + "epoch": 0.65, + "learning_rate": 0.00020230545318419743, + "loss": 0.0426, "step": 100910 }, { - "epoch": 1.09, - "learning_rate": 0.0001362645207346356, - "loss": 0.0403, + "epoch": 0.65, + "learning_rate": 0.00020229577182984048, + "loss": 0.0442, "step": 100920 }, { - "epoch": 1.09, - "learning_rate": 0.00013624829645012655, - "loss": 0.0406, + "epoch": 0.65, + "learning_rate": 0.00020228609047548356, + "loss": 0.0427, "step": 100930 }, { - "epoch": 1.09, - "learning_rate": 0.0001362320721656175, - "loss": 0.0387, + "epoch": 0.65, + "learning_rate": 0.00020227640912112664, + "loss": 0.0494, "step": 100940 }, { - "epoch": 1.09, - "learning_rate": 0.00013621584788110842, - "loss": 0.0348, + "epoch": 0.65, + "learning_rate": 0.00020226672776676972, + "loss": 0.0436, "step": 100950 }, { - "epoch": 1.09, - "learning_rate": 0.00013619962359659937, - "loss": 0.0359, + "epoch": 0.65, + "learning_rate": 0.00020225704641241277, + "loss": 0.0447, "step": 100960 }, { - "epoch": 1.09, - "learning_rate": 0.00013618339931209032, - "loss": 0.037, + "epoch": 0.65, + "learning_rate": 0.00020224736505805582, + "loss": 0.0379, "step": 100970 }, { - "epoch": 1.09, - "learning_rate": 0.00013616717502758127, - "loss": 0.0341, + "epoch": 0.65, + "learning_rate": 0.0002022376837036989, + "loss": 0.0522, "step": 100980 }, { - "epoch": 1.09, - "learning_rate": 0.00013615095074307222, - "loss": 0.0347, + "epoch": 0.65, + "learning_rate": 0.00020222800234934196, + "loss": 0.0512, "step": 100990 }, { - "epoch": 1.09, - "learning_rate": 0.00013613472645856317, - "loss": 0.0424, + "epoch": 0.65, + "learning_rate": 0.00020221832099498504, + "loss": 0.0519, "step": 101000 }, { - "epoch": 1.09, - "eval_cer": 0.9212515085494778, - "eval_loss": 0.028364714235067368, - "eval_runtime": 118.8214, - "eval_samples_per_second": 16.832, - "eval_steps_per_second": 4.208, + "epoch": 0.65, + "eval_cer": 0.9199032877640945, + "eval_loss": 0.030138300731778145, + "eval_runtime": 119.833, + "eval_samples_per_second": 16.69, + "eval_steps_per_second": 4.172, "step": 101000 }, { - "epoch": 1.09, - "learning_rate": 0.00013611850217405412, - "loss": 0.0392, + "epoch": 0.65, + "learning_rate": 0.00020220863964062812, + "loss": 0.0599, "step": 101010 }, { - "epoch": 1.09, - "learning_rate": 0.00013610227788954507, - "loss": 0.0385, + "epoch": 0.65, + "learning_rate": 0.0002021989582862712, + "loss": 0.0476, "step": 101020 }, { - "epoch": 1.09, - "learning_rate": 0.00013608605360503602, - "loss": 0.0356, + "epoch": 0.65, + "learning_rate": 0.00020218927693191425, + "loss": 0.0482, "step": 101030 }, { - "epoch": 1.09, - "learning_rate": 0.00013606982932052694, - "loss": 0.0386, + "epoch": 0.65, + "learning_rate": 0.0002021795955775573, + "loss": 0.0523, "step": 101040 }, { - "epoch": 1.09, - "learning_rate": 0.0001360536050360179, - "loss": 0.0336, + "epoch": 0.65, + "learning_rate": 0.00020216991422320038, + "loss": 0.0426, "step": 101050 }, { - "epoch": 1.09, - "learning_rate": 0.00013603738075150884, - "loss": 0.0397, + "epoch": 0.65, + "learning_rate": 0.00020216023286884343, + "loss": 0.0457, "step": 101060 }, { - "epoch": 1.09, - "learning_rate": 0.0001360211564669998, - "loss": 0.0381, + "epoch": 0.65, + "learning_rate": 0.0002021505515144865, + "loss": 0.046, "step": 101070 }, { - "epoch": 1.09, - "learning_rate": 0.00013600493218249074, - "loss": 0.0322, + "epoch": 0.65, + "learning_rate": 0.0002021408701601296, + "loss": 0.0539, "step": 101080 }, { - "epoch": 1.09, - "learning_rate": 0.0001359887078979817, - "loss": 0.0421, + "epoch": 0.65, + "learning_rate": 0.00020213118880577267, + "loss": 0.0463, "step": 101090 }, { - "epoch": 1.09, - "learning_rate": 0.00013597248361347264, - "loss": 0.0348, + "epoch": 0.65, + "learning_rate": 0.00020212150745141572, + "loss": 0.0446, "step": 101100 }, { - "epoch": 1.09, - "learning_rate": 0.0001359562593289636, - "loss": 0.0414, + "epoch": 0.65, + "learning_rate": 0.00020211182609705878, + "loss": 0.0498, "step": 101110 }, { - "epoch": 1.09, - "learning_rate": 0.00013594003504445454, - "loss": 0.037, + "epoch": 0.65, + "learning_rate": 0.00020210214474270183, + "loss": 0.0477, "step": 101120 }, { - "epoch": 1.09, - "learning_rate": 0.00013592381075994546, - "loss": 0.0407, + "epoch": 0.65, + "learning_rate": 0.0002020924633883449, + "loss": 0.059, "step": 101130 }, { - "epoch": 1.09, - "learning_rate": 0.0001359075864754364, - "loss": 0.0382, + "epoch": 0.65, + "learning_rate": 0.000202082782033988, + "loss": 0.0476, "step": 101140 }, { - "epoch": 1.09, - "learning_rate": 0.00013589136219092736, - "loss": 0.0371, + "epoch": 0.65, + "learning_rate": 0.00020207310067963107, + "loss": 0.0507, "step": 101150 }, { - "epoch": 1.09, - "learning_rate": 0.0001358751379064183, - "loss": 0.0398, + "epoch": 0.65, + "learning_rate": 0.00020206341932527412, + "loss": 0.0497, "step": 101160 }, { - "epoch": 1.09, - "learning_rate": 0.00013585891362190926, - "loss": 0.0359, + "epoch": 0.65, + "learning_rate": 0.0002020537379709172, + "loss": 0.0494, "step": 101170 }, { - "epoch": 1.09, - "learning_rate": 0.0001358426893374002, - "loss": 0.0378, + "epoch": 0.65, + "learning_rate": 0.00020204405661656025, + "loss": 0.0454, "step": 101180 }, { - "epoch": 1.09, - "learning_rate": 0.00013582646505289116, - "loss": 0.0428, + "epoch": 0.65, + "learning_rate": 0.0002020343752622033, + "loss": 0.0415, "step": 101190 }, { - "epoch": 1.09, - "learning_rate": 0.0001358102407683821, - "loss": 0.0341, + "epoch": 0.65, + "learning_rate": 0.0002020246939078464, + "loss": 0.0486, "step": 101200 }, { - "epoch": 1.09, - "learning_rate": 0.00013579401648387306, - "loss": 0.0373, + "epoch": 0.65, + "learning_rate": 0.00020201501255348947, + "loss": 0.0479, "step": 101210 }, { - "epoch": 1.09, - "learning_rate": 0.00013577779219936398, - "loss": 0.0417, + "epoch": 0.65, + "learning_rate": 0.00020200533119913255, + "loss": 0.0552, "step": 101220 }, { - "epoch": 1.09, - "learning_rate": 0.00013576156791485493, - "loss": 0.0405, + "epoch": 0.65, + "learning_rate": 0.0002019956498447756, + "loss": 0.049, "step": 101230 }, { - "epoch": 1.1, - "learning_rate": 0.00013574534363034588, - "loss": 0.0442, + "epoch": 0.65, + "learning_rate": 0.00020198596849041868, + "loss": 0.0444, "step": 101240 }, { - "epoch": 1.1, - "learning_rate": 0.00013572911934583683, - "loss": 0.043, + "epoch": 0.65, + "learning_rate": 0.00020197628713606173, + "loss": 0.0546, "step": 101250 }, { - "epoch": 1.1, - "learning_rate": 0.00013571289506132778, - "loss": 0.0398, + "epoch": 0.65, + "learning_rate": 0.00020196660578170478, + "loss": 0.0489, "step": 101260 }, { - "epoch": 1.1, - "learning_rate": 0.00013569667077681873, - "loss": 0.0372, + "epoch": 0.65, + "learning_rate": 0.00020195692442734786, + "loss": 0.0573, "step": 101270 }, { - "epoch": 1.1, - "learning_rate": 0.00013568044649230968, - "loss": 0.0356, + "epoch": 0.65, + "learning_rate": 0.00020194724307299094, + "loss": 0.0459, "step": 101280 }, { - "epoch": 1.1, - "learning_rate": 0.00013566422220780063, - "loss": 0.0368, + "epoch": 0.65, + "learning_rate": 0.00020193756171863402, + "loss": 0.0447, "step": 101290 }, { - "epoch": 1.1, - "learning_rate": 0.00013564799792329158, - "loss": 0.0346, + "epoch": 0.65, + "learning_rate": 0.00020192788036427708, + "loss": 0.044, "step": 101300 }, { - "epoch": 1.1, - "learning_rate": 0.0001356317736387825, - "loss": 0.0405, + "epoch": 0.65, + "learning_rate": 0.00020191819900992016, + "loss": 0.041, "step": 101310 }, { - "epoch": 1.1, - "learning_rate": 0.00013561554935427345, - "loss": 0.0382, + "epoch": 0.65, + "learning_rate": 0.00020190851765556318, + "loss": 0.0466, "step": 101320 }, { - "epoch": 1.1, - "learning_rate": 0.0001355993250697644, - "loss": 0.0346, + "epoch": 0.65, + "learning_rate": 0.00020189883630120626, + "loss": 0.0431, "step": 101330 }, { - "epoch": 1.1, - "learning_rate": 0.00013558310078525535, - "loss": 0.0401, + "epoch": 0.65, + "learning_rate": 0.00020188915494684934, + "loss": 0.046, "step": 101340 }, { - "epoch": 1.1, - "learning_rate": 0.0001355668765007463, - "loss": 0.0336, + "epoch": 0.65, + "learning_rate": 0.00020187947359249242, + "loss": 0.0419, "step": 101350 }, { - "epoch": 1.1, - "learning_rate": 0.00013555065221623725, - "loss": 0.033, + "epoch": 0.65, + "learning_rate": 0.00020186979223813547, + "loss": 0.0424, "step": 101360 }, { - "epoch": 1.1, - "learning_rate": 0.0001355344279317282, - "loss": 0.0387, + "epoch": 0.65, + "learning_rate": 0.00020186011088377855, + "loss": 0.0457, "step": 101370 }, { - "epoch": 1.1, - "learning_rate": 0.00013551820364721915, - "loss": 0.0329, + "epoch": 0.65, + "learning_rate": 0.00020185042952942163, + "loss": 0.0436, "step": 101380 }, { - "epoch": 1.1, - "learning_rate": 0.0001355019793627101, - "loss": 0.0358, + "epoch": 0.65, + "learning_rate": 0.00020184074817506466, + "loss": 0.0501, "step": 101390 }, { - "epoch": 1.1, - "learning_rate": 0.00013548575507820102, - "loss": 0.0379, + "epoch": 0.65, + "learning_rate": 0.00020183106682070774, + "loss": 0.0508, "step": 101400 }, { - "epoch": 1.1, - "learning_rate": 0.00013546953079369197, - "loss": 0.0345, + "epoch": 0.65, + "learning_rate": 0.00020182138546635082, + "loss": 0.044, "step": 101410 }, { - "epoch": 1.1, - "learning_rate": 0.00013545330650918292, - "loss": 0.0373, + "epoch": 0.65, + "learning_rate": 0.0002018117041119939, + "loss": 0.0464, "step": 101420 }, { - "epoch": 1.1, - "learning_rate": 0.00013543708222467387, - "loss": 0.0407, + "epoch": 0.65, + "learning_rate": 0.00020180202275763695, + "loss": 0.0426, "step": 101430 }, { - "epoch": 1.1, - "learning_rate": 0.00013542085794016482, - "loss": 0.0326, + "epoch": 0.65, + "learning_rate": 0.00020179234140328003, + "loss": 0.0502, "step": 101440 }, { - "epoch": 1.1, - "learning_rate": 0.00013540463365565577, - "loss": 0.0384, + "epoch": 0.65, + "learning_rate": 0.0002017826600489231, + "loss": 0.0464, "step": 101450 }, { - "epoch": 1.1, - "learning_rate": 0.00013538840937114672, - "loss": 0.0412, + "epoch": 0.65, + "learning_rate": 0.00020177297869456614, + "loss": 0.052, "step": 101460 }, { - "epoch": 1.1, - "learning_rate": 0.00013537218508663767, - "loss": 0.0397, + "epoch": 0.65, + "learning_rate": 0.00020176329734020922, + "loss": 0.0515, "step": 101470 }, { - "epoch": 1.1, - "learning_rate": 0.00013535596080212862, - "loss": 0.0414, + "epoch": 0.65, + "learning_rate": 0.0002017536159858523, + "loss": 0.0408, "step": 101480 }, { - "epoch": 1.1, - "learning_rate": 0.00013533973651761957, - "loss": 0.0362, + "epoch": 0.66, + "learning_rate": 0.00020174393463149538, + "loss": 0.0485, "step": 101490 }, { - "epoch": 1.1, - "learning_rate": 0.0001353235122331105, - "loss": 0.035, + "epoch": 0.66, + "learning_rate": 0.00020173425327713843, + "loss": 0.0456, "step": 101500 }, { - "epoch": 1.1, - "learning_rate": 0.00013530728794860144, - "loss": 0.0339, + "epoch": 0.66, + "learning_rate": 0.0002017245719227815, + "loss": 0.0555, "step": 101510 }, { - "epoch": 1.1, - "learning_rate": 0.0001352910636640924, - "loss": 0.041, + "epoch": 0.66, + "learning_rate": 0.0002017148905684246, + "loss": 0.053, "step": 101520 }, { - "epoch": 1.1, - "learning_rate": 0.00013527483937958334, - "loss": 0.0359, + "epoch": 0.66, + "learning_rate": 0.00020170520921406761, + "loss": 0.0429, "step": 101530 }, { - "epoch": 1.1, - "learning_rate": 0.0001352586150950743, - "loss": 0.0398, + "epoch": 0.66, + "learning_rate": 0.0002016955278597107, + "loss": 0.0441, "step": 101540 }, { - "epoch": 1.1, - "learning_rate": 0.00013524239081056524, - "loss": 0.0339, + "epoch": 0.66, + "learning_rate": 0.00020168584650535377, + "loss": 0.0464, "step": 101550 }, { - "epoch": 1.1, - "learning_rate": 0.0001352261665260562, - "loss": 0.0378, + "epoch": 0.66, + "learning_rate": 0.00020167616515099683, + "loss": 0.0408, "step": 101560 }, { - "epoch": 1.1, - "learning_rate": 0.00013520994224154714, - "loss": 0.0345, + "epoch": 0.66, + "learning_rate": 0.0002016664837966399, + "loss": 0.0533, "step": 101570 }, { - "epoch": 1.1, - "learning_rate": 0.0001351937179570381, - "loss": 0.0377, + "epoch": 0.66, + "learning_rate": 0.00020165680244228299, + "loss": 0.0524, "step": 101580 }, { - "epoch": 1.1, - "learning_rate": 0.00013517749367252901, - "loss": 0.0406, + "epoch": 0.66, + "learning_rate": 0.00020164712108792607, + "loss": 0.0496, "step": 101590 }, { - "epoch": 1.1, - "learning_rate": 0.00013516126938801996, - "loss": 0.0372, + "epoch": 0.66, + "learning_rate": 0.0002016374397335691, + "loss": 0.0488, "step": 101600 }, { - "epoch": 1.1, - "learning_rate": 0.0001351450451035109, - "loss": 0.04, + "epoch": 0.66, + "learning_rate": 0.00020162775837921217, + "loss": 0.0467, "step": 101610 }, { - "epoch": 1.1, - "learning_rate": 0.00013512882081900186, - "loss": 0.0321, + "epoch": 0.66, + "learning_rate": 0.00020161807702485525, + "loss": 0.0403, "step": 101620 }, { - "epoch": 1.1, - "learning_rate": 0.0001351125965344928, - "loss": 0.0341, + "epoch": 0.66, + "learning_rate": 0.0002016083956704983, + "loss": 0.0476, "step": 101630 }, { - "epoch": 1.1, - "learning_rate": 0.00013509637224998376, - "loss": 0.0382, + "epoch": 0.66, + "learning_rate": 0.00020159871431614138, + "loss": 0.0473, "step": 101640 }, { - "epoch": 1.1, - "learning_rate": 0.0001350801479654747, - "loss": 0.0363, + "epoch": 0.66, + "learning_rate": 0.00020158903296178446, + "loss": 0.0501, "step": 101650 }, { - "epoch": 1.1, - "learning_rate": 0.00013506392368096566, - "loss": 0.0321, + "epoch": 0.66, + "learning_rate": 0.00020157935160742754, + "loss": 0.0409, "step": 101660 }, { - "epoch": 1.1, - "learning_rate": 0.0001350476993964566, - "loss": 0.0351, + "epoch": 0.66, + "learning_rate": 0.00020156967025307057, + "loss": 0.0457, "step": 101670 }, { - "epoch": 1.1, - "learning_rate": 0.00013503147511194753, - "loss": 0.0344, + "epoch": 0.66, + "learning_rate": 0.00020155998889871365, + "loss": 0.0567, "step": 101680 }, { - "epoch": 1.1, - "learning_rate": 0.00013501525082743848, - "loss": 0.0312, + "epoch": 0.66, + "learning_rate": 0.00020155030754435673, + "loss": 0.0499, "step": 101690 }, { - "epoch": 1.1, - "learning_rate": 0.00013499902654292943, - "loss": 0.0366, + "epoch": 0.66, + "learning_rate": 0.00020154062618999978, + "loss": 0.049, "step": 101700 }, { - "epoch": 1.1, - "learning_rate": 0.00013498280225842038, - "loss": 0.04, + "epoch": 0.66, + "learning_rate": 0.00020153094483564286, + "loss": 0.0486, "step": 101710 }, { - "epoch": 1.1, - "learning_rate": 0.00013496657797391133, - "loss": 0.0351, + "epoch": 0.66, + "learning_rate": 0.00020152126348128594, + "loss": 0.041, "step": 101720 }, { - "epoch": 1.1, - "learning_rate": 0.00013495035368940228, - "loss": 0.0374, + "epoch": 0.66, + "learning_rate": 0.000201511582126929, + "loss": 0.0416, "step": 101730 }, { - "epoch": 1.1, - "learning_rate": 0.00013493412940489323, - "loss": 0.0379, + "epoch": 0.66, + "learning_rate": 0.00020150190077257205, + "loss": 0.0488, "step": 101740 }, { - "epoch": 1.1, - "learning_rate": 0.00013491790512038418, - "loss": 0.0402, + "epoch": 0.66, + "learning_rate": 0.00020149221941821513, + "loss": 0.0576, "step": 101750 }, { - "epoch": 1.1, - "learning_rate": 0.00013490168083587513, - "loss": 0.0353, + "epoch": 0.66, + "learning_rate": 0.00020148253806385818, + "loss": 0.0483, "step": 101760 }, { - "epoch": 1.1, - "learning_rate": 0.00013488545655136606, - "loss": 0.0375, + "epoch": 0.66, + "learning_rate": 0.00020147285670950126, + "loss": 0.0514, "step": 101770 }, { - "epoch": 1.1, - "learning_rate": 0.000134869232266857, - "loss": 0.0362, + "epoch": 0.66, + "learning_rate": 0.00020146317535514434, + "loss": 0.0441, "step": 101780 }, { - "epoch": 1.1, - "learning_rate": 0.00013485300798234796, - "loss": 0.0384, + "epoch": 0.66, + "learning_rate": 0.00020145349400078742, + "loss": 0.0463, "step": 101790 }, { - "epoch": 1.1, - "learning_rate": 0.0001348367836978389, - "loss": 0.0355, + "epoch": 0.66, + "learning_rate": 0.00020144381264643047, + "loss": 0.0533, "step": 101800 }, { - "epoch": 1.1, - "learning_rate": 0.00013482055941332985, - "loss": 0.043, + "epoch": 0.66, + "learning_rate": 0.00020143413129207352, + "loss": 0.0484, "step": 101810 }, { - "epoch": 1.1, - "learning_rate": 0.0001348043351288208, - "loss": 0.039, + "epoch": 0.66, + "learning_rate": 0.0002014244499377166, + "loss": 0.0462, "step": 101820 }, { - "epoch": 1.1, - "learning_rate": 0.00013478811084431175, - "loss": 0.0366, + "epoch": 0.66, + "learning_rate": 0.00020141476858335966, + "loss": 0.048, "step": 101830 }, { - "epoch": 1.1, - "learning_rate": 0.0001347718865598027, - "loss": 0.0345, + "epoch": 0.66, + "learning_rate": 0.00020140508722900273, + "loss": 0.0459, "step": 101840 }, { - "epoch": 1.1, - "learning_rate": 0.00013475566227529365, - "loss": 0.0352, + "epoch": 0.66, + "learning_rate": 0.00020139540587464581, + "loss": 0.0627, "step": 101850 }, { - "epoch": 1.1, - "learning_rate": 0.00013473943799078458, - "loss": 0.0416, + "epoch": 0.66, + "learning_rate": 0.0002013857245202889, + "loss": 0.0418, "step": 101860 }, { - "epoch": 1.1, - "learning_rate": 0.00013472321370627553, - "loss": 0.0403, + "epoch": 0.66, + "learning_rate": 0.00020137604316593195, + "loss": 0.0499, "step": 101870 }, { - "epoch": 1.1, - "learning_rate": 0.00013470698942176648, - "loss": 0.0428, + "epoch": 0.66, + "learning_rate": 0.000201366361811575, + "loss": 0.046, "step": 101880 }, { - "epoch": 1.1, - "learning_rate": 0.00013469076513725743, - "loss": 0.0386, + "epoch": 0.66, + "learning_rate": 0.00020135668045721808, + "loss": 0.0447, "step": 101890 }, { - "epoch": 1.1, - "learning_rate": 0.00013467454085274838, - "loss": 0.0393, + "epoch": 0.66, + "learning_rate": 0.00020134699910286113, + "loss": 0.0471, "step": 101900 }, { - "epoch": 1.1, - "learning_rate": 0.00013465831656823933, - "loss": 0.0356, + "epoch": 0.66, + "learning_rate": 0.0002013373177485042, + "loss": 0.0522, "step": 101910 }, { - "epoch": 1.1, - "learning_rate": 0.00013464209228373028, - "loss": 0.0391, + "epoch": 0.66, + "learning_rate": 0.0002013276363941473, + "loss": 0.0463, "step": 101920 }, { - "epoch": 1.1, - "learning_rate": 0.00013462586799922122, - "loss": 0.0406, + "epoch": 0.66, + "learning_rate": 0.00020131795503979034, + "loss": 0.0388, "step": 101930 }, { - "epoch": 1.1, - "learning_rate": 0.00013460964371471217, - "loss": 0.0373, + "epoch": 0.66, + "learning_rate": 0.00020130827368543342, + "loss": 0.0439, "step": 101940 }, { - "epoch": 1.1, - "learning_rate": 0.0001345934194302031, - "loss": 0.0351, + "epoch": 0.66, + "learning_rate": 0.00020129859233107648, + "loss": 0.0471, "step": 101950 }, { - "epoch": 1.1, - "learning_rate": 0.00013457719514569405, - "loss": 0.0453, + "epoch": 0.66, + "learning_rate": 0.00020128891097671953, + "loss": 0.0507, "step": 101960 }, { - "epoch": 1.1, - "learning_rate": 0.000134560970861185, - "loss": 0.0311, + "epoch": 0.66, + "learning_rate": 0.0002012792296223626, + "loss": 0.0431, "step": 101970 }, { - "epoch": 1.1, - "learning_rate": 0.00013454474657667595, - "loss": 0.0385, + "epoch": 0.66, + "learning_rate": 0.0002012695482680057, + "loss": 0.0494, "step": 101980 }, { - "epoch": 1.1, - "learning_rate": 0.0001345285222921669, - "loss": 0.0322, + "epoch": 0.66, + "learning_rate": 0.00020125986691364877, + "loss": 0.0458, "step": 101990 }, { - "epoch": 1.1, - "learning_rate": 0.00013451229800765785, - "loss": 0.0357, + "epoch": 0.66, + "learning_rate": 0.00020125018555929182, + "loss": 0.0417, "step": 102000 }, { - "epoch": 1.1, - "eval_cer": 0.9211446069466606, - "eval_loss": 0.02821805141866207, - "eval_runtime": 119.0387, - "eval_samples_per_second": 16.801, - "eval_steps_per_second": 4.2, + "epoch": 0.66, + "eval_cer": 0.9199168455541746, + "eval_loss": 0.030525721609592438, + "eval_runtime": 119.742, + "eval_samples_per_second": 16.703, + "eval_steps_per_second": 4.176, "step": 102000 }, { - "epoch": 1.1, - "learning_rate": 0.0001344960737231488, - "loss": 0.039, + "epoch": 0.66, + "learning_rate": 0.0002012405042049349, + "loss": 0.05, "step": 102010 }, { - "epoch": 1.1, - "learning_rate": 0.00013447984943863975, - "loss": 0.0335, + "epoch": 0.66, + "learning_rate": 0.00020123082285057795, + "loss": 0.0474, "step": 102020 }, { - "epoch": 1.1, - "learning_rate": 0.0001344636251541307, - "loss": 0.0372, + "epoch": 0.66, + "learning_rate": 0.000201221141496221, + "loss": 0.0494, "step": 102030 }, { - "epoch": 1.1, - "learning_rate": 0.00013444740086962162, - "loss": 0.0316, + "epoch": 0.66, + "learning_rate": 0.0002012114601418641, + "loss": 0.0406, "step": 102040 }, { - "epoch": 1.1, - "learning_rate": 0.00013443117658511257, - "loss": 0.0381, + "epoch": 0.66, + "learning_rate": 0.00020120177878750717, + "loss": 0.0457, "step": 102050 }, { - "epoch": 1.1, - "learning_rate": 0.00013441495230060352, - "loss": 0.0359, + "epoch": 0.66, + "learning_rate": 0.00020119209743315025, + "loss": 0.0478, "step": 102060 }, { - "epoch": 1.1, - "learning_rate": 0.00013439872801609447, - "loss": 0.033, + "epoch": 0.66, + "learning_rate": 0.0002011824160787933, + "loss": 0.0457, "step": 102070 }, { - "epoch": 1.1, - "learning_rate": 0.00013438250373158544, - "loss": 0.0323, + "epoch": 0.66, + "learning_rate": 0.00020117273472443638, + "loss": 0.0444, "step": 102080 }, { - "epoch": 1.1, - "learning_rate": 0.00013436627944707637, - "loss": 0.0341, + "epoch": 0.66, + "learning_rate": 0.00020116305337007943, + "loss": 0.0518, "step": 102090 }, { - "epoch": 1.1, - "learning_rate": 0.00013435005516256732, - "loss": 0.0372, + "epoch": 0.66, + "learning_rate": 0.00020115337201572248, + "loss": 0.0436, "step": 102100 }, { - "epoch": 1.1, - "learning_rate": 0.00013433383087805827, - "loss": 0.0382, + "epoch": 0.66, + "learning_rate": 0.00020114369066136556, + "loss": 0.0449, "step": 102110 }, { - "epoch": 1.1, - "learning_rate": 0.00013431760659354922, - "loss": 0.0435, + "epoch": 0.66, + "learning_rate": 0.00020113400930700864, + "loss": 0.0486, "step": 102120 }, { - "epoch": 1.1, - "learning_rate": 0.00013430138230904017, - "loss": 0.034, + "epoch": 0.66, + "learning_rate": 0.0002011243279526517, + "loss": 0.0433, "step": 102130 }, { - "epoch": 1.1, - "learning_rate": 0.00013428515802453112, - "loss": 0.0319, + "epoch": 0.66, + "learning_rate": 0.00020111464659829478, + "loss": 0.0478, "step": 102140 }, { - "epoch": 1.1, - "learning_rate": 0.00013426893374002207, - "loss": 0.0336, + "epoch": 0.66, + "learning_rate": 0.00020110496524393786, + "loss": 0.0522, "step": 102150 }, { - "epoch": 1.1, - "learning_rate": 0.00013425270945551302, - "loss": 0.0383, + "epoch": 0.66, + "learning_rate": 0.00020109528388958088, + "loss": 0.0468, "step": 102160 }, { - "epoch": 1.11, - "learning_rate": 0.00013423648517100397, - "loss": 0.0389, + "epoch": 0.66, + "learning_rate": 0.00020108560253522396, + "loss": 0.0452, "step": 102170 }, { - "epoch": 1.11, - "learning_rate": 0.00013422026088649491, - "loss": 0.034, + "epoch": 0.66, + "learning_rate": 0.00020107592118086704, + "loss": 0.0551, "step": 102180 }, { - "epoch": 1.11, - "learning_rate": 0.00013420403660198584, - "loss": 0.0383, + "epoch": 0.66, + "learning_rate": 0.00020106623982651012, + "loss": 0.0455, "step": 102190 }, { - "epoch": 1.11, - "learning_rate": 0.0001341878123174768, - "loss": 0.0368, + "epoch": 0.66, + "learning_rate": 0.00020105655847215317, + "loss": 0.0429, "step": 102200 }, { - "epoch": 1.11, - "learning_rate": 0.00013417158803296774, - "loss": 0.0376, + "epoch": 0.66, + "learning_rate": 0.00020104687711779625, + "loss": 0.0448, "step": 102210 }, { - "epoch": 1.11, - "learning_rate": 0.0001341553637484587, - "loss": 0.0366, + "epoch": 0.66, + "learning_rate": 0.00020103719576343933, + "loss": 0.0562, "step": 102220 }, { - "epoch": 1.11, - "learning_rate": 0.00013413913946394964, - "loss": 0.0363, + "epoch": 0.66, + "learning_rate": 0.00020102751440908236, + "loss": 0.0449, "step": 102230 }, { - "epoch": 1.11, - "learning_rate": 0.00013412291517944059, - "loss": 0.0373, + "epoch": 0.66, + "learning_rate": 0.00020101783305472544, + "loss": 0.0485, "step": 102240 }, { - "epoch": 1.11, - "learning_rate": 0.00013410669089493154, - "loss": 0.0386, + "epoch": 0.66, + "learning_rate": 0.00020100815170036852, + "loss": 0.0474, "step": 102250 }, { - "epoch": 1.11, - "learning_rate": 0.00013409046661042249, - "loss": 0.0319, + "epoch": 0.66, + "learning_rate": 0.0002009984703460116, + "loss": 0.0434, "step": 102260 }, { - "epoch": 1.11, - "learning_rate": 0.00013407424232591344, - "loss": 0.0412, + "epoch": 0.66, + "learning_rate": 0.00020098878899165465, + "loss": 0.0497, "step": 102270 }, { - "epoch": 1.11, - "learning_rate": 0.00013405801804140436, - "loss": 0.0341, + "epoch": 0.66, + "learning_rate": 0.00020097910763729773, + "loss": 0.0483, "step": 102280 }, { - "epoch": 1.11, - "learning_rate": 0.0001340417937568953, - "loss": 0.035, + "epoch": 0.66, + "learning_rate": 0.0002009694262829408, + "loss": 0.0473, "step": 102290 }, { - "epoch": 1.11, - "learning_rate": 0.00013402556947238626, - "loss": 0.0375, + "epoch": 0.66, + "learning_rate": 0.00020095974492858384, + "loss": 0.0439, "step": 102300 }, { - "epoch": 1.11, - "learning_rate": 0.0001340093451878772, - "loss": 0.0342, + "epoch": 0.66, + "learning_rate": 0.00020095006357422692, + "loss": 0.0493, "step": 102310 }, { - "epoch": 1.11, - "learning_rate": 0.00013399312090336816, - "loss": 0.0344, + "epoch": 0.66, + "learning_rate": 0.00020094038221987, + "loss": 0.0524, "step": 102320 }, { - "epoch": 1.11, - "learning_rate": 0.0001339768966188591, - "loss": 0.0311, + "epoch": 0.66, + "learning_rate": 0.00020093070086551305, + "loss": 0.0437, "step": 102330 }, { - "epoch": 1.11, - "learning_rate": 0.00013396067233435006, - "loss": 0.0302, + "epoch": 0.66, + "learning_rate": 0.00020092101951115613, + "loss": 0.0463, "step": 102340 }, { - "epoch": 1.11, - "learning_rate": 0.000133944448049841, - "loss": 0.0377, + "epoch": 0.66, + "learning_rate": 0.0002009113381567992, + "loss": 0.0506, "step": 102350 }, { - "epoch": 1.11, - "learning_rate": 0.00013392822376533196, - "loss": 0.0343, + "epoch": 0.66, + "learning_rate": 0.0002009016568024423, + "loss": 0.0425, "step": 102360 }, { - "epoch": 1.11, - "learning_rate": 0.00013391199948082288, - "loss": 0.0358, + "epoch": 0.66, + "learning_rate": 0.0002008919754480853, + "loss": 0.0461, "step": 102370 }, { - "epoch": 1.11, - "learning_rate": 0.00013389577519631383, - "loss": 0.0313, + "epoch": 0.66, + "learning_rate": 0.0002008822940937284, + "loss": 0.0437, "step": 102380 }, { - "epoch": 1.11, - "learning_rate": 0.00013387955091180478, - "loss": 0.0374, + "epoch": 0.66, + "learning_rate": 0.00020087261273937147, + "loss": 0.0471, "step": 102390 }, { - "epoch": 1.11, - "learning_rate": 0.00013386332662729573, - "loss": 0.0349, + "epoch": 0.66, + "learning_rate": 0.00020086293138501453, + "loss": 0.0465, "step": 102400 }, { - "epoch": 1.11, - "learning_rate": 0.00013384710234278668, - "loss": 0.0351, + "epoch": 0.66, + "learning_rate": 0.0002008532500306576, + "loss": 0.0482, "step": 102410 }, { - "epoch": 1.11, - "learning_rate": 0.00013383087805827763, - "loss": 0.0351, + "epoch": 0.66, + "learning_rate": 0.00020084356867630069, + "loss": 0.039, "step": 102420 }, { - "epoch": 1.11, - "learning_rate": 0.00013381465377376858, - "loss": 0.038, + "epoch": 0.66, + "learning_rate": 0.00020083388732194377, + "loss": 0.0457, "step": 102430 }, { - "epoch": 1.11, - "learning_rate": 0.00013379842948925953, + "epoch": 0.66, + "learning_rate": 0.0002008242059675868, "loss": 0.0401, "step": 102440 }, { - "epoch": 1.11, - "learning_rate": 0.00013378220520475048, - "loss": 0.038, + "epoch": 0.66, + "learning_rate": 0.00020081452461322987, + "loss": 0.052, "step": 102450 }, { - "epoch": 1.11, - "learning_rate": 0.0001337659809202414, - "loss": 0.0385, + "epoch": 0.66, + "learning_rate": 0.00020080484325887295, + "loss": 0.047, "step": 102460 }, { - "epoch": 1.11, - "learning_rate": 0.00013374975663573235, - "loss": 0.0369, + "epoch": 0.66, + "learning_rate": 0.000200795161904516, + "loss": 0.0437, "step": 102470 }, { - "epoch": 1.11, - "learning_rate": 0.0001337335323512233, - "loss": 0.0357, + "epoch": 0.66, + "learning_rate": 0.00020078548055015908, + "loss": 0.044, "step": 102480 }, { - "epoch": 1.11, - "learning_rate": 0.00013371730806671425, - "loss": 0.0321, + "epoch": 0.66, + "learning_rate": 0.00020077579919580216, + "loss": 0.0462, "step": 102490 }, { - "epoch": 1.11, - "learning_rate": 0.0001337010837822052, - "loss": 0.0316, + "epoch": 0.66, + "learning_rate": 0.00020076611784144522, + "loss": 0.0457, "step": 102500 }, { - "epoch": 1.11, - "learning_rate": 0.00013368485949769615, - "loss": 0.0356, + "epoch": 0.66, + "learning_rate": 0.00020075643648708827, + "loss": 0.0513, "step": 102510 }, { - "epoch": 1.11, - "learning_rate": 0.0001336686352131871, - "loss": 0.0338, + "epoch": 0.66, + "learning_rate": 0.00020074675513273135, + "loss": 0.0517, "step": 102520 }, { - "epoch": 1.11, - "learning_rate": 0.00013365241092867805, - "loss": 0.0387, + "epoch": 0.66, + "learning_rate": 0.0002007370737783744, + "loss": 0.0463, "step": 102530 }, { - "epoch": 1.11, - "learning_rate": 0.000133636186644169, - "loss": 0.0401, + "epoch": 0.66, + "learning_rate": 0.00020072739242401748, + "loss": 0.0493, "step": 102540 }, { - "epoch": 1.11, - "learning_rate": 0.00013361996235965992, - "loss": 0.0347, + "epoch": 0.66, + "learning_rate": 0.00020071771106966056, + "loss": 0.0418, "step": 102550 }, { - "epoch": 1.11, - "learning_rate": 0.00013360373807515087, - "loss": 0.031, + "epoch": 0.66, + "learning_rate": 0.00020070802971530364, + "loss": 0.0437, "step": 102560 }, { - "epoch": 1.11, - "learning_rate": 0.00013358751379064182, - "loss": 0.038, + "epoch": 0.66, + "learning_rate": 0.0002006983483609467, + "loss": 0.0427, "step": 102570 }, { - "epoch": 1.11, - "learning_rate": 0.00013357128950613277, - "loss": 0.0361, + "epoch": 0.66, + "learning_rate": 0.00020068866700658975, + "loss": 0.0472, "step": 102580 }, { - "epoch": 1.11, - "learning_rate": 0.00013355506522162372, - "loss": 0.0343, + "epoch": 0.66, + "learning_rate": 0.00020067898565223282, + "loss": 0.0449, "step": 102590 }, { - "epoch": 1.11, - "learning_rate": 0.00013353884093711467, - "loss": 0.0365, + "epoch": 0.66, + "learning_rate": 0.00020066930429787588, + "loss": 0.0486, "step": 102600 }, { - "epoch": 1.11, - "learning_rate": 0.00013352261665260562, - "loss": 0.0315, + "epoch": 0.66, + "learning_rate": 0.00020065962294351896, + "loss": 0.0511, "step": 102610 }, { - "epoch": 1.11, - "learning_rate": 0.00013350639236809657, - "loss": 0.0287, + "epoch": 0.66, + "learning_rate": 0.00020064994158916204, + "loss": 0.0461, "step": 102620 }, { - "epoch": 1.11, - "learning_rate": 0.00013349016808358752, - "loss": 0.0334, + "epoch": 0.66, + "learning_rate": 0.00020064026023480512, + "loss": 0.0518, "step": 102630 }, { - "epoch": 1.11, - "learning_rate": 0.00013347394379907844, - "loss": 0.0332, + "epoch": 0.66, + "learning_rate": 0.00020063057888044817, + "loss": 0.0511, "step": 102640 }, { - "epoch": 1.11, - "learning_rate": 0.0001334577195145694, - "loss": 0.0405, + "epoch": 0.66, + "learning_rate": 0.00020062089752609122, + "loss": 0.0422, "step": 102650 }, { - "epoch": 1.11, - "learning_rate": 0.00013344149523006034, - "loss": 0.0373, + "epoch": 0.66, + "learning_rate": 0.0002006112161717343, + "loss": 0.0449, "step": 102660 }, { - "epoch": 1.11, - "learning_rate": 0.0001334252709455513, - "loss": 0.0318, + "epoch": 0.66, + "learning_rate": 0.00020060153481737735, + "loss": 0.0436, "step": 102670 }, { - "epoch": 1.11, - "learning_rate": 0.00013340904666104224, - "loss": 0.0406, + "epoch": 0.66, + "learning_rate": 0.00020059185346302043, + "loss": 0.049, "step": 102680 }, { - "epoch": 1.11, - "learning_rate": 0.0001333928223765332, - "loss": 0.0296, + "epoch": 0.66, + "learning_rate": 0.00020058217210866351, + "loss": 0.0406, "step": 102690 }, { - "epoch": 1.11, - "learning_rate": 0.00013337659809202414, - "loss": 0.0348, + "epoch": 0.66, + "learning_rate": 0.0002005724907543066, + "loss": 0.0473, "step": 102700 }, { - "epoch": 1.11, - "learning_rate": 0.0001333603738075151, - "loss": 0.0352, + "epoch": 0.66, + "learning_rate": 0.00020056280939994965, + "loss": 0.0431, "step": 102710 }, { - "epoch": 1.11, - "learning_rate": 0.00013334414952300604, - "loss": 0.0394, + "epoch": 0.66, + "learning_rate": 0.0002005531280455927, + "loss": 0.0457, "step": 102720 }, { - "epoch": 1.11, - "learning_rate": 0.00013332792523849696, - "loss": 0.035, + "epoch": 0.66, + "learning_rate": 0.00020054344669123575, + "loss": 0.0441, "step": 102730 }, { - "epoch": 1.11, - "learning_rate": 0.0001333117009539879, - "loss": 0.0309, + "epoch": 0.66, + "learning_rate": 0.00020053376533687883, + "loss": 0.0397, "step": 102740 }, { - "epoch": 1.11, - "learning_rate": 0.00013329547666947886, - "loss": 0.0396, + "epoch": 0.66, + "learning_rate": 0.0002005240839825219, + "loss": 0.0469, "step": 102750 }, { - "epoch": 1.11, - "learning_rate": 0.0001332792523849698, - "loss": 0.0405, + "epoch": 0.66, + "learning_rate": 0.000200514402628165, + "loss": 0.0437, "step": 102760 }, { - "epoch": 1.11, - "learning_rate": 0.00013326302810046076, - "loss": 0.0383, + "epoch": 0.66, + "learning_rate": 0.00020050472127380804, + "loss": 0.0456, "step": 102770 }, { - "epoch": 1.11, - "learning_rate": 0.0001332468038159517, - "loss": 0.0369, + "epoch": 0.66, + "learning_rate": 0.00020049503991945112, + "loss": 0.0407, "step": 102780 }, { - "epoch": 1.11, - "learning_rate": 0.00013323057953144266, - "loss": 0.0332, + "epoch": 0.66, + "learning_rate": 0.00020048535856509418, + "loss": 0.0487, "step": 102790 }, { - "epoch": 1.11, - "learning_rate": 0.0001332143552469336, - "loss": 0.0392, + "epoch": 0.66, + "learning_rate": 0.00020047567721073723, + "loss": 0.0377, "step": 102800 }, { - "epoch": 1.11, - "learning_rate": 0.00013319813096242456, - "loss": 0.031, + "epoch": 0.66, + "learning_rate": 0.0002004659958563803, + "loss": 0.0434, "step": 102810 }, { - "epoch": 1.11, - "learning_rate": 0.00013318190667791548, - "loss": 0.0395, + "epoch": 0.66, + "learning_rate": 0.0002004563145020234, + "loss": 0.046, "step": 102820 }, { - "epoch": 1.11, - "learning_rate": 0.00013316568239340643, - "loss": 0.0322, + "epoch": 0.66, + "learning_rate": 0.00020044663314766647, + "loss": 0.0498, "step": 102830 }, { - "epoch": 1.11, - "learning_rate": 0.00013314945810889738, - "loss": 0.0328, + "epoch": 0.66, + "learning_rate": 0.00020043695179330952, + "loss": 0.0477, "step": 102840 }, { - "epoch": 1.11, - "learning_rate": 0.00013313323382438833, - "loss": 0.0347, + "epoch": 0.66, + "learning_rate": 0.0002004272704389526, + "loss": 0.0487, "step": 102850 }, { - "epoch": 1.11, - "learning_rate": 0.00013311700953987928, - "loss": 0.0353, + "epoch": 0.66, + "learning_rate": 0.00020041758908459565, + "loss": 0.0491, "step": 102860 }, { - "epoch": 1.11, - "learning_rate": 0.00013310078525537023, - "loss": 0.0391, + "epoch": 0.66, + "learning_rate": 0.0002004079077302387, + "loss": 0.0535, "step": 102870 }, { - "epoch": 1.11, - "learning_rate": 0.00013308456097086118, - "loss": 0.042, + "epoch": 0.66, + "learning_rate": 0.0002003982263758818, + "loss": 0.045, "step": 102880 }, { - "epoch": 1.11, - "learning_rate": 0.00013306833668635213, - "loss": 0.0386, + "epoch": 0.66, + "learning_rate": 0.00020038854502152487, + "loss": 0.0431, "step": 102890 }, { - "epoch": 1.11, - "learning_rate": 0.00013305211240184308, - "loss": 0.0342, + "epoch": 0.66, + "learning_rate": 0.00020037886366716795, + "loss": 0.0458, "step": 102900 }, { - "epoch": 1.11, - "learning_rate": 0.000133035888117334, - "loss": 0.043, + "epoch": 0.66, + "learning_rate": 0.000200369182312811, + "loss": 0.045, "step": 102910 }, { - "epoch": 1.11, - "learning_rate": 0.00013301966383282495, - "loss": 0.0352, + "epoch": 0.66, + "learning_rate": 0.00020035950095845408, + "loss": 0.0491, "step": 102920 }, { - "epoch": 1.11, - "learning_rate": 0.0001330034395483159, - "loss": 0.0335, + "epoch": 0.66, + "learning_rate": 0.0002003498196040971, + "loss": 0.0508, "step": 102930 }, { - "epoch": 1.11, - "learning_rate": 0.00013298721526380685, - "loss": 0.0351, + "epoch": 0.66, + "learning_rate": 0.00020034013824974018, + "loss": 0.0462, "step": 102940 }, { - "epoch": 1.11, - "learning_rate": 0.0001329709909792978, - "loss": 0.0366, + "epoch": 0.66, + "learning_rate": 0.00020033045689538326, + "loss": 0.0458, "step": 102950 }, { - "epoch": 1.11, - "learning_rate": 0.00013295476669478875, - "loss": 0.0341, + "epoch": 0.66, + "learning_rate": 0.00020032077554102634, + "loss": 0.0471, "step": 102960 }, { - "epoch": 1.11, - "learning_rate": 0.0001329385424102797, - "loss": 0.0395, + "epoch": 0.66, + "learning_rate": 0.0002003110941866694, + "loss": 0.0428, "step": 102970 }, { - "epoch": 1.11, - "learning_rate": 0.00013292231812577065, - "loss": 0.04, + "epoch": 0.66, + "learning_rate": 0.00020030141283231248, + "loss": 0.0529, "step": 102980 }, { - "epoch": 1.11, - "learning_rate": 0.0001329060938412616, - "loss": 0.0316, + "epoch": 0.66, + "learning_rate": 0.00020029173147795556, + "loss": 0.053, "step": 102990 }, { - "epoch": 1.11, - "learning_rate": 0.00013288986955675253, - "loss": 0.0413, + "epoch": 0.66, + "learning_rate": 0.00020028205012359858, + "loss": 0.0456, "step": 103000 }, { - "epoch": 1.11, - "eval_cer": 0.9210960153090163, - "eval_loss": 0.028240669518709183, - "eval_runtime": 119.0594, - "eval_samples_per_second": 16.798, - "eval_steps_per_second": 4.2, + "epoch": 0.66, + "eval_cer": 0.919939441870975, + "eval_loss": 0.030785538256168365, + "eval_runtime": 119.6928, + "eval_samples_per_second": 16.709, + "eval_steps_per_second": 4.177, "step": 103000 }, { - "epoch": 1.11, - "learning_rate": 0.00013287364527224347, - "loss": 0.0315, + "epoch": 0.66, + "learning_rate": 0.00020027236876924166, + "loss": 0.0453, "step": 103010 }, { - "epoch": 1.11, - "learning_rate": 0.00013285742098773442, - "loss": 0.0472, + "epoch": 0.66, + "learning_rate": 0.00020026268741488474, + "loss": 0.0431, "step": 103020 }, { - "epoch": 1.11, - "learning_rate": 0.00013284119670322537, - "loss": 0.0375, + "epoch": 0.66, + "learning_rate": 0.00020025300606052782, + "loss": 0.0539, "step": 103030 }, { - "epoch": 1.11, - "learning_rate": 0.00013282497241871632, - "loss": 0.0345, + "epoch": 0.67, + "learning_rate": 0.00020024332470617087, + "loss": 0.0385, "step": 103040 }, { - "epoch": 1.11, - "learning_rate": 0.00013280874813420727, - "loss": 0.0336, + "epoch": 0.67, + "learning_rate": 0.00020023364335181395, + "loss": 0.0449, "step": 103050 }, { - "epoch": 1.11, - "learning_rate": 0.00013279252384969822, - "loss": 0.0354, + "epoch": 0.67, + "learning_rate": 0.00020022396199745703, + "loss": 0.053, "step": 103060 }, { - "epoch": 1.11, - "learning_rate": 0.00013277629956518917, - "loss": 0.032, + "epoch": 0.67, + "learning_rate": 0.00020021428064310006, + "loss": 0.0456, "step": 103070 }, { - "epoch": 1.11, - "learning_rate": 0.00013276007528068012, - "loss": 0.0291, + "epoch": 0.67, + "learning_rate": 0.00020020459928874314, + "loss": 0.0492, "step": 103080 }, { - "epoch": 1.12, - "learning_rate": 0.00013274385099617105, - "loss": 0.0346, + "epoch": 0.67, + "learning_rate": 0.00020019491793438622, + "loss": 0.043, "step": 103090 }, { - "epoch": 1.12, - "learning_rate": 0.000132727626711662, - "loss": 0.0419, + "epoch": 0.67, + "learning_rate": 0.0002001852365800293, + "loss": 0.0574, "step": 103100 }, { - "epoch": 1.12, - "learning_rate": 0.00013271140242715295, - "loss": 0.0362, + "epoch": 0.67, + "learning_rate": 0.00020017555522567235, + "loss": 0.0475, "step": 103110 }, { - "epoch": 1.12, - "learning_rate": 0.0001326951781426439, - "loss": 0.0407, + "epoch": 0.67, + "learning_rate": 0.00020016587387131543, + "loss": 0.0429, "step": 103120 }, { - "epoch": 1.12, - "learning_rate": 0.00013267895385813484, - "loss": 0.0373, + "epoch": 0.67, + "learning_rate": 0.0002001561925169585, + "loss": 0.0534, "step": 103130 }, { - "epoch": 1.12, - "learning_rate": 0.0001326627295736258, - "loss": 0.0352, + "epoch": 0.67, + "learning_rate": 0.00020014651116260154, + "loss": 0.046, "step": 103140 }, { - "epoch": 1.12, - "learning_rate": 0.00013264650528911674, - "loss": 0.0364, + "epoch": 0.67, + "learning_rate": 0.00020013682980824462, + "loss": 0.0478, "step": 103150 }, { - "epoch": 1.12, - "learning_rate": 0.0001326302810046077, - "loss": 0.041, + "epoch": 0.67, + "learning_rate": 0.0002001271484538877, + "loss": 0.0435, "step": 103160 }, { - "epoch": 1.12, - "learning_rate": 0.00013261405672009864, - "loss": 0.042, + "epoch": 0.67, + "learning_rate": 0.00020011746709953075, + "loss": 0.0449, "step": 103170 }, { - "epoch": 1.12, - "learning_rate": 0.00013259783243558957, - "loss": 0.0389, + "epoch": 0.67, + "learning_rate": 0.00020010778574517383, + "loss": 0.0477, "step": 103180 }, { - "epoch": 1.12, - "learning_rate": 0.00013258160815108052, - "loss": 0.039, + "epoch": 0.67, + "learning_rate": 0.0002000981043908169, + "loss": 0.0385, "step": 103190 }, { - "epoch": 1.12, - "learning_rate": 0.00013256538386657147, - "loss": 0.0358, + "epoch": 0.67, + "learning_rate": 0.00020008842303646, + "loss": 0.0444, "step": 103200 }, { - "epoch": 1.12, - "learning_rate": 0.00013254915958206242, - "loss": 0.0366, + "epoch": 0.67, + "learning_rate": 0.000200078741682103, + "loss": 0.045, "step": 103210 }, { - "epoch": 1.12, - "learning_rate": 0.00013253293529755337, - "loss": 0.0362, + "epoch": 0.67, + "learning_rate": 0.0002000690603277461, + "loss": 0.0497, "step": 103220 }, { - "epoch": 1.12, - "learning_rate": 0.00013251671101304432, - "loss": 0.0365, + "epoch": 0.67, + "learning_rate": 0.00020005937897338917, + "loss": 0.0449, "step": 103230 }, { - "epoch": 1.12, - "learning_rate": 0.00013250048672853527, - "loss": 0.0426, + "epoch": 0.67, + "learning_rate": 0.00020004969761903223, + "loss": 0.0404, "step": 103240 }, { - "epoch": 1.12, - "learning_rate": 0.00013248426244402622, - "loss": 0.0351, + "epoch": 0.67, + "learning_rate": 0.0002000400162646753, + "loss": 0.0503, "step": 103250 }, { - "epoch": 1.12, - "learning_rate": 0.00013246803815951716, - "loss": 0.0402, + "epoch": 0.67, + "learning_rate": 0.00020003033491031838, + "loss": 0.0449, "step": 103260 }, { - "epoch": 1.12, - "learning_rate": 0.0001324518138750081, - "loss": 0.0348, + "epoch": 0.67, + "learning_rate": 0.00020002065355596146, + "loss": 0.0496, "step": 103270 }, { - "epoch": 1.12, - "learning_rate": 0.00013243558959049904, - "loss": 0.034, + "epoch": 0.67, + "learning_rate": 0.0002000109722016045, + "loss": 0.0493, "step": 103280 }, { - "epoch": 1.12, - "learning_rate": 0.00013241936530599, - "loss": 0.0387, + "epoch": 0.67, + "learning_rate": 0.00020000129084724757, + "loss": 0.0462, "step": 103290 }, { - "epoch": 1.12, - "learning_rate": 0.00013240314102148094, - "loss": 0.0362, + "epoch": 0.67, + "learning_rate": 0.00019999160949289065, + "loss": 0.0509, "step": 103300 }, { - "epoch": 1.12, - "learning_rate": 0.0001323869167369719, - "loss": 0.0317, + "epoch": 0.67, + "learning_rate": 0.0001999819281385337, + "loss": 0.0542, "step": 103310 }, { - "epoch": 1.12, - "learning_rate": 0.00013237069245246284, - "loss": 0.0326, + "epoch": 0.67, + "learning_rate": 0.00019997224678417678, + "loss": 0.0417, "step": 103320 }, { - "epoch": 1.12, - "learning_rate": 0.00013235446816795379, - "loss": 0.0394, + "epoch": 0.67, + "learning_rate": 0.00019996256542981986, + "loss": 0.0477, "step": 103330 }, { - "epoch": 1.12, - "learning_rate": 0.00013233824388344474, - "loss": 0.0385, + "epoch": 0.67, + "learning_rate": 0.00019995288407546291, + "loss": 0.0455, "step": 103340 }, { - "epoch": 1.12, - "learning_rate": 0.00013232201959893569, - "loss": 0.0328, + "epoch": 0.67, + "learning_rate": 0.00019994320272110597, + "loss": 0.0551, "step": 103350 }, { - "epoch": 1.12, - "learning_rate": 0.0001323057953144266, - "loss": 0.0413, + "epoch": 0.67, + "learning_rate": 0.00019993352136674905, + "loss": 0.0482, "step": 103360 }, { - "epoch": 1.12, - "learning_rate": 0.00013228957102991756, - "loss": 0.0359, + "epoch": 0.67, + "learning_rate": 0.0001999238400123921, + "loss": 0.05, "step": 103370 }, { - "epoch": 1.12, - "learning_rate": 0.0001322733467454085, - "loss": 0.0352, + "epoch": 0.67, + "learning_rate": 0.00019991415865803518, + "loss": 0.0518, "step": 103380 }, { - "epoch": 1.12, - "learning_rate": 0.00013225712246089946, - "loss": 0.0363, + "epoch": 0.67, + "learning_rate": 0.00019990447730367826, + "loss": 0.0447, "step": 103390 }, { - "epoch": 1.12, - "learning_rate": 0.0001322408981763904, - "loss": 0.04, + "epoch": 0.67, + "learning_rate": 0.00019989479594932134, + "loss": 0.0438, "step": 103400 }, { - "epoch": 1.12, - "learning_rate": 0.00013222467389188136, - "loss": 0.0306, + "epoch": 0.67, + "learning_rate": 0.0001998851145949644, + "loss": 0.0516, "step": 103410 }, { - "epoch": 1.12, - "learning_rate": 0.0001322084496073723, - "loss": 0.0352, + "epoch": 0.67, + "learning_rate": 0.00019987543324060744, + "loss": 0.0451, "step": 103420 }, { - "epoch": 1.12, - "learning_rate": 0.00013219222532286326, - "loss": 0.0323, + "epoch": 0.67, + "learning_rate": 0.00019986575188625052, + "loss": 0.0448, "step": 103430 }, { - "epoch": 1.12, - "learning_rate": 0.0001321760010383542, - "loss": 0.0402, + "epoch": 0.67, + "learning_rate": 0.00019985607053189358, + "loss": 0.0439, "step": 103440 }, { - "epoch": 1.12, - "learning_rate": 0.00013215977675384513, - "loss": 0.0376, + "epoch": 0.67, + "learning_rate": 0.00019984638917753666, + "loss": 0.043, "step": 103450 }, { - "epoch": 1.12, - "learning_rate": 0.00013214355246933608, - "loss": 0.0372, + "epoch": 0.67, + "learning_rate": 0.00019983670782317974, + "loss": 0.0479, "step": 103460 }, { - "epoch": 1.12, - "learning_rate": 0.00013212732818482703, - "loss": 0.0362, + "epoch": 0.67, + "learning_rate": 0.00019982702646882282, + "loss": 0.0421, "step": 103470 }, { - "epoch": 1.12, - "learning_rate": 0.00013211110390031798, - "loss": 0.0332, + "epoch": 0.67, + "learning_rate": 0.00019981734511446587, + "loss": 0.0508, "step": 103480 }, { - "epoch": 1.12, - "learning_rate": 0.00013209487961580893, - "loss": 0.0363, + "epoch": 0.67, + "learning_rate": 0.00019980766376010892, + "loss": 0.0456, "step": 103490 }, { - "epoch": 1.12, - "learning_rate": 0.00013207865533129988, - "loss": 0.0401, + "epoch": 0.67, + "learning_rate": 0.000199797982405752, + "loss": 0.0461, "step": 103500 }, { - "epoch": 1.12, - "learning_rate": 0.00013206243104679083, - "loss": 0.0369, + "epoch": 0.67, + "learning_rate": 0.00019978830105139505, + "loss": 0.0471, "step": 103510 }, { - "epoch": 1.12, - "learning_rate": 0.00013204620676228178, - "loss": 0.04, + "epoch": 0.67, + "learning_rate": 0.00019977861969703813, + "loss": 0.0466, "step": 103520 }, { - "epoch": 1.12, - "learning_rate": 0.00013202998247777273, - "loss": 0.0353, + "epoch": 0.67, + "learning_rate": 0.00019976893834268121, + "loss": 0.0526, "step": 103530 }, { - "epoch": 1.12, - "learning_rate": 0.00013201375819326365, - "loss": 0.0373, + "epoch": 0.67, + "learning_rate": 0.00019975925698832427, + "loss": 0.0476, "step": 103540 }, { - "epoch": 1.12, - "learning_rate": 0.0001319975339087546, - "loss": 0.0328, + "epoch": 0.67, + "learning_rate": 0.00019974957563396735, + "loss": 0.0433, "step": 103550 }, { - "epoch": 1.12, - "learning_rate": 0.00013198130962424555, - "loss": 0.0396, + "epoch": 0.67, + "learning_rate": 0.0001997398942796104, + "loss": 0.0464, "step": 103560 }, { - "epoch": 1.12, - "learning_rate": 0.0001319650853397365, - "loss": 0.0349, + "epoch": 0.67, + "learning_rate": 0.00019973021292525345, + "loss": 0.043, "step": 103570 }, { - "epoch": 1.12, - "learning_rate": 0.00013194886105522745, - "loss": 0.0375, + "epoch": 0.67, + "learning_rate": 0.00019972053157089653, + "loss": 0.0409, "step": 103580 }, { - "epoch": 1.12, - "learning_rate": 0.0001319326367707184, - "loss": 0.036, + "epoch": 0.67, + "learning_rate": 0.0001997108502165396, + "loss": 0.0412, "step": 103590 }, { - "epoch": 1.12, - "learning_rate": 0.00013191641248620935, - "loss": 0.0333, + "epoch": 0.67, + "learning_rate": 0.0001997011688621827, + "loss": 0.0462, "step": 103600 }, { - "epoch": 1.12, - "learning_rate": 0.0001319001882017003, - "loss": 0.0345, + "epoch": 0.67, + "learning_rate": 0.00019969148750782574, + "loss": 0.0477, "step": 103610 }, { - "epoch": 1.12, - "learning_rate": 0.00013188396391719125, - "loss": 0.0353, + "epoch": 0.67, + "learning_rate": 0.00019968180615346882, + "loss": 0.049, "step": 103620 }, { - "epoch": 1.12, - "learning_rate": 0.0001318677396326822, - "loss": 0.0347, + "epoch": 0.67, + "learning_rate": 0.00019967212479911188, + "loss": 0.0448, "step": 103630 }, { - "epoch": 1.12, - "learning_rate": 0.00013185151534817312, - "loss": 0.0317, + "epoch": 0.67, + "learning_rate": 0.00019966244344475493, + "loss": 0.0502, "step": 103640 }, { - "epoch": 1.12, - "learning_rate": 0.00013183529106366407, - "loss": 0.0304, + "epoch": 0.67, + "learning_rate": 0.000199652762090398, + "loss": 0.0501, "step": 103650 }, { - "epoch": 1.12, - "learning_rate": 0.00013181906677915502, - "loss": 0.0348, + "epoch": 0.67, + "learning_rate": 0.0001996430807360411, + "loss": 0.0457, "step": 103660 }, { - "epoch": 1.12, - "learning_rate": 0.00013180284249464597, - "loss": 0.0318, + "epoch": 0.67, + "learning_rate": 0.00019963339938168417, + "loss": 0.0539, "step": 103670 }, { - "epoch": 1.12, - "learning_rate": 0.00013178661821013692, - "loss": 0.0313, + "epoch": 0.67, + "learning_rate": 0.00019962371802732722, + "loss": 0.0468, "step": 103680 }, { - "epoch": 1.12, - "learning_rate": 0.00013177039392562787, - "loss": 0.0401, + "epoch": 0.67, + "learning_rate": 0.0001996140366729703, + "loss": 0.0504, "step": 103690 }, { - "epoch": 1.12, - "learning_rate": 0.00013175416964111882, - "loss": 0.0367, + "epoch": 0.67, + "learning_rate": 0.00019960435531861335, + "loss": 0.0448, "step": 103700 }, { - "epoch": 1.12, - "learning_rate": 0.00013173794535660977, - "loss": 0.0418, + "epoch": 0.67, + "learning_rate": 0.0001995946739642564, + "loss": 0.0468, "step": 103710 }, { - "epoch": 1.12, - "learning_rate": 0.00013172172107210072, - "loss": 0.0341, + "epoch": 0.67, + "learning_rate": 0.00019958499260989949, + "loss": 0.0459, "step": 103720 }, { - "epoch": 1.12, - "learning_rate": 0.00013170549678759164, - "loss": 0.0346, + "epoch": 0.67, + "learning_rate": 0.00019957531125554257, + "loss": 0.045, "step": 103730 }, { - "epoch": 1.12, - "learning_rate": 0.0001316892725030826, - "loss": 0.0418, + "epoch": 0.67, + "learning_rate": 0.00019956562990118562, + "loss": 0.0521, "step": 103740 }, { - "epoch": 1.12, - "learning_rate": 0.00013167304821857354, - "loss": 0.0326, + "epoch": 0.67, + "learning_rate": 0.0001995559485468287, + "loss": 0.046, "step": 103750 }, { - "epoch": 1.12, - "learning_rate": 0.0001316568239340645, - "loss": 0.0284, + "epoch": 0.67, + "learning_rate": 0.00019954626719247178, + "loss": 0.0451, "step": 103760 }, { - "epoch": 1.12, - "learning_rate": 0.00013164059964955544, - "loss": 0.0428, + "epoch": 0.67, + "learning_rate": 0.0001995365858381148, + "loss": 0.0448, "step": 103770 }, { - "epoch": 1.12, - "learning_rate": 0.0001316243753650464, - "loss": 0.036, + "epoch": 0.67, + "learning_rate": 0.00019952690448375788, + "loss": 0.0449, "step": 103780 }, { - "epoch": 1.12, - "learning_rate": 0.00013160815108053734, - "loss": 0.0367, + "epoch": 0.67, + "learning_rate": 0.00019951722312940096, + "loss": 0.0422, "step": 103790 }, { - "epoch": 1.12, - "learning_rate": 0.0001315919267960283, - "loss": 0.0358, + "epoch": 0.67, + "learning_rate": 0.00019950754177504404, + "loss": 0.0552, "step": 103800 }, { - "epoch": 1.12, - "learning_rate": 0.00013157570251151924, - "loss": 0.0384, + "epoch": 0.67, + "learning_rate": 0.0001994978604206871, + "loss": 0.0502, "step": 103810 }, { - "epoch": 1.12, - "learning_rate": 0.00013155947822701016, - "loss": 0.0408, + "epoch": 0.67, + "learning_rate": 0.00019948817906633018, + "loss": 0.0495, "step": 103820 }, { - "epoch": 1.12, - "learning_rate": 0.0001315432539425011, - "loss": 0.0373, + "epoch": 0.67, + "learning_rate": 0.00019947849771197326, + "loss": 0.0425, "step": 103830 }, { - "epoch": 1.12, - "learning_rate": 0.00013152702965799206, - "loss": 0.0333, + "epoch": 0.67, + "learning_rate": 0.00019946881635761628, + "loss": 0.0587, "step": 103840 }, { - "epoch": 1.12, - "learning_rate": 0.000131510805373483, - "loss": 0.0403, + "epoch": 0.67, + "learning_rate": 0.00019945913500325936, + "loss": 0.0421, "step": 103850 }, { - "epoch": 1.12, - "learning_rate": 0.00013149458108897396, - "loss": 0.0373, + "epoch": 0.67, + "learning_rate": 0.00019944945364890244, + "loss": 0.0538, "step": 103860 }, { - "epoch": 1.12, - "learning_rate": 0.0001314783568044649, - "loss": 0.035, + "epoch": 0.67, + "learning_rate": 0.00019943977229454552, + "loss": 0.0457, "step": 103870 }, { - "epoch": 1.12, - "learning_rate": 0.00013146213251995586, - "loss": 0.0336, + "epoch": 0.67, + "learning_rate": 0.00019943009094018857, + "loss": 0.0452, "step": 103880 }, { - "epoch": 1.12, - "learning_rate": 0.0001314459082354468, - "loss": 0.033, + "epoch": 0.67, + "learning_rate": 0.00019942040958583165, + "loss": 0.0477, "step": 103890 }, { - "epoch": 1.12, - "learning_rate": 0.00013142968395093776, - "loss": 0.0319, + "epoch": 0.67, + "learning_rate": 0.00019941072823147473, + "loss": 0.0479, "step": 103900 }, { - "epoch": 1.12, - "learning_rate": 0.00013141345966642868, - "loss": 0.0392, + "epoch": 0.67, + "learning_rate": 0.00019940104687711776, + "loss": 0.0428, "step": 103910 }, { - "epoch": 1.12, - "learning_rate": 0.00013139723538191963, - "loss": 0.0329, + "epoch": 0.67, + "learning_rate": 0.00019939136552276084, + "loss": 0.0481, "step": 103920 }, { - "epoch": 1.12, - "learning_rate": 0.00013138101109741058, - "loss": 0.0375, + "epoch": 0.67, + "learning_rate": 0.00019938168416840392, + "loss": 0.0473, "step": 103930 }, { - "epoch": 1.12, - "learning_rate": 0.00013136478681290153, - "loss": 0.0341, + "epoch": 0.67, + "learning_rate": 0.00019937200281404697, + "loss": 0.0503, "step": 103940 }, { - "epoch": 1.12, - "learning_rate": 0.00013134856252839248, - "loss": 0.0346, + "epoch": 0.67, + "learning_rate": 0.00019936232145969005, + "loss": 0.0473, "step": 103950 }, { - "epoch": 1.12, - "learning_rate": 0.00013133233824388343, - "loss": 0.0361, + "epoch": 0.67, + "learning_rate": 0.00019935264010533313, + "loss": 0.0426, "step": 103960 }, { - "epoch": 1.12, - "learning_rate": 0.00013131611395937438, - "loss": 0.0409, + "epoch": 0.67, + "learning_rate": 0.0001993429587509762, + "loss": 0.0507, "step": 103970 }, { - "epoch": 1.12, - "learning_rate": 0.00013129988967486533, - "loss": 0.0339, + "epoch": 0.67, + "learning_rate": 0.00019933327739661924, + "loss": 0.0548, "step": 103980 }, { - "epoch": 1.12, - "learning_rate": 0.00013128366539035628, - "loss": 0.0371, + "epoch": 0.67, + "learning_rate": 0.00019932359604226232, + "loss": 0.0506, "step": 103990 }, { - "epoch": 1.12, - "learning_rate": 0.0001312674411058472, - "loss": 0.0348, + "epoch": 0.67, + "learning_rate": 0.0001993139146879054, + "loss": 0.046, "step": 104000 }, { - "epoch": 1.12, - "eval_cer": 0.921156092242831, - "eval_loss": 0.027890626341104507, - "eval_runtime": 118.8637, - "eval_samples_per_second": 16.826, - "eval_steps_per_second": 4.206, + "epoch": 0.67, + "eval_cer": 0.9198345949610214, + "eval_loss": 0.03151978179812431, + "eval_runtime": 120.1984, + "eval_samples_per_second": 16.639, + "eval_steps_per_second": 4.16, "step": 104000 }, { - "epoch": 1.12, - "learning_rate": 0.00013125121682133815, - "loss": 0.0351, + "epoch": 0.67, + "learning_rate": 0.00019930423333354845, + "loss": 0.0484, "step": 104010 }, { - "epoch": 1.13, - "learning_rate": 0.0001312349925368291, - "loss": 0.0447, + "epoch": 0.67, + "learning_rate": 0.00019929455197919153, + "loss": 0.0488, "step": 104020 }, { - "epoch": 1.13, - "learning_rate": 0.00013121876825232005, - "loss": 0.0339, + "epoch": 0.67, + "learning_rate": 0.0001992848706248346, + "loss": 0.0434, "step": 104030 }, { - "epoch": 1.13, - "learning_rate": 0.000131202543967811, - "loss": 0.036, + "epoch": 0.67, + "learning_rate": 0.0001992751892704777, + "loss": 0.0429, "step": 104040 }, { - "epoch": 1.13, - "learning_rate": 0.00013118631968330195, - "loss": 0.0342, + "epoch": 0.67, + "learning_rate": 0.0001992655079161207, + "loss": 0.0523, "step": 104050 }, { - "epoch": 1.13, - "learning_rate": 0.0001311700953987929, - "loss": 0.0323, + "epoch": 0.67, + "learning_rate": 0.0001992558265617638, + "loss": 0.0472, "step": 104060 }, { - "epoch": 1.13, - "learning_rate": 0.00013115387111428385, - "loss": 0.0385, + "epoch": 0.67, + "learning_rate": 0.00019924614520740687, + "loss": 0.0426, "step": 104070 }, { - "epoch": 1.13, - "learning_rate": 0.0001311376468297748, - "loss": 0.0397, + "epoch": 0.67, + "learning_rate": 0.00019923646385304992, + "loss": 0.0503, "step": 104080 }, { - "epoch": 1.13, - "learning_rate": 0.00013112142254526572, - "loss": 0.0319, + "epoch": 0.67, + "learning_rate": 0.000199226782498693, + "loss": 0.0488, "step": 104090 }, { - "epoch": 1.13, - "learning_rate": 0.00013110519826075667, - "loss": 0.0357, + "epoch": 0.67, + "learning_rate": 0.00019921710114433608, + "loss": 0.0456, "step": 104100 }, { - "epoch": 1.13, - "learning_rate": 0.00013108897397624762, - "loss": 0.0413, + "epoch": 0.67, + "learning_rate": 0.00019920741978997914, + "loss": 0.0545, "step": 104110 }, { - "epoch": 1.13, - "learning_rate": 0.00013107274969173857, - "loss": 0.0303, + "epoch": 0.67, + "learning_rate": 0.0001991977384356222, + "loss": 0.0459, "step": 104120 }, { - "epoch": 1.13, - "learning_rate": 0.00013105652540722952, - "loss": 0.0366, + "epoch": 0.67, + "learning_rate": 0.00019918805708126527, + "loss": 0.0473, "step": 104130 }, { - "epoch": 1.13, - "learning_rate": 0.00013104030112272047, - "loss": 0.037, + "epoch": 0.67, + "learning_rate": 0.00019917837572690832, + "loss": 0.0519, "step": 104140 }, { - "epoch": 1.13, - "learning_rate": 0.00013102407683821142, - "loss": 0.0376, + "epoch": 0.67, + "learning_rate": 0.0001991686943725514, + "loss": 0.0419, "step": 104150 }, { - "epoch": 1.13, - "learning_rate": 0.00013100785255370237, - "loss": 0.038, + "epoch": 0.67, + "learning_rate": 0.00019915901301819448, + "loss": 0.0441, "step": 104160 }, { - "epoch": 1.13, - "learning_rate": 0.00013099162826919332, - "loss": 0.0337, + "epoch": 0.67, + "learning_rate": 0.00019914933166383756, + "loss": 0.0503, "step": 104170 }, { - "epoch": 1.13, - "learning_rate": 0.00013097540398468425, - "loss": 0.0405, + "epoch": 0.67, + "learning_rate": 0.00019913965030948061, + "loss": 0.0429, "step": 104180 }, { - "epoch": 1.13, - "learning_rate": 0.0001309591797001752, - "loss": 0.0368, + "epoch": 0.67, + "learning_rate": 0.00019912996895512367, + "loss": 0.0415, "step": 104190 }, { - "epoch": 1.13, - "learning_rate": 0.00013094295541566615, - "loss": 0.0354, + "epoch": 0.67, + "learning_rate": 0.00019912028760076675, + "loss": 0.0483, "step": 104200 }, { - "epoch": 1.13, - "learning_rate": 0.0001309267311311571, - "loss": 0.0374, + "epoch": 0.67, + "learning_rate": 0.0001991106062464098, + "loss": 0.0472, "step": 104210 }, { - "epoch": 1.13, - "learning_rate": 0.00013091050684664804, - "loss": 0.0374, + "epoch": 0.67, + "learning_rate": 0.00019910092489205288, + "loss": 0.0502, "step": 104220 }, { - "epoch": 1.13, - "learning_rate": 0.000130894282562139, - "loss": 0.0456, + "epoch": 0.67, + "learning_rate": 0.00019909124353769596, + "loss": 0.0432, "step": 104230 }, { - "epoch": 1.13, - "learning_rate": 0.00013087805827762994, - "loss": 0.0304, + "epoch": 0.67, + "learning_rate": 0.00019908156218333904, + "loss": 0.0469, "step": 104240 }, { - "epoch": 1.13, - "learning_rate": 0.0001308618339931209, - "loss": 0.0313, + "epoch": 0.67, + "learning_rate": 0.0001990718808289821, + "loss": 0.0381, "step": 104250 }, { - "epoch": 1.13, - "learning_rate": 0.00013084560970861184, - "loss": 0.0385, + "epoch": 0.67, + "learning_rate": 0.00019906219947462514, + "loss": 0.0454, "step": 104260 }, { - "epoch": 1.13, - "learning_rate": 0.00013082938542410277, - "loss": 0.036, + "epoch": 0.67, + "learning_rate": 0.00019905251812026822, + "loss": 0.0431, "step": 104270 }, { - "epoch": 1.13, - "learning_rate": 0.00013081316113959372, - "loss": 0.0345, + "epoch": 0.67, + "learning_rate": 0.00019904283676591128, + "loss": 0.0448, "step": 104280 }, { - "epoch": 1.13, - "learning_rate": 0.00013079693685508467, - "loss": 0.0307, + "epoch": 0.67, + "learning_rate": 0.00019903315541155436, + "loss": 0.0461, "step": 104290 }, { - "epoch": 1.13, - "learning_rate": 0.00013078071257057562, - "loss": 0.0431, + "epoch": 0.67, + "learning_rate": 0.00019902347405719744, + "loss": 0.0426, "step": 104300 }, { - "epoch": 1.13, - "learning_rate": 0.00013076448828606657, - "loss": 0.0436, + "epoch": 0.67, + "learning_rate": 0.0001990137927028405, + "loss": 0.0491, "step": 104310 }, { - "epoch": 1.13, - "learning_rate": 0.00013074826400155752, - "loss": 0.0316, + "epoch": 0.67, + "learning_rate": 0.00019900411134848357, + "loss": 0.0424, "step": 104320 }, { - "epoch": 1.13, - "learning_rate": 0.00013073203971704847, - "loss": 0.0395, + "epoch": 0.67, + "learning_rate": 0.00019899442999412662, + "loss": 0.0415, "step": 104330 }, { - "epoch": 1.13, - "learning_rate": 0.00013071581543253941, - "loss": 0.0425, + "epoch": 0.67, + "learning_rate": 0.00019898474863976967, + "loss": 0.0472, "step": 104340 }, { - "epoch": 1.13, - "learning_rate": 0.00013069959114803036, - "loss": 0.0388, + "epoch": 0.67, + "learning_rate": 0.00019897506728541275, + "loss": 0.0414, "step": 104350 }, { - "epoch": 1.13, - "learning_rate": 0.0001306833668635213, - "loss": 0.0384, + "epoch": 0.67, + "learning_rate": 0.00019896538593105583, + "loss": 0.0419, "step": 104360 }, { - "epoch": 1.13, - "learning_rate": 0.00013066714257901224, - "loss": 0.0367, + "epoch": 0.67, + "learning_rate": 0.00019895570457669891, + "loss": 0.0448, "step": 104370 }, { - "epoch": 1.13, - "learning_rate": 0.0001306509182945032, - "loss": 0.0437, + "epoch": 0.67, + "learning_rate": 0.00019894602322234197, + "loss": 0.0532, "step": 104380 }, { - "epoch": 1.13, - "learning_rate": 0.00013063469400999414, - "loss": 0.0384, + "epoch": 0.67, + "learning_rate": 0.00019893634186798505, + "loss": 0.0494, "step": 104390 }, { - "epoch": 1.13, - "learning_rate": 0.00013061846972548509, - "loss": 0.04, + "epoch": 0.67, + "learning_rate": 0.0001989266605136281, + "loss": 0.043, "step": 104400 }, { - "epoch": 1.13, - "learning_rate": 0.00013060224544097604, - "loss": 0.0324, + "epoch": 0.67, + "learning_rate": 0.00019891697915927115, + "loss": 0.0467, "step": 104410 }, { - "epoch": 1.13, - "learning_rate": 0.00013058602115646699, - "loss": 0.0342, + "epoch": 0.67, + "learning_rate": 0.00019890729780491423, + "loss": 0.0483, "step": 104420 }, { - "epoch": 1.13, - "learning_rate": 0.00013056979687195794, - "loss": 0.0366, + "epoch": 0.67, + "learning_rate": 0.0001988976164505573, + "loss": 0.046, "step": 104430 }, { - "epoch": 1.13, - "learning_rate": 0.00013055357258744889, - "loss": 0.043, + "epoch": 0.67, + "learning_rate": 0.0001988879350962004, + "loss": 0.059, "step": 104440 }, { - "epoch": 1.13, - "learning_rate": 0.00013053734830293984, - "loss": 0.0388, + "epoch": 0.67, + "learning_rate": 0.00019887825374184344, + "loss": 0.0463, "step": 104450 }, { - "epoch": 1.13, - "learning_rate": 0.00013052112401843078, - "loss": 0.0352, + "epoch": 0.67, + "learning_rate": 0.00019886857238748652, + "loss": 0.052, "step": 104460 }, { - "epoch": 1.13, - "learning_rate": 0.00013050489973392173, - "loss": 0.0361, + "epoch": 0.67, + "learning_rate": 0.00019885889103312958, + "loss": 0.0453, "step": 104470 }, { - "epoch": 1.13, - "learning_rate": 0.00013048867544941268, - "loss": 0.0328, + "epoch": 0.67, + "learning_rate": 0.00019884920967877263, + "loss": 0.0435, "step": 104480 }, { - "epoch": 1.13, - "learning_rate": 0.00013047245116490363, - "loss": 0.0364, + "epoch": 0.67, + "learning_rate": 0.0001988395283244157, + "loss": 0.0487, "step": 104490 }, { - "epoch": 1.13, - "learning_rate": 0.00013045622688039458, - "loss": 0.0387, + "epoch": 0.67, + "learning_rate": 0.0001988298469700588, + "loss": 0.0392, "step": 104500 }, { - "epoch": 1.13, - "learning_rate": 0.0001304400025958855, - "loss": 0.0357, + "epoch": 0.67, + "learning_rate": 0.00019882016561570184, + "loss": 0.0453, "step": 104510 }, { - "epoch": 1.13, - "learning_rate": 0.00013042377831137646, - "loss": 0.0297, + "epoch": 0.67, + "learning_rate": 0.00019881048426134492, + "loss": 0.0477, "step": 104520 }, { - "epoch": 1.13, - "learning_rate": 0.0001304075540268674, - "loss": 0.0393, + "epoch": 0.67, + "learning_rate": 0.000198800802906988, + "loss": 0.0454, "step": 104530 }, { - "epoch": 1.13, - "learning_rate": 0.00013039132974235836, - "loss": 0.03, + "epoch": 0.67, + "learning_rate": 0.00019879112155263103, + "loss": 0.0488, "step": 104540 }, { - "epoch": 1.13, - "learning_rate": 0.0001303751054578493, - "loss": 0.0381, + "epoch": 0.67, + "learning_rate": 0.0001987814401982741, + "loss": 0.0453, "step": 104550 }, { - "epoch": 1.13, - "learning_rate": 0.00013035888117334026, - "loss": 0.0339, + "epoch": 0.67, + "learning_rate": 0.00019877175884391719, + "loss": 0.043, "step": 104560 }, { - "epoch": 1.13, - "learning_rate": 0.0001303426568888312, - "loss": 0.0298, + "epoch": 0.67, + "learning_rate": 0.00019876207748956027, + "loss": 0.0474, "step": 104570 }, { - "epoch": 1.13, - "learning_rate": 0.00013032643260432216, - "loss": 0.0402, + "epoch": 0.67, + "learning_rate": 0.00019875239613520332, + "loss": 0.0489, "step": 104580 }, { - "epoch": 1.13, - "learning_rate": 0.0001303102083198131, - "loss": 0.0356, + "epoch": 0.68, + "learning_rate": 0.0001987427147808464, + "loss": 0.045, "step": 104590 }, { - "epoch": 1.13, - "learning_rate": 0.00013029398403530403, - "loss": 0.0348, + "epoch": 0.68, + "learning_rate": 0.00019873303342648948, + "loss": 0.049, "step": 104600 }, { - "epoch": 1.13, - "learning_rate": 0.00013027775975079498, - "loss": 0.0319, + "epoch": 0.68, + "learning_rate": 0.0001987233520721325, + "loss": 0.0406, "step": 104610 }, { - "epoch": 1.13, - "learning_rate": 0.00013026153546628593, - "loss": 0.0335, + "epoch": 0.68, + "learning_rate": 0.00019871367071777558, + "loss": 0.0459, "step": 104620 }, { - "epoch": 1.13, - "learning_rate": 0.00013024531118177688, - "loss": 0.0379, + "epoch": 0.68, + "learning_rate": 0.00019870398936341866, + "loss": 0.0438, "step": 104630 }, { - "epoch": 1.13, - "learning_rate": 0.00013022908689726783, - "loss": 0.0332, + "epoch": 0.68, + "learning_rate": 0.00019869430800906174, + "loss": 0.05, "step": 104640 }, { - "epoch": 1.13, - "learning_rate": 0.00013021286261275878, - "loss": 0.0323, + "epoch": 0.68, + "learning_rate": 0.0001986846266547048, + "loss": 0.0446, "step": 104650 }, { - "epoch": 1.13, - "learning_rate": 0.00013019663832824973, - "loss": 0.0345, + "epoch": 0.68, + "learning_rate": 0.00019867494530034788, + "loss": 0.0481, "step": 104660 }, { - "epoch": 1.13, - "learning_rate": 0.00013018041404374068, - "loss": 0.0385, + "epoch": 0.68, + "learning_rate": 0.00019866526394599095, + "loss": 0.0437, "step": 104670 }, { - "epoch": 1.13, - "learning_rate": 0.00013016418975923163, - "loss": 0.0438, + "epoch": 0.68, + "learning_rate": 0.00019865558259163398, + "loss": 0.0435, "step": 104680 }, { - "epoch": 1.13, - "learning_rate": 0.00013014796547472255, - "loss": 0.038, + "epoch": 0.68, + "learning_rate": 0.00019864590123727706, + "loss": 0.0496, "step": 104690 }, { - "epoch": 1.13, - "learning_rate": 0.0001301317411902135, - "loss": 0.0366, + "epoch": 0.68, + "learning_rate": 0.00019863621988292014, + "loss": 0.0501, "step": 104700 }, { - "epoch": 1.13, - "learning_rate": 0.00013011551690570445, - "loss": 0.0354, + "epoch": 0.68, + "learning_rate": 0.0001986265385285632, + "loss": 0.0471, "step": 104710 }, { - "epoch": 1.13, - "learning_rate": 0.0001300992926211954, - "loss": 0.0404, + "epoch": 0.68, + "learning_rate": 0.00019861685717420627, + "loss": 0.0542, "step": 104720 }, { - "epoch": 1.13, - "learning_rate": 0.00013008306833668635, - "loss": 0.0331, + "epoch": 0.68, + "learning_rate": 0.00019860717581984935, + "loss": 0.0464, "step": 104730 }, { - "epoch": 1.13, - "learning_rate": 0.0001300668440521773, - "loss": 0.0361, + "epoch": 0.68, + "learning_rate": 0.00019859749446549243, + "loss": 0.0493, "step": 104740 }, { - "epoch": 1.13, - "learning_rate": 0.00013005061976766825, - "loss": 0.0331, + "epoch": 0.68, + "learning_rate": 0.00019858781311113546, + "loss": 0.0648, "step": 104750 }, { - "epoch": 1.13, - "learning_rate": 0.0001300343954831592, - "loss": 0.0438, + "epoch": 0.68, + "learning_rate": 0.00019857813175677854, + "loss": 0.0541, "step": 104760 }, { - "epoch": 1.13, - "learning_rate": 0.00013001817119865015, - "loss": 0.0375, + "epoch": 0.68, + "learning_rate": 0.00019856845040242162, + "loss": 0.0464, "step": 104770 }, { - "epoch": 1.13, - "learning_rate": 0.00013000194691414107, - "loss": 0.0378, + "epoch": 0.68, + "learning_rate": 0.00019855876904806467, + "loss": 0.0438, "step": 104780 }, { - "epoch": 1.13, - "learning_rate": 0.00012998572262963202, - "loss": 0.0387, + "epoch": 0.68, + "learning_rate": 0.00019854908769370775, + "loss": 0.0574, "step": 104790 }, { - "epoch": 1.13, - "learning_rate": 0.00012996949834512297, - "loss": 0.0354, + "epoch": 0.68, + "learning_rate": 0.00019853940633935083, + "loss": 0.0437, "step": 104800 }, { - "epoch": 1.13, - "learning_rate": 0.00012995327406061392, - "loss": 0.034, + "epoch": 0.68, + "learning_rate": 0.0001985297249849939, + "loss": 0.047, "step": 104810 }, { - "epoch": 1.13, - "learning_rate": 0.00012993704977610487, - "loss": 0.0355, + "epoch": 0.68, + "learning_rate": 0.00019852004363063694, + "loss": 0.0438, "step": 104820 }, { - "epoch": 1.13, - "learning_rate": 0.00012992082549159582, - "loss": 0.0311, + "epoch": 0.68, + "learning_rate": 0.00019851036227628001, + "loss": 0.0442, "step": 104830 }, { - "epoch": 1.13, - "learning_rate": 0.00012990460120708677, - "loss": 0.0429, + "epoch": 0.68, + "learning_rate": 0.0001985006809219231, + "loss": 0.0443, "step": 104840 }, { - "epoch": 1.13, - "learning_rate": 0.00012988837692257772, - "loss": 0.0381, + "epoch": 0.68, + "learning_rate": 0.00019849099956756615, + "loss": 0.046, "step": 104850 }, { - "epoch": 1.13, - "learning_rate": 0.00012987215263806867, - "loss": 0.0333, + "epoch": 0.68, + "learning_rate": 0.00019848131821320923, + "loss": 0.0413, "step": 104860 }, { - "epoch": 1.13, - "learning_rate": 0.0001298559283535596, - "loss": 0.037, + "epoch": 0.68, + "learning_rate": 0.0001984716368588523, + "loss": 0.0451, "step": 104870 }, { - "epoch": 1.13, - "learning_rate": 0.00012983970406905054, - "loss": 0.0361, + "epoch": 0.68, + "learning_rate": 0.0001984619555044954, + "loss": 0.0453, "step": 104880 }, { - "epoch": 1.13, - "learning_rate": 0.0001298234797845415, - "loss": 0.0417, + "epoch": 0.68, + "learning_rate": 0.0001984522741501384, + "loss": 0.0459, "step": 104890 }, { - "epoch": 1.13, - "learning_rate": 0.00012980725550003244, - "loss": 0.0321, + "epoch": 0.68, + "learning_rate": 0.0001984425927957815, + "loss": 0.049, "step": 104900 }, { - "epoch": 1.13, - "learning_rate": 0.0001297910312155234, - "loss": 0.0326, + "epoch": 0.68, + "learning_rate": 0.00019843291144142454, + "loss": 0.0482, "step": 104910 }, { - "epoch": 1.13, - "learning_rate": 0.00012977480693101434, - "loss": 0.0371, + "epoch": 0.68, + "learning_rate": 0.00019842323008706762, + "loss": 0.0448, "step": 104920 }, { - "epoch": 1.13, - "learning_rate": 0.0001297585826465053, - "loss": 0.038, + "epoch": 0.68, + "learning_rate": 0.0001984135487327107, + "loss": 0.0473, "step": 104930 }, { - "epoch": 1.14, - "learning_rate": 0.00012974235836199624, - "loss": 0.0341, + "epoch": 0.68, + "learning_rate": 0.00019840386737835378, + "loss": 0.0512, "step": 104940 }, { - "epoch": 1.14, - "learning_rate": 0.0001297261340774872, - "loss": 0.0363, + "epoch": 0.68, + "learning_rate": 0.00019839418602399684, + "loss": 0.0436, "step": 104950 }, { - "epoch": 1.14, - "learning_rate": 0.0001297099097929781, - "loss": 0.0374, + "epoch": 0.68, + "learning_rate": 0.0001983845046696399, + "loss": 0.0489, "step": 104960 }, { - "epoch": 1.14, - "learning_rate": 0.00012969368550846906, - "loss": 0.0336, + "epoch": 0.68, + "learning_rate": 0.00019837482331528297, + "loss": 0.0526, "step": 104970 }, { - "epoch": 1.14, - "learning_rate": 0.00012967746122396, - "loss": 0.0354, + "epoch": 0.68, + "learning_rate": 0.00019836514196092602, + "loss": 0.0395, "step": 104980 }, { - "epoch": 1.14, - "learning_rate": 0.00012966123693945096, - "loss": 0.0367, + "epoch": 0.68, + "learning_rate": 0.0001983554606065691, + "loss": 0.0449, "step": 104990 }, { - "epoch": 1.14, - "learning_rate": 0.0001296450126549419, - "loss": 0.0363, + "epoch": 0.68, + "learning_rate": 0.00019834577925221218, + "loss": 0.0462, "step": 105000 }, { - "epoch": 1.14, - "eval_cer": 0.9211666940546807, - "eval_loss": 0.02789819799363613, - "eval_runtime": 119.0331, - "eval_samples_per_second": 16.802, - "eval_steps_per_second": 4.201, + "epoch": 0.68, + "eval_cer": 0.9199078070274546, + "eval_loss": 0.03056810237467289, + "eval_runtime": 119.7885, + "eval_samples_per_second": 16.696, + "eval_steps_per_second": 4.174, "step": 105000 }, { - "epoch": 1.14, - "learning_rate": 0.00012962878837043286, - "loss": 0.0382, + "epoch": 0.68, + "learning_rate": 0.00019833609789785526, + "loss": 0.0445, "step": 105010 }, { - "epoch": 1.14, - "learning_rate": 0.0001296125640859238, - "loss": 0.0377, + "epoch": 0.68, + "learning_rate": 0.00019832641654349831, + "loss": 0.044, "step": 105020 }, { - "epoch": 1.14, - "learning_rate": 0.00012959633980141476, - "loss": 0.0474, + "epoch": 0.68, + "learning_rate": 0.00019831673518914137, + "loss": 0.0484, "step": 105030 }, { - "epoch": 1.14, - "learning_rate": 0.0001295801155169057, - "loss": 0.0389, + "epoch": 0.68, + "learning_rate": 0.00019830705383478445, + "loss": 0.042, "step": 105040 }, { - "epoch": 1.14, - "learning_rate": 0.00012956389123239663, - "loss": 0.0401, + "epoch": 0.68, + "learning_rate": 0.0001982973724804275, + "loss": 0.0496, "step": 105050 }, { - "epoch": 1.14, - "learning_rate": 0.00012954766694788758, - "loss": 0.0314, + "epoch": 0.68, + "learning_rate": 0.00019828769112607058, + "loss": 0.0528, "step": 105060 }, { - "epoch": 1.14, - "learning_rate": 0.00012953144266337853, - "loss": 0.0356, + "epoch": 0.68, + "learning_rate": 0.00019827800977171366, + "loss": 0.052, "step": 105070 }, { - "epoch": 1.14, - "learning_rate": 0.00012951521837886948, - "loss": 0.0361, + "epoch": 0.68, + "learning_rate": 0.00019826832841735674, + "loss": 0.0502, "step": 105080 }, { - "epoch": 1.14, - "learning_rate": 0.00012949899409436043, - "loss": 0.0324, + "epoch": 0.68, + "learning_rate": 0.0001982586470629998, + "loss": 0.0518, "step": 105090 }, { - "epoch": 1.14, - "learning_rate": 0.00012948276980985138, - "loss": 0.033, + "epoch": 0.68, + "learning_rate": 0.00019824896570864284, + "loss": 0.0435, "step": 105100 }, { - "epoch": 1.14, - "learning_rate": 0.00012946654552534233, - "loss": 0.0396, + "epoch": 0.68, + "learning_rate": 0.0001982392843542859, + "loss": 0.0513, "step": 105110 }, { - "epoch": 1.14, - "learning_rate": 0.00012945032124083328, - "loss": 0.039, + "epoch": 0.68, + "learning_rate": 0.00019822960299992898, + "loss": 0.0521, "step": 105120 }, { - "epoch": 1.14, - "learning_rate": 0.00012943409695632423, - "loss": 0.0315, + "epoch": 0.68, + "learning_rate": 0.00019821992164557206, + "loss": 0.0479, "step": 105130 }, { - "epoch": 1.14, - "learning_rate": 0.00012941787267181515, - "loss": 0.0342, + "epoch": 0.68, + "learning_rate": 0.00019821024029121514, + "loss": 0.0433, "step": 105140 }, { - "epoch": 1.14, - "learning_rate": 0.0001294016483873061, - "loss": 0.0367, + "epoch": 0.68, + "learning_rate": 0.0001982005589368582, + "loss": 0.0464, "step": 105150 }, { - "epoch": 1.14, - "learning_rate": 0.00012938542410279705, - "loss": 0.0375, + "epoch": 0.68, + "learning_rate": 0.00019819087758250127, + "loss": 0.0426, "step": 105160 }, { - "epoch": 1.14, - "learning_rate": 0.000129369199818288, - "loss": 0.0305, + "epoch": 0.68, + "learning_rate": 0.00019818119622814432, + "loss": 0.0509, "step": 105170 }, { - "epoch": 1.14, - "learning_rate": 0.00012935297553377895, - "loss": 0.0331, + "epoch": 0.68, + "learning_rate": 0.00019817151487378737, + "loss": 0.0454, "step": 105180 }, { - "epoch": 1.14, - "learning_rate": 0.0001293367512492699, - "loss": 0.0337, + "epoch": 0.68, + "learning_rate": 0.00019816183351943045, + "loss": 0.0409, "step": 105190 }, { - "epoch": 1.14, - "learning_rate": 0.00012932052696476085, - "loss": 0.0426, + "epoch": 0.68, + "learning_rate": 0.00019815215216507353, + "loss": 0.0365, "step": 105200 }, { - "epoch": 1.14, - "learning_rate": 0.0001293043026802518, - "loss": 0.0345, + "epoch": 0.68, + "learning_rate": 0.0001981424708107166, + "loss": 0.042, "step": 105210 }, { - "epoch": 1.14, - "learning_rate": 0.00012928807839574275, - "loss": 0.0407, + "epoch": 0.68, + "learning_rate": 0.00019813278945635967, + "loss": 0.0501, "step": 105220 }, { - "epoch": 1.14, - "learning_rate": 0.00012927185411123367, - "loss": 0.0331, + "epoch": 0.68, + "learning_rate": 0.00019812310810200275, + "loss": 0.0458, "step": 105230 }, { - "epoch": 1.14, - "learning_rate": 0.00012925562982672462, - "loss": 0.038, + "epoch": 0.68, + "learning_rate": 0.0001981134267476458, + "loss": 0.049, "step": 105240 }, { - "epoch": 1.14, - "learning_rate": 0.00012923940554221557, - "loss": 0.0393, + "epoch": 0.68, + "learning_rate": 0.00019810374539328885, + "loss": 0.0502, "step": 105250 }, { - "epoch": 1.14, - "learning_rate": 0.00012922318125770652, - "loss": 0.0389, + "epoch": 0.68, + "learning_rate": 0.00019809406403893193, + "loss": 0.0521, "step": 105260 }, { - "epoch": 1.14, - "learning_rate": 0.00012920695697319747, - "loss": 0.0363, + "epoch": 0.68, + "learning_rate": 0.000198084382684575, + "loss": 0.0469, "step": 105270 }, { - "epoch": 1.14, - "learning_rate": 0.00012919073268868842, - "loss": 0.0315, + "epoch": 0.68, + "learning_rate": 0.0001980747013302181, + "loss": 0.0429, "step": 105280 }, { - "epoch": 1.14, - "learning_rate": 0.00012917450840417937, - "loss": 0.0374, + "epoch": 0.68, + "learning_rate": 0.00019806501997586114, + "loss": 0.0412, "step": 105290 }, { - "epoch": 1.14, - "learning_rate": 0.00012915828411967032, - "loss": 0.0335, + "epoch": 0.68, + "learning_rate": 0.00019805533862150422, + "loss": 0.0457, "step": 105300 }, { - "epoch": 1.14, - "learning_rate": 0.00012914205983516127, - "loss": 0.0371, + "epoch": 0.68, + "learning_rate": 0.00019804565726714725, + "loss": 0.0476, "step": 105310 }, { - "epoch": 1.14, - "learning_rate": 0.0001291258355506522, - "loss": 0.029, + "epoch": 0.68, + "learning_rate": 0.00019803597591279033, + "loss": 0.0517, "step": 105320 }, { - "epoch": 1.14, - "learning_rate": 0.00012910961126614314, - "loss": 0.0405, + "epoch": 0.68, + "learning_rate": 0.0001980262945584334, + "loss": 0.0448, "step": 105330 }, { - "epoch": 1.14, - "learning_rate": 0.0001290933869816341, - "loss": 0.0301, + "epoch": 0.68, + "learning_rate": 0.0001980166132040765, + "loss": 0.0541, "step": 105340 }, { - "epoch": 1.14, - "learning_rate": 0.00012907716269712504, - "loss": 0.0386, + "epoch": 0.68, + "learning_rate": 0.00019800693184971954, + "loss": 0.0424, "step": 105350 }, { - "epoch": 1.14, - "learning_rate": 0.000129060938412616, - "loss": 0.0322, + "epoch": 0.68, + "learning_rate": 0.00019799725049536262, + "loss": 0.0456, "step": 105360 }, { - "epoch": 1.14, - "learning_rate": 0.00012904471412810694, - "loss": 0.0349, + "epoch": 0.68, + "learning_rate": 0.0001979875691410057, + "loss": 0.0446, "step": 105370 }, { - "epoch": 1.14, - "learning_rate": 0.0001290284898435979, - "loss": 0.0371, + "epoch": 0.68, + "learning_rate": 0.00019797788778664873, + "loss": 0.0518, "step": 105380 }, { - "epoch": 1.14, - "learning_rate": 0.00012901226555908884, - "loss": 0.0324, + "epoch": 0.68, + "learning_rate": 0.0001979682064322918, + "loss": 0.0506, "step": 105390 }, { - "epoch": 1.14, - "learning_rate": 0.0001289960412745798, - "loss": 0.0357, + "epoch": 0.68, + "learning_rate": 0.00019795852507793489, + "loss": 0.0506, "step": 105400 }, { - "epoch": 1.14, - "learning_rate": 0.00012897981699007072, - "loss": 0.037, + "epoch": 0.68, + "learning_rate": 0.00019794884372357797, + "loss": 0.0509, "step": 105410 }, { - "epoch": 1.14, - "learning_rate": 0.00012896359270556166, - "loss": 0.0366, + "epoch": 0.68, + "learning_rate": 0.00019793916236922102, + "loss": 0.0425, "step": 105420 }, { - "epoch": 1.14, - "learning_rate": 0.00012894736842105261, - "loss": 0.0291, + "epoch": 0.68, + "learning_rate": 0.0001979294810148641, + "loss": 0.0419, "step": 105430 }, { - "epoch": 1.14, - "learning_rate": 0.00012893114413654356, - "loss": 0.0307, + "epoch": 0.68, + "learning_rate": 0.00019791979966050718, + "loss": 0.0399, "step": 105440 }, { - "epoch": 1.14, - "learning_rate": 0.00012891491985203451, - "loss": 0.0369, + "epoch": 0.68, + "learning_rate": 0.0001979101183061502, + "loss": 0.0511, "step": 105450 }, { - "epoch": 1.14, - "learning_rate": 0.00012889869556752546, - "loss": 0.0421, + "epoch": 0.68, + "learning_rate": 0.00019790043695179328, + "loss": 0.0478, "step": 105460 }, { - "epoch": 1.14, - "learning_rate": 0.00012888247128301641, - "loss": 0.0384, + "epoch": 0.68, + "learning_rate": 0.00019789075559743636, + "loss": 0.0446, "step": 105470 }, { - "epoch": 1.14, - "learning_rate": 0.00012886624699850736, - "loss": 0.0415, + "epoch": 0.68, + "learning_rate": 0.00019788107424307944, + "loss": 0.0486, "step": 105480 }, { - "epoch": 1.14, - "learning_rate": 0.0001288500227139983, - "loss": 0.0338, + "epoch": 0.68, + "learning_rate": 0.0001978713928887225, + "loss": 0.0412, "step": 105490 }, { - "epoch": 1.14, - "learning_rate": 0.00012883379842948924, - "loss": 0.038, + "epoch": 0.68, + "learning_rate": 0.00019786171153436557, + "loss": 0.0442, "step": 105500 }, { - "epoch": 1.14, - "learning_rate": 0.00012881757414498019, - "loss": 0.039, + "epoch": 0.68, + "learning_rate": 0.00019785203018000865, + "loss": 0.0457, "step": 105510 }, { - "epoch": 1.14, - "learning_rate": 0.00012880134986047114, - "loss": 0.0493, + "epoch": 0.68, + "learning_rate": 0.00019784234882565168, + "loss": 0.0432, "step": 105520 }, { - "epoch": 1.14, - "learning_rate": 0.00012878512557596209, - "loss": 0.0331, + "epoch": 0.68, + "learning_rate": 0.00019783266747129476, + "loss": 0.0508, "step": 105530 }, { - "epoch": 1.14, - "learning_rate": 0.00012876890129145303, - "loss": 0.0365, + "epoch": 0.68, + "learning_rate": 0.00019782298611693784, + "loss": 0.0436, "step": 105540 }, { - "epoch": 1.14, - "learning_rate": 0.00012875267700694398, - "loss": 0.037, + "epoch": 0.68, + "learning_rate": 0.0001978133047625809, + "loss": 0.0444, "step": 105550 }, { - "epoch": 1.14, - "learning_rate": 0.00012873645272243493, - "loss": 0.0369, + "epoch": 0.68, + "learning_rate": 0.00019780362340822397, + "loss": 0.0447, "step": 105560 }, { - "epoch": 1.14, - "learning_rate": 0.00012872022843792588, - "loss": 0.0406, + "epoch": 0.68, + "learning_rate": 0.00019779394205386705, + "loss": 0.0464, "step": 105570 }, { - "epoch": 1.14, - "learning_rate": 0.00012870400415341683, - "loss": 0.0323, + "epoch": 0.68, + "learning_rate": 0.00019778426069951013, + "loss": 0.044, "step": 105580 }, { - "epoch": 1.14, - "learning_rate": 0.00012868777986890776, - "loss": 0.0324, + "epoch": 0.68, + "learning_rate": 0.00019777457934515316, + "loss": 0.0476, "step": 105590 }, { - "epoch": 1.14, - "learning_rate": 0.0001286715555843987, - "loss": 0.0426, + "epoch": 0.68, + "learning_rate": 0.00019776489799079624, + "loss": 0.0448, "step": 105600 }, { - "epoch": 1.14, - "learning_rate": 0.00012865533129988966, - "loss": 0.0296, + "epoch": 0.68, + "learning_rate": 0.00019775521663643932, + "loss": 0.0463, "step": 105610 }, { - "epoch": 1.14, - "learning_rate": 0.0001286391070153806, - "loss": 0.0326, + "epoch": 0.68, + "learning_rate": 0.00019774553528208237, + "loss": 0.0431, "step": 105620 }, { - "epoch": 1.14, - "learning_rate": 0.00012862288273087156, - "loss": 0.0311, + "epoch": 0.68, + "learning_rate": 0.00019773585392772545, + "loss": 0.0436, "step": 105630 }, { - "epoch": 1.14, - "learning_rate": 0.0001286066584463625, - "loss": 0.0407, + "epoch": 0.68, + "learning_rate": 0.00019772617257336853, + "loss": 0.0422, "step": 105640 }, { - "epoch": 1.14, - "learning_rate": 0.00012859043416185346, - "loss": 0.0408, + "epoch": 0.68, + "learning_rate": 0.0001977164912190116, + "loss": 0.0436, "step": 105650 }, { - "epoch": 1.14, - "learning_rate": 0.0001285742098773444, - "loss": 0.0312, + "epoch": 0.68, + "learning_rate": 0.00019770680986465463, + "loss": 0.0449, "step": 105660 }, { - "epoch": 1.14, - "learning_rate": 0.00012855798559283535, - "loss": 0.04, + "epoch": 0.68, + "learning_rate": 0.00019769712851029771, + "loss": 0.0476, "step": 105670 }, { - "epoch": 1.14, - "learning_rate": 0.00012854176130832628, - "loss": 0.0336, + "epoch": 0.68, + "learning_rate": 0.0001976874471559408, + "loss": 0.0415, "step": 105680 }, { - "epoch": 1.14, - "learning_rate": 0.00012852553702381723, - "loss": 0.04, + "epoch": 0.68, + "learning_rate": 0.00019767776580158385, + "loss": 0.0437, "step": 105690 }, { - "epoch": 1.14, - "learning_rate": 0.00012850931273930818, - "loss": 0.0331, + "epoch": 0.68, + "learning_rate": 0.00019766808444722693, + "loss": 0.0412, "step": 105700 }, { - "epoch": 1.14, - "learning_rate": 0.00012849308845479913, - "loss": 0.0366, + "epoch": 0.68, + "learning_rate": 0.00019765840309287, + "loss": 0.0442, "step": 105710 }, { - "epoch": 1.14, - "learning_rate": 0.00012847686417029008, - "loss": 0.0338, + "epoch": 0.68, + "learning_rate": 0.00019764872173851306, + "loss": 0.0374, "step": 105720 }, { - "epoch": 1.14, - "learning_rate": 0.00012846063988578103, - "loss": 0.0313, + "epoch": 0.68, + "learning_rate": 0.0001976390403841561, + "loss": 0.0426, "step": 105730 }, { - "epoch": 1.14, - "learning_rate": 0.00012844441560127198, - "loss": 0.0386, + "epoch": 0.68, + "learning_rate": 0.0001976293590297992, + "loss": 0.0382, "step": 105740 }, { - "epoch": 1.14, - "learning_rate": 0.00012842819131676293, - "loss": 0.039, + "epoch": 0.68, + "learning_rate": 0.00019761967767544224, + "loss": 0.0536, "step": 105750 }, { - "epoch": 1.14, - "learning_rate": 0.00012841196703225388, - "loss": 0.036, + "epoch": 0.68, + "learning_rate": 0.00019760999632108532, + "loss": 0.0467, "step": 105760 }, { - "epoch": 1.14, - "learning_rate": 0.00012839574274774483, - "loss": 0.0362, + "epoch": 0.68, + "learning_rate": 0.0001976003149667284, + "loss": 0.0438, "step": 105770 }, { - "epoch": 1.14, - "learning_rate": 0.00012837951846323575, - "loss": 0.0359, + "epoch": 0.68, + "learning_rate": 0.00019759063361237148, + "loss": 0.0414, "step": 105780 }, { - "epoch": 1.14, - "learning_rate": 0.0001283632941787267, - "loss": 0.0309, + "epoch": 0.68, + "learning_rate": 0.00019758095225801454, + "loss": 0.0432, "step": 105790 }, { - "epoch": 1.14, - "learning_rate": 0.00012834706989421765, - "loss": 0.03, + "epoch": 0.68, + "learning_rate": 0.0001975712709036576, + "loss": 0.0428, "step": 105800 }, { - "epoch": 1.14, - "learning_rate": 0.0001283308456097086, - "loss": 0.0377, + "epoch": 0.68, + "learning_rate": 0.00019756158954930067, + "loss": 0.0461, "step": 105810 }, { - "epoch": 1.14, - "learning_rate": 0.00012831462132519955, - "loss": 0.0373, + "epoch": 0.68, + "learning_rate": 0.00019755190819494372, + "loss": 0.0384, "step": 105820 }, { - "epoch": 1.14, - "learning_rate": 0.0001282983970406905, - "loss": 0.0338, + "epoch": 0.68, + "learning_rate": 0.0001975422268405868, + "loss": 0.0476, "step": 105830 }, { - "epoch": 1.14, - "learning_rate": 0.00012828217275618145, - "loss": 0.0288, + "epoch": 0.68, + "learning_rate": 0.00019753254548622988, + "loss": 0.0458, "step": 105840 }, { - "epoch": 1.14, - "learning_rate": 0.0001282659484716724, - "loss": 0.0419, + "epoch": 0.68, + "learning_rate": 0.00019752286413187296, + "loss": 0.0425, "step": 105850 }, { - "epoch": 1.14, - "learning_rate": 0.00012824972418716335, - "loss": 0.0375, + "epoch": 0.68, + "learning_rate": 0.00019751318277751601, + "loss": 0.0498, "step": 105860 }, { - "epoch": 1.15, - "learning_rate": 0.00012823349990265427, - "loss": 0.034, + "epoch": 0.68, + "learning_rate": 0.00019750350142315907, + "loss": 0.0381, "step": 105870 }, { - "epoch": 1.15, - "learning_rate": 0.00012821727561814522, - "loss": 0.04, + "epoch": 0.68, + "learning_rate": 0.00019749382006880215, + "loss": 0.0466, "step": 105880 }, { - "epoch": 1.15, - "learning_rate": 0.00012820105133363617, - "loss": 0.0333, + "epoch": 0.68, + "learning_rate": 0.0001974841387144452, + "loss": 0.05, "step": 105890 }, { - "epoch": 1.15, - "learning_rate": 0.00012818482704912712, - "loss": 0.0343, + "epoch": 0.68, + "learning_rate": 0.00019747445736008828, + "loss": 0.0443, "step": 105900 }, { - "epoch": 1.15, - "learning_rate": 0.00012816860276461807, - "loss": 0.0331, + "epoch": 0.68, + "learning_rate": 0.00019746477600573136, + "loss": 0.0505, "step": 105910 }, { - "epoch": 1.15, - "learning_rate": 0.00012815237848010902, - "loss": 0.0338, + "epoch": 0.68, + "learning_rate": 0.0001974550946513744, + "loss": 0.0454, "step": 105920 }, { - "epoch": 1.15, - "learning_rate": 0.00012813615419559997, - "loss": 0.0327, + "epoch": 0.68, + "learning_rate": 0.0001974454132970175, + "loss": 0.045, "step": 105930 }, { - "epoch": 1.15, - "learning_rate": 0.00012811992991109092, - "loss": 0.0313, + "epoch": 0.68, + "learning_rate": 0.00019743573194266054, + "loss": 0.0447, "step": 105940 }, { - "epoch": 1.15, - "learning_rate": 0.00012810370562658187, - "loss": 0.0319, + "epoch": 0.68, + "learning_rate": 0.0001974260505883036, + "loss": 0.0446, "step": 105950 }, { - "epoch": 1.15, - "learning_rate": 0.0001280874813420728, - "loss": 0.0345, + "epoch": 0.68, + "learning_rate": 0.00019741636923394668, + "loss": 0.0502, "step": 105960 }, { - "epoch": 1.15, - "learning_rate": 0.00012807125705756374, - "loss": 0.0335, + "epoch": 0.68, + "learning_rate": 0.00019740668787958976, + "loss": 0.0462, "step": 105970 }, { - "epoch": 1.15, - "learning_rate": 0.0001280550327730547, - "loss": 0.0368, + "epoch": 0.68, + "learning_rate": 0.00019739700652523284, + "loss": 0.0506, "step": 105980 }, { - "epoch": 1.15, - "learning_rate": 0.00012803880848854564, - "loss": 0.0399, + "epoch": 0.68, + "learning_rate": 0.0001973873251708759, + "loss": 0.0446, "step": 105990 }, { - "epoch": 1.15, - "learning_rate": 0.0001280225842040366, - "loss": 0.0329, + "epoch": 0.68, + "learning_rate": 0.00019737764381651897, + "loss": 0.0478, "step": 106000 }, { - "epoch": 1.15, - "eval_cer": 0.9211101510581492, - "eval_loss": 0.02817097119987011, - "eval_runtime": 118.7157, - "eval_samples_per_second": 16.847, - "eval_steps_per_second": 4.212, + "epoch": 0.68, + "eval_cer": 0.9198834030053101, + "eval_loss": 0.03057784214615822, + "eval_runtime": 119.7766, + "eval_samples_per_second": 16.698, + "eval_steps_per_second": 4.174, "step": 106000 }, { - "epoch": 1.15, - "learning_rate": 0.00012800635991952754, - "loss": 0.039, + "epoch": 0.68, + "learning_rate": 0.00019736796246216202, + "loss": 0.0508, "step": 106010 }, { - "epoch": 1.15, - "learning_rate": 0.0001279901356350185, - "loss": 0.0332, + "epoch": 0.68, + "learning_rate": 0.00019735828110780507, + "loss": 0.0506, "step": 106020 }, { - "epoch": 1.15, - "learning_rate": 0.00012797391135050944, - "loss": 0.0374, + "epoch": 0.68, + "learning_rate": 0.00019734859975344815, + "loss": 0.0585, "step": 106030 }, { - "epoch": 1.15, - "learning_rate": 0.0001279576870660004, - "loss": 0.033, + "epoch": 0.68, + "learning_rate": 0.00019733891839909123, + "loss": 0.0429, "step": 106040 }, { - "epoch": 1.15, - "learning_rate": 0.0001279414627814913, - "loss": 0.0399, + "epoch": 0.68, + "learning_rate": 0.0001973292370447343, + "loss": 0.0612, "step": 106050 }, { - "epoch": 1.15, - "learning_rate": 0.00012792523849698226, - "loss": 0.0453, + "epoch": 0.68, + "learning_rate": 0.00019731955569037737, + "loss": 0.0439, "step": 106060 }, { - "epoch": 1.15, - "learning_rate": 0.0001279090142124732, - "loss": 0.0388, + "epoch": 0.68, + "learning_rate": 0.00019730987433602045, + "loss": 0.0429, "step": 106070 }, { - "epoch": 1.15, - "learning_rate": 0.00012789278992796416, - "loss": 0.034, + "epoch": 0.68, + "learning_rate": 0.0001973001929816635, + "loss": 0.049, "step": 106080 }, { - "epoch": 1.15, - "learning_rate": 0.0001278765656434551, - "loss": 0.0356, + "epoch": 0.68, + "learning_rate": 0.00019729051162730655, + "loss": 0.0503, "step": 106090 }, { - "epoch": 1.15, - "learning_rate": 0.00012786034135894606, - "loss": 0.0348, + "epoch": 0.68, + "learning_rate": 0.00019728083027294963, + "loss": 0.0428, "step": 106100 }, { - "epoch": 1.15, - "learning_rate": 0.000127844117074437, - "loss": 0.037, + "epoch": 0.68, + "learning_rate": 0.0001972711489185927, + "loss": 0.0523, "step": 106110 }, { - "epoch": 1.15, - "learning_rate": 0.00012782789278992796, - "loss": 0.035, + "epoch": 0.68, + "learning_rate": 0.00019726146756423576, + "loss": 0.0468, "step": 106120 }, { - "epoch": 1.15, - "learning_rate": 0.0001278116685054189, - "loss": 0.035, + "epoch": 0.68, + "learning_rate": 0.00019725178620987884, + "loss": 0.0592, "step": 106130 }, { - "epoch": 1.15, - "learning_rate": 0.00012779544422090983, - "loss": 0.0357, + "epoch": 0.69, + "learning_rate": 0.00019724210485552192, + "loss": 0.0529, "step": 106140 }, { - "epoch": 1.15, - "learning_rate": 0.00012777921993640078, - "loss": 0.0379, + "epoch": 0.69, + "learning_rate": 0.00019723242350116495, + "loss": 0.0456, "step": 106150 }, { - "epoch": 1.15, - "learning_rate": 0.00012776299565189173, - "loss": 0.0348, + "epoch": 0.69, + "learning_rate": 0.00019722274214680803, + "loss": 0.0392, "step": 106160 }, { - "epoch": 1.15, - "learning_rate": 0.00012774677136738268, - "loss": 0.0349, + "epoch": 0.69, + "learning_rate": 0.0001972130607924511, + "loss": 0.0455, "step": 106170 }, { - "epoch": 1.15, - "learning_rate": 0.00012773054708287363, - "loss": 0.0357, + "epoch": 0.69, + "learning_rate": 0.0001972033794380942, + "loss": 0.0412, "step": 106180 }, { - "epoch": 1.15, - "learning_rate": 0.00012771432279836458, - "loss": 0.0332, + "epoch": 0.69, + "learning_rate": 0.00019719369808373724, + "loss": 0.0545, "step": 106190 }, { - "epoch": 1.15, - "learning_rate": 0.00012769809851385553, - "loss": 0.0299, + "epoch": 0.69, + "learning_rate": 0.00019718401672938032, + "loss": 0.0455, "step": 106200 }, { - "epoch": 1.15, - "learning_rate": 0.00012768187422934648, - "loss": 0.036, + "epoch": 0.69, + "learning_rate": 0.0001971743353750234, + "loss": 0.045, "step": 106210 }, { - "epoch": 1.15, - "learning_rate": 0.00012766564994483743, - "loss": 0.0373, + "epoch": 0.69, + "learning_rate": 0.00019716465402066643, + "loss": 0.0501, "step": 106220 }, { - "epoch": 1.15, - "learning_rate": 0.00012764942566032835, - "loss": 0.0328, + "epoch": 0.69, + "learning_rate": 0.0001971549726663095, + "loss": 0.0429, "step": 106230 }, { - "epoch": 1.15, - "learning_rate": 0.0001276332013758193, - "loss": 0.0328, + "epoch": 0.69, + "learning_rate": 0.00019714529131195258, + "loss": 0.0431, "step": 106240 }, { - "epoch": 1.15, - "learning_rate": 0.00012761697709131025, - "loss": 0.0372, + "epoch": 0.69, + "learning_rate": 0.00019713560995759566, + "loss": 0.0506, "step": 106250 }, { - "epoch": 1.15, - "learning_rate": 0.0001276007528068012, - "loss": 0.0307, - "step": 106260 + "epoch": 0.69, + "learning_rate": 0.00019712592860323872, + "loss": 0.0416, + "step": 106260 }, { - "epoch": 1.15, - "learning_rate": 0.00012758452852229215, - "loss": 0.0417, + "epoch": 0.69, + "learning_rate": 0.0001971162472488818, + "loss": 0.0491, "step": 106270 }, { - "epoch": 1.15, - "learning_rate": 0.0001275683042377831, - "loss": 0.0349, + "epoch": 0.69, + "learning_rate": 0.00019710656589452488, + "loss": 0.0544, "step": 106280 }, { - "epoch": 1.15, - "learning_rate": 0.00012755207995327405, - "loss": 0.0307, + "epoch": 0.69, + "learning_rate": 0.0001970968845401679, + "loss": 0.0469, "step": 106290 }, { - "epoch": 1.15, - "learning_rate": 0.000127535855668765, - "loss": 0.0314, + "epoch": 0.69, + "learning_rate": 0.00019708720318581098, + "loss": 0.0618, "step": 106300 }, { - "epoch": 1.15, - "learning_rate": 0.00012751963138425595, - "loss": 0.0296, + "epoch": 0.69, + "learning_rate": 0.00019707752183145406, + "loss": 0.0434, "step": 106310 }, { - "epoch": 1.15, - "learning_rate": 0.00012750340709974687, - "loss": 0.0401, + "epoch": 0.69, + "learning_rate": 0.00019706784047709711, + "loss": 0.0393, "step": 106320 }, { - "epoch": 1.15, - "learning_rate": 0.00012748718281523782, - "loss": 0.0325, + "epoch": 0.69, + "learning_rate": 0.0001970581591227402, + "loss": 0.0445, "step": 106330 }, { - "epoch": 1.15, - "learning_rate": 0.00012747095853072877, - "loss": 0.0343, + "epoch": 0.69, + "learning_rate": 0.00019704847776838327, + "loss": 0.0399, "step": 106340 }, { - "epoch": 1.15, - "learning_rate": 0.00012745473424621972, - "loss": 0.0368, + "epoch": 0.69, + "learning_rate": 0.00019703879641402635, + "loss": 0.0418, "step": 106350 }, { - "epoch": 1.15, - "learning_rate": 0.00012743850996171067, - "loss": 0.0345, + "epoch": 0.69, + "learning_rate": 0.00019702911505966938, + "loss": 0.0479, "step": 106360 }, { - "epoch": 1.15, - "learning_rate": 0.00012742228567720162, - "loss": 0.0397, + "epoch": 0.69, + "learning_rate": 0.00019701943370531246, + "loss": 0.052, "step": 106370 }, { - "epoch": 1.15, - "learning_rate": 0.00012740606139269257, - "loss": 0.0411, + "epoch": 0.69, + "learning_rate": 0.00019700975235095554, + "loss": 0.0491, "step": 106380 }, { - "epoch": 1.15, - "learning_rate": 0.00012738983710818352, - "loss": 0.0387, + "epoch": 0.69, + "learning_rate": 0.0001970000709965986, + "loss": 0.0462, "step": 106390 }, { - "epoch": 1.15, - "learning_rate": 0.00012737361282367447, - "loss": 0.0372, + "epoch": 0.69, + "learning_rate": 0.00019699038964224167, + "loss": 0.0465, "step": 106400 }, { - "epoch": 1.15, - "learning_rate": 0.0001273573885391654, - "loss": 0.0388, + "epoch": 0.69, + "learning_rate": 0.00019698070828788475, + "loss": 0.0498, "step": 106410 }, { - "epoch": 1.15, - "learning_rate": 0.00012734116425465634, - "loss": 0.0287, + "epoch": 0.69, + "learning_rate": 0.00019697102693352783, + "loss": 0.0431, "step": 106420 }, { - "epoch": 1.15, - "learning_rate": 0.0001273249399701473, - "loss": 0.0391, + "epoch": 0.69, + "learning_rate": 0.00019696134557917086, + "loss": 0.0543, "step": 106430 }, { - "epoch": 1.15, - "learning_rate": 0.00012730871568563824, - "loss": 0.0344, + "epoch": 0.69, + "learning_rate": 0.00019695166422481394, + "loss": 0.0443, "step": 106440 }, { - "epoch": 1.15, - "learning_rate": 0.0001272924914011292, - "loss": 0.0277, + "epoch": 0.69, + "learning_rate": 0.00019694198287045702, + "loss": 0.0451, "step": 106450 }, { - "epoch": 1.15, - "learning_rate": 0.00012727626711662014, - "loss": 0.0316, + "epoch": 0.69, + "learning_rate": 0.00019693230151610007, + "loss": 0.0453, "step": 106460 }, { - "epoch": 1.15, - "learning_rate": 0.0001272600428321111, - "loss": 0.0399, + "epoch": 0.69, + "learning_rate": 0.00019692262016174315, + "loss": 0.0432, "step": 106470 }, { - "epoch": 1.15, - "learning_rate": 0.00012724381854760204, - "loss": 0.0392, + "epoch": 0.69, + "learning_rate": 0.00019691293880738623, + "loss": 0.0466, "step": 106480 }, { - "epoch": 1.15, - "learning_rate": 0.000127227594263093, - "loss": 0.0327, + "epoch": 0.69, + "learning_rate": 0.00019690325745302928, + "loss": 0.0459, "step": 106490 }, { - "epoch": 1.15, - "learning_rate": 0.00012721136997858391, - "loss": 0.0382, + "epoch": 0.69, + "learning_rate": 0.00019689357609867233, + "loss": 0.046, "step": 106500 }, { - "epoch": 1.15, - "learning_rate": 0.00012719514569407486, - "loss": 0.0365, + "epoch": 0.69, + "learning_rate": 0.00019688389474431541, + "loss": 0.0432, "step": 106510 }, { - "epoch": 1.15, - "learning_rate": 0.00012717892140956581, - "loss": 0.0416, + "epoch": 0.69, + "learning_rate": 0.00019687421338995847, + "loss": 0.0447, "step": 106520 }, { - "epoch": 1.15, - "learning_rate": 0.00012716269712505676, - "loss": 0.0327, + "epoch": 0.69, + "learning_rate": 0.00019686453203560155, + "loss": 0.0431, "step": 106530 }, { - "epoch": 1.15, - "learning_rate": 0.00012714647284054771, - "loss": 0.0387, + "epoch": 0.69, + "learning_rate": 0.00019685485068124463, + "loss": 0.0478, "step": 106540 }, { - "epoch": 1.15, - "learning_rate": 0.00012713024855603866, - "loss": 0.0366, + "epoch": 0.69, + "learning_rate": 0.0001968451693268877, + "loss": 0.0414, "step": 106550 }, { - "epoch": 1.15, - "learning_rate": 0.0001271140242715296, - "loss": 0.035, + "epoch": 0.69, + "learning_rate": 0.00019683548797253076, + "loss": 0.0518, "step": 106560 }, { - "epoch": 1.15, - "learning_rate": 0.00012709779998702056, - "loss": 0.0317, + "epoch": 0.69, + "learning_rate": 0.0001968258066181738, + "loss": 0.0495, "step": 106570 }, { - "epoch": 1.15, - "learning_rate": 0.0001270815757025115, - "loss": 0.0362, + "epoch": 0.69, + "learning_rate": 0.0001968161252638169, + "loss": 0.0461, "step": 106580 }, { - "epoch": 1.15, - "learning_rate": 0.00012706535141800244, - "loss": 0.036, + "epoch": 0.69, + "learning_rate": 0.00019680644390945994, + "loss": 0.0522, "step": 106590 }, { - "epoch": 1.15, - "learning_rate": 0.00012704912713349339, - "loss": 0.035, + "epoch": 0.69, + "learning_rate": 0.00019679676255510302, + "loss": 0.0511, "step": 106600 }, { - "epoch": 1.15, - "learning_rate": 0.00012703290284898434, - "loss": 0.0322, + "epoch": 0.69, + "learning_rate": 0.0001967870812007461, + "loss": 0.0493, "step": 106610 }, { - "epoch": 1.15, - "learning_rate": 0.00012701667856447528, - "loss": 0.0284, + "epoch": 0.69, + "learning_rate": 0.00019677739984638918, + "loss": 0.0489, "step": 106620 }, { - "epoch": 1.15, - "learning_rate": 0.00012700045427996623, - "loss": 0.0351, + "epoch": 0.69, + "learning_rate": 0.00019676771849203224, + "loss": 0.0434, "step": 106630 }, { - "epoch": 1.15, - "learning_rate": 0.00012698422999545718, - "loss": 0.0352, + "epoch": 0.69, + "learning_rate": 0.0001967580371376753, + "loss": 0.0419, "step": 106640 }, { - "epoch": 1.15, - "learning_rate": 0.00012696800571094813, - "loss": 0.0375, + "epoch": 0.69, + "learning_rate": 0.00019674835578331837, + "loss": 0.0449, "step": 106650 }, { - "epoch": 1.15, - "learning_rate": 0.00012695178142643908, - "loss": 0.0338, + "epoch": 0.69, + "learning_rate": 0.00019673867442896142, + "loss": 0.0512, "step": 106660 }, { - "epoch": 1.15, - "learning_rate": 0.00012693555714193003, - "loss": 0.0391, + "epoch": 0.69, + "learning_rate": 0.0001967289930746045, + "loss": 0.0501, "step": 106670 }, { - "epoch": 1.15, - "learning_rate": 0.00012691933285742096, - "loss": 0.0389, + "epoch": 0.69, + "learning_rate": 0.00019671931172024758, + "loss": 0.0555, "step": 106680 }, { - "epoch": 1.15, - "learning_rate": 0.0001269031085729119, - "loss": 0.0378, + "epoch": 0.69, + "learning_rate": 0.00019670963036589063, + "loss": 0.0446, "step": 106690 }, { - "epoch": 1.15, - "learning_rate": 0.00012688688428840286, - "loss": 0.0364, + "epoch": 0.69, + "learning_rate": 0.0001966999490115337, + "loss": 0.0518, "step": 106700 }, { - "epoch": 1.15, - "learning_rate": 0.0001268706600038938, - "loss": 0.0369, + "epoch": 0.69, + "learning_rate": 0.00019669026765717677, + "loss": 0.045, "step": 106710 }, { - "epoch": 1.15, - "learning_rate": 0.00012685443571938476, - "loss": 0.0392, + "epoch": 0.69, + "learning_rate": 0.00019668058630281982, + "loss": 0.0484, "step": 106720 }, { - "epoch": 1.15, - "learning_rate": 0.0001268382114348757, - "loss": 0.0327, + "epoch": 0.69, + "learning_rate": 0.0001966709049484629, + "loss": 0.0467, "step": 106730 }, { - "epoch": 1.15, - "learning_rate": 0.00012682198715036666, - "loss": 0.0387, + "epoch": 0.69, + "learning_rate": 0.00019666122359410598, + "loss": 0.041, "step": 106740 }, { - "epoch": 1.15, - "learning_rate": 0.0001268057628658576, - "loss": 0.0371, + "epoch": 0.69, + "learning_rate": 0.00019665154223974906, + "loss": 0.0454, "step": 106750 }, { - "epoch": 1.15, - "learning_rate": 0.00012678953858134855, - "loss": 0.0339, + "epoch": 0.69, + "learning_rate": 0.0001966418608853921, + "loss": 0.0439, "step": 106760 }, { - "epoch": 1.15, - "learning_rate": 0.0001267733142968395, - "loss": 0.0323, + "epoch": 0.69, + "learning_rate": 0.00019663217953103516, + "loss": 0.0424, "step": 106770 }, { - "epoch": 1.15, - "learning_rate": 0.00012675709001233045, - "loss": 0.0375, + "epoch": 0.69, + "learning_rate": 0.00019662249817667824, + "loss": 0.0413, "step": 106780 }, { - "epoch": 1.16, - "learning_rate": 0.0001267408657278214, - "loss": 0.035, + "epoch": 0.69, + "learning_rate": 0.0001966128168223213, + "loss": 0.0457, "step": 106790 }, { - "epoch": 1.16, - "learning_rate": 0.00012672464144331235, - "loss": 0.0305, + "epoch": 0.69, + "learning_rate": 0.00019660313546796438, + "loss": 0.0395, "step": 106800 }, { - "epoch": 1.16, - "learning_rate": 0.0001267084171588033, - "loss": 0.0315, + "epoch": 0.69, + "learning_rate": 0.00019659345411360746, + "loss": 0.0538, "step": 106810 }, { - "epoch": 1.16, - "learning_rate": 0.00012669219287429425, - "loss": 0.0321, + "epoch": 0.69, + "learning_rate": 0.00019658377275925054, + "loss": 0.0418, "step": 106820 }, { - "epoch": 1.16, - "learning_rate": 0.00012667596858978518, - "loss": 0.031, + "epoch": 0.69, + "learning_rate": 0.0001965740914048936, + "loss": 0.046, "step": 106830 }, { - "epoch": 1.16, - "learning_rate": 0.00012665974430527613, - "loss": 0.0359, + "epoch": 0.69, + "learning_rate": 0.00019656441005053664, + "loss": 0.0454, "step": 106840 }, { - "epoch": 1.16, - "learning_rate": 0.00012664352002076708, - "loss": 0.0298, + "epoch": 0.69, + "learning_rate": 0.00019655472869617972, + "loss": 0.0533, "step": 106850 }, { - "epoch": 1.16, - "learning_rate": 0.00012662729573625803, - "loss": 0.0405, + "epoch": 0.69, + "learning_rate": 0.00019654504734182277, + "loss": 0.0457, "step": 106860 }, { - "epoch": 1.16, - "learning_rate": 0.00012661107145174897, - "loss": 0.0361, + "epoch": 0.69, + "learning_rate": 0.00019653536598746585, + "loss": 0.1217, "step": 106870 }, { - "epoch": 1.16, - "learning_rate": 0.00012659484716723992, - "loss": 0.0425, + "epoch": 0.69, + "learning_rate": 0.00019652568463310893, + "loss": 0.0501, "step": 106880 }, { - "epoch": 1.16, - "learning_rate": 0.00012657862288273087, - "loss": 0.0411, + "epoch": 0.69, + "learning_rate": 0.000196516003278752, + "loss": 0.0533, "step": 106890 }, { - "epoch": 1.16, - "learning_rate": 0.00012656239859822182, - "loss": 0.0316, + "epoch": 0.69, + "learning_rate": 0.00019650632192439507, + "loss": 0.0463, "step": 106900 }, { - "epoch": 1.16, - "learning_rate": 0.00012654617431371277, - "loss": 0.0359, + "epoch": 0.69, + "learning_rate": 0.00019649664057003812, + "loss": 0.0432, "step": 106910 }, { - "epoch": 1.16, - "learning_rate": 0.0001265299500292037, - "loss": 0.0304, + "epoch": 0.69, + "learning_rate": 0.00019648695921568117, + "loss": 0.0494, "step": 106920 }, { - "epoch": 1.16, - "learning_rate": 0.00012651372574469465, - "loss": 0.0337, + "epoch": 0.69, + "learning_rate": 0.00019647727786132425, + "loss": 0.0406, "step": 106930 }, { - "epoch": 1.16, - "learning_rate": 0.0001264975014601856, - "loss": 0.0379, + "epoch": 0.69, + "learning_rate": 0.00019646759650696733, + "loss": 0.0508, "step": 106940 }, { - "epoch": 1.16, - "learning_rate": 0.00012648127717567655, - "loss": 0.0378, + "epoch": 0.69, + "learning_rate": 0.0001964579151526104, + "loss": 0.0455, "step": 106950 }, { - "epoch": 1.16, - "learning_rate": 0.0001264650528911675, - "loss": 0.0393, + "epoch": 0.69, + "learning_rate": 0.00019644823379825346, + "loss": 0.0402, "step": 106960 }, { - "epoch": 1.16, - "learning_rate": 0.00012644882860665845, - "loss": 0.0351, + "epoch": 0.69, + "learning_rate": 0.00019643855244389654, + "loss": 0.0482, "step": 106970 }, { - "epoch": 1.16, - "learning_rate": 0.0001264326043221494, - "loss": 0.0344, + "epoch": 0.69, + "learning_rate": 0.0001964288710895396, + "loss": 0.0958, "step": 106980 }, { - "epoch": 1.16, - "learning_rate": 0.00012641638003764035, - "loss": 0.0352, + "epoch": 0.69, + "learning_rate": 0.00019641918973518265, + "loss": 0.056, "step": 106990 }, { - "epoch": 1.16, - "learning_rate": 0.0001264001557531313, - "loss": 0.0438, + "epoch": 0.69, + "learning_rate": 0.00019640950838082573, + "loss": 0.0456, "step": 107000 }, { - "epoch": 1.16, - "eval_cer": 0.9212391397689865, - "eval_loss": 0.02793010324239731, - "eval_runtime": 118.945, - "eval_samples_per_second": 16.814, - "eval_steps_per_second": 4.204, + "epoch": 0.69, + "eval_cer": 0.9199249802282228, + "eval_loss": 0.03076346032321453, + "eval_runtime": 119.7637, + "eval_samples_per_second": 16.7, + "eval_steps_per_second": 4.175, "step": 107000 }, { - "epoch": 1.16, - "learning_rate": 0.00012638393146862222, - "loss": 0.0312, + "epoch": 0.69, + "learning_rate": 0.0001963998270264688, + "loss": 0.0391, "step": 107010 }, { - "epoch": 1.16, - "learning_rate": 0.00012636770718411317, - "loss": 0.0368, + "epoch": 0.69, + "learning_rate": 0.0001963901456721119, + "loss": 0.0503, "step": 107020 }, { - "epoch": 1.16, - "learning_rate": 0.00012635148289960412, - "loss": 0.0411, + "epoch": 0.69, + "learning_rate": 0.00019638046431775494, + "loss": 0.0497, "step": 107030 }, { - "epoch": 1.16, - "learning_rate": 0.00012633525861509507, - "loss": 0.0367, + "epoch": 0.69, + "learning_rate": 0.00019637078296339802, + "loss": 0.0553, "step": 107040 }, { - "epoch": 1.16, - "learning_rate": 0.00012631903433058602, - "loss": 0.0342, + "epoch": 0.69, + "learning_rate": 0.00019636110160904107, + "loss": 0.0503, "step": 107050 }, { - "epoch": 1.16, - "learning_rate": 0.00012630281004607697, - "loss": 0.0349, + "epoch": 0.69, + "learning_rate": 0.00019635142025468412, + "loss": 0.0498, "step": 107060 }, { - "epoch": 1.16, - "learning_rate": 0.00012628658576156792, - "loss": 0.0347, + "epoch": 0.69, + "learning_rate": 0.0001963417389003272, + "loss": 0.0547, "step": 107070 }, { - "epoch": 1.16, - "learning_rate": 0.00012627036147705887, - "loss": 0.0377, + "epoch": 0.69, + "learning_rate": 0.00019633205754597028, + "loss": 0.0447, "step": 107080 }, { - "epoch": 1.16, - "learning_rate": 0.00012625413719254982, - "loss": 0.0382, + "epoch": 0.69, + "learning_rate": 0.00019632237619161336, + "loss": 0.0471, "step": 107090 }, { - "epoch": 1.16, - "learning_rate": 0.00012623791290804074, - "loss": 0.0444, + "epoch": 0.69, + "learning_rate": 0.00019631269483725642, + "loss": 0.0451, "step": 107100 }, { - "epoch": 1.16, - "learning_rate": 0.0001262216886235317, - "loss": 0.0311, + "epoch": 0.69, + "learning_rate": 0.0001963030134828995, + "loss": 0.0459, "step": 107110 }, { - "epoch": 1.16, - "learning_rate": 0.00012620546433902264, - "loss": 0.0338, + "epoch": 0.69, + "learning_rate": 0.00019629333212854252, + "loss": 0.0442, "step": 107120 }, { - "epoch": 1.16, - "learning_rate": 0.0001261892400545136, - "loss": 0.0301, + "epoch": 0.69, + "learning_rate": 0.0001962836507741856, + "loss": 0.0466, "step": 107130 }, { - "epoch": 1.16, - "learning_rate": 0.00012617301577000454, - "loss": 0.0365, + "epoch": 0.69, + "learning_rate": 0.00019627396941982868, + "loss": 0.0467, "step": 107140 }, { - "epoch": 1.16, - "learning_rate": 0.0001261567914854955, - "loss": 0.0384, + "epoch": 0.69, + "learning_rate": 0.00019626428806547176, + "loss": 0.0502, "step": 107150 }, { - "epoch": 1.16, - "learning_rate": 0.00012614056720098644, - "loss": 0.0366, + "epoch": 0.69, + "learning_rate": 0.00019625460671111481, + "loss": 0.046, "step": 107160 }, { - "epoch": 1.16, - "learning_rate": 0.0001261243429164774, - "loss": 0.0337, + "epoch": 0.69, + "learning_rate": 0.0001962449253567579, + "loss": 0.0436, "step": 107170 }, { - "epoch": 1.16, - "learning_rate": 0.00012610811863196834, - "loss": 0.037, + "epoch": 0.69, + "learning_rate": 0.00019623524400240097, + "loss": 0.0418, "step": 107180 }, { - "epoch": 1.16, - "learning_rate": 0.00012609189434745926, - "loss": 0.0309, + "epoch": 0.69, + "learning_rate": 0.000196225562648044, + "loss": 0.0431, "step": 107190 }, { - "epoch": 1.16, - "learning_rate": 0.0001260756700629502, - "loss": 0.0372, + "epoch": 0.69, + "learning_rate": 0.00019621588129368708, + "loss": 0.0433, "step": 107200 }, { - "epoch": 1.16, - "learning_rate": 0.00012605944577844116, - "loss": 0.0332, + "epoch": 0.69, + "learning_rate": 0.00019620619993933016, + "loss": 0.0463, "step": 107210 }, { - "epoch": 1.16, - "learning_rate": 0.0001260432214939321, - "loss": 0.0372, + "epoch": 0.69, + "learning_rate": 0.00019619651858497324, + "loss": 0.0439, "step": 107220 }, { - "epoch": 1.16, - "learning_rate": 0.00012602699720942306, - "loss": 0.0298, + "epoch": 0.69, + "learning_rate": 0.0001961868372306163, + "loss": 0.0467, "step": 107230 }, { - "epoch": 1.16, - "learning_rate": 0.000126010772924914, - "loss": 0.0323, + "epoch": 0.69, + "learning_rate": 0.00019617715587625937, + "loss": 0.0598, "step": 107240 }, { - "epoch": 1.16, - "learning_rate": 0.00012599454864040496, - "loss": 0.0355, + "epoch": 0.69, + "learning_rate": 0.00019616747452190245, + "loss": 0.0482, "step": 107250 }, { - "epoch": 1.16, - "learning_rate": 0.0001259783243558959, - "loss": 0.0339, + "epoch": 0.69, + "learning_rate": 0.00019615779316754548, + "loss": 0.0456, "step": 107260 }, { - "epoch": 1.16, - "learning_rate": 0.00012596210007138686, - "loss": 0.039, + "epoch": 0.69, + "learning_rate": 0.00019614811181318856, + "loss": 0.0545, "step": 107270 }, { - "epoch": 1.16, - "learning_rate": 0.00012594587578687778, - "loss": 0.0299, + "epoch": 0.69, + "learning_rate": 0.00019613843045883164, + "loss": 0.0454, "step": 107280 }, { - "epoch": 1.16, - "learning_rate": 0.00012592965150236873, - "loss": 0.0364, + "epoch": 0.69, + "learning_rate": 0.00019612874910447472, + "loss": 0.04, "step": 107290 }, { - "epoch": 1.16, - "learning_rate": 0.00012591342721785968, - "loss": 0.0346, + "epoch": 0.69, + "learning_rate": 0.00019611906775011777, + "loss": 0.0416, "step": 107300 }, { - "epoch": 1.16, - "learning_rate": 0.00012589720293335063, - "loss": 0.0346, + "epoch": 0.69, + "learning_rate": 0.00019610938639576085, + "loss": 0.0554, "step": 107310 }, { - "epoch": 1.16, - "learning_rate": 0.00012588097864884158, - "loss": 0.0366, + "epoch": 0.69, + "learning_rate": 0.00019609970504140393, + "loss": 0.0473, "step": 107320 }, { - "epoch": 1.16, - "learning_rate": 0.00012586475436433253, - "loss": 0.0332, + "epoch": 0.69, + "learning_rate": 0.00019609002368704695, + "loss": 0.046, "step": 107330 }, { - "epoch": 1.16, - "learning_rate": 0.00012584853007982348, - "loss": 0.0412, + "epoch": 0.69, + "learning_rate": 0.00019608034233269003, + "loss": 0.044, "step": 107340 }, { - "epoch": 1.16, - "learning_rate": 0.00012583230579531443, - "loss": 0.0335, + "epoch": 0.69, + "learning_rate": 0.00019607066097833311, + "loss": 0.0415, "step": 107350 }, { - "epoch": 1.16, - "learning_rate": 0.00012581608151080538, - "loss": 0.0323, + "epoch": 0.69, + "learning_rate": 0.00019606097962397617, + "loss": 0.0453, "step": 107360 }, { - "epoch": 1.16, - "learning_rate": 0.0001257998572262963, - "loss": 0.0424, + "epoch": 0.69, + "learning_rate": 0.00019605129826961925, + "loss": 0.0457, "step": 107370 }, { - "epoch": 1.16, - "learning_rate": 0.00012578363294178725, - "loss": 0.0339, + "epoch": 0.69, + "learning_rate": 0.00019604161691526233, + "loss": 0.0437, "step": 107380 }, { - "epoch": 1.16, - "learning_rate": 0.0001257674086572782, - "loss": 0.035, + "epoch": 0.69, + "learning_rate": 0.0001960319355609054, + "loss": 0.045, "step": 107390 }, { - "epoch": 1.16, - "learning_rate": 0.00012575118437276915, - "loss": 0.0328, + "epoch": 0.69, + "learning_rate": 0.00019602225420654843, + "loss": 0.0422, "step": 107400 }, { - "epoch": 1.16, - "learning_rate": 0.0001257349600882601, - "loss": 0.0383, + "epoch": 0.69, + "learning_rate": 0.0001960125728521915, + "loss": 0.0469, "step": 107410 }, { - "epoch": 1.16, - "learning_rate": 0.00012571873580375105, - "loss": 0.0307, + "epoch": 0.69, + "learning_rate": 0.0001960028914978346, + "loss": 0.0472, "step": 107420 }, { - "epoch": 1.16, - "learning_rate": 0.000125702511519242, - "loss": 0.0423, + "epoch": 0.69, + "learning_rate": 0.00019599321014347764, + "loss": 0.0535, "step": 107430 }, { - "epoch": 1.16, - "learning_rate": 0.00012568628723473295, - "loss": 0.0334, + "epoch": 0.69, + "learning_rate": 0.00019598352878912072, + "loss": 0.0453, "step": 107440 }, { - "epoch": 1.16, - "learning_rate": 0.0001256700629502239, - "loss": 0.0337, + "epoch": 0.69, + "learning_rate": 0.0001959738474347638, + "loss": 0.0432, "step": 107450 }, { - "epoch": 1.16, - "learning_rate": 0.00012565383866571482, - "loss": 0.0351, + "epoch": 0.69, + "learning_rate": 0.00019596416608040688, + "loss": 0.051, "step": 107460 }, { - "epoch": 1.16, - "learning_rate": 0.00012563761438120577, - "loss": 0.0324, + "epoch": 0.69, + "learning_rate": 0.0001959544847260499, + "loss": 0.0443, "step": 107470 }, { - "epoch": 1.16, - "learning_rate": 0.00012562139009669672, - "loss": 0.0353, + "epoch": 0.69, + "learning_rate": 0.000195944803371693, + "loss": 0.043, "step": 107480 }, { - "epoch": 1.16, - "learning_rate": 0.00012560516581218767, - "loss": 0.0341, + "epoch": 0.69, + "learning_rate": 0.00019593512201733607, + "loss": 0.0442, "step": 107490 }, { - "epoch": 1.16, - "learning_rate": 0.00012558894152767862, - "loss": 0.0345, + "epoch": 0.69, + "learning_rate": 0.00019592544066297912, + "loss": 0.0516, "step": 107500 }, { - "epoch": 1.16, - "learning_rate": 0.00012557271724316957, - "loss": 0.0415, + "epoch": 0.69, + "learning_rate": 0.0001959157593086222, + "loss": 0.043, "step": 107510 }, { - "epoch": 1.16, - "learning_rate": 0.00012555649295866052, - "loss": 0.0352, + "epoch": 0.69, + "learning_rate": 0.00019590607795426528, + "loss": 0.0432, "step": 107520 }, { - "epoch": 1.16, - "learning_rate": 0.00012554026867415147, - "loss": 0.0286, + "epoch": 0.69, + "learning_rate": 0.00019589639659990833, + "loss": 0.0405, "step": 107530 }, { - "epoch": 1.16, - "learning_rate": 0.00012552404438964242, - "loss": 0.0357, + "epoch": 0.69, + "learning_rate": 0.00019588671524555139, + "loss": 0.0459, "step": 107540 }, { - "epoch": 1.16, - "learning_rate": 0.00012550782010513334, - "loss": 0.0324, + "epoch": 0.69, + "learning_rate": 0.00019587703389119447, + "loss": 0.0482, "step": 107550 }, { - "epoch": 1.16, - "learning_rate": 0.0001254915958206243, - "loss": 0.0327, + "epoch": 0.69, + "learning_rate": 0.00019586735253683752, + "loss": 0.0427, "step": 107560 }, { - "epoch": 1.16, - "learning_rate": 0.00012547537153611524, - "loss": 0.0328, + "epoch": 0.69, + "learning_rate": 0.0001958576711824806, + "loss": 0.0536, "step": 107570 }, { - "epoch": 1.16, - "learning_rate": 0.0001254591472516062, - "loss": 0.0334, + "epoch": 0.69, + "learning_rate": 0.00019584798982812368, + "loss": 0.0398, "step": 107580 }, { - "epoch": 1.16, - "learning_rate": 0.00012544292296709714, - "loss": 0.0423, + "epoch": 0.69, + "learning_rate": 0.00019583830847376676, + "loss": 0.0457, "step": 107590 }, { - "epoch": 1.16, - "learning_rate": 0.0001254266986825881, - "loss": 0.0351, + "epoch": 0.69, + "learning_rate": 0.0001958286271194098, + "loss": 0.0677, "step": 107600 }, { - "epoch": 1.16, - "learning_rate": 0.00012541047439807904, - "loss": 0.0347, + "epoch": 0.69, + "learning_rate": 0.00019581894576505286, + "loss": 0.0438, "step": 107610 }, { - "epoch": 1.16, - "learning_rate": 0.00012539425011357, - "loss": 0.0381, + "epoch": 0.69, + "learning_rate": 0.00019580926441069594, + "loss": 0.047, "step": 107620 }, { - "epoch": 1.16, - "learning_rate": 0.00012537802582906094, - "loss": 0.0328, + "epoch": 0.69, + "learning_rate": 0.000195799583056339, + "loss": 0.0427, "step": 107630 }, { - "epoch": 1.16, - "learning_rate": 0.00012536180154455186, - "loss": 0.0305, + "epoch": 0.69, + "learning_rate": 0.00019578990170198208, + "loss": 0.0457, "step": 107640 }, { - "epoch": 1.16, - "learning_rate": 0.0001253455772600428, - "loss": 0.0295, + "epoch": 0.69, + "learning_rate": 0.00019578022034762516, + "loss": 0.0456, "step": 107650 }, { - "epoch": 1.16, - "learning_rate": 0.00012532935297553376, - "loss": 0.0351, + "epoch": 0.69, + "learning_rate": 0.00019577053899326823, + "loss": 0.0555, "step": 107660 }, { - "epoch": 1.16, - "learning_rate": 0.0001253131286910247, - "loss": 0.0365, + "epoch": 0.69, + "learning_rate": 0.0001957608576389113, + "loss": 0.049, "step": 107670 }, { - "epoch": 1.16, - "learning_rate": 0.00012529690440651566, - "loss": 0.0324, + "epoch": 0.69, + "learning_rate": 0.00019575117628455434, + "loss": 0.0445, "step": 107680 }, { - "epoch": 1.16, - "learning_rate": 0.0001252806801220066, - "loss": 0.0365, + "epoch": 0.7, + "learning_rate": 0.00019574149493019742, + "loss": 0.0455, "step": 107690 }, { - "epoch": 1.16, - "learning_rate": 0.00012526445583749756, - "loss": 0.0355, + "epoch": 0.7, + "learning_rate": 0.00019573181357584047, + "loss": 0.0425, "step": 107700 }, { - "epoch": 1.16, - "learning_rate": 0.0001252482315529885, - "loss": 0.0316, + "epoch": 0.7, + "learning_rate": 0.00019572213222148355, + "loss": 0.0489, "step": 107710 }, { - "epoch": 1.17, - "learning_rate": 0.00012523200726847946, - "loss": 0.0383, + "epoch": 0.7, + "learning_rate": 0.00019571245086712663, + "loss": 0.0452, "step": 107720 }, { - "epoch": 1.17, - "learning_rate": 0.00012521578298397038, - "loss": 0.0304, + "epoch": 0.7, + "learning_rate": 0.00019570276951276968, + "loss": 0.0449, "step": 107730 }, { - "epoch": 1.17, - "learning_rate": 0.00012519955869946133, - "loss": 0.034, + "epoch": 0.7, + "learning_rate": 0.00019569308815841276, + "loss": 0.062, "step": 107740 }, { - "epoch": 1.17, - "learning_rate": 0.00012518333441495228, - "loss": 0.0412, + "epoch": 0.7, + "learning_rate": 0.00019568340680405582, + "loss": 0.0558, "step": 107750 }, { - "epoch": 1.17, - "learning_rate": 0.00012516711013044323, - "loss": 0.0367, + "epoch": 0.7, + "learning_rate": 0.00019567372544969887, + "loss": 0.0446, "step": 107760 }, { - "epoch": 1.17, - "learning_rate": 0.00012515088584593418, - "loss": 0.0357, + "epoch": 0.7, + "learning_rate": 0.00019566404409534195, + "loss": 0.0442, "step": 107770 }, { - "epoch": 1.17, - "learning_rate": 0.00012513466156142513, - "loss": 0.036, + "epoch": 0.7, + "learning_rate": 0.00019565436274098503, + "loss": 0.0446, "step": 107780 }, { - "epoch": 1.17, - "learning_rate": 0.00012511843727691608, - "loss": 0.0359, + "epoch": 0.7, + "learning_rate": 0.0001956446813866281, + "loss": 0.0386, "step": 107790 }, { - "epoch": 1.17, - "learning_rate": 0.00012510221299240703, - "loss": 0.0303, + "epoch": 0.7, + "learning_rate": 0.00019563500003227116, + "loss": 0.0495, "step": 107800 }, { - "epoch": 1.17, - "learning_rate": 0.00012508598870789798, - "loss": 0.0379, + "epoch": 0.7, + "learning_rate": 0.00019562531867791424, + "loss": 0.0402, "step": 107810 }, { - "epoch": 1.17, - "learning_rate": 0.0001250697644233889, - "loss": 0.0346, + "epoch": 0.7, + "learning_rate": 0.0001956156373235573, + "loss": 0.0413, "step": 107820 }, { - "epoch": 1.17, - "learning_rate": 0.00012505354013887985, - "loss": 0.0396, + "epoch": 0.7, + "learning_rate": 0.00019560595596920035, + "loss": 0.0529, "step": 107830 }, { - "epoch": 1.17, - "learning_rate": 0.0001250373158543708, - "loss": 0.0323, + "epoch": 0.7, + "learning_rate": 0.00019559627461484343, + "loss": 0.0431, "step": 107840 }, { - "epoch": 1.17, - "learning_rate": 0.00012502109156986175, - "loss": 0.0363, + "epoch": 0.7, + "learning_rate": 0.0001955865932604865, + "loss": 0.0563, "step": 107850 }, { - "epoch": 1.17, - "learning_rate": 0.0001250048672853527, - "loss": 0.0404, + "epoch": 0.7, + "learning_rate": 0.0001955769119061296, + "loss": 0.0563, "step": 107860 }, { - "epoch": 1.17, - "learning_rate": 0.00012498864300084365, - "loss": 0.0388, + "epoch": 0.7, + "learning_rate": 0.00019556723055177264, + "loss": 0.0424, "step": 107870 }, { - "epoch": 1.17, - "learning_rate": 0.0001249724187163346, - "loss": 0.0401, + "epoch": 0.7, + "learning_rate": 0.00019555754919741572, + "loss": 0.0392, "step": 107880 }, { - "epoch": 1.17, - "learning_rate": 0.00012495619443182555, - "loss": 0.0365, + "epoch": 0.7, + "learning_rate": 0.00019554786784305877, + "loss": 0.0493, "step": 107890 }, { - "epoch": 1.17, - "learning_rate": 0.0001249399701473165, - "loss": 0.0368, + "epoch": 0.7, + "learning_rate": 0.00019553818648870182, + "loss": 0.0463, "step": 107900 }, { - "epoch": 1.17, - "learning_rate": 0.00012492374586280745, - "loss": 0.0319, + "epoch": 0.7, + "learning_rate": 0.0001955285051343449, + "loss": 0.043, "step": 107910 }, { - "epoch": 1.17, - "learning_rate": 0.00012490752157829838, - "loss": 0.0376, + "epoch": 0.7, + "learning_rate": 0.00019551882377998798, + "loss": 0.0525, "step": 107920 }, { - "epoch": 1.17, - "learning_rate": 0.00012489129729378933, - "loss": 0.037, + "epoch": 0.7, + "learning_rate": 0.00019550914242563104, + "loss": 0.0453, "step": 107930 }, { - "epoch": 1.17, - "learning_rate": 0.00012487507300928028, - "loss": 0.0408, + "epoch": 0.7, + "learning_rate": 0.00019549946107127412, + "loss": 0.0496, "step": 107940 }, { - "epoch": 1.17, - "learning_rate": 0.00012485884872477122, - "loss": 0.0314, + "epoch": 0.7, + "learning_rate": 0.0001954897797169172, + "loss": 0.0443, "step": 107950 }, { - "epoch": 1.17, - "learning_rate": 0.00012484262444026217, - "loss": 0.0368, + "epoch": 0.7, + "learning_rate": 0.00019548009836256022, + "loss": 0.0442, "step": 107960 }, { - "epoch": 1.17, - "learning_rate": 0.00012482640015575312, - "loss": 0.0334, + "epoch": 0.7, + "learning_rate": 0.0001954704170082033, + "loss": 0.0589, "step": 107970 }, { - "epoch": 1.17, - "learning_rate": 0.00012481017587124407, - "loss": 0.0344, + "epoch": 0.7, + "learning_rate": 0.00019546073565384638, + "loss": 0.0403, "step": 107980 }, { - "epoch": 1.17, - "learning_rate": 0.00012479395158673502, - "loss": 0.0325, + "epoch": 0.7, + "learning_rate": 0.00019545105429948946, + "loss": 0.043, "step": 107990 }, { - "epoch": 1.17, - "learning_rate": 0.00012477772730222597, - "loss": 0.037, + "epoch": 0.7, + "learning_rate": 0.00019544137294513251, + "loss": 0.0433, "step": 108000 }, { - "epoch": 1.17, - "eval_cer": 0.9211587426957933, - "eval_loss": 0.02736649662256241, - "eval_runtime": 118.6945, - "eval_samples_per_second": 16.85, - "eval_steps_per_second": 4.212, + "epoch": 0.7, + "eval_cer": 0.9200207886114563, + "eval_loss": 0.030186787247657776, + "eval_runtime": 119.9054, + "eval_samples_per_second": 16.68, + "eval_steps_per_second": 4.17, "step": 108000 }, { - "epoch": 1.17, - "learning_rate": 0.0001247615030177169, - "loss": 0.0331, + "epoch": 0.7, + "learning_rate": 0.0001954316915907756, + "loss": 0.0465, "step": 108010 }, { - "epoch": 1.17, - "learning_rate": 0.00012474527873320785, - "loss": 0.0319, + "epoch": 0.7, + "learning_rate": 0.00019542201023641867, + "loss": 0.0443, "step": 108020 }, { - "epoch": 1.17, - "learning_rate": 0.0001247290544486988, - "loss": 0.0322, + "epoch": 0.7, + "learning_rate": 0.0001954123288820617, + "loss": 0.0405, "step": 108030 }, { - "epoch": 1.17, - "learning_rate": 0.00012471283016418975, - "loss": 0.0383, + "epoch": 0.7, + "learning_rate": 0.00019540264752770478, + "loss": 0.0418, "step": 108040 }, { - "epoch": 1.17, - "learning_rate": 0.0001246966058796807, - "loss": 0.0367, + "epoch": 0.7, + "learning_rate": 0.00019539296617334786, + "loss": 0.0472, "step": 108050 }, { - "epoch": 1.17, - "learning_rate": 0.00012468038159517165, - "loss": 0.0309, + "epoch": 0.7, + "learning_rate": 0.00019538328481899094, + "loss": 0.0409, "step": 108060 }, { - "epoch": 1.17, - "learning_rate": 0.0001246641573106626, - "loss": 0.0274, + "epoch": 0.7, + "learning_rate": 0.000195373603464634, + "loss": 0.0472, "step": 108070 }, { - "epoch": 1.17, - "learning_rate": 0.00012464793302615354, - "loss": 0.0359, + "epoch": 0.7, + "learning_rate": 0.00019536392211027707, + "loss": 0.0436, "step": 108080 }, { - "epoch": 1.17, - "learning_rate": 0.0001246317087416445, - "loss": 0.0366, + "epoch": 0.7, + "learning_rate": 0.00019535424075592015, + "loss": 0.0471, "step": 108090 }, { - "epoch": 1.17, - "learning_rate": 0.00012461548445713542, - "loss": 0.0346, + "epoch": 0.7, + "learning_rate": 0.00019534455940156318, + "loss": 0.0443, "step": 108100 }, { - "epoch": 1.17, - "learning_rate": 0.00012459926017262637, - "loss": 0.0362, + "epoch": 0.7, + "learning_rate": 0.00019533487804720626, + "loss": 0.0473, "step": 108110 }, { - "epoch": 1.17, - "learning_rate": 0.00012458303588811732, - "loss": 0.0315, + "epoch": 0.7, + "learning_rate": 0.00019532519669284934, + "loss": 0.0452, "step": 108120 }, { - "epoch": 1.17, - "learning_rate": 0.00012456681160360827, - "loss": 0.0335, + "epoch": 0.7, + "learning_rate": 0.0001953155153384924, + "loss": 0.0505, "step": 108130 }, { - "epoch": 1.17, - "learning_rate": 0.00012455058731909922, - "loss": 0.0371, + "epoch": 0.7, + "learning_rate": 0.00019530583398413547, + "loss": 0.0456, "step": 108140 }, { - "epoch": 1.17, - "learning_rate": 0.00012453436303459017, - "loss": 0.0398, + "epoch": 0.7, + "learning_rate": 0.00019529615262977855, + "loss": 0.0455, "step": 108150 }, { - "epoch": 1.17, - "learning_rate": 0.00012451813875008112, - "loss": 0.0343, + "epoch": 0.7, + "learning_rate": 0.00019528647127542163, + "loss": 0.0414, "step": 108160 }, { - "epoch": 1.17, - "learning_rate": 0.00012450191446557207, - "loss": 0.0411, + "epoch": 0.7, + "learning_rate": 0.00019527678992106465, + "loss": 0.0433, "step": 108170 }, { - "epoch": 1.17, - "learning_rate": 0.00012448569018106302, - "loss": 0.0363, + "epoch": 0.7, + "learning_rate": 0.00019526710856670773, + "loss": 0.0397, "step": 108180 }, { - "epoch": 1.17, - "learning_rate": 0.00012446946589655394, - "loss": 0.0383, + "epoch": 0.7, + "learning_rate": 0.0001952574272123508, + "loss": 0.0482, "step": 108190 }, { - "epoch": 1.17, - "learning_rate": 0.0001244532416120449, - "loss": 0.0322, + "epoch": 0.7, + "learning_rate": 0.00019524774585799387, + "loss": 0.0464, "step": 108200 }, { - "epoch": 1.17, - "learning_rate": 0.00012443701732753584, - "loss": 0.0327, + "epoch": 0.7, + "learning_rate": 0.00019523806450363695, + "loss": 0.0442, "step": 108210 }, { - "epoch": 1.17, - "learning_rate": 0.0001244207930430268, - "loss": 0.0396, + "epoch": 0.7, + "learning_rate": 0.00019522838314928003, + "loss": 0.0598, "step": 108220 }, { - "epoch": 1.17, - "learning_rate": 0.00012440456875851774, - "loss": 0.0281, + "epoch": 0.7, + "learning_rate": 0.0001952187017949231, + "loss": 0.0421, "step": 108230 }, { - "epoch": 1.17, - "learning_rate": 0.0001243883444740087, - "loss": 0.0358, + "epoch": 0.7, + "learning_rate": 0.00019520902044056613, + "loss": 0.0427, "step": 108240 }, { - "epoch": 1.17, - "learning_rate": 0.00012437212018949964, - "loss": 0.0328, + "epoch": 0.7, + "learning_rate": 0.0001951993390862092, + "loss": 0.0499, "step": 108250 }, { - "epoch": 1.17, - "learning_rate": 0.0001243558959049906, - "loss": 0.0402, + "epoch": 0.7, + "learning_rate": 0.0001951896577318523, + "loss": 0.054, "step": 108260 }, { - "epoch": 1.17, - "learning_rate": 0.00012433967162048154, - "loss": 0.0298, + "epoch": 0.7, + "learning_rate": 0.00019517997637749534, + "loss": 0.053, "step": 108270 }, { - "epoch": 1.17, - "learning_rate": 0.00012432344733597246, - "loss": 0.0415, + "epoch": 0.7, + "learning_rate": 0.00019517029502313842, + "loss": 0.0446, "step": 108280 }, { - "epoch": 1.17, - "learning_rate": 0.0001243072230514634, - "loss": 0.0397, + "epoch": 0.7, + "learning_rate": 0.0001951606136687815, + "loss": 0.0442, "step": 108290 }, { - "epoch": 1.17, - "learning_rate": 0.00012429099876695436, - "loss": 0.0387, + "epoch": 0.7, + "learning_rate": 0.00019515093231442456, + "loss": 0.0542, "step": 108300 }, { - "epoch": 1.17, - "learning_rate": 0.0001242747744824453, - "loss": 0.0377, + "epoch": 0.7, + "learning_rate": 0.0001951412509600676, + "loss": 0.05, "step": 108310 }, { - "epoch": 1.17, - "learning_rate": 0.00012425855019793626, - "loss": 0.0401, + "epoch": 0.7, + "learning_rate": 0.0001951315696057107, + "loss": 0.0442, "step": 108320 }, { - "epoch": 1.17, - "learning_rate": 0.0001242423259134272, - "loss": 0.0518, + "epoch": 0.7, + "learning_rate": 0.00019512188825135374, + "loss": 0.0403, "step": 108330 }, { - "epoch": 1.17, - "learning_rate": 0.00012422610162891816, - "loss": 0.0335, + "epoch": 0.7, + "learning_rate": 0.00019511220689699682, + "loss": 0.0435, "step": 108340 }, { - "epoch": 1.17, - "learning_rate": 0.0001242098773444091, - "loss": 0.0436, + "epoch": 0.7, + "learning_rate": 0.0001951025255426399, + "loss": 0.041, "step": 108350 }, { - "epoch": 1.17, - "learning_rate": 0.00012419365305990006, - "loss": 0.0341, + "epoch": 0.7, + "learning_rate": 0.00019509284418828298, + "loss": 0.0455, "step": 108360 }, { - "epoch": 1.17, - "learning_rate": 0.00012417742877539098, - "loss": 0.0361, + "epoch": 0.7, + "learning_rate": 0.00019508316283392603, + "loss": 0.0439, "step": 108370 }, { - "epoch": 1.17, - "learning_rate": 0.00012416120449088193, - "loss": 0.0398, + "epoch": 0.7, + "learning_rate": 0.00019507348147956909, + "loss": 0.0426, "step": 108380 }, { - "epoch": 1.17, - "learning_rate": 0.00012414498020637288, - "loss": 0.0344, + "epoch": 0.7, + "learning_rate": 0.00019506380012521217, + "loss": 0.0454, "step": 108390 }, { - "epoch": 1.17, - "learning_rate": 0.00012412875592186383, - "loss": 0.0333, + "epoch": 0.7, + "learning_rate": 0.00019505411877085522, + "loss": 0.0466, "step": 108400 }, { - "epoch": 1.17, - "learning_rate": 0.00012411253163735478, - "loss": 0.0389, + "epoch": 0.7, + "learning_rate": 0.0001950444374164983, + "loss": 0.0445, "step": 108410 }, { - "epoch": 1.17, - "learning_rate": 0.00012409630735284573, - "loss": 0.0339, + "epoch": 0.7, + "learning_rate": 0.00019503475606214138, + "loss": 0.0436, "step": 108420 }, { - "epoch": 1.17, - "learning_rate": 0.00012408008306833668, - "loss": 0.0401, + "epoch": 0.7, + "learning_rate": 0.00019502507470778446, + "loss": 0.0428, "step": 108430 }, { - "epoch": 1.17, - "learning_rate": 0.00012406385878382763, - "loss": 0.0393, + "epoch": 0.7, + "learning_rate": 0.0001950153933534275, + "loss": 0.0439, "step": 108440 }, { - "epoch": 1.17, - "learning_rate": 0.00012404763449931858, - "loss": 0.0306, + "epoch": 0.7, + "learning_rate": 0.00019500571199907056, + "loss": 0.0427, "step": 108450 }, { - "epoch": 1.17, - "learning_rate": 0.0001240314102148095, - "loss": 0.0404, + "epoch": 0.7, + "learning_rate": 0.00019499603064471364, + "loss": 0.0552, "step": 108460 }, { - "epoch": 1.17, - "learning_rate": 0.00012401518593030045, - "loss": 0.0382, + "epoch": 0.7, + "learning_rate": 0.0001949863492903567, + "loss": 0.0447, "step": 108470 }, { - "epoch": 1.17, - "learning_rate": 0.0001239989616457914, - "loss": 0.0352, + "epoch": 0.7, + "learning_rate": 0.00019497666793599977, + "loss": 0.042, "step": 108480 }, { - "epoch": 1.17, - "learning_rate": 0.00012398273736128235, - "loss": 0.0363, + "epoch": 0.7, + "learning_rate": 0.00019496698658164285, + "loss": 0.0468, "step": 108490 }, { - "epoch": 1.17, - "learning_rate": 0.0001239665130767733, - "loss": 0.0334, + "epoch": 0.7, + "learning_rate": 0.0001949573052272859, + "loss": 0.0542, "step": 108500 }, { - "epoch": 1.17, - "learning_rate": 0.00012395028879226425, - "loss": 0.0328, + "epoch": 0.7, + "learning_rate": 0.000194947623872929, + "loss": 0.0579, "step": 108510 }, { - "epoch": 1.17, - "learning_rate": 0.0001239340645077552, - "loss": 0.0333, + "epoch": 0.7, + "learning_rate": 0.00019493794251857204, + "loss": 0.0489, "step": 108520 }, { - "epoch": 1.17, - "learning_rate": 0.00012391784022324615, - "loss": 0.0333, + "epoch": 0.7, + "learning_rate": 0.0001949282611642151, + "loss": 0.0478, "step": 108530 }, { - "epoch": 1.17, - "learning_rate": 0.0001239016159387371, - "loss": 0.0326, + "epoch": 0.7, + "learning_rate": 0.00019491857980985817, + "loss": 0.0593, "step": 108540 }, { - "epoch": 1.17, - "learning_rate": 0.00012388539165422802, - "loss": 0.0387, + "epoch": 0.7, + "learning_rate": 0.00019490889845550125, + "loss": 0.0502, "step": 108550 }, { - "epoch": 1.17, - "learning_rate": 0.00012386916736971897, - "loss": 0.0307, + "epoch": 0.7, + "learning_rate": 0.00019489921710114433, + "loss": 0.0473, "step": 108560 }, { - "epoch": 1.17, - "learning_rate": 0.00012385294308520992, - "loss": 0.0449, + "epoch": 0.7, + "learning_rate": 0.00019488953574678738, + "loss": 0.0459, "step": 108570 }, { - "epoch": 1.17, - "learning_rate": 0.00012383671880070087, - "loss": 0.0374, + "epoch": 0.7, + "learning_rate": 0.00019487985439243046, + "loss": 0.0483, "step": 108580 }, { - "epoch": 1.17, - "learning_rate": 0.00012382049451619182, - "loss": 0.0343, + "epoch": 0.7, + "learning_rate": 0.00019487017303807352, + "loss": 0.0596, "step": 108590 }, { - "epoch": 1.17, - "learning_rate": 0.00012380427023168277, - "loss": 0.0379, + "epoch": 0.7, + "learning_rate": 0.00019486049168371657, + "loss": 0.0416, "step": 108600 }, { - "epoch": 1.17, - "learning_rate": 0.00012378804594717372, + "epoch": 0.7, + "learning_rate": 0.00019485081032935965, "loss": 0.0439, "step": 108610 }, { - "epoch": 1.17, - "learning_rate": 0.00012377182166266467, - "loss": 0.0345, + "epoch": 0.7, + "learning_rate": 0.00019484112897500273, + "loss": 0.0489, "step": 108620 }, { - "epoch": 1.17, - "learning_rate": 0.00012375559737815562, - "loss": 0.0345, + "epoch": 0.7, + "learning_rate": 0.0001948314476206458, + "loss": 0.0441, "step": 108630 }, { - "epoch": 1.18, - "learning_rate": 0.00012373937309364654, - "loss": 0.0332, + "epoch": 0.7, + "learning_rate": 0.00019482176626628886, + "loss": 0.0441, "step": 108640 }, { - "epoch": 1.18, - "learning_rate": 0.0001237231488091375, - "loss": 0.0308, + "epoch": 0.7, + "learning_rate": 0.00019481208491193194, + "loss": 0.0512, "step": 108650 }, { - "epoch": 1.18, - "learning_rate": 0.00012370692452462844, - "loss": 0.0371, + "epoch": 0.7, + "learning_rate": 0.000194802403557575, + "loss": 0.0438, "step": 108660 }, { - "epoch": 1.18, - "learning_rate": 0.0001236907002401194, - "loss": 0.0357, + "epoch": 0.7, + "learning_rate": 0.00019479272220321805, + "loss": 0.0451, "step": 108670 }, { - "epoch": 1.18, - "learning_rate": 0.00012367447595561034, - "loss": 0.0356, + "epoch": 0.7, + "learning_rate": 0.00019478304084886113, + "loss": 0.0467, "step": 108680 }, { - "epoch": 1.18, - "learning_rate": 0.0001236582516711013, - "loss": 0.0373, + "epoch": 0.7, + "learning_rate": 0.0001947733594945042, + "loss": 0.0405, "step": 108690 }, { - "epoch": 1.18, - "learning_rate": 0.00012364202738659224, - "loss": 0.034, + "epoch": 0.7, + "learning_rate": 0.00019476367814014726, + "loss": 0.0518, "step": 108700 }, { - "epoch": 1.18, - "learning_rate": 0.0001236258031020832, - "loss": 0.0371, + "epoch": 0.7, + "learning_rate": 0.00019475399678579034, + "loss": 0.0486, "step": 108710 }, { - "epoch": 1.18, - "learning_rate": 0.00012360957881757414, - "loss": 0.0362, + "epoch": 0.7, + "learning_rate": 0.00019474431543143342, + "loss": 0.0474, "step": 108720 }, { - "epoch": 1.18, - "learning_rate": 0.00012359335453306506, - "loss": 0.0328, + "epoch": 0.7, + "learning_rate": 0.00019473463407707644, + "loss": 0.0381, "step": 108730 }, { - "epoch": 1.18, - "learning_rate": 0.000123577130248556, - "loss": 0.0343, + "epoch": 0.7, + "learning_rate": 0.00019472495272271952, + "loss": 0.0455, "step": 108740 }, { - "epoch": 1.18, - "learning_rate": 0.00012356090596404696, - "loss": 0.0303, + "epoch": 0.7, + "learning_rate": 0.0001947152713683626, + "loss": 0.0521, "step": 108750 }, { - "epoch": 1.18, - "learning_rate": 0.0001235446816795379, - "loss": 0.0394, + "epoch": 0.7, + "learning_rate": 0.00019470559001400568, + "loss": 0.0405, "step": 108760 }, { - "epoch": 1.18, - "learning_rate": 0.00012352845739502886, - "loss": 0.0326, + "epoch": 0.7, + "learning_rate": 0.00019469590865964874, + "loss": 0.0482, "step": 108770 }, { - "epoch": 1.18, - "learning_rate": 0.0001235122331105198, - "loss": 0.0349, + "epoch": 0.7, + "learning_rate": 0.00019468622730529182, + "loss": 0.0408, "step": 108780 }, { - "epoch": 1.18, - "learning_rate": 0.00012349600882601076, - "loss": 0.0368, + "epoch": 0.7, + "learning_rate": 0.0001946765459509349, + "loss": 0.0498, "step": 108790 }, { - "epoch": 1.18, - "learning_rate": 0.0001234797845415017, - "loss": 0.0307, + "epoch": 0.7, + "learning_rate": 0.00019466686459657792, + "loss": 0.0428, "step": 108800 }, { - "epoch": 1.18, - "learning_rate": 0.00012346356025699266, - "loss": 0.0305, + "epoch": 0.7, + "learning_rate": 0.000194657183242221, + "loss": 0.0442, "step": 108810 }, { - "epoch": 1.18, - "learning_rate": 0.00012344733597248358, - "loss": 0.0411, + "epoch": 0.7, + "learning_rate": 0.00019464750188786408, + "loss": 0.0456, "step": 108820 }, { - "epoch": 1.18, - "learning_rate": 0.00012343111168797453, - "loss": 0.0353, + "epoch": 0.7, + "learning_rate": 0.00019463782053350716, + "loss": 0.048, "step": 108830 }, { - "epoch": 1.18, - "learning_rate": 0.00012341488740346548, - "loss": 0.033, + "epoch": 0.7, + "learning_rate": 0.00019462813917915021, + "loss": 0.0477, "step": 108840 }, { - "epoch": 1.18, - "learning_rate": 0.00012339866311895643, - "loss": 0.0321, + "epoch": 0.7, + "learning_rate": 0.0001946184578247933, + "loss": 0.0567, "step": 108850 }, { - "epoch": 1.18, - "learning_rate": 0.00012338243883444738, - "loss": 0.0302, + "epoch": 0.7, + "learning_rate": 0.00019460877647043637, + "loss": 0.0451, "step": 108860 }, { - "epoch": 1.18, - "learning_rate": 0.00012336621454993833, - "loss": 0.0318, + "epoch": 0.7, + "learning_rate": 0.0001945990951160794, + "loss": 0.047, "step": 108870 }, { - "epoch": 1.18, - "learning_rate": 0.00012334999026542928, - "loss": 0.033, + "epoch": 0.7, + "learning_rate": 0.00019458941376172248, + "loss": 0.0414, "step": 108880 }, { - "epoch": 1.18, - "learning_rate": 0.00012333376598092023, - "loss": 0.0323, + "epoch": 0.7, + "learning_rate": 0.00019457973240736556, + "loss": 0.0427, "step": 108890 }, { - "epoch": 1.18, - "learning_rate": 0.00012331754169641118, - "loss": 0.042, + "epoch": 0.7, + "learning_rate": 0.0001945700510530086, + "loss": 0.046, "step": 108900 }, { - "epoch": 1.18, - "learning_rate": 0.0001233013174119021, - "loss": 0.0335, + "epoch": 0.7, + "learning_rate": 0.0001945603696986517, + "loss": 0.045, "step": 108910 }, { - "epoch": 1.18, - "learning_rate": 0.00012328509312739305, - "loss": 0.0316, + "epoch": 0.7, + "learning_rate": 0.00019455068834429477, + "loss": 0.0528, "step": 108920 }, { - "epoch": 1.18, - "learning_rate": 0.000123268868842884, - "loss": 0.0359, + "epoch": 0.7, + "learning_rate": 0.00019454100698993785, + "loss": 0.0459, "step": 108930 }, { - "epoch": 1.18, - "learning_rate": 0.00012325264455837495, - "loss": 0.0416, + "epoch": 0.7, + "learning_rate": 0.00019453132563558088, + "loss": 0.0386, "step": 108940 }, { - "epoch": 1.18, - "learning_rate": 0.0001232364202738659, - "loss": 0.0342, + "epoch": 0.7, + "learning_rate": 0.00019452164428122396, + "loss": 0.0472, "step": 108950 }, { - "epoch": 1.18, - "learning_rate": 0.00012322019598935685, - "loss": 0.044, + "epoch": 0.7, + "learning_rate": 0.00019451196292686704, + "loss": 0.0456, "step": 108960 }, { - "epoch": 1.18, - "learning_rate": 0.0001232039717048478, - "loss": 0.033, + "epoch": 0.7, + "learning_rate": 0.0001945022815725101, + "loss": 0.0564, "step": 108970 }, { - "epoch": 1.18, - "learning_rate": 0.00012318774742033875, - "loss": 0.03, + "epoch": 0.7, + "learning_rate": 0.00019449260021815317, + "loss": 0.0496, "step": 108980 }, { - "epoch": 1.18, - "learning_rate": 0.0001231715231358297, - "loss": 0.035, + "epoch": 0.7, + "learning_rate": 0.00019448291886379625, + "loss": 0.0491, "step": 108990 }, { - "epoch": 1.18, - "learning_rate": 0.00012315529885132063, - "loss": 0.0311, + "epoch": 0.7, + "learning_rate": 0.00019447323750943933, + "loss": 0.0498, "step": 109000 }, { - "epoch": 1.18, - "eval_cer": 0.9211675775390015, - "eval_loss": 0.027750546112656593, - "eval_runtime": 119.0437, - "eval_samples_per_second": 16.801, - "eval_steps_per_second": 4.2, + "epoch": 0.7, + "eval_cer": 0.9199918653259519, + "eval_loss": 0.029607662931084633, + "eval_runtime": 119.9769, + "eval_samples_per_second": 16.67, + "eval_steps_per_second": 4.167, "step": 109000 }, { - "epoch": 1.18, - "learning_rate": 0.00012313907456681158, - "loss": 0.0297, + "epoch": 0.7, + "learning_rate": 0.00019446355615508235, + "loss": 0.0528, "step": 109010 }, { - "epoch": 1.18, - "learning_rate": 0.00012312285028230253, - "loss": 0.0385, + "epoch": 0.7, + "learning_rate": 0.00019445387480072543, + "loss": 0.0442, "step": 109020 }, { - "epoch": 1.18, - "learning_rate": 0.00012310662599779347, - "loss": 0.0367, + "epoch": 0.7, + "learning_rate": 0.0001944441934463685, + "loss": 0.0491, "step": 109030 }, { - "epoch": 1.18, - "learning_rate": 0.00012309040171328442, - "loss": 0.0362, + "epoch": 0.7, + "learning_rate": 0.00019443451209201157, + "loss": 0.0482, "step": 109040 }, { - "epoch": 1.18, - "learning_rate": 0.00012307417742877537, - "loss": 0.0323, + "epoch": 0.7, + "learning_rate": 0.00019442483073765465, + "loss": 0.0472, "step": 109050 }, { - "epoch": 1.18, - "learning_rate": 0.00012305795314426632, - "loss": 0.0429, + "epoch": 0.7, + "learning_rate": 0.00019441514938329773, + "loss": 0.0502, "step": 109060 }, { - "epoch": 1.18, - "learning_rate": 0.00012304172885975727, - "loss": 0.0396, + "epoch": 0.7, + "learning_rate": 0.0001944054680289408, + "loss": 0.0439, "step": 109070 }, { - "epoch": 1.18, - "learning_rate": 0.00012302550457524822, - "loss": 0.0313, + "epoch": 0.7, + "learning_rate": 0.00019439578667458383, + "loss": 0.0465, "step": 109080 }, { - "epoch": 1.18, - "learning_rate": 0.00012300928029073915, - "loss": 0.0328, + "epoch": 0.7, + "learning_rate": 0.0001943861053202269, + "loss": 0.049, "step": 109090 }, { - "epoch": 1.18, - "learning_rate": 0.0001229930560062301, - "loss": 0.0318, + "epoch": 0.7, + "learning_rate": 0.00019437642396586996, + "loss": 0.0409, "step": 109100 }, { - "epoch": 1.18, - "learning_rate": 0.00012297683172172105, - "loss": 0.038, + "epoch": 0.7, + "learning_rate": 0.00019436674261151304, + "loss": 0.0475, "step": 109110 }, { - "epoch": 1.18, - "learning_rate": 0.00012296060743721202, - "loss": 0.0353, + "epoch": 0.7, + "learning_rate": 0.00019435706125715612, + "loss": 0.0451, "step": 109120 }, { - "epoch": 1.18, - "learning_rate": 0.00012294438315270297, - "loss": 0.0336, + "epoch": 0.7, + "learning_rate": 0.0001943473799027992, + "loss": 0.0473, "step": 109130 }, { - "epoch": 1.18, - "learning_rate": 0.00012292815886819392, - "loss": 0.0354, + "epoch": 0.7, + "learning_rate": 0.00019433769854844226, + "loss": 0.0415, "step": 109140 }, { - "epoch": 1.18, - "learning_rate": 0.00012291193458368485, - "loss": 0.0307, + "epoch": 0.7, + "learning_rate": 0.0001943280171940853, + "loss": 0.0438, "step": 109150 }, { - "epoch": 1.18, - "learning_rate": 0.0001228957102991758, - "loss": 0.0439, + "epoch": 0.7, + "learning_rate": 0.0001943183358397284, + "loss": 0.0478, "step": 109160 }, { - "epoch": 1.18, - "learning_rate": 0.00012287948601466674, - "loss": 0.0347, + "epoch": 0.7, + "learning_rate": 0.00019430865448537144, + "loss": 0.0409, "step": 109170 }, { - "epoch": 1.18, - "learning_rate": 0.0001228632617301577, - "loss": 0.0373, + "epoch": 0.7, + "learning_rate": 0.00019429897313101452, + "loss": 0.0411, "step": 109180 }, { - "epoch": 1.18, - "learning_rate": 0.00012284703744564864, - "loss": 0.0337, + "epoch": 0.7, + "learning_rate": 0.0001942892917766576, + "loss": 0.0472, "step": 109190 }, { - "epoch": 1.18, - "learning_rate": 0.0001228308131611396, - "loss": 0.0356, + "epoch": 0.7, + "learning_rate": 0.00019427961042230068, + "loss": 0.0402, "step": 109200 }, { - "epoch": 1.18, - "learning_rate": 0.00012281458887663054, - "loss": 0.0339, + "epoch": 0.7, + "learning_rate": 0.00019426992906794373, + "loss": 0.037, "step": 109210 }, { - "epoch": 1.18, - "learning_rate": 0.0001227983645921215, - "loss": 0.0313, + "epoch": 0.7, + "learning_rate": 0.00019426024771358678, + "loss": 0.0575, "step": 109220 }, { - "epoch": 1.18, - "learning_rate": 0.00012278214030761244, - "loss": 0.0439, + "epoch": 0.7, + "learning_rate": 0.00019425056635922986, + "loss": 0.0434, "step": 109230 }, { - "epoch": 1.18, - "learning_rate": 0.00012276591602310337, - "loss": 0.0338, + "epoch": 0.71, + "learning_rate": 0.00019424088500487292, + "loss": 0.0483, "step": 109240 }, { - "epoch": 1.18, - "learning_rate": 0.00012274969173859432, - "loss": 0.039, + "epoch": 0.71, + "learning_rate": 0.000194231203650516, + "loss": 0.045, "step": 109250 }, { - "epoch": 1.18, - "learning_rate": 0.00012273346745408527, - "loss": 0.0348, + "epoch": 0.71, + "learning_rate": 0.00019422152229615908, + "loss": 0.0456, "step": 109260 }, { - "epoch": 1.18, - "learning_rate": 0.00012271724316957622, - "loss": 0.0401, + "epoch": 0.71, + "learning_rate": 0.00019421184094180216, + "loss": 0.04, "step": 109270 }, { - "epoch": 1.18, - "learning_rate": 0.00012270101888506716, - "loss": 0.0324, + "epoch": 0.71, + "learning_rate": 0.0001942021595874452, + "loss": 0.0437, "step": 109280 }, { - "epoch": 1.18, - "learning_rate": 0.00012268479460055811, - "loss": 0.0305, + "epoch": 0.71, + "learning_rate": 0.00019419247823308826, + "loss": 0.0465, "step": 109290 }, { - "epoch": 1.18, - "learning_rate": 0.00012266857031604906, - "loss": 0.0404, + "epoch": 0.71, + "learning_rate": 0.00019418279687873131, + "loss": 0.0493, "step": 109300 }, { - "epoch": 1.18, - "learning_rate": 0.00012265234603154001, - "loss": 0.0358, + "epoch": 0.71, + "learning_rate": 0.0001941731155243744, + "loss": 0.0401, "step": 109310 }, { - "epoch": 1.18, - "learning_rate": 0.00012263612174703096, - "loss": 0.0382, + "epoch": 0.71, + "learning_rate": 0.00019416343417001747, + "loss": 0.0469, "step": 109320 }, { - "epoch": 1.18, - "learning_rate": 0.0001226198974625219, - "loss": 0.0387, + "epoch": 0.71, + "learning_rate": 0.00019415375281566055, + "loss": 0.0452, "step": 109330 }, { - "epoch": 1.18, - "learning_rate": 0.00012260367317801284, - "loss": 0.0391, + "epoch": 0.71, + "learning_rate": 0.0001941440714613036, + "loss": 0.048, "step": 109340 }, { - "epoch": 1.18, - "learning_rate": 0.00012258744889350379, - "loss": 0.034, + "epoch": 0.71, + "learning_rate": 0.0001941343901069467, + "loss": 0.0446, "step": 109350 }, { - "epoch": 1.18, - "learning_rate": 0.00012257122460899474, - "loss": 0.0386, + "epoch": 0.71, + "learning_rate": 0.00019412470875258974, + "loss": 0.0439, "step": 109360 }, { - "epoch": 1.18, - "learning_rate": 0.00012255500032448569, - "loss": 0.0354, + "epoch": 0.71, + "learning_rate": 0.0001941150273982328, + "loss": 0.0436, "step": 109370 }, { - "epoch": 1.18, - "learning_rate": 0.00012253877603997664, - "loss": 0.036, + "epoch": 0.71, + "learning_rate": 0.00019410534604387587, + "loss": 0.0428, "step": 109380 }, { - "epoch": 1.18, - "learning_rate": 0.00012252255175546759, - "loss": 0.0323, + "epoch": 0.71, + "learning_rate": 0.00019409566468951895, + "loss": 0.0441, "step": 109390 }, { - "epoch": 1.18, - "learning_rate": 0.00012250632747095854, - "loss": 0.0331, + "epoch": 0.71, + "learning_rate": 0.00019408598333516203, + "loss": 0.0452, "step": 109400 }, { - "epoch": 1.18, - "learning_rate": 0.00012249010318644948, - "loss": 0.0376, + "epoch": 0.71, + "learning_rate": 0.00019407630198080508, + "loss": 0.0535, "step": 109410 }, { - "epoch": 1.18, - "learning_rate": 0.0001224738789019404, - "loss": 0.0281, + "epoch": 0.71, + "learning_rate": 0.00019406662062644816, + "loss": 0.0437, "step": 109420 }, { - "epoch": 1.18, - "learning_rate": 0.00012245765461743136, - "loss": 0.0331, + "epoch": 0.71, + "learning_rate": 0.00019405693927209122, + "loss": 0.0414, "step": 109430 }, { - "epoch": 1.18, - "learning_rate": 0.0001224414303329223, - "loss": 0.0304, + "epoch": 0.71, + "learning_rate": 0.00019404725791773427, + "loss": 0.0478, "step": 109440 }, { - "epoch": 1.18, - "learning_rate": 0.00012242520604841326, - "loss": 0.0351, + "epoch": 0.71, + "learning_rate": 0.00019403757656337735, + "loss": 0.0475, "step": 109450 }, { - "epoch": 1.18, - "learning_rate": 0.0001224089817639042, - "loss": 0.0378, + "epoch": 0.71, + "learning_rate": 0.00019402789520902043, + "loss": 0.0453, "step": 109460 }, { - "epoch": 1.18, - "learning_rate": 0.00012239275747939516, - "loss": 0.0413, + "epoch": 0.71, + "learning_rate": 0.0001940182138546635, + "loss": 0.0451, "step": 109470 }, { - "epoch": 1.18, - "learning_rate": 0.0001223765331948861, - "loss": 0.0349, + "epoch": 0.71, + "learning_rate": 0.00019400853250030656, + "loss": 0.0429, "step": 109480 }, { - "epoch": 1.18, - "learning_rate": 0.00012236030891037706, - "loss": 0.0355, + "epoch": 0.71, + "learning_rate": 0.00019399885114594964, + "loss": 0.0477, "step": 109490 }, { - "epoch": 1.18, - "learning_rate": 0.000122344084625868, - "loss": 0.0373, + "epoch": 0.71, + "learning_rate": 0.00019398916979159267, + "loss": 0.0436, "step": 109500 }, { - "epoch": 1.18, - "learning_rate": 0.00012232786034135893, - "loss": 0.0368, + "epoch": 0.71, + "learning_rate": 0.00019397948843723575, + "loss": 0.0439, "step": 109510 }, { - "epoch": 1.18, - "learning_rate": 0.00012231163605684988, - "loss": 0.0388, + "epoch": 0.71, + "learning_rate": 0.00019396980708287883, + "loss": 0.0513, "step": 109520 }, { - "epoch": 1.18, - "learning_rate": 0.00012229541177234083, - "loss": 0.0336, + "epoch": 0.71, + "learning_rate": 0.0001939601257285219, + "loss": 0.0403, "step": 109530 }, { - "epoch": 1.18, - "learning_rate": 0.00012227918748783178, - "loss": 0.0344, + "epoch": 0.71, + "learning_rate": 0.00019395044437416496, + "loss": 0.0436, "step": 109540 }, { - "epoch": 1.18, - "learning_rate": 0.00012226296320332273, - "loss": 0.0291, + "epoch": 0.71, + "learning_rate": 0.00019394076301980804, + "loss": 0.0428, "step": 109550 }, { - "epoch": 1.19, - "learning_rate": 0.00012224673891881368, - "loss": 0.0355, + "epoch": 0.71, + "learning_rate": 0.00019393108166545112, + "loss": 0.0418, "step": 109560 }, { - "epoch": 1.19, - "learning_rate": 0.00012223051463430463, - "loss": 0.0338, + "epoch": 0.71, + "learning_rate": 0.00019392140031109414, + "loss": 0.0461, "step": 109570 }, { - "epoch": 1.19, - "learning_rate": 0.00012221429034979558, - "loss": 0.0344, + "epoch": 0.71, + "learning_rate": 0.00019391171895673722, + "loss": 0.043, "step": 109580 }, { - "epoch": 1.19, - "learning_rate": 0.00012219806606528653, - "loss": 0.0377, + "epoch": 0.71, + "learning_rate": 0.0001939020376023803, + "loss": 0.0503, "step": 109590 }, { - "epoch": 1.19, - "learning_rate": 0.00012218184178077745, - "loss": 0.0399, + "epoch": 0.71, + "learning_rate": 0.00019389235624802338, + "loss": 0.0462, "step": 109600 }, { - "epoch": 1.19, - "learning_rate": 0.0001221656174962684, - "loss": 0.0327, + "epoch": 0.71, + "learning_rate": 0.00019388267489366644, + "loss": 0.0442, "step": 109610 }, { - "epoch": 1.19, - "learning_rate": 0.00012214939321175935, - "loss": 0.0333, + "epoch": 0.71, + "learning_rate": 0.00019387299353930952, + "loss": 0.0473, "step": 109620 }, { - "epoch": 1.19, - "learning_rate": 0.0001221331689272503, - "loss": 0.0323, + "epoch": 0.71, + "learning_rate": 0.0001938633121849526, + "loss": 0.0449, "step": 109630 }, { - "epoch": 1.19, - "learning_rate": 0.00012211694464274125, - "loss": 0.0382, + "epoch": 0.71, + "learning_rate": 0.00019385363083059562, + "loss": 0.043, "step": 109640 }, { - "epoch": 1.19, - "learning_rate": 0.0001221007203582322, - "loss": 0.0317, + "epoch": 0.71, + "learning_rate": 0.0001938439494762387, + "loss": 0.05, "step": 109650 }, { - "epoch": 1.19, - "learning_rate": 0.00012208449607372315, - "loss": 0.0298, + "epoch": 0.71, + "learning_rate": 0.00019383426812188178, + "loss": 0.0477, "step": 109660 }, { - "epoch": 1.19, - "learning_rate": 0.00012206827178921408, - "loss": 0.0361, + "epoch": 0.71, + "learning_rate": 0.00019382458676752486, + "loss": 0.0442, "step": 109670 }, { - "epoch": 1.19, - "learning_rate": 0.00012205204750470503, - "loss": 0.0321, + "epoch": 0.71, + "learning_rate": 0.0001938149054131679, + "loss": 0.0544, "step": 109680 }, { - "epoch": 1.19, - "learning_rate": 0.00012203582322019598, - "loss": 0.0299, + "epoch": 0.71, + "learning_rate": 0.000193805224058811, + "loss": 0.0467, "step": 109690 }, { - "epoch": 1.19, - "learning_rate": 0.00012201959893568693, - "loss": 0.037, + "epoch": 0.71, + "learning_rate": 0.00019379554270445407, + "loss": 0.0454, "step": 109700 }, { - "epoch": 1.19, - "learning_rate": 0.00012200337465117788, - "loss": 0.0328, + "epoch": 0.71, + "learning_rate": 0.0001937858613500971, + "loss": 0.0363, "step": 109710 }, { - "epoch": 1.19, - "learning_rate": 0.00012198715036666882, - "loss": 0.0345, + "epoch": 0.71, + "learning_rate": 0.00019377617999574018, + "loss": 0.0465, "step": 109720 }, { - "epoch": 1.19, - "learning_rate": 0.00012197092608215977, - "loss": 0.0351, + "epoch": 0.71, + "learning_rate": 0.00019376649864138326, + "loss": 0.0532, "step": 109730 }, { - "epoch": 1.19, - "learning_rate": 0.00012195470179765072, - "loss": 0.0362, + "epoch": 0.71, + "learning_rate": 0.0001937568172870263, + "loss": 0.0488, "step": 109740 }, { - "epoch": 1.19, - "learning_rate": 0.00012193847751314167, - "loss": 0.0319, + "epoch": 0.71, + "learning_rate": 0.0001937471359326694, + "loss": 0.0425, "step": 109750 }, { - "epoch": 1.19, - "learning_rate": 0.0001219222532286326, - "loss": 0.0361, + "epoch": 0.71, + "learning_rate": 0.00019373745457831247, + "loss": 0.0417, "step": 109760 }, { - "epoch": 1.19, - "learning_rate": 0.00012190602894412355, - "loss": 0.0414, + "epoch": 0.71, + "learning_rate": 0.00019372777322395555, + "loss": 0.0455, "step": 109770 }, { - "epoch": 1.19, - "learning_rate": 0.0001218898046596145, - "loss": 0.0343, + "epoch": 0.71, + "learning_rate": 0.00019371809186959858, + "loss": 0.0434, "step": 109780 }, { - "epoch": 1.19, - "learning_rate": 0.00012187358037510545, - "loss": 0.0396, + "epoch": 0.71, + "learning_rate": 0.00019370841051524166, + "loss": 0.0473, "step": 109790 }, { - "epoch": 1.19, - "learning_rate": 0.0001218573560905964, - "loss": 0.0406, + "epoch": 0.71, + "learning_rate": 0.00019369872916088474, + "loss": 0.0492, "step": 109800 }, { - "epoch": 1.19, - "learning_rate": 0.00012184113180608734, - "loss": 0.0383, + "epoch": 0.71, + "learning_rate": 0.0001936890478065278, + "loss": 0.0462, "step": 109810 }, { - "epoch": 1.19, - "learning_rate": 0.00012182490752157829, - "loss": 0.033, + "epoch": 0.71, + "learning_rate": 0.00019367936645217087, + "loss": 0.0459, "step": 109820 }, { - "epoch": 1.19, - "learning_rate": 0.00012180868323706924, - "loss": 0.0368, + "epoch": 0.71, + "learning_rate": 0.00019366968509781395, + "loss": 0.0463, "step": 109830 }, { - "epoch": 1.19, - "learning_rate": 0.00012179245895256019, - "loss": 0.0348, + "epoch": 0.71, + "learning_rate": 0.00019366000374345703, + "loss": 0.0465, "step": 109840 }, { - "epoch": 1.19, - "learning_rate": 0.00012177623466805113, - "loss": 0.0394, + "epoch": 0.71, + "learning_rate": 0.00019365032238910005, + "loss": 0.0424, "step": 109850 }, { - "epoch": 1.19, - "learning_rate": 0.00012176001038354208, - "loss": 0.0358, + "epoch": 0.71, + "learning_rate": 0.00019364064103474313, + "loss": 0.0487, "step": 109860 }, { - "epoch": 1.19, - "learning_rate": 0.00012174378609903303, - "loss": 0.0317, + "epoch": 0.71, + "learning_rate": 0.0001936309596803862, + "loss": 0.0479, "step": 109870 }, { - "epoch": 1.19, - "learning_rate": 0.00012172756181452398, - "loss": 0.0392, + "epoch": 0.71, + "learning_rate": 0.00019362127832602927, + "loss": 0.0448, "step": 109880 }, { - "epoch": 1.19, - "learning_rate": 0.00012171133753001492, - "loss": 0.0398, + "epoch": 0.71, + "learning_rate": 0.00019361159697167234, + "loss": 0.0443, "step": 109890 }, { - "epoch": 1.19, - "learning_rate": 0.00012169511324550586, - "loss": 0.0339, + "epoch": 0.71, + "learning_rate": 0.00019360191561731542, + "loss": 0.0416, "step": 109900 }, { - "epoch": 1.19, - "learning_rate": 0.00012167888896099681, - "loss": 0.0348, + "epoch": 0.71, + "learning_rate": 0.00019359223426295848, + "loss": 0.0449, "step": 109910 }, { - "epoch": 1.19, - "learning_rate": 0.00012166266467648776, - "loss": 0.0366, + "epoch": 0.71, + "learning_rate": 0.00019358255290860153, + "loss": 0.0525, "step": 109920 }, { - "epoch": 1.19, - "learning_rate": 0.00012164644039197871, - "loss": 0.0336, + "epoch": 0.71, + "learning_rate": 0.0001935728715542446, + "loss": 0.0449, "step": 109930 }, { - "epoch": 1.19, - "learning_rate": 0.00012163021610746965, - "loss": 0.0383, + "epoch": 0.71, + "learning_rate": 0.00019356319019988766, + "loss": 0.0482, "step": 109940 }, { - "epoch": 1.19, - "learning_rate": 0.0001216139918229606, - "loss": 0.0321, + "epoch": 0.71, + "learning_rate": 0.00019355350884553074, + "loss": 0.0433, "step": 109950 }, { - "epoch": 1.19, - "learning_rate": 0.00012159776753845155, - "loss": 0.0324, + "epoch": 0.71, + "learning_rate": 0.00019354382749117382, + "loss": 0.0441, "step": 109960 }, { - "epoch": 1.19, - "learning_rate": 0.0001215815432539425, - "loss": 0.0367, + "epoch": 0.71, + "learning_rate": 0.0001935341461368169, + "loss": 0.0452, "step": 109970 }, { - "epoch": 1.19, - "learning_rate": 0.00012156531896943345, - "loss": 0.039, + "epoch": 0.71, + "learning_rate": 0.00019352446478245995, + "loss": 0.0496, "step": 109980 }, { - "epoch": 1.19, - "learning_rate": 0.00012154909468492438, - "loss": 0.0419, + "epoch": 0.71, + "learning_rate": 0.000193514783428103, + "loss": 0.0451, "step": 109990 }, { - "epoch": 1.19, - "learning_rate": 0.00012153287040041533, - "loss": 0.0297, + "epoch": 0.71, + "learning_rate": 0.0001935051020737461, + "loss": 0.0438, "step": 110000 }, { - "epoch": 1.19, - "eval_cer": 0.9211772958665303, - "eval_loss": 0.027520321309566498, - "eval_runtime": 118.987, - "eval_samples_per_second": 16.809, - "eval_steps_per_second": 4.202, + "epoch": 0.71, + "eval_cer": 0.9199584227770873, + "eval_loss": 0.03002985194325447, + "eval_runtime": 120.0419, + "eval_samples_per_second": 16.661, + "eval_steps_per_second": 4.165, "step": 110000 }, { - "epoch": 1.19, - "learning_rate": 0.00012151664611590628, - "loss": 0.0346, + "epoch": 0.71, + "learning_rate": 0.00019349542071938914, + "loss": 0.0396, "step": 110010 }, { - "epoch": 1.19, - "learning_rate": 0.00012150042183139723, - "loss": 0.0388, + "epoch": 0.71, + "learning_rate": 0.00019348573936503222, + "loss": 0.0466, "step": 110020 }, { - "epoch": 1.19, - "learning_rate": 0.00012148419754688817, - "loss": 0.0389, + "epoch": 0.71, + "learning_rate": 0.0001934760580106753, + "loss": 0.0454, "step": 110030 }, { - "epoch": 1.19, - "learning_rate": 0.00012146797326237912, - "loss": 0.0352, + "epoch": 0.71, + "learning_rate": 0.00019346637665631838, + "loss": 0.0444, "step": 110040 }, { - "epoch": 1.19, - "learning_rate": 0.00012145174897787007, - "loss": 0.0409, + "epoch": 0.71, + "learning_rate": 0.00019345669530196143, + "loss": 0.0507, "step": 110050 }, { - "epoch": 1.19, - "learning_rate": 0.00012143552469336102, - "loss": 0.0351, + "epoch": 0.71, + "learning_rate": 0.00019344701394760448, + "loss": 0.044, "step": 110060 }, { - "epoch": 1.19, - "learning_rate": 0.00012141930040885197, - "loss": 0.036, + "epoch": 0.71, + "learning_rate": 0.00019343733259324756, + "loss": 0.0466, "step": 110070 }, { - "epoch": 1.19, - "learning_rate": 0.0001214030761243429, - "loss": 0.0293, + "epoch": 0.71, + "learning_rate": 0.00019342765123889062, + "loss": 0.0463, "step": 110080 }, { - "epoch": 1.19, - "learning_rate": 0.00012138685183983385, - "loss": 0.0329, + "epoch": 0.71, + "learning_rate": 0.0001934179698845337, + "loss": 0.0482, "step": 110090 }, { - "epoch": 1.19, - "learning_rate": 0.0001213706275553248, + "epoch": 0.71, + "learning_rate": 0.00019340828853017678, "loss": 0.0388, "step": 110100 }, { - "epoch": 1.19, - "learning_rate": 0.00012135440327081575, - "loss": 0.0307, + "epoch": 0.71, + "learning_rate": 0.00019339860717581983, + "loss": 0.0411, "step": 110110 }, { - "epoch": 1.19, - "learning_rate": 0.00012133817898630669, - "loss": 0.0415, + "epoch": 0.71, + "learning_rate": 0.0001933889258214629, + "loss": 0.0433, "step": 110120 }, { - "epoch": 1.19, - "learning_rate": 0.00012132195470179764, - "loss": 0.0296, + "epoch": 0.71, + "learning_rate": 0.00019337924446710596, + "loss": 0.0462, "step": 110130 }, { - "epoch": 1.19, - "learning_rate": 0.00012130573041728859, - "loss": 0.0332, + "epoch": 0.71, + "learning_rate": 0.00019336956311274901, + "loss": 0.0451, "step": 110140 }, { - "epoch": 1.19, - "learning_rate": 0.00012128950613277954, - "loss": 0.0343, + "epoch": 0.71, + "learning_rate": 0.0001933598817583921, + "loss": 0.0431, "step": 110150 }, { - "epoch": 1.19, - "learning_rate": 0.00012127328184827049, - "loss": 0.0356, + "epoch": 0.71, + "learning_rate": 0.00019335020040403517, + "loss": 0.0468, "step": 110160 }, { - "epoch": 1.19, - "learning_rate": 0.00012125705756376142, - "loss": 0.0316, + "epoch": 0.71, + "learning_rate": 0.00019334051904967825, + "loss": 0.0383, "step": 110170 }, { - "epoch": 1.19, - "learning_rate": 0.00012124083327925237, - "loss": 0.0316, + "epoch": 0.71, + "learning_rate": 0.0001933308376953213, + "loss": 0.0474, "step": 110180 }, { - "epoch": 1.19, - "learning_rate": 0.00012122460899474332, - "loss": 0.0303, + "epoch": 0.71, + "learning_rate": 0.00019332115634096439, + "loss": 0.0518, "step": 110190 }, { - "epoch": 1.19, - "learning_rate": 0.00012120838471023427, - "loss": 0.038, + "epoch": 0.71, + "learning_rate": 0.00019331147498660744, + "loss": 0.0441, "step": 110200 }, { - "epoch": 1.19, - "learning_rate": 0.00012119216042572521, - "loss": 0.0289, + "epoch": 0.71, + "learning_rate": 0.0001933017936322505, + "loss": 0.0443, "step": 110210 }, { - "epoch": 1.19, - "learning_rate": 0.00012117593614121616, - "loss": 0.0409, + "epoch": 0.71, + "learning_rate": 0.00019329211227789357, + "loss": 0.0388, "step": 110220 }, { - "epoch": 1.19, - "learning_rate": 0.00012115971185670711, - "loss": 0.0348, + "epoch": 0.71, + "learning_rate": 0.00019328243092353665, + "loss": 0.0473, "step": 110230 }, { - "epoch": 1.19, - "learning_rate": 0.00012114348757219806, - "loss": 0.0326, + "epoch": 0.71, + "learning_rate": 0.00019327274956917973, + "loss": 0.0465, "step": 110240 }, { - "epoch": 1.19, - "learning_rate": 0.00012112726328768901, - "loss": 0.0322, + "epoch": 0.71, + "learning_rate": 0.00019326306821482278, + "loss": 0.0501, "step": 110250 }, { - "epoch": 1.19, - "learning_rate": 0.00012111103900317994, - "loss": 0.0327, + "epoch": 0.71, + "learning_rate": 0.00019325338686046586, + "loss": 0.0412, "step": 110260 }, { - "epoch": 1.19, - "learning_rate": 0.0001210948147186709, - "loss": 0.034, + "epoch": 0.71, + "learning_rate": 0.00019324370550610892, + "loss": 0.0447, "step": 110270 }, { - "epoch": 1.19, - "learning_rate": 0.00012107859043416184, - "loss": 0.0348, + "epoch": 0.71, + "learning_rate": 0.00019323402415175197, + "loss": 0.0488, "step": 110280 }, { - "epoch": 1.19, - "learning_rate": 0.0001210623661496528, - "loss": 0.0329, + "epoch": 0.71, + "learning_rate": 0.00019322434279739505, + "loss": 0.0419, "step": 110290 }, { - "epoch": 1.19, - "learning_rate": 0.00012104614186514373, - "loss": 0.0314, + "epoch": 0.71, + "learning_rate": 0.00019321466144303813, + "loss": 0.0418, "step": 110300 }, { - "epoch": 1.19, - "learning_rate": 0.00012102991758063468, - "loss": 0.0325, + "epoch": 0.71, + "learning_rate": 0.00019320498008868118, + "loss": 0.0406, "step": 110310 }, { - "epoch": 1.19, - "learning_rate": 0.00012101369329612563, - "loss": 0.0311, + "epoch": 0.71, + "learning_rate": 0.00019319529873432426, + "loss": 0.0432, "step": 110320 }, { - "epoch": 1.19, - "learning_rate": 0.00012099746901161658, - "loss": 0.0345, + "epoch": 0.71, + "learning_rate": 0.00019318561737996734, + "loss": 0.047, "step": 110330 }, { - "epoch": 1.19, - "learning_rate": 0.00012098124472710753, - "loss": 0.033, + "epoch": 0.71, + "learning_rate": 0.00019317593602561037, + "loss": 0.0459, "step": 110340 }, { - "epoch": 1.19, - "learning_rate": 0.00012096502044259847, - "loss": 0.0374, + "epoch": 0.71, + "learning_rate": 0.00019316625467125345, + "loss": 0.0427, "step": 110350 }, { - "epoch": 1.19, - "learning_rate": 0.00012094879615808941, - "loss": 0.0386, + "epoch": 0.71, + "learning_rate": 0.00019315657331689653, + "loss": 0.0523, "step": 110360 }, { - "epoch": 1.19, - "learning_rate": 0.00012093257187358036, - "loss": 0.0364, + "epoch": 0.71, + "learning_rate": 0.0001931468919625396, + "loss": 0.0417, "step": 110370 }, { - "epoch": 1.19, - "learning_rate": 0.00012091634758907131, - "loss": 0.0349, + "epoch": 0.71, + "learning_rate": 0.00019313721060818266, + "loss": 0.0483, "step": 110380 }, { - "epoch": 1.19, - "learning_rate": 0.00012090012330456226, - "loss": 0.0286, + "epoch": 0.71, + "learning_rate": 0.00019312752925382574, + "loss": 0.0418, "step": 110390 }, { - "epoch": 1.19, - "learning_rate": 0.0001208838990200532, - "loss": 0.0344, + "epoch": 0.71, + "learning_rate": 0.00019311784789946882, + "loss": 0.0415, "step": 110400 }, { - "epoch": 1.19, - "learning_rate": 0.00012086767473554415, - "loss": 0.0366, + "epoch": 0.71, + "learning_rate": 0.00019310816654511184, + "loss": 0.0433, "step": 110410 }, { - "epoch": 1.19, - "learning_rate": 0.0001208514504510351, - "loss": 0.0403, + "epoch": 0.71, + "learning_rate": 0.00019309848519075492, + "loss": 0.0446, "step": 110420 }, { - "epoch": 1.19, - "learning_rate": 0.00012083522616652605, - "loss": 0.0305, + "epoch": 0.71, + "learning_rate": 0.000193088803836398, + "loss": 0.0409, "step": 110430 }, { - "epoch": 1.19, - "learning_rate": 0.00012081900188201699, - "loss": 0.0276, + "epoch": 0.71, + "learning_rate": 0.00019307912248204108, + "loss": 0.0446, "step": 110440 }, { - "epoch": 1.19, - "learning_rate": 0.00012080277759750794, - "loss": 0.0336, + "epoch": 0.71, + "learning_rate": 0.00019306944112768414, + "loss": 0.0416, "step": 110450 }, { - "epoch": 1.19, - "learning_rate": 0.00012078655331299889, - "loss": 0.0337, + "epoch": 0.71, + "learning_rate": 0.00019305975977332722, + "loss": 0.0485, "step": 110460 }, { - "epoch": 1.19, - "learning_rate": 0.00012077032902848984, - "loss": 0.0397, + "epoch": 0.71, + "learning_rate": 0.0001930500784189703, + "loss": 0.0475, "step": 110470 }, { - "epoch": 1.19, - "learning_rate": 0.00012075410474398079, - "loss": 0.0324, + "epoch": 0.71, + "learning_rate": 0.00019304039706461332, + "loss": 0.0458, "step": 110480 }, { - "epoch": 1.2, - "learning_rate": 0.00012073788045947172, - "loss": 0.0336, + "epoch": 0.71, + "learning_rate": 0.0001930307157102564, + "loss": 0.0489, "step": 110490 }, { - "epoch": 1.2, - "learning_rate": 0.00012072165617496267, - "loss": 0.03, + "epoch": 0.71, + "learning_rate": 0.00019302103435589948, + "loss": 0.05, "step": 110500 }, { - "epoch": 1.2, - "learning_rate": 0.00012070543189045362, - "loss": 0.0338, + "epoch": 0.71, + "learning_rate": 0.00019301135300154253, + "loss": 0.0462, "step": 110510 }, { - "epoch": 1.2, - "learning_rate": 0.00012068920760594457, - "loss": 0.0335, + "epoch": 0.71, + "learning_rate": 0.0001930016716471856, + "loss": 0.0541, "step": 110520 }, { - "epoch": 1.2, - "learning_rate": 0.00012067298332143551, - "loss": 0.0343, + "epoch": 0.71, + "learning_rate": 0.0001929919902928287, + "loss": 0.0507, "step": 110530 }, { - "epoch": 1.2, - "learning_rate": 0.00012065675903692646, - "loss": 0.0386, + "epoch": 0.71, + "learning_rate": 0.00019298230893847177, + "loss": 0.0448, "step": 110540 }, { - "epoch": 1.2, - "learning_rate": 0.0001206405347524174, - "loss": 0.0341, + "epoch": 0.71, + "learning_rate": 0.0001929726275841148, + "loss": 0.0495, "step": 110550 }, { - "epoch": 1.2, - "learning_rate": 0.00012062431046790836, - "loss": 0.0325, + "epoch": 0.71, + "learning_rate": 0.00019296294622975788, + "loss": 0.0449, "step": 110560 }, { - "epoch": 1.2, - "learning_rate": 0.0001206080861833993, - "loss": 0.0302, + "epoch": 0.71, + "learning_rate": 0.00019295326487540096, + "loss": 0.0409, "step": 110570 }, { - "epoch": 1.2, - "learning_rate": 0.00012059186189889024, - "loss": 0.0376, + "epoch": 0.71, + "learning_rate": 0.000192943583521044, + "loss": 0.045, "step": 110580 }, { - "epoch": 1.2, - "learning_rate": 0.00012057563761438119, - "loss": 0.0335, + "epoch": 0.71, + "learning_rate": 0.0001929339021666871, + "loss": 0.0416, "step": 110590 }, { - "epoch": 1.2, - "learning_rate": 0.00012055941332987214, - "loss": 0.0369, + "epoch": 0.71, + "learning_rate": 0.00019292422081233017, + "loss": 0.0423, "step": 110600 }, { - "epoch": 1.2, - "learning_rate": 0.00012054318904536309, - "loss": 0.032, + "epoch": 0.71, + "learning_rate": 0.00019291453945797325, + "loss": 0.0483, "step": 110610 }, { - "epoch": 1.2, - "learning_rate": 0.00012052696476085403, - "loss": 0.0354, + "epoch": 0.71, + "learning_rate": 0.00019290485810361628, + "loss": 0.0465, "step": 110620 }, { - "epoch": 1.2, - "learning_rate": 0.00012051074047634498, - "loss": 0.0429, + "epoch": 0.71, + "learning_rate": 0.00019289517674925936, + "loss": 0.0421, "step": 110630 }, { - "epoch": 1.2, - "learning_rate": 0.00012049451619183593, - "loss": 0.037, + "epoch": 0.71, + "learning_rate": 0.00019288549539490243, + "loss": 0.045, "step": 110640 }, { - "epoch": 1.2, - "learning_rate": 0.00012047829190732688, - "loss": 0.0363, + "epoch": 0.71, + "learning_rate": 0.0001928758140405455, + "loss": 0.0443, "step": 110650 }, { - "epoch": 1.2, - "learning_rate": 0.00012046206762281783, - "loss": 0.0307, + "epoch": 0.71, + "learning_rate": 0.00019286613268618857, + "loss": 0.0508, "step": 110660 }, { - "epoch": 1.2, - "learning_rate": 0.00012044584333830876, - "loss": 0.0372, + "epoch": 0.71, + "learning_rate": 0.00019285645133183165, + "loss": 0.0437, "step": 110670 }, { - "epoch": 1.2, - "learning_rate": 0.00012042961905379971, - "loss": 0.0377, + "epoch": 0.71, + "learning_rate": 0.0001928467699774747, + "loss": 0.0412, "step": 110680 }, { - "epoch": 1.2, - "learning_rate": 0.00012041339476929066, - "loss": 0.0379, + "epoch": 0.71, + "learning_rate": 0.00019283708862311775, + "loss": 0.0423, "step": 110690 }, { - "epoch": 1.2, - "learning_rate": 0.00012039717048478161, - "loss": 0.03, + "epoch": 0.71, + "learning_rate": 0.00019282740726876083, + "loss": 0.0502, "step": 110700 }, { - "epoch": 1.2, - "learning_rate": 0.00012038094620027255, - "loss": 0.0363, + "epoch": 0.71, + "learning_rate": 0.00019281772591440389, + "loss": 0.0432, "step": 110710 }, { - "epoch": 1.2, - "learning_rate": 0.0001203647219157635, - "loss": 0.0312, + "epoch": 0.71, + "learning_rate": 0.00019280804456004696, + "loss": 0.048, "step": 110720 }, { - "epoch": 1.2, - "learning_rate": 0.00012034849763125445, - "loss": 0.0353, + "epoch": 0.71, + "learning_rate": 0.00019279836320569004, + "loss": 0.0437, "step": 110730 }, { - "epoch": 1.2, - "learning_rate": 0.0001203322733467454, - "loss": 0.0401, + "epoch": 0.71, + "learning_rate": 0.00019278868185133312, + "loss": 0.0429, "step": 110740 }, { - "epoch": 1.2, - "learning_rate": 0.00012031604906223635, - "loss": 0.0353, + "epoch": 0.71, + "learning_rate": 0.00019277900049697618, + "loss": 0.0432, "step": 110750 }, { - "epoch": 1.2, - "learning_rate": 0.00012029982477772728, - "loss": 0.0381, + "epoch": 0.71, + "learning_rate": 0.00019276931914261923, + "loss": 0.0437, "step": 110760 }, { - "epoch": 1.2, - "learning_rate": 0.00012028360049321823, - "loss": 0.0369, + "epoch": 0.71, + "learning_rate": 0.0001927596377882623, + "loss": 0.0428, "step": 110770 }, { - "epoch": 1.2, - "learning_rate": 0.00012026737620870918, - "loss": 0.0372, + "epoch": 0.71, + "learning_rate": 0.00019274995643390536, + "loss": 0.0472, "step": 110780 }, { - "epoch": 1.2, - "learning_rate": 0.00012025115192420013, - "loss": 0.0294, + "epoch": 0.72, + "learning_rate": 0.00019274027507954844, + "loss": 0.0481, "step": 110790 }, { - "epoch": 1.2, - "learning_rate": 0.00012023492763969107, - "loss": 0.0375, + "epoch": 0.72, + "learning_rate": 0.00019273059372519152, + "loss": 0.041, "step": 110800 }, { - "epoch": 1.2, - "learning_rate": 0.00012021870335518202, - "loss": 0.0363, + "epoch": 0.72, + "learning_rate": 0.0001927209123708346, + "loss": 0.0449, "step": 110810 }, { - "epoch": 1.2, - "learning_rate": 0.00012020247907067297, - "loss": 0.042, + "epoch": 0.72, + "learning_rate": 0.00019271123101647765, + "loss": 0.0432, "step": 110820 }, { - "epoch": 1.2, - "learning_rate": 0.00012018625478616392, - "loss": 0.0363, + "epoch": 0.72, + "learning_rate": 0.0001927015496621207, + "loss": 0.0447, "step": 110830 }, { - "epoch": 1.2, - "learning_rate": 0.00012017003050165487, - "loss": 0.0404, + "epoch": 0.72, + "learning_rate": 0.0001926918683077638, + "loss": 0.049, "step": 110840 }, { - "epoch": 1.2, - "learning_rate": 0.0001201538062171458, - "loss": 0.0343, + "epoch": 0.72, + "learning_rate": 0.00019268218695340684, + "loss": 0.0471, "step": 110850 }, { - "epoch": 1.2, - "learning_rate": 0.00012013758193263675, - "loss": 0.034, + "epoch": 0.72, + "learning_rate": 0.00019267250559904992, + "loss": 0.0501, "step": 110860 }, { - "epoch": 1.2, - "learning_rate": 0.0001201213576481277, - "loss": 0.0385, + "epoch": 0.72, + "learning_rate": 0.000192662824244693, + "loss": 0.0427, "step": 110870 }, { - "epoch": 1.2, - "learning_rate": 0.00012010513336361865, - "loss": 0.0351, + "epoch": 0.72, + "learning_rate": 0.00019265314289033605, + "loss": 0.0418, "step": 110880 }, { - "epoch": 1.2, - "learning_rate": 0.00012008890907910959, - "loss": 0.0355, + "epoch": 0.72, + "learning_rate": 0.00019264346153597913, + "loss": 0.0426, "step": 110890 }, { - "epoch": 1.2, - "learning_rate": 0.00012007268479460054, - "loss": 0.0337, + "epoch": 0.72, + "learning_rate": 0.00019263378018162218, + "loss": 0.0437, "step": 110900 }, { - "epoch": 1.2, - "learning_rate": 0.00012005646051009149, - "loss": 0.0322, + "epoch": 0.72, + "learning_rate": 0.00019262409882726524, + "loss": 0.0497, "step": 110910 }, { - "epoch": 1.2, - "learning_rate": 0.00012004023622558244, - "loss": 0.037, + "epoch": 0.72, + "learning_rate": 0.00019261441747290832, + "loss": 0.0482, "step": 110920 }, { - "epoch": 1.2, - "learning_rate": 0.00012002401194107339, - "loss": 0.0344, + "epoch": 0.72, + "learning_rate": 0.0001926047361185514, + "loss": 0.051, "step": 110930 }, { - "epoch": 1.2, - "learning_rate": 0.00012000778765656433, - "loss": 0.0297, + "epoch": 0.72, + "learning_rate": 0.00019259505476419448, + "loss": 0.0467, "step": 110940 }, { - "epoch": 1.2, - "learning_rate": 0.00011999156337205528, - "loss": 0.0343, + "epoch": 0.72, + "learning_rate": 0.00019258537340983753, + "loss": 0.048, "step": 110950 }, { - "epoch": 1.2, - "learning_rate": 0.00011997533908754623, - "loss": 0.038, + "epoch": 0.72, + "learning_rate": 0.0001925756920554806, + "loss": 0.0423, "step": 110960 }, { - "epoch": 1.2, - "learning_rate": 0.00011995911480303717, - "loss": 0.0377, + "epoch": 0.72, + "learning_rate": 0.00019256601070112366, + "loss": 0.0476, "step": 110970 }, { - "epoch": 1.2, - "learning_rate": 0.00011994289051852811, - "loss": 0.0323, + "epoch": 0.72, + "learning_rate": 0.00019255632934676671, + "loss": 0.0432, "step": 110980 }, { - "epoch": 1.2, - "learning_rate": 0.00011992666623401906, - "loss": 0.031, + "epoch": 0.72, + "learning_rate": 0.0001925466479924098, + "loss": 0.0551, "step": 110990 }, { - "epoch": 1.2, - "learning_rate": 0.00011991044194951001, - "loss": 0.0323, + "epoch": 0.72, + "learning_rate": 0.00019253696663805287, + "loss": 0.0394, "step": 111000 }, { - "epoch": 1.2, - "eval_cer": 0.9211631601173974, - "eval_loss": 0.027129851281642914, - "eval_runtime": 119.0086, - "eval_samples_per_second": 16.806, - "eval_steps_per_second": 4.201, + "epoch": 0.72, + "eval_cer": 0.9198192294655971, + "eval_loss": 0.029867488890886307, + "eval_runtime": 119.9464, + "eval_samples_per_second": 16.674, + "eval_steps_per_second": 4.169, "step": 111000 }, { - "epoch": 1.2, - "learning_rate": 0.00011989421766500096, - "loss": 0.0307, + "epoch": 0.72, + "learning_rate": 0.00019252728528369595, + "loss": 0.0482, "step": 111010 }, { - "epoch": 1.2, - "learning_rate": 0.00011987799338049191, - "loss": 0.0366, + "epoch": 0.72, + "learning_rate": 0.000192517603929339, + "loss": 0.041, "step": 111020 }, { - "epoch": 1.2, - "learning_rate": 0.00011986176909598285, - "loss": 0.0389, + "epoch": 0.72, + "learning_rate": 0.00019250792257498209, + "loss": 0.0401, "step": 111030 }, { - "epoch": 1.2, - "learning_rate": 0.0001198455448114738, - "loss": 0.0314, + "epoch": 0.72, + "learning_rate": 0.00019249824122062514, + "loss": 0.0507, "step": 111040 }, { - "epoch": 1.2, - "learning_rate": 0.00011982932052696475, - "loss": 0.0333, + "epoch": 0.72, + "learning_rate": 0.0001924885598662682, + "loss": 0.0426, "step": 111050 }, { - "epoch": 1.2, - "learning_rate": 0.0001198130962424557, - "loss": 0.0397, + "epoch": 0.72, + "learning_rate": 0.00019247887851191127, + "loss": 0.0454, "step": 111060 }, { - "epoch": 1.2, - "learning_rate": 0.00011979687195794663, - "loss": 0.0405, + "epoch": 0.72, + "learning_rate": 0.00019246919715755435, + "loss": 0.0521, "step": 111070 }, { - "epoch": 1.2, - "learning_rate": 0.00011978064767343758, - "loss": 0.0345, + "epoch": 0.72, + "learning_rate": 0.0001924595158031974, + "loss": 0.0407, "step": 111080 }, { - "epoch": 1.2, - "learning_rate": 0.00011976442338892853, - "loss": 0.0325, + "epoch": 0.72, + "learning_rate": 0.00019244983444884048, + "loss": 0.044, "step": 111090 }, { - "epoch": 1.2, - "learning_rate": 0.00011974819910441948, - "loss": 0.0343, + "epoch": 0.72, + "learning_rate": 0.00019244015309448356, + "loss": 0.0473, "step": 111100 }, { - "epoch": 1.2, - "learning_rate": 0.00011973197481991043, - "loss": 0.0329, + "epoch": 0.72, + "learning_rate": 0.0001924304717401266, + "loss": 0.0464, "step": 111110 }, { - "epoch": 1.2, - "learning_rate": 0.00011971575053540137, - "loss": 0.035, + "epoch": 0.72, + "learning_rate": 0.00019242079038576967, + "loss": 0.0527, "step": 111120 }, { - "epoch": 1.2, - "learning_rate": 0.00011969952625089232, - "loss": 0.0376, + "epoch": 0.72, + "learning_rate": 0.00019241110903141275, + "loss": 0.0479, "step": 111130 }, { - "epoch": 1.2, - "learning_rate": 0.00011968330196638327, - "loss": 0.0346, + "epoch": 0.72, + "learning_rate": 0.00019240142767705583, + "loss": 0.0479, "step": 111140 }, { - "epoch": 1.2, - "learning_rate": 0.00011966707768187422, - "loss": 0.0368, + "epoch": 0.72, + "learning_rate": 0.00019239174632269888, + "loss": 0.0453, "step": 111150 }, { - "epoch": 1.2, - "learning_rate": 0.00011965085339736517, - "loss": 0.0321, + "epoch": 0.72, + "learning_rate": 0.00019238206496834196, + "loss": 0.0494, "step": 111160 }, { - "epoch": 1.2, - "learning_rate": 0.0001196346291128561, - "loss": 0.0383, + "epoch": 0.72, + "learning_rate": 0.00019237238361398504, + "loss": 0.0415, "step": 111170 }, { - "epoch": 1.2, - "learning_rate": 0.00011961840482834705, - "loss": 0.0332, + "epoch": 0.72, + "learning_rate": 0.00019236270225962807, + "loss": 0.0482, "step": 111180 }, { - "epoch": 1.2, - "learning_rate": 0.000119602180543838, - "loss": 0.0353, + "epoch": 0.72, + "learning_rate": 0.00019235302090527115, + "loss": 0.0453, "step": 111190 }, { - "epoch": 1.2, - "learning_rate": 0.00011958595625932895, - "loss": 0.0376, + "epoch": 0.72, + "learning_rate": 0.00019234333955091423, + "loss": 0.0416, "step": 111200 }, { - "epoch": 1.2, - "learning_rate": 0.00011956973197481989, - "loss": 0.0388, + "epoch": 0.72, + "learning_rate": 0.0001923336581965573, + "loss": 0.0468, "step": 111210 }, { - "epoch": 1.2, - "learning_rate": 0.00011955350769031084, - "loss": 0.0315, + "epoch": 0.72, + "learning_rate": 0.00019232397684220036, + "loss": 0.0448, "step": 111220 }, { - "epoch": 1.2, - "learning_rate": 0.00011953728340580179, - "loss": 0.0319, + "epoch": 0.72, + "learning_rate": 0.00019231429548784344, + "loss": 0.0545, "step": 111230 }, { - "epoch": 1.2, - "learning_rate": 0.00011952105912129274, - "loss": 0.0341, + "epoch": 0.72, + "learning_rate": 0.00019230461413348652, + "loss": 0.04, "step": 111240 }, { - "epoch": 1.2, - "learning_rate": 0.00011950483483678369, - "loss": 0.0445, + "epoch": 0.72, + "learning_rate": 0.00019229493277912954, + "loss": 0.044, "step": 111250 }, { - "epoch": 1.2, - "learning_rate": 0.00011948861055227462, - "loss": 0.0348, + "epoch": 0.72, + "learning_rate": 0.00019228525142477262, + "loss": 0.0456, "step": 111260 }, { - "epoch": 1.2, - "learning_rate": 0.00011947238626776557, - "loss": 0.0347, + "epoch": 0.72, + "learning_rate": 0.0001922755700704157, + "loss": 0.0393, "step": 111270 }, { - "epoch": 1.2, - "learning_rate": 0.00011945616198325652, - "loss": 0.0377, + "epoch": 0.72, + "learning_rate": 0.00019226588871605878, + "loss": 0.0394, "step": 111280 }, { - "epoch": 1.2, - "learning_rate": 0.00011943993769874747, - "loss": 0.0377, + "epoch": 0.72, + "learning_rate": 0.00019225620736170184, + "loss": 0.0564, "step": 111290 }, { - "epoch": 1.2, - "learning_rate": 0.00011942371341423841, - "loss": 0.0388, + "epoch": 0.72, + "learning_rate": 0.00019224652600734492, + "loss": 0.0453, "step": 111300 }, { - "epoch": 1.2, - "learning_rate": 0.00011940748912972936, - "loss": 0.0437, + "epoch": 0.72, + "learning_rate": 0.000192236844652988, + "loss": 0.042, "step": 111310 }, { - "epoch": 1.2, - "learning_rate": 0.00011939126484522031, - "loss": 0.0305, + "epoch": 0.72, + "learning_rate": 0.00019222716329863102, + "loss": 0.0411, "step": 111320 }, { - "epoch": 1.2, - "learning_rate": 0.00011937504056071126, - "loss": 0.0414, + "epoch": 0.72, + "learning_rate": 0.0001922174819442741, + "loss": 0.0421, "step": 111330 }, { - "epoch": 1.2, - "learning_rate": 0.00011935881627620221, - "loss": 0.033, + "epoch": 0.72, + "learning_rate": 0.00019220780058991718, + "loss": 0.0418, "step": 111340 }, { - "epoch": 1.2, - "learning_rate": 0.00011934259199169314, - "loss": 0.0287, + "epoch": 0.72, + "learning_rate": 0.00019219811923556023, + "loss": 0.046, "step": 111350 }, { - "epoch": 1.2, - "learning_rate": 0.0001193263677071841, - "loss": 0.0333, + "epoch": 0.72, + "learning_rate": 0.0001921884378812033, + "loss": 0.046, "step": 111360 }, { - "epoch": 1.2, - "learning_rate": 0.00011931014342267504, - "loss": 0.0407, + "epoch": 0.72, + "learning_rate": 0.0001921787565268464, + "loss": 0.0443, "step": 111370 }, { - "epoch": 1.2, - "learning_rate": 0.000119293919138166, - "loss": 0.0388, + "epoch": 0.72, + "learning_rate": 0.00019216907517248947, + "loss": 0.0417, "step": 111380 }, { - "epoch": 1.2, - "learning_rate": 0.00011927769485365693, - "loss": 0.0417, + "epoch": 0.72, + "learning_rate": 0.0001921593938181325, + "loss": 0.0499, "step": 111390 }, { - "epoch": 1.2, - "learning_rate": 0.00011926147056914788, - "loss": 0.032, + "epoch": 0.72, + "learning_rate": 0.00019214971246377558, + "loss": 0.0461, "step": 111400 }, { - "epoch": 1.21, - "learning_rate": 0.00011924524628463883, - "loss": 0.033, + "epoch": 0.72, + "learning_rate": 0.00019214003110941866, + "loss": 0.04, "step": 111410 }, { - "epoch": 1.21, - "learning_rate": 0.00011922902200012978, - "loss": 0.0324, + "epoch": 0.72, + "learning_rate": 0.0001921303497550617, + "loss": 0.0452, "step": 111420 }, { - "epoch": 1.21, - "learning_rate": 0.00011921279771562073, - "loss": 0.0352, + "epoch": 0.72, + "learning_rate": 0.0001921206684007048, + "loss": 0.0442, "step": 111430 }, { - "epoch": 1.21, - "learning_rate": 0.00011919657343111166, - "loss": 0.0362, + "epoch": 0.72, + "learning_rate": 0.00019211098704634787, + "loss": 0.0406, "step": 111440 }, { - "epoch": 1.21, - "learning_rate": 0.00011918034914660261, - "loss": 0.038, + "epoch": 0.72, + "learning_rate": 0.00019210130569199095, + "loss": 0.043, "step": 111450 }, { - "epoch": 1.21, - "learning_rate": 0.00011916412486209356, - "loss": 0.0309, + "epoch": 0.72, + "learning_rate": 0.00019209162433763397, + "loss": 0.0434, "step": 111460 }, { - "epoch": 1.21, - "learning_rate": 0.00011914790057758453, - "loss": 0.0331, + "epoch": 0.72, + "learning_rate": 0.00019208194298327705, + "loss": 0.0499, "step": 111470 }, { - "epoch": 1.21, - "learning_rate": 0.00011913167629307548, - "loss": 0.0379, + "epoch": 0.72, + "learning_rate": 0.00019207226162892013, + "loss": 0.0451, "step": 111480 }, { - "epoch": 1.21, - "learning_rate": 0.00011911545200856641, - "loss": 0.0295, + "epoch": 0.72, + "learning_rate": 0.0001920625802745632, + "loss": 0.0395, "step": 111490 }, { - "epoch": 1.21, - "learning_rate": 0.00011909922772405736, - "loss": 0.0355, + "epoch": 0.72, + "learning_rate": 0.00019205289892020627, + "loss": 0.0427, "step": 111500 }, { - "epoch": 1.21, - "learning_rate": 0.00011908300343954831, - "loss": 0.0347, + "epoch": 0.72, + "learning_rate": 0.00019204321756584935, + "loss": 0.0431, "step": 111510 }, { - "epoch": 1.21, - "learning_rate": 0.00011906677915503926, - "loss": 0.0377, + "epoch": 0.72, + "learning_rate": 0.0001920335362114924, + "loss": 0.0497, "step": 111520 }, { - "epoch": 1.21, - "learning_rate": 0.00011905055487053021, - "loss": 0.0376, + "epoch": 0.72, + "learning_rate": 0.00019202385485713545, + "loss": 0.0433, "step": 111530 }, { - "epoch": 1.21, - "learning_rate": 0.00011903433058602115, - "loss": 0.0375, + "epoch": 0.72, + "learning_rate": 0.00019201417350277853, + "loss": 0.0469, "step": 111540 }, { - "epoch": 1.21, - "learning_rate": 0.0001190181063015121, - "loss": 0.0302, + "epoch": 0.72, + "learning_rate": 0.00019200449214842158, + "loss": 0.0428, "step": 111550 }, { - "epoch": 1.21, - "learning_rate": 0.00011900188201700305, - "loss": 0.0347, + "epoch": 0.72, + "learning_rate": 0.00019199481079406466, + "loss": 0.0448, "step": 111560 }, { - "epoch": 1.21, - "learning_rate": 0.000118985657732494, - "loss": 0.0463, + "epoch": 0.72, + "learning_rate": 0.00019198512943970774, + "loss": 0.0434, "step": 111570 }, { - "epoch": 1.21, - "learning_rate": 0.00011896943344798493, - "loss": 0.03, + "epoch": 0.72, + "learning_rate": 0.00019197544808535082, + "loss": 0.0435, "step": 111580 }, { - "epoch": 1.21, - "learning_rate": 0.00011895320916347588, - "loss": 0.0365, + "epoch": 0.72, + "learning_rate": 0.00019196576673099388, + "loss": 0.0423, "step": 111590 }, { - "epoch": 1.21, - "learning_rate": 0.00011893698487896683, - "loss": 0.0306, + "epoch": 0.72, + "learning_rate": 0.00019195608537663693, + "loss": 0.049, "step": 111600 }, { - "epoch": 1.21, - "learning_rate": 0.00011892076059445778, - "loss": 0.0296, + "epoch": 0.72, + "learning_rate": 0.00019194640402228, + "loss": 0.0428, "step": 111610 }, { - "epoch": 1.21, - "learning_rate": 0.00011890453630994873, - "loss": 0.0349, + "epoch": 0.72, + "learning_rate": 0.00019193672266792306, + "loss": 0.0417, "step": 111620 }, { - "epoch": 1.21, - "learning_rate": 0.00011888831202543967, - "loss": 0.0291, + "epoch": 0.72, + "learning_rate": 0.00019192704131356614, + "loss": 0.0598, "step": 111630 }, { - "epoch": 1.21, - "learning_rate": 0.00011887208774093062, - "loss": 0.0331, + "epoch": 0.72, + "learning_rate": 0.00019191735995920922, + "loss": 0.0422, "step": 111640 }, { - "epoch": 1.21, - "learning_rate": 0.00011885586345642157, - "loss": 0.0449, + "epoch": 0.72, + "learning_rate": 0.0001919076786048523, + "loss": 0.0484, "step": 111650 }, { - "epoch": 1.21, - "learning_rate": 0.00011883963917191252, - "loss": 0.0333, + "epoch": 0.72, + "learning_rate": 0.00019189799725049535, + "loss": 0.0389, "step": 111660 }, { - "epoch": 1.21, - "learning_rate": 0.00011882341488740346, - "loss": 0.0285, + "epoch": 0.72, + "learning_rate": 0.0001918883158961384, + "loss": 0.0385, "step": 111670 }, { - "epoch": 1.21, - "learning_rate": 0.0001188071906028944, - "loss": 0.0369, + "epoch": 0.72, + "learning_rate": 0.00019187863454178149, + "loss": 0.0472, "step": 111680 }, { - "epoch": 1.21, - "learning_rate": 0.00011879096631838535, - "loss": 0.036, + "epoch": 0.72, + "learning_rate": 0.00019186895318742454, + "loss": 0.0393, "step": 111690 }, { - "epoch": 1.21, - "learning_rate": 0.0001187747420338763, - "loss": 0.032, + "epoch": 0.72, + "learning_rate": 0.00019185927183306762, + "loss": 0.0452, "step": 111700 }, { - "epoch": 1.21, - "learning_rate": 0.00011875851774936725, - "loss": 0.0326, + "epoch": 0.72, + "learning_rate": 0.0001918495904787107, + "loss": 0.0441, "step": 111710 }, { - "epoch": 1.21, - "learning_rate": 0.00011874229346485819, - "loss": 0.0342, + "epoch": 0.72, + "learning_rate": 0.00019183990912435375, + "loss": 0.0437, "step": 111720 }, { - "epoch": 1.21, - "learning_rate": 0.00011872606918034914, - "loss": 0.0307, + "epoch": 0.72, + "learning_rate": 0.00019183022776999683, + "loss": 0.04, "step": 111730 }, { - "epoch": 1.21, - "learning_rate": 0.00011870984489584009, - "loss": 0.0357, + "epoch": 0.72, + "learning_rate": 0.00019182054641563988, + "loss": 0.0408, "step": 111740 }, { - "epoch": 1.21, - "learning_rate": 0.00011869362061133104, - "loss": 0.0355, + "epoch": 0.72, + "learning_rate": 0.00019181086506128294, + "loss": 0.0435, "step": 111750 }, { - "epoch": 1.21, - "learning_rate": 0.00011867739632682198, - "loss": 0.0347, + "epoch": 0.72, + "learning_rate": 0.00019180118370692602, + "loss": 0.04, "step": 111760 }, { - "epoch": 1.21, - "learning_rate": 0.00011866117204231293, - "loss": 0.041, + "epoch": 0.72, + "learning_rate": 0.0001917915023525691, + "loss": 0.0442, "step": 111770 }, { - "epoch": 1.21, - "learning_rate": 0.00011864494775780388, - "loss": 0.0352, + "epoch": 0.72, + "learning_rate": 0.00019178182099821218, + "loss": 0.0456, "step": 111780 }, { - "epoch": 1.21, - "learning_rate": 0.00011862872347329483, - "loss": 0.0305, + "epoch": 0.72, + "learning_rate": 0.00019177213964385523, + "loss": 0.0445, "step": 111790 }, { - "epoch": 1.21, - "learning_rate": 0.00011861249918878578, - "loss": 0.0343, + "epoch": 0.72, + "learning_rate": 0.0001917624582894983, + "loss": 0.0428, "step": 111800 }, { - "epoch": 1.21, - "learning_rate": 0.00011859627490427671, - "loss": 0.0306, + "epoch": 0.72, + "learning_rate": 0.00019175277693514136, + "loss": 0.0394, "step": 111810 }, { - "epoch": 1.21, - "learning_rate": 0.00011858005061976766, - "loss": 0.0349, + "epoch": 0.72, + "learning_rate": 0.00019174309558078441, + "loss": 0.0453, "step": 111820 }, { - "epoch": 1.21, - "learning_rate": 0.00011856382633525861, - "loss": 0.0298, + "epoch": 0.72, + "learning_rate": 0.0001917334142264275, + "loss": 0.0555, "step": 111830 }, { - "epoch": 1.21, - "learning_rate": 0.00011854760205074956, - "loss": 0.0317, + "epoch": 0.72, + "learning_rate": 0.00019172373287207057, + "loss": 0.0481, "step": 111840 }, { - "epoch": 1.21, - "learning_rate": 0.00011853137776624051, - "loss": 0.0325, + "epoch": 0.72, + "learning_rate": 0.00019171405151771365, + "loss": 0.0483, "step": 111850 }, { - "epoch": 1.21, - "learning_rate": 0.00011851515348173145, - "loss": 0.0406, + "epoch": 0.72, + "learning_rate": 0.0001917043701633567, + "loss": 0.0435, "step": 111860 }, { - "epoch": 1.21, - "learning_rate": 0.0001184989291972224, - "loss": 0.0344, + "epoch": 0.72, + "learning_rate": 0.00019169468880899979, + "loss": 0.0461, "step": 111870 }, { - "epoch": 1.21, - "learning_rate": 0.00011848270491271335, - "loss": 0.0389, + "epoch": 0.72, + "learning_rate": 0.00019168500745464284, + "loss": 0.0487, "step": 111880 }, { - "epoch": 1.21, - "learning_rate": 0.0001184664806282043, - "loss": 0.0271, + "epoch": 0.72, + "learning_rate": 0.0001916753261002859, + "loss": 0.0439, "step": 111890 }, { - "epoch": 1.21, - "learning_rate": 0.00011845025634369523, - "loss": 0.0351, + "epoch": 0.72, + "learning_rate": 0.00019166564474592897, + "loss": 0.0557, "step": 111900 }, { - "epoch": 1.21, - "learning_rate": 0.00011843403205918618, - "loss": 0.0436, + "epoch": 0.72, + "learning_rate": 0.00019165596339157205, + "loss": 0.0461, "step": 111910 }, { - "epoch": 1.21, - "learning_rate": 0.00011841780777467713, - "loss": 0.0361, + "epoch": 0.72, + "learning_rate": 0.0001916462820372151, + "loss": 0.0546, "step": 111920 }, { - "epoch": 1.21, - "learning_rate": 0.00011840158349016808, - "loss": 0.0331, + "epoch": 0.72, + "learning_rate": 0.00019163660068285818, + "loss": 0.0468, "step": 111930 }, { - "epoch": 1.21, - "learning_rate": 0.00011838535920565903, - "loss": 0.0351, + "epoch": 0.72, + "learning_rate": 0.00019162691932850126, + "loss": 0.0425, "step": 111940 }, { - "epoch": 1.21, - "learning_rate": 0.00011836913492114997, - "loss": 0.0346, + "epoch": 0.72, + "learning_rate": 0.0001916172379741443, + "loss": 0.0417, "step": 111950 }, { - "epoch": 1.21, - "learning_rate": 0.00011835291063664092, - "loss": 0.0359, + "epoch": 0.72, + "learning_rate": 0.00019160755661978737, + "loss": 0.0421, "step": 111960 }, { - "epoch": 1.21, - "learning_rate": 0.00011833668635213187, - "loss": 0.0332, + "epoch": 0.72, + "learning_rate": 0.00019159787526543045, + "loss": 0.0493, "step": 111970 }, { - "epoch": 1.21, - "learning_rate": 0.00011832046206762282, - "loss": 0.032, + "epoch": 0.72, + "learning_rate": 0.00019158819391107353, + "loss": 0.0441, "step": 111980 }, { - "epoch": 1.21, - "learning_rate": 0.00011830423778311375, - "loss": 0.0415, + "epoch": 0.72, + "learning_rate": 0.00019157851255671658, + "loss": 0.0409, "step": 111990 }, { - "epoch": 1.21, - "learning_rate": 0.0001182880134986047, - "loss": 0.0387, + "epoch": 0.72, + "learning_rate": 0.00019156883120235966, + "loss": 0.0451, "step": 112000 }, { - "epoch": 1.21, - "eval_cer": 0.9211552087585102, - "eval_loss": 0.027456477284431458, - "eval_runtime": 119.0129, - "eval_samples_per_second": 16.805, - "eval_steps_per_second": 4.201, + "epoch": 0.72, + "eval_cer": 0.9199602304824314, + "eval_loss": 0.029715538024902344, + "eval_runtime": 120.0538, + "eval_samples_per_second": 16.659, + "eval_steps_per_second": 4.165, "step": 112000 }, { - "epoch": 1.21, - "learning_rate": 0.00011827178921409565, - "loss": 0.0379, + "epoch": 0.72, + "learning_rate": 0.00019155914984800274, + "loss": 0.0462, "step": 112010 }, { - "epoch": 1.21, - "learning_rate": 0.0001182555649295866, - "loss": 0.0367, + "epoch": 0.72, + "learning_rate": 0.00019154946849364577, + "loss": 0.0536, "step": 112020 }, { - "epoch": 1.21, - "learning_rate": 0.00011823934064507755, - "loss": 0.0311, + "epoch": 0.72, + "learning_rate": 0.00019153978713928885, + "loss": 0.0446, "step": 112030 }, { - "epoch": 1.21, - "learning_rate": 0.00011822311636056849, - "loss": 0.0395, + "epoch": 0.72, + "learning_rate": 0.00019153010578493193, + "loss": 0.0476, "step": 112040 }, { - "epoch": 1.21, - "learning_rate": 0.00011820689207605944, - "loss": 0.0353, + "epoch": 0.72, + "learning_rate": 0.000191520424430575, + "loss": 0.0523, "step": 112050 }, { - "epoch": 1.21, - "learning_rate": 0.00011819066779155039, - "loss": 0.0388, + "epoch": 0.72, + "learning_rate": 0.00019151074307621806, + "loss": 0.045, "step": 112060 }, { - "epoch": 1.21, - "learning_rate": 0.00011817444350704134, - "loss": 0.0397, + "epoch": 0.72, + "learning_rate": 0.00019150106172186114, + "loss": 0.0439, "step": 112070 }, { - "epoch": 1.21, - "learning_rate": 0.00011815821922253227, - "loss": 0.0394, + "epoch": 0.72, + "learning_rate": 0.00019149138036750422, + "loss": 0.0482, "step": 112080 }, { - "epoch": 1.21, - "learning_rate": 0.00011814199493802322, - "loss": 0.0293, + "epoch": 0.72, + "learning_rate": 0.00019148169901314724, + "loss": 0.0447, "step": 112090 }, { - "epoch": 1.21, - "learning_rate": 0.00011812577065351417, - "loss": 0.0392, + "epoch": 0.72, + "learning_rate": 0.00019147201765879032, + "loss": 0.0439, "step": 112100 }, { - "epoch": 1.21, - "learning_rate": 0.00011810954636900512, - "loss": 0.0362, + "epoch": 0.72, + "learning_rate": 0.0001914623363044334, + "loss": 0.0449, "step": 112110 }, { - "epoch": 1.21, - "learning_rate": 0.00011809332208449607, - "loss": 0.0302, + "epoch": 0.72, + "learning_rate": 0.00019145265495007646, + "loss": 0.0432, "step": 112120 }, { - "epoch": 1.21, - "learning_rate": 0.00011807709779998701, - "loss": 0.0395, + "epoch": 0.72, + "learning_rate": 0.00019144297359571953, + "loss": 0.0432, "step": 112130 }, { - "epoch": 1.21, - "learning_rate": 0.00011806087351547796, - "loss": 0.0325, + "epoch": 0.72, + "learning_rate": 0.00019143329224136261, + "loss": 0.0442, "step": 112140 }, { - "epoch": 1.21, - "learning_rate": 0.00011804464923096891, - "loss": 0.0353, + "epoch": 0.72, + "learning_rate": 0.0001914236108870057, + "loss": 0.0463, "step": 112150 }, { - "epoch": 1.21, - "learning_rate": 0.00011802842494645986, - "loss": 0.0308, + "epoch": 0.72, + "learning_rate": 0.00019141392953264872, + "loss": 0.0494, "step": 112160 }, { - "epoch": 1.21, - "learning_rate": 0.0001180122006619508, - "loss": 0.0414, + "epoch": 0.72, + "learning_rate": 0.0001914042481782918, + "loss": 0.0464, "step": 112170 }, { - "epoch": 1.21, - "learning_rate": 0.00011799597637744174, - "loss": 0.0311, + "epoch": 0.72, + "learning_rate": 0.00019139456682393488, + "loss": 0.0424, "step": 112180 }, { - "epoch": 1.21, - "learning_rate": 0.0001179797520929327, - "loss": 0.0392, + "epoch": 0.72, + "learning_rate": 0.00019138488546957793, + "loss": 0.0448, "step": 112190 }, { - "epoch": 1.21, - "learning_rate": 0.00011796352780842364, - "loss": 0.0341, + "epoch": 0.72, + "learning_rate": 0.000191375204115221, + "loss": 0.0446, "step": 112200 }, { - "epoch": 1.21, - "learning_rate": 0.0001179473035239146, - "loss": 0.0305, + "epoch": 0.72, + "learning_rate": 0.0001913655227608641, + "loss": 0.0409, "step": 112210 }, { - "epoch": 1.21, - "learning_rate": 0.00011793107923940553, - "loss": 0.0419, + "epoch": 0.72, + "learning_rate": 0.00019135584140650717, + "loss": 0.0517, "step": 112220 }, { - "epoch": 1.21, - "learning_rate": 0.00011791485495489648, - "loss": 0.0406, + "epoch": 0.72, + "learning_rate": 0.0001913461600521502, + "loss": 0.0401, "step": 112230 }, { - "epoch": 1.21, - "learning_rate": 0.00011789863067038743, - "loss": 0.0334, + "epoch": 0.72, + "learning_rate": 0.00019133647869779328, + "loss": 0.0436, "step": 112240 }, { - "epoch": 1.21, - "learning_rate": 0.00011788240638587838, - "loss": 0.0331, + "epoch": 0.72, + "learning_rate": 0.00019132679734343636, + "loss": 0.0416, "step": 112250 }, { - "epoch": 1.21, - "learning_rate": 0.00011786618210136932, - "loss": 0.0378, + "epoch": 0.72, + "learning_rate": 0.0001913171159890794, + "loss": 0.0534, "step": 112260 }, { - "epoch": 1.21, - "learning_rate": 0.00011784995781686027, - "loss": 0.0336, + "epoch": 0.72, + "learning_rate": 0.0001913074346347225, + "loss": 0.0433, "step": 112270 }, { - "epoch": 1.21, - "learning_rate": 0.00011783373353235122, - "loss": 0.036, + "epoch": 0.72, + "learning_rate": 0.00019129775328036557, + "loss": 0.0518, "step": 112280 }, { - "epoch": 1.21, - "learning_rate": 0.00011781750924784217, - "loss": 0.0323, + "epoch": 0.72, + "learning_rate": 0.00019128807192600862, + "loss": 0.046, "step": 112290 }, { - "epoch": 1.21, - "learning_rate": 0.00011780128496333311, - "loss": 0.0332, + "epoch": 0.72, + "learning_rate": 0.00019127839057165167, + "loss": 0.0449, "step": 112300 }, { - "epoch": 1.21, - "learning_rate": 0.00011778506067882405, - "loss": 0.0318, + "epoch": 0.72, + "learning_rate": 0.00019126870921729475, + "loss": 0.0435, "step": 112310 }, { - "epoch": 1.21, - "learning_rate": 0.000117768836394315, - "loss": 0.034, + "epoch": 0.72, + "learning_rate": 0.0001912590278629378, + "loss": 0.0392, "step": 112320 }, { - "epoch": 1.21, - "learning_rate": 0.00011775261210980595, - "loss": 0.038, + "epoch": 0.73, + "learning_rate": 0.0001912493465085809, + "loss": 0.0417, "step": 112330 }, { - "epoch": 1.22, - "learning_rate": 0.0001177363878252969, - "loss": 0.0346, + "epoch": 0.73, + "learning_rate": 0.00019123966515422397, + "loss": 0.0398, "step": 112340 }, { - "epoch": 1.22, - "learning_rate": 0.00011772016354078784, - "loss": 0.0259, + "epoch": 0.73, + "learning_rate": 0.00019122998379986705, + "loss": 0.0474, "step": 112350 }, { - "epoch": 1.22, - "learning_rate": 0.00011770393925627879, - "loss": 0.0358, + "epoch": 0.73, + "learning_rate": 0.0001912203024455101, + "loss": 0.0491, "step": 112360 }, { - "epoch": 1.22, - "learning_rate": 0.00011768771497176974, - "loss": 0.0322, + "epoch": 0.73, + "learning_rate": 0.00019121062109115315, + "loss": 0.039, "step": 112370 }, { - "epoch": 1.22, - "learning_rate": 0.00011767149068726069, - "loss": 0.0331, + "epoch": 0.73, + "learning_rate": 0.00019120093973679623, + "loss": 0.0477, "step": 112380 }, { - "epoch": 1.22, - "learning_rate": 0.00011765526640275164, - "loss": 0.0377, + "epoch": 0.73, + "learning_rate": 0.00019119125838243928, + "loss": 0.049, "step": 112390 }, { - "epoch": 1.22, - "learning_rate": 0.00011763904211824257, - "loss": 0.0369, + "epoch": 0.73, + "learning_rate": 0.00019118157702808236, + "loss": 0.0463, "step": 112400 }, { - "epoch": 1.22, - "learning_rate": 0.00011762281783373352, - "loss": 0.0334, + "epoch": 0.73, + "learning_rate": 0.00019117189567372544, + "loss": 0.0444, "step": 112410 }, { - "epoch": 1.22, - "learning_rate": 0.00011760659354922447, - "loss": 0.035, + "epoch": 0.73, + "learning_rate": 0.00019116221431936852, + "loss": 0.0479, "step": 112420 }, { - "epoch": 1.22, - "learning_rate": 0.00011759036926471542, - "loss": 0.0338, + "epoch": 0.73, + "learning_rate": 0.00019115253296501158, + "loss": 0.0426, "step": 112430 }, { - "epoch": 1.22, - "learning_rate": 0.00011757414498020636, - "loss": 0.0325, + "epoch": 0.73, + "learning_rate": 0.00019114285161065463, + "loss": 0.0439, "step": 112440 }, { - "epoch": 1.22, - "learning_rate": 0.00011755792069569731, - "loss": 0.0333, + "epoch": 0.73, + "learning_rate": 0.0001911331702562977, + "loss": 0.0426, "step": 112450 }, { - "epoch": 1.22, - "learning_rate": 0.00011754169641118826, - "loss": 0.0349, + "epoch": 0.73, + "learning_rate": 0.00019112348890194076, + "loss": 0.0419, "step": 112460 }, { - "epoch": 1.22, - "learning_rate": 0.0001175254721266792, - "loss": 0.0398, + "epoch": 0.73, + "learning_rate": 0.00019111380754758384, + "loss": 0.0389, "step": 112470 }, { - "epoch": 1.22, - "learning_rate": 0.00011750924784217016, - "loss": 0.0347, + "epoch": 0.73, + "learning_rate": 0.00019110412619322692, + "loss": 0.0431, "step": 112480 }, { - "epoch": 1.22, - "learning_rate": 0.00011749302355766109, - "loss": 0.0328, + "epoch": 0.73, + "learning_rate": 0.00019109444483886997, + "loss": 0.0423, "step": 112490 }, { - "epoch": 1.22, - "learning_rate": 0.00011747679927315204, - "loss": 0.0328, + "epoch": 0.73, + "learning_rate": 0.00019108476348451305, + "loss": 0.0494, "step": 112500 }, { - "epoch": 1.22, - "learning_rate": 0.00011746057498864299, - "loss": 0.0333, + "epoch": 0.73, + "learning_rate": 0.0001910750821301561, + "loss": 0.0417, "step": 112510 }, { - "epoch": 1.22, - "learning_rate": 0.00011744435070413394, - "loss": 0.0347, + "epoch": 0.73, + "learning_rate": 0.00019106540077579916, + "loss": 0.0474, "step": 112520 }, { - "epoch": 1.22, - "learning_rate": 0.00011742812641962489, - "loss": 0.0355, + "epoch": 0.73, + "learning_rate": 0.00019105571942144224, + "loss": 0.0408, "step": 112530 }, { - "epoch": 1.22, - "learning_rate": 0.00011741190213511583, - "loss": 0.0348, + "epoch": 0.73, + "learning_rate": 0.00019104603806708532, + "loss": 0.0489, "step": 112540 }, { - "epoch": 1.22, - "learning_rate": 0.00011739567785060678, - "loss": 0.0356, + "epoch": 0.73, + "learning_rate": 0.0001910363567127284, + "loss": 0.0456, "step": 112550 }, { - "epoch": 1.22, - "learning_rate": 0.00011737945356609773, - "loss": 0.0345, + "epoch": 0.73, + "learning_rate": 0.00019102667535837145, + "loss": 0.0409, "step": 112560 }, { - "epoch": 1.22, - "learning_rate": 0.00011736322928158868, - "loss": 0.038, + "epoch": 0.73, + "learning_rate": 0.00019101699400401453, + "loss": 0.0479, "step": 112570 }, { - "epoch": 1.22, - "learning_rate": 0.00011734700499707961, - "loss": 0.031, + "epoch": 0.73, + "learning_rate": 0.00019100731264965758, + "loss": 0.0423, "step": 112580 }, { - "epoch": 1.22, - "learning_rate": 0.00011733078071257056, - "loss": 0.0344, + "epoch": 0.73, + "learning_rate": 0.00019099763129530064, + "loss": 0.0472, "step": 112590 }, { - "epoch": 1.22, - "learning_rate": 0.00011731455642806151, - "loss": 0.0342, + "epoch": 0.73, + "learning_rate": 0.00019098794994094372, + "loss": 0.0415, "step": 112600 }, { - "epoch": 1.22, - "learning_rate": 0.00011729833214355246, - "loss": 0.0371, + "epoch": 0.73, + "learning_rate": 0.0001909782685865868, + "loss": 0.0419, "step": 112610 }, { - "epoch": 1.22, - "learning_rate": 0.00011728210785904341, - "loss": 0.0306, + "epoch": 0.73, + "learning_rate": 0.00019096858723222988, + "loss": 0.0424, "step": 112620 }, { - "epoch": 1.22, - "learning_rate": 0.00011726588357453435, - "loss": 0.0336, - "step": 112630 + "epoch": 0.73, + "learning_rate": 0.00019095890587787293, + "loss": 0.0436, + "step": 112630 }, { - "epoch": 1.22, - "learning_rate": 0.0001172496592900253, - "loss": 0.0315, + "epoch": 0.73, + "learning_rate": 0.000190949224523516, + "loss": 0.0462, "step": 112640 }, { - "epoch": 1.22, - "learning_rate": 0.00011723343500551625, - "loss": 0.04, + "epoch": 0.73, + "learning_rate": 0.00019093954316915906, + "loss": 0.0474, "step": 112650 }, { - "epoch": 1.22, - "learning_rate": 0.0001172172107210072, - "loss": 0.0355, + "epoch": 0.73, + "learning_rate": 0.0001909298618148021, + "loss": 0.0434, "step": 112660 }, { - "epoch": 1.22, - "learning_rate": 0.00011720098643649813, - "loss": 0.0375, + "epoch": 0.73, + "learning_rate": 0.0001909201804604452, + "loss": 0.0443, "step": 112670 }, { - "epoch": 1.22, - "learning_rate": 0.00011718476215198908, - "loss": 0.0355, + "epoch": 0.73, + "learning_rate": 0.00019091049910608827, + "loss": 0.0509, "step": 112680 }, { - "epoch": 1.22, - "learning_rate": 0.00011716853786748003, - "loss": 0.0334, + "epoch": 0.73, + "learning_rate": 0.00019090081775173133, + "loss": 0.047, "step": 112690 }, { - "epoch": 1.22, - "learning_rate": 0.00011715231358297098, - "loss": 0.0351, + "epoch": 0.73, + "learning_rate": 0.0001908911363973744, + "loss": 0.0544, "step": 112700 }, { - "epoch": 1.22, - "learning_rate": 0.00011713608929846193, - "loss": 0.0342, + "epoch": 0.73, + "learning_rate": 0.00019088145504301749, + "loss": 0.0463, "step": 112710 }, { - "epoch": 1.22, - "learning_rate": 0.00011711986501395287, - "loss": 0.0364, + "epoch": 0.73, + "learning_rate": 0.0001908717736886605, + "loss": 0.0474, "step": 112720 }, { - "epoch": 1.22, - "learning_rate": 0.00011710364072944382, - "loss": 0.0328, + "epoch": 0.73, + "learning_rate": 0.0001908620923343036, + "loss": 0.0454, "step": 112730 }, { - "epoch": 1.22, - "learning_rate": 0.00011708741644493477, - "loss": 0.0384, + "epoch": 0.73, + "learning_rate": 0.00019085241097994667, + "loss": 0.0431, "step": 112740 }, { - "epoch": 1.22, - "learning_rate": 0.00011707119216042572, - "loss": 0.0325, + "epoch": 0.73, + "learning_rate": 0.00019084272962558975, + "loss": 0.0498, "step": 112750 }, { - "epoch": 1.22, - "learning_rate": 0.00011705496787591666, - "loss": 0.0331, + "epoch": 0.73, + "learning_rate": 0.0001908330482712328, + "loss": 0.0457, "step": 112760 }, { - "epoch": 1.22, - "learning_rate": 0.0001170387435914076, - "loss": 0.0369, + "epoch": 0.73, + "learning_rate": 0.00019082336691687588, + "loss": 0.0456, "step": 112770 }, { - "epoch": 1.22, - "learning_rate": 0.00011702251930689855, - "loss": 0.034, + "epoch": 0.73, + "learning_rate": 0.00019081368556251896, + "loss": 0.0478, "step": 112780 }, { - "epoch": 1.22, - "learning_rate": 0.0001170062950223895, - "loss": 0.0343, + "epoch": 0.73, + "learning_rate": 0.000190804004208162, + "loss": 0.0431, "step": 112790 }, { - "epoch": 1.22, - "learning_rate": 0.00011699007073788045, - "loss": 0.0382, + "epoch": 0.73, + "learning_rate": 0.00019079432285380507, + "loss": 0.0408, "step": 112800 }, { - "epoch": 1.22, - "learning_rate": 0.00011697384645337139, - "loss": 0.0373, + "epoch": 0.73, + "learning_rate": 0.00019078464149944815, + "loss": 0.043, "step": 112810 }, { - "epoch": 1.22, - "learning_rate": 0.00011695762216886234, - "loss": 0.029, + "epoch": 0.73, + "learning_rate": 0.00019077496014509123, + "loss": 0.0449, "step": 112820 }, { - "epoch": 1.22, - "learning_rate": 0.00011694139788435329, - "loss": 0.0329, + "epoch": 0.73, + "learning_rate": 0.00019076527879073428, + "loss": 0.0409, "step": 112830 }, { - "epoch": 1.22, - "learning_rate": 0.00011692517359984424, - "loss": 0.0364, + "epoch": 0.73, + "learning_rate": 0.00019075559743637736, + "loss": 0.0495, "step": 112840 }, { - "epoch": 1.22, - "learning_rate": 0.00011690894931533518, - "loss": 0.0343, + "epoch": 0.73, + "learning_rate": 0.00019074591608202044, + "loss": 0.0418, "step": 112850 }, { - "epoch": 1.22, - "learning_rate": 0.00011689272503082613, - "loss": 0.0402, + "epoch": 0.73, + "learning_rate": 0.00019073623472766347, + "loss": 0.0437, "step": 112860 }, { - "epoch": 1.22, - "learning_rate": 0.00011687650074631708, - "loss": 0.0315, + "epoch": 0.73, + "learning_rate": 0.00019072655337330655, + "loss": 0.0569, "step": 112870 }, { - "epoch": 1.22, - "learning_rate": 0.00011686027646180803, - "loss": 0.0313, + "epoch": 0.73, + "learning_rate": 0.00019071687201894962, + "loss": 0.0431, "step": 112880 }, { - "epoch": 1.22, - "learning_rate": 0.00011684405217729898, - "loss": 0.0385, + "epoch": 0.73, + "learning_rate": 0.00019070719066459268, + "loss": 0.0464, "step": 112890 }, { - "epoch": 1.22, - "learning_rate": 0.00011682782789278991, - "loss": 0.0379, + "epoch": 0.73, + "learning_rate": 0.00019069750931023576, + "loss": 0.048, "step": 112900 }, { - "epoch": 1.22, - "learning_rate": 0.00011681160360828086, - "loss": 0.032, + "epoch": 0.73, + "learning_rate": 0.00019068782795587884, + "loss": 0.0527, "step": 112910 }, { - "epoch": 1.22, - "learning_rate": 0.00011679537932377181, - "loss": 0.0297, + "epoch": 0.73, + "learning_rate": 0.00019067814660152192, + "loss": 0.0505, "step": 112920 }, { - "epoch": 1.22, - "learning_rate": 0.00011677915503926276, - "loss": 0.0331, + "epoch": 0.73, + "learning_rate": 0.00019066846524716494, + "loss": 0.0491, "step": 112930 }, { - "epoch": 1.22, - "learning_rate": 0.0001167629307547537, - "loss": 0.0288, + "epoch": 0.73, + "learning_rate": 0.00019065878389280802, + "loss": 0.0478, "step": 112940 }, { - "epoch": 1.22, - "learning_rate": 0.00011674670647024465, - "loss": 0.0341, + "epoch": 0.73, + "learning_rate": 0.0001906491025384511, + "loss": 0.0469, "step": 112950 }, { - "epoch": 1.22, - "learning_rate": 0.0001167304821857356, - "loss": 0.0359, + "epoch": 0.73, + "learning_rate": 0.00019063942118409415, + "loss": 0.0416, "step": 112960 }, { - "epoch": 1.22, - "learning_rate": 0.00011671425790122655, - "loss": 0.0363, + "epoch": 0.73, + "learning_rate": 0.00019062973982973723, + "loss": 0.0427, "step": 112970 }, { - "epoch": 1.22, - "learning_rate": 0.0001166980336167175, - "loss": 0.035, + "epoch": 0.73, + "learning_rate": 0.00019062005847538031, + "loss": 0.0413, "step": 112980 }, { - "epoch": 1.22, - "learning_rate": 0.00011668180933220843, - "loss": 0.0365, + "epoch": 0.73, + "learning_rate": 0.0001906103771210234, + "loss": 0.049, "step": 112990 }, { - "epoch": 1.22, - "learning_rate": 0.00011666558504769938, - "loss": 0.0366, + "epoch": 0.73, + "learning_rate": 0.00019060069576666642, + "loss": 0.0413, "step": 113000 }, { - "epoch": 1.22, - "eval_cer": 0.9211163354483948, - "eval_loss": 0.026883266866207123, - "eval_runtime": 118.8572, - "eval_samples_per_second": 16.827, - "eval_steps_per_second": 4.207, + "epoch": 0.73, + "eval_cer": 0.9199014800587504, + "eval_loss": 0.02950255572795868, + "eval_runtime": 119.9456, + "eval_samples_per_second": 16.674, + "eval_steps_per_second": 4.169, "step": 113000 }, { - "epoch": 1.22, - "learning_rate": 0.00011664936076319033, - "loss": 0.0332, + "epoch": 0.73, + "learning_rate": 0.0001905910144123095, + "loss": 0.0461, "step": 113010 }, { - "epoch": 1.22, - "learning_rate": 0.00011663313647868128, - "loss": 0.0309, + "epoch": 0.73, + "learning_rate": 0.00019058133305795258, + "loss": 0.0446, "step": 113020 }, { - "epoch": 1.22, - "learning_rate": 0.00011661691219417222, - "loss": 0.0327, + "epoch": 0.73, + "learning_rate": 0.00019057165170359563, + "loss": 0.0394, "step": 113030 }, { - "epoch": 1.22, - "learning_rate": 0.00011660068790966317, - "loss": 0.0335, + "epoch": 0.73, + "learning_rate": 0.0001905619703492387, + "loss": 0.0436, "step": 113040 }, { - "epoch": 1.22, - "learning_rate": 0.00011658446362515412, - "loss": 0.0342, + "epoch": 0.73, + "learning_rate": 0.0001905522889948818, + "loss": 0.0434, "step": 113050 }, { - "epoch": 1.22, - "learning_rate": 0.00011656823934064507, - "loss": 0.0315, + "epoch": 0.73, + "learning_rate": 0.00019054260764052487, + "loss": 0.0493, "step": 113060 }, { - "epoch": 1.22, - "learning_rate": 0.00011655201505613602, - "loss": 0.0346, + "epoch": 0.73, + "learning_rate": 0.0001905329262861679, + "loss": 0.0428, "step": 113070 }, { - "epoch": 1.22, - "learning_rate": 0.00011653579077162695, - "loss": 0.0358, + "epoch": 0.73, + "learning_rate": 0.00019052324493181098, + "loss": 0.0406, "step": 113080 }, { - "epoch": 1.22, - "learning_rate": 0.0001165195664871179, - "loss": 0.0364, + "epoch": 0.73, + "learning_rate": 0.00019051356357745403, + "loss": 0.0519, "step": 113090 }, { - "epoch": 1.22, - "learning_rate": 0.00011650334220260885, - "loss": 0.0326, + "epoch": 0.73, + "learning_rate": 0.0001905038822230971, + "loss": 0.0481, "step": 113100 }, { - "epoch": 1.22, - "learning_rate": 0.0001164871179180998, - "loss": 0.0312, + "epoch": 0.73, + "learning_rate": 0.0001904942008687402, + "loss": 0.0429, "step": 113110 }, { - "epoch": 1.22, - "learning_rate": 0.00011647089363359074, - "loss": 0.0348, + "epoch": 0.73, + "learning_rate": 0.00019048451951438327, + "loss": 0.0403, "step": 113120 }, { - "epoch": 1.22, - "learning_rate": 0.00011645466934908169, - "loss": 0.0325, + "epoch": 0.73, + "learning_rate": 0.00019047483816002632, + "loss": 0.0461, "step": 113130 }, { - "epoch": 1.22, - "learning_rate": 0.00011643844506457264, - "loss": 0.0328, + "epoch": 0.73, + "learning_rate": 0.00019046515680566937, + "loss": 0.0431, "step": 113140 }, { - "epoch": 1.22, - "learning_rate": 0.00011642222078006359, - "loss": 0.0338, + "epoch": 0.73, + "learning_rate": 0.00019045547545131245, + "loss": 0.052, "step": 113150 }, { - "epoch": 1.22, - "learning_rate": 0.00011640599649555454, - "loss": 0.0343, + "epoch": 0.73, + "learning_rate": 0.0001904457940969555, + "loss": 0.0483, "step": 113160 }, { - "epoch": 1.22, - "learning_rate": 0.00011638977221104547, - "loss": 0.0279, + "epoch": 0.73, + "learning_rate": 0.00019043611274259859, + "loss": 0.0449, "step": 113170 }, { - "epoch": 1.22, - "learning_rate": 0.00011637354792653642, - "loss": 0.0363, + "epoch": 0.73, + "learning_rate": 0.00019042643138824167, + "loss": 0.0469, "step": 113180 }, { - "epoch": 1.22, - "learning_rate": 0.00011635732364202737, - "loss": 0.0365, + "epoch": 0.73, + "learning_rate": 0.00019041675003388475, + "loss": 0.0405, "step": 113190 }, { - "epoch": 1.22, - "learning_rate": 0.00011634109935751832, - "loss": 0.03, + "epoch": 0.73, + "learning_rate": 0.0001904070686795278, + "loss": 0.0426, "step": 113200 }, { - "epoch": 1.22, - "learning_rate": 0.00011632487507300926, - "loss": 0.032, + "epoch": 0.73, + "learning_rate": 0.00019039738732517085, + "loss": 0.0412, "step": 113210 }, { - "epoch": 1.22, - "learning_rate": 0.00011630865078850021, - "loss": 0.0352, + "epoch": 0.73, + "learning_rate": 0.00019038770597081393, + "loss": 0.0488, "step": 113220 }, { - "epoch": 1.22, - "learning_rate": 0.00011629242650399116, - "loss": 0.038, + "epoch": 0.73, + "learning_rate": 0.00019037802461645698, + "loss": 0.0483, "step": 113230 }, { - "epoch": 1.22, - "learning_rate": 0.00011627620221948211, - "loss": 0.0284, + "epoch": 0.73, + "learning_rate": 0.00019036834326210006, + "loss": 0.0421, "step": 113240 }, { - "epoch": 1.22, - "learning_rate": 0.00011625997793497306, - "loss": 0.0287, + "epoch": 0.73, + "learning_rate": 0.00019035866190774314, + "loss": 0.0421, "step": 113250 }, { - "epoch": 1.23, - "learning_rate": 0.000116243753650464, - "loss": 0.0397, + "epoch": 0.73, + "learning_rate": 0.00019034898055338622, + "loss": 0.0416, "step": 113260 }, { - "epoch": 1.23, - "learning_rate": 0.00011622752936595494, - "loss": 0.0329, + "epoch": 0.73, + "learning_rate": 0.00019033929919902928, + "loss": 0.0399, "step": 113270 }, { - "epoch": 1.23, - "learning_rate": 0.0001162113050814459, - "loss": 0.0328, + "epoch": 0.73, + "learning_rate": 0.00019032961784467233, + "loss": 0.0455, "step": 113280 }, { - "epoch": 1.23, - "learning_rate": 0.00011619508079693684, - "loss": 0.0331, + "epoch": 0.73, + "learning_rate": 0.00019031993649031538, + "loss": 0.0448, "step": 113290 }, { - "epoch": 1.23, - "learning_rate": 0.0001161788565124278, - "loss": 0.0367, + "epoch": 0.73, + "learning_rate": 0.00019031025513595846, + "loss": 0.0431, "step": 113300 }, { - "epoch": 1.23, - "learning_rate": 0.00011616263222791873, - "loss": 0.0298, + "epoch": 0.73, + "learning_rate": 0.00019030057378160154, + "loss": 0.0416, "step": 113310 }, { - "epoch": 1.23, - "learning_rate": 0.00011614640794340968, - "loss": 0.0334, + "epoch": 0.73, + "learning_rate": 0.00019029089242724462, + "loss": 0.0463, "step": 113320 }, { - "epoch": 1.23, - "learning_rate": 0.00011613018365890063, - "loss": 0.0248, + "epoch": 0.73, + "learning_rate": 0.00019028121107288767, + "loss": 0.0501, "step": 113330 }, { - "epoch": 1.23, - "learning_rate": 0.00011611395937439158, - "loss": 0.0313, + "epoch": 0.73, + "learning_rate": 0.00019027152971853075, + "loss": 0.0403, "step": 113340 }, { - "epoch": 1.23, - "learning_rate": 0.00011609773508988252, - "loss": 0.0303, + "epoch": 0.73, + "learning_rate": 0.0001902618483641738, + "loss": 0.0465, "step": 113350 }, { - "epoch": 1.23, - "learning_rate": 0.00011608151080537347, - "loss": 0.0336, + "epoch": 0.73, + "learning_rate": 0.00019025216700981686, + "loss": 0.0416, "step": 113360 }, { - "epoch": 1.23, - "learning_rate": 0.00011606528652086442, - "loss": 0.0374, + "epoch": 0.73, + "learning_rate": 0.00019024248565545994, + "loss": 0.0438, "step": 113370 }, { - "epoch": 1.23, - "learning_rate": 0.00011604906223635536, - "loss": 0.0305, + "epoch": 0.73, + "learning_rate": 0.00019023280430110302, + "loss": 0.051, "step": 113380 }, { - "epoch": 1.23, - "learning_rate": 0.00011603283795184631, - "loss": 0.0366, + "epoch": 0.73, + "learning_rate": 0.0001902231229467461, + "loss": 0.0412, "step": 113390 }, { - "epoch": 1.23, - "learning_rate": 0.00011601661366733725, - "loss": 0.0279, + "epoch": 0.73, + "learning_rate": 0.00019021344159238915, + "loss": 0.0448, "step": 113400 }, { - "epoch": 1.23, - "learning_rate": 0.0001160003893828282, - "loss": 0.0356, + "epoch": 0.73, + "learning_rate": 0.00019020376023803223, + "loss": 0.0447, "step": 113410 }, { - "epoch": 1.23, - "learning_rate": 0.00011598416509831915, - "loss": 0.0274, + "epoch": 0.73, + "learning_rate": 0.00019019407888367528, + "loss": 0.0407, "step": 113420 }, { - "epoch": 1.23, - "learning_rate": 0.0001159679408138101, - "loss": 0.0432, + "epoch": 0.73, + "learning_rate": 0.00019018439752931834, + "loss": 0.043, "step": 113430 }, { - "epoch": 1.23, - "learning_rate": 0.00011595171652930104, - "loss": 0.039, + "epoch": 0.73, + "learning_rate": 0.00019017471617496142, + "loss": 0.0373, "step": 113440 }, { - "epoch": 1.23, - "learning_rate": 0.00011593549224479199, - "loss": 0.03, + "epoch": 0.73, + "learning_rate": 0.0001901650348206045, + "loss": 0.0446, "step": 113450 }, { - "epoch": 1.23, - "learning_rate": 0.00011591926796028294, - "loss": 0.0332, + "epoch": 0.73, + "learning_rate": 0.00019015535346624758, + "loss": 0.0412, "step": 113460 }, { - "epoch": 1.23, - "learning_rate": 0.00011590304367577389, - "loss": 0.0355, + "epoch": 0.73, + "learning_rate": 0.00019014567211189063, + "loss": 0.0451, "step": 113470 }, { - "epoch": 1.23, - "learning_rate": 0.00011588681939126484, - "loss": 0.0359, + "epoch": 0.73, + "learning_rate": 0.0001901359907575337, + "loss": 0.0383, "step": 113480 }, { - "epoch": 1.23, - "learning_rate": 0.00011587059510675577, - "loss": 0.0337, + "epoch": 0.73, + "learning_rate": 0.00019012630940317673, + "loss": 0.0376, "step": 113490 }, { - "epoch": 1.23, - "learning_rate": 0.00011585437082224672, - "loss": 0.0366, + "epoch": 0.73, + "learning_rate": 0.0001901166280488198, + "loss": 0.0385, "step": 113500 }, { - "epoch": 1.23, - "learning_rate": 0.00011583814653773767, - "loss": 0.0312, + "epoch": 0.73, + "learning_rate": 0.0001901069466944629, + "loss": 0.0401, "step": 113510 }, { - "epoch": 1.23, - "learning_rate": 0.00011582192225322862, - "loss": 0.0354, + "epoch": 0.73, + "learning_rate": 0.00019009726534010597, + "loss": 0.0406, "step": 113520 }, { - "epoch": 1.23, - "learning_rate": 0.00011580569796871956, - "loss": 0.0355, + "epoch": 0.73, + "learning_rate": 0.00019008758398574903, + "loss": 0.0491, "step": 113530 }, { - "epoch": 1.23, - "learning_rate": 0.00011578947368421051, - "loss": 0.0313, + "epoch": 0.73, + "learning_rate": 0.0001900779026313921, + "loss": 0.0417, "step": 113540 }, { - "epoch": 1.23, - "learning_rate": 0.00011577324939970146, - "loss": 0.035, + "epoch": 0.73, + "learning_rate": 0.00019006822127703518, + "loss": 0.0382, "step": 113550 }, { - "epoch": 1.23, - "learning_rate": 0.0001157570251151924, - "loss": 0.0464, + "epoch": 0.73, + "learning_rate": 0.0001900585399226782, + "loss": 0.0489, "step": 113560 }, { - "epoch": 1.23, - "learning_rate": 0.00011574080083068336, - "loss": 0.0422, + "epoch": 0.73, + "learning_rate": 0.0001900488585683213, + "loss": 0.0379, "step": 113570 }, { - "epoch": 1.23, - "learning_rate": 0.00011572457654617429, - "loss": 0.0306, + "epoch": 0.73, + "learning_rate": 0.00019003917721396437, + "loss": 0.0403, "step": 113580 }, { - "epoch": 1.23, - "learning_rate": 0.00011570835226166524, - "loss": 0.0337, + "epoch": 0.73, + "learning_rate": 0.00019002949585960745, + "loss": 0.0394, "step": 113590 }, { - "epoch": 1.23, - "learning_rate": 0.00011569212797715619, - "loss": 0.0358, + "epoch": 0.73, + "learning_rate": 0.0001900198145052505, + "loss": 0.043, "step": 113600 }, { - "epoch": 1.23, - "learning_rate": 0.00011567590369264714, - "loss": 0.0364, + "epoch": 0.73, + "learning_rate": 0.00019001013315089358, + "loss": 0.0554, "step": 113610 }, { - "epoch": 1.23, - "learning_rate": 0.00011565967940813808, - "loss": 0.0344, + "epoch": 0.73, + "learning_rate": 0.00019000045179653666, + "loss": 0.0467, "step": 113620 }, { - "epoch": 1.23, - "learning_rate": 0.00011564345512362903, - "loss": 0.0376, + "epoch": 0.73, + "learning_rate": 0.0001899907704421797, + "loss": 0.0468, "step": 113630 }, { - "epoch": 1.23, - "learning_rate": 0.00011562723083911998, - "loss": 0.0407, + "epoch": 0.73, + "learning_rate": 0.00018998108908782277, + "loss": 0.0505, "step": 113640 }, { - "epoch": 1.23, - "learning_rate": 0.00011561100655461093, - "loss": 0.032, + "epoch": 0.73, + "learning_rate": 0.00018997140773346585, + "loss": 0.0403, "step": 113650 }, { - "epoch": 1.23, - "learning_rate": 0.00011559478227010188, - "loss": 0.0338, + "epoch": 0.73, + "learning_rate": 0.00018996172637910893, + "loss": 0.041, "step": 113660 }, { - "epoch": 1.23, - "learning_rate": 0.00011557855798559281, - "loss": 0.0392, + "epoch": 0.73, + "learning_rate": 0.00018995204502475198, + "loss": 0.0463, "step": 113670 }, { - "epoch": 1.23, - "learning_rate": 0.00011556233370108376, - "loss": 0.0386, + "epoch": 0.73, + "learning_rate": 0.00018994236367039506, + "loss": 0.0495, "step": 113680 }, { - "epoch": 1.23, - "learning_rate": 0.00011554610941657471, - "loss": 0.0388, + "epoch": 0.73, + "learning_rate": 0.00018993268231603809, + "loss": 0.0407, "step": 113690 }, { - "epoch": 1.23, - "learning_rate": 0.00011552988513206566, - "loss": 0.0368, + "epoch": 0.73, + "learning_rate": 0.00018992300096168116, + "loss": 0.0423, "step": 113700 }, { - "epoch": 1.23, - "learning_rate": 0.0001155136608475566, - "loss": 0.0401, + "epoch": 0.73, + "learning_rate": 0.00018991331960732424, + "loss": 0.0434, "step": 113710 }, { - "epoch": 1.23, - "learning_rate": 0.00011549743656304755, - "loss": 0.0391, + "epoch": 0.73, + "learning_rate": 0.00018990363825296732, + "loss": 0.0444, "step": 113720 }, { - "epoch": 1.23, - "learning_rate": 0.0001154812122785385, - "loss": 0.0346, + "epoch": 0.73, + "learning_rate": 0.00018989395689861038, + "loss": 0.0476, "step": 113730 }, { - "epoch": 1.23, - "learning_rate": 0.00011546498799402945, - "loss": 0.0342, + "epoch": 0.73, + "learning_rate": 0.00018988427554425346, + "loss": 0.0462, "step": 113740 }, { - "epoch": 1.23, - "learning_rate": 0.0001154487637095204, - "loss": 0.038, + "epoch": 0.73, + "learning_rate": 0.00018987459418989654, + "loss": 0.0426, "step": 113750 }, { - "epoch": 1.23, - "learning_rate": 0.00011543253942501133, - "loss": 0.04, + "epoch": 0.73, + "learning_rate": 0.00018986491283553956, + "loss": 0.0457, "step": 113760 }, { - "epoch": 1.23, - "learning_rate": 0.00011541631514050228, - "loss": 0.0355, + "epoch": 0.73, + "learning_rate": 0.00018985523148118264, + "loss": 0.0472, "step": 113770 }, { - "epoch": 1.23, - "learning_rate": 0.00011540009085599323, - "loss": 0.0346, + "epoch": 0.73, + "learning_rate": 0.00018984555012682572, + "loss": 0.0495, "step": 113780 }, { - "epoch": 1.23, - "learning_rate": 0.00011538386657148418, - "loss": 0.0319, + "epoch": 0.73, + "learning_rate": 0.0001898358687724688, + "loss": 0.0497, "step": 113790 }, { - "epoch": 1.23, - "learning_rate": 0.00011536764228697512, - "loss": 0.0367, + "epoch": 0.73, + "learning_rate": 0.00018982618741811185, + "loss": 0.0449, "step": 113800 }, { - "epoch": 1.23, - "learning_rate": 0.00011535141800246608, - "loss": 0.0359, + "epoch": 0.73, + "learning_rate": 0.00018981650606375493, + "loss": 0.0418, "step": 113810 }, { - "epoch": 1.23, - "learning_rate": 0.00011533519371795703, - "loss": 0.0395, + "epoch": 0.73, + "learning_rate": 0.00018980682470939801, + "loss": 0.0524, "step": 113820 }, { - "epoch": 1.23, - "learning_rate": 0.00011531896943344798, - "loss": 0.0363, + "epoch": 0.73, + "learning_rate": 0.00018979714335504104, + "loss": 0.046, "step": 113830 }, { - "epoch": 1.23, - "learning_rate": 0.00011530274514893893, - "loss": 0.0372, + "epoch": 0.73, + "learning_rate": 0.00018978746200068412, + "loss": 0.0441, "step": 113840 }, { - "epoch": 1.23, - "learning_rate": 0.00011528652086442988, - "loss": 0.0337, + "epoch": 0.73, + "learning_rate": 0.0001897777806463272, + "loss": 0.0424, "step": 113850 }, { - "epoch": 1.23, - "learning_rate": 0.00011527029657992082, - "loss": 0.0314, + "epoch": 0.73, + "learning_rate": 0.00018976809929197028, + "loss": 0.0403, "step": 113860 }, { - "epoch": 1.23, - "learning_rate": 0.00011525407229541177, - "loss": 0.0405, + "epoch": 0.73, + "learning_rate": 0.00018975841793761333, + "loss": 0.0441, "step": 113870 }, { - "epoch": 1.23, - "learning_rate": 0.00011523784801090272, - "loss": 0.0284, + "epoch": 0.74, + "learning_rate": 0.0001897487365832564, + "loss": 0.0366, "step": 113880 }, { - "epoch": 1.23, - "learning_rate": 0.00011522162372639367, - "loss": 0.0331, + "epoch": 0.74, + "learning_rate": 0.0001897390552288995, + "loss": 0.041, "step": 113890 }, { - "epoch": 1.23, - "learning_rate": 0.0001152053994418846, - "loss": 0.0324, + "epoch": 0.74, + "learning_rate": 0.00018972937387454252, + "loss": 0.0433, "step": 113900 }, { - "epoch": 1.23, - "learning_rate": 0.00011518917515737555, - "loss": 0.0301, + "epoch": 0.74, + "learning_rate": 0.0001897196925201856, + "loss": 0.0511, "step": 113910 }, { - "epoch": 1.23, - "learning_rate": 0.0001151729508728665, - "loss": 0.0318, + "epoch": 0.74, + "learning_rate": 0.00018971001116582868, + "loss": 0.042, "step": 113920 }, { - "epoch": 1.23, - "learning_rate": 0.00011515672658835745, - "loss": 0.0307, + "epoch": 0.74, + "learning_rate": 0.00018970032981147173, + "loss": 0.0406, "step": 113930 }, { - "epoch": 1.23, - "learning_rate": 0.0001151405023038484, - "loss": 0.0327, + "epoch": 0.74, + "learning_rate": 0.0001896906484571148, + "loss": 0.0406, "step": 113940 }, { - "epoch": 1.23, - "learning_rate": 0.00011512427801933934, - "loss": 0.0331, + "epoch": 0.74, + "learning_rate": 0.0001896809671027579, + "loss": 0.0443, "step": 113950 }, { - "epoch": 1.23, - "learning_rate": 0.00011510805373483029, - "loss": 0.0314, + "epoch": 0.74, + "learning_rate": 0.00018967128574840097, + "loss": 0.0384, "step": 113960 }, { - "epoch": 1.23, - "learning_rate": 0.00011509182945032124, - "loss": 0.0346, + "epoch": 0.74, + "learning_rate": 0.000189661604394044, + "loss": 0.0426, "step": 113970 }, { - "epoch": 1.23, - "learning_rate": 0.00011507560516581219, - "loss": 0.0386, + "epoch": 0.74, + "learning_rate": 0.00018965192303968707, + "loss": 0.0432, "step": 113980 }, { - "epoch": 1.23, - "learning_rate": 0.00011505938088130314, - "loss": 0.0359, + "epoch": 0.74, + "learning_rate": 0.00018964224168533015, + "loss": 0.0369, "step": 113990 }, { - "epoch": 1.23, - "learning_rate": 0.00011504315659679407, - "loss": 0.0345, + "epoch": 0.74, + "learning_rate": 0.0001896325603309732, + "loss": 0.0461, "step": 114000 }, { - "epoch": 1.23, - "eval_cer": 0.9211189859013572, - "eval_loss": 0.0268502589315176, - "eval_runtime": 118.9187, - "eval_samples_per_second": 16.818, - "eval_steps_per_second": 4.205, + "epoch": 0.74, + "eval_cer": 0.919810190938877, + "eval_loss": 0.030083321034908295, + "eval_runtime": 119.8896, + "eval_samples_per_second": 16.682, + "eval_steps_per_second": 4.171, "step": 114000 }, { - "epoch": 1.23, - "learning_rate": 0.00011502693231228502, - "loss": 0.0362, + "epoch": 0.74, + "learning_rate": 0.00018962287897661629, + "loss": 0.043, "step": 114010 }, { - "epoch": 1.23, - "learning_rate": 0.00011501070802777597, - "loss": 0.0378, + "epoch": 0.74, + "learning_rate": 0.00018961319762225937, + "loss": 0.047, "step": 114020 }, { - "epoch": 1.23, - "learning_rate": 0.00011499448374326692, - "loss": 0.0378, + "epoch": 0.74, + "learning_rate": 0.00018960351626790245, + "loss": 0.0419, "step": 114030 }, { - "epoch": 1.23, - "learning_rate": 0.00011497825945875786, - "loss": 0.0323, + "epoch": 0.74, + "learning_rate": 0.00018959383491354547, + "loss": 0.0448, "step": 114040 }, { - "epoch": 1.23, - "learning_rate": 0.00011496203517424881, - "loss": 0.0323, + "epoch": 0.74, + "learning_rate": 0.00018958415355918855, + "loss": 0.0412, "step": 114050 }, { - "epoch": 1.23, - "learning_rate": 0.00011494581088973976, - "loss": 0.0351, + "epoch": 0.74, + "learning_rate": 0.00018957447220483163, + "loss": 0.0393, "step": 114060 }, { - "epoch": 1.23, - "learning_rate": 0.00011492958660523071, - "loss": 0.0381, + "epoch": 0.74, + "learning_rate": 0.00018956479085047468, + "loss": 0.0463, "step": 114070 }, { - "epoch": 1.23, - "learning_rate": 0.00011491336232072166, - "loss": 0.0352, + "epoch": 0.74, + "learning_rate": 0.00018955510949611776, + "loss": 0.0368, "step": 114080 }, { - "epoch": 1.23, - "learning_rate": 0.0001148971380362126, - "loss": 0.0379, + "epoch": 0.74, + "learning_rate": 0.00018954542814176084, + "loss": 0.0632, "step": 114090 }, { - "epoch": 1.23, - "learning_rate": 0.00011488091375170354, - "loss": 0.0368, + "epoch": 0.74, + "learning_rate": 0.0001895357467874039, + "loss": 0.0382, "step": 114100 }, { - "epoch": 1.23, - "learning_rate": 0.0001148646894671945, - "loss": 0.0363, + "epoch": 0.74, + "learning_rate": 0.00018952606543304695, + "loss": 0.0487, "step": 114110 }, { - "epoch": 1.23, - "learning_rate": 0.00011484846518268544, - "loss": 0.0281, + "epoch": 0.74, + "learning_rate": 0.00018951638407869003, + "loss": 0.0396, "step": 114120 }, { - "epoch": 1.23, - "learning_rate": 0.00011483224089817638, - "loss": 0.0328, + "epoch": 0.74, + "learning_rate": 0.00018950670272433308, + "loss": 0.0452, "step": 114130 }, { - "epoch": 1.23, - "learning_rate": 0.00011481601661366733, - "loss": 0.0328, + "epoch": 0.74, + "learning_rate": 0.00018949702136997616, + "loss": 0.0442, "step": 114140 }, { - "epoch": 1.23, - "learning_rate": 0.00011479979232915828, - "loss": 0.0331, + "epoch": 0.74, + "learning_rate": 0.00018948734001561924, + "loss": 0.0398, "step": 114150 }, { - "epoch": 1.23, - "learning_rate": 0.00011478356804464923, - "loss": 0.0306, + "epoch": 0.74, + "learning_rate": 0.00018947765866126232, + "loss": 0.0459, "step": 114160 }, { - "epoch": 1.23, - "learning_rate": 0.00011476734376014018, - "loss": 0.0389, + "epoch": 0.74, + "learning_rate": 0.00018946797730690537, + "loss": 0.0428, "step": 114170 }, { - "epoch": 1.23, - "learning_rate": 0.00011475111947563112, - "loss": 0.0361, + "epoch": 0.74, + "learning_rate": 0.00018945829595254843, + "loss": 0.0535, "step": 114180 }, { - "epoch": 1.24, - "learning_rate": 0.00011473489519112207, - "loss": 0.0301, + "epoch": 0.74, + "learning_rate": 0.0001894486145981915, + "loss": 0.0451, "step": 114190 }, { - "epoch": 1.24, - "learning_rate": 0.00011471867090661302, - "loss": 0.0436, + "epoch": 0.74, + "learning_rate": 0.00018943893324383456, + "loss": 0.0481, "step": 114200 }, { - "epoch": 1.24, - "learning_rate": 0.00011470244662210397, - "loss": 0.0368, + "epoch": 0.74, + "learning_rate": 0.00018942925188947764, + "loss": 0.0446, "step": 114210 }, { - "epoch": 1.24, - "learning_rate": 0.0001146862223375949, - "loss": 0.0377, + "epoch": 0.74, + "learning_rate": 0.00018941957053512072, + "loss": 0.0477, "step": 114220 }, { - "epoch": 1.24, - "learning_rate": 0.00011466999805308585, - "loss": 0.0307, + "epoch": 0.74, + "learning_rate": 0.0001894098891807638, + "loss": 0.0409, "step": 114230 }, { - "epoch": 1.24, - "learning_rate": 0.0001146537737685768, - "loss": 0.0398, + "epoch": 0.74, + "learning_rate": 0.00018940020782640685, + "loss": 0.0461, "step": 114240 }, { - "epoch": 1.24, - "learning_rate": 0.00011463754948406775, - "loss": 0.0346, + "epoch": 0.74, + "learning_rate": 0.0001893905264720499, + "loss": 0.0428, "step": 114250 }, { - "epoch": 1.24, - "learning_rate": 0.0001146213251995587, - "loss": 0.0362, + "epoch": 0.74, + "learning_rate": 0.00018938084511769298, + "loss": 0.0426, "step": 114260 }, { - "epoch": 1.24, - "learning_rate": 0.00011460510091504964, - "loss": 0.0316, + "epoch": 0.74, + "learning_rate": 0.00018937116376333604, + "loss": 0.0399, "step": 114270 }, { - "epoch": 1.24, - "learning_rate": 0.00011458887663054059, - "loss": 0.034, + "epoch": 0.74, + "learning_rate": 0.00018936148240897912, + "loss": 0.0461, "step": 114280 }, { - "epoch": 1.24, - "learning_rate": 0.00011457265234603154, - "loss": 0.0362, + "epoch": 0.74, + "learning_rate": 0.0001893518010546222, + "loss": 0.049, "step": 114290 }, { - "epoch": 1.24, - "learning_rate": 0.00011455642806152249, - "loss": 0.0289, + "epoch": 0.74, + "learning_rate": 0.00018934211970026525, + "loss": 0.0514, "step": 114300 }, { - "epoch": 1.24, - "learning_rate": 0.00011454020377701342, - "loss": 0.0376, + "epoch": 0.74, + "learning_rate": 0.00018933243834590833, + "loss": 0.0391, "step": 114310 }, { - "epoch": 1.24, - "learning_rate": 0.00011452397949250437, - "loss": 0.0415, + "epoch": 0.74, + "learning_rate": 0.00018932275699155138, + "loss": 0.0509, "step": 114320 }, { - "epoch": 1.24, - "learning_rate": 0.00011450775520799532, - "loss": 0.0322, + "epoch": 0.74, + "learning_rate": 0.00018931307563719443, + "loss": 0.0451, "step": 114330 }, { - "epoch": 1.24, - "learning_rate": 0.00011449153092348627, - "loss": 0.0388, + "epoch": 0.74, + "learning_rate": 0.0001893033942828375, + "loss": 0.0438, "step": 114340 }, { - "epoch": 1.24, - "learning_rate": 0.00011447530663897722, - "loss": 0.0468, + "epoch": 0.74, + "learning_rate": 0.0001892937129284806, + "loss": 0.0445, "step": 114350 }, { - "epoch": 1.24, - "learning_rate": 0.00011445908235446816, - "loss": 0.0276, + "epoch": 0.74, + "learning_rate": 0.00018928403157412367, + "loss": 0.0493, "step": 114360 }, { - "epoch": 1.24, - "learning_rate": 0.00011444285806995911, - "loss": 0.0303, + "epoch": 0.74, + "learning_rate": 0.00018927435021976672, + "loss": 0.0483, "step": 114370 }, { - "epoch": 1.24, - "learning_rate": 0.00011442663378545006, - "loss": 0.0383, + "epoch": 0.74, + "learning_rate": 0.0001892646688654098, + "loss": 0.0398, "step": 114380 }, { - "epoch": 1.24, - "learning_rate": 0.00011441040950094101, - "loss": 0.0322, + "epoch": 0.74, + "learning_rate": 0.00018925498751105286, + "loss": 0.0444, "step": 114390 }, { - "epoch": 1.24, - "learning_rate": 0.00011439418521643194, - "loss": 0.0398, + "epoch": 0.74, + "learning_rate": 0.0001892453061566959, + "loss": 0.0422, "step": 114400 }, { - "epoch": 1.24, - "learning_rate": 0.00011437796093192289, - "loss": 0.0401, + "epoch": 0.74, + "learning_rate": 0.000189235624802339, + "loss": 0.0403, "step": 114410 }, { - "epoch": 1.24, - "learning_rate": 0.00011436173664741384, - "loss": 0.0336, + "epoch": 0.74, + "learning_rate": 0.00018922594344798207, + "loss": 0.0392, "step": 114420 }, { - "epoch": 1.24, - "learning_rate": 0.00011434551236290479, - "loss": 0.035, + "epoch": 0.74, + "learning_rate": 0.00018921626209362515, + "loss": 0.0517, "step": 114430 }, { - "epoch": 1.24, - "learning_rate": 0.00011432928807839574, - "loss": 0.0359, + "epoch": 0.74, + "learning_rate": 0.0001892065807392682, + "loss": 0.045, "step": 114440 }, { - "epoch": 1.24, - "learning_rate": 0.00011431306379388668, - "loss": 0.0326, + "epoch": 0.74, + "learning_rate": 0.00018919689938491128, + "loss": 0.0538, "step": 114450 }, { - "epoch": 1.24, - "learning_rate": 0.00011429683950937763, - "loss": 0.0323, + "epoch": 0.74, + "learning_rate": 0.00018918721803055433, + "loss": 0.0467, "step": 114460 }, { - "epoch": 1.24, - "learning_rate": 0.00011428061522486858, - "loss": 0.0281, + "epoch": 0.74, + "learning_rate": 0.0001891775366761974, + "loss": 0.0509, "step": 114470 }, { - "epoch": 1.24, - "learning_rate": 0.00011426439094035953, - "loss": 0.0355, + "epoch": 0.74, + "learning_rate": 0.00018916785532184047, + "loss": 0.0479, "step": 114480 }, { - "epoch": 1.24, - "learning_rate": 0.00011424816665585046, - "loss": 0.0328, + "epoch": 0.74, + "learning_rate": 0.00018915817396748355, + "loss": 0.0428, "step": 114490 }, { - "epoch": 1.24, - "learning_rate": 0.00011423194237134141, - "loss": 0.037, + "epoch": 0.74, + "learning_rate": 0.0001891484926131266, + "loss": 0.0495, "step": 114500 }, { - "epoch": 1.24, - "learning_rate": 0.00011421571808683236, - "loss": 0.0398, + "epoch": 0.74, + "learning_rate": 0.00018913881125876968, + "loss": 0.0413, "step": 114510 }, { - "epoch": 1.24, - "learning_rate": 0.00011419949380232331, - "loss": 0.0306, + "epoch": 0.74, + "learning_rate": 0.00018912912990441276, + "loss": 0.0413, "step": 114520 }, { - "epoch": 1.24, - "learning_rate": 0.00011418326951781426, - "loss": 0.0368, + "epoch": 0.74, + "learning_rate": 0.00018911944855005578, + "loss": 0.0484, "step": 114530 }, { - "epoch": 1.24, - "learning_rate": 0.0001141670452333052, - "loss": 0.0309, + "epoch": 0.74, + "learning_rate": 0.00018910976719569886, + "loss": 0.0516, "step": 114540 }, { - "epoch": 1.24, - "learning_rate": 0.00011415082094879615, - "loss": 0.0403, + "epoch": 0.74, + "learning_rate": 0.00018910008584134194, + "loss": 0.0468, "step": 114550 }, { - "epoch": 1.24, - "learning_rate": 0.0001141345966642871, - "loss": 0.0322, + "epoch": 0.74, + "learning_rate": 0.00018909040448698502, + "loss": 0.045, "step": 114560 }, { - "epoch": 1.24, - "learning_rate": 0.00011411837237977805, - "loss": 0.0323, + "epoch": 0.74, + "learning_rate": 0.00018908072313262808, + "loss": 0.043, "step": 114570 }, { - "epoch": 1.24, - "learning_rate": 0.00011410214809526898, - "loss": 0.0343, + "epoch": 0.74, + "learning_rate": 0.00018907104177827116, + "loss": 0.0516, "step": 114580 }, { - "epoch": 1.24, - "learning_rate": 0.00011408592381075993, - "loss": 0.0394, + "epoch": 0.74, + "learning_rate": 0.00018906136042391424, + "loss": 0.0496, "step": 114590 }, { - "epoch": 1.24, - "learning_rate": 0.00011406969952625088, - "loss": 0.0409, + "epoch": 0.74, + "learning_rate": 0.00018905167906955726, + "loss": 0.0509, "step": 114600 }, { - "epoch": 1.24, - "learning_rate": 0.00011405347524174183, - "loss": 0.0347, + "epoch": 0.74, + "learning_rate": 0.00018904199771520034, + "loss": 0.046, "step": 114610 }, { - "epoch": 1.24, - "learning_rate": 0.00011403725095723278, - "loss": 0.0263, + "epoch": 0.74, + "learning_rate": 0.00018903231636084342, + "loss": 0.0445, "step": 114620 }, { - "epoch": 1.24, - "learning_rate": 0.00011402102667272372, - "loss": 0.04, + "epoch": 0.74, + "learning_rate": 0.0001890226350064865, + "loss": 0.0404, "step": 114630 }, { - "epoch": 1.24, - "learning_rate": 0.00011400480238821467, - "loss": 0.033, + "epoch": 0.74, + "learning_rate": 0.00018901295365212955, + "loss": 0.0417, "step": 114640 }, { - "epoch": 1.24, - "learning_rate": 0.00011398857810370562, - "loss": 0.0301, + "epoch": 0.74, + "learning_rate": 0.00018900327229777263, + "loss": 0.04, "step": 114650 }, { - "epoch": 1.24, - "learning_rate": 0.00011397235381919657, - "loss": 0.032, + "epoch": 0.74, + "learning_rate": 0.0001889935909434157, + "loss": 0.0488, "step": 114660 }, { - "epoch": 1.24, - "learning_rate": 0.00011395612953468752, - "loss": 0.038, + "epoch": 0.74, + "learning_rate": 0.00018898390958905874, + "loss": 0.0461, "step": 114670 }, { - "epoch": 1.24, - "learning_rate": 0.00011393990525017846, - "loss": 0.0365, + "epoch": 0.74, + "learning_rate": 0.00018897422823470182, + "loss": 0.0481, "step": 114680 }, { - "epoch": 1.24, - "learning_rate": 0.0001139236809656694, - "loss": 0.0323, + "epoch": 0.74, + "learning_rate": 0.0001889645468803449, + "loss": 0.0499, "step": 114690 }, { - "epoch": 1.24, - "learning_rate": 0.00011390745668116036, - "loss": 0.0304, + "epoch": 0.74, + "learning_rate": 0.00018895486552598795, + "loss": 0.0456, "step": 114700 }, { - "epoch": 1.24, - "learning_rate": 0.0001138912323966513, - "loss": 0.0297, + "epoch": 0.74, + "learning_rate": 0.00018894518417163103, + "loss": 0.0498, "step": 114710 }, { - "epoch": 1.24, - "learning_rate": 0.00011387500811214224, - "loss": 0.0402, + "epoch": 0.74, + "learning_rate": 0.0001889355028172741, + "loss": 0.0417, "step": 114720 }, { - "epoch": 1.24, - "learning_rate": 0.00011385878382763319, - "loss": 0.0389, + "epoch": 0.74, + "learning_rate": 0.0001889258214629172, + "loss": 0.0477, "step": 114730 }, { - "epoch": 1.24, - "learning_rate": 0.00011384255954312414, - "loss": 0.0371, + "epoch": 0.74, + "learning_rate": 0.00018891614010856022, + "loss": 0.0527, "step": 114740 }, { - "epoch": 1.24, - "learning_rate": 0.00011382633525861509, - "loss": 0.0347, + "epoch": 0.74, + "learning_rate": 0.0001889064587542033, + "loss": 0.0482, "step": 114750 }, { - "epoch": 1.24, - "learning_rate": 0.00011381011097410604, - "loss": 0.0315, + "epoch": 0.74, + "learning_rate": 0.00018889677739984638, + "loss": 0.0468, "step": 114760 }, { - "epoch": 1.24, - "learning_rate": 0.00011379388668959698, - "loss": 0.0324, + "epoch": 0.74, + "learning_rate": 0.00018888709604548943, + "loss": 0.045, "step": 114770 }, { - "epoch": 1.24, - "learning_rate": 0.00011377766240508793, - "loss": 0.0301, + "epoch": 0.74, + "learning_rate": 0.0001888774146911325, + "loss": 0.0511, "step": 114780 }, { - "epoch": 1.24, - "learning_rate": 0.00011376143812057888, - "loss": 0.0353, + "epoch": 0.74, + "learning_rate": 0.0001888677333367756, + "loss": 0.0407, "step": 114790 }, { - "epoch": 1.24, - "learning_rate": 0.00011374521383606983, - "loss": 0.0382, + "epoch": 0.74, + "learning_rate": 0.00018885805198241867, + "loss": 0.0477, "step": 114800 }, { - "epoch": 1.24, - "learning_rate": 0.00011372898955156076, - "loss": 0.0366, + "epoch": 0.74, + "learning_rate": 0.0001888483706280617, + "loss": 0.0479, "step": 114810 }, { - "epoch": 1.24, - "learning_rate": 0.00011371276526705171, - "loss": 0.0338, + "epoch": 0.74, + "learning_rate": 0.00018883868927370477, + "loss": 0.0411, "step": 114820 }, { - "epoch": 1.24, - "learning_rate": 0.00011369654098254266, - "loss": 0.0384, + "epoch": 0.74, + "learning_rate": 0.00018882900791934785, + "loss": 0.0439, "step": 114830 }, { - "epoch": 1.24, - "learning_rate": 0.00011368031669803361, - "loss": 0.0354, + "epoch": 0.74, + "learning_rate": 0.0001888193265649909, + "loss": 0.0388, "step": 114840 }, { - "epoch": 1.24, - "learning_rate": 0.00011366409241352456, - "loss": 0.0329, + "epoch": 0.74, + "learning_rate": 0.00018880964521063399, + "loss": 0.0457, "step": 114850 }, { - "epoch": 1.24, - "learning_rate": 0.0001136478681290155, - "loss": 0.0373, + "epoch": 0.74, + "learning_rate": 0.00018879996385627707, + "loss": 0.0504, "step": 114860 }, { - "epoch": 1.24, - "learning_rate": 0.00011363164384450645, - "loss": 0.0365, + "epoch": 0.74, + "learning_rate": 0.00018879028250192012, + "loss": 0.0406, "step": 114870 }, { - "epoch": 1.24, - "learning_rate": 0.0001136154195599974, - "loss": 0.0314, + "epoch": 0.74, + "learning_rate": 0.00018878060114756317, + "loss": 0.0495, "step": 114880 }, { - "epoch": 1.24, - "learning_rate": 0.00011359919527548835, - "loss": 0.0282, + "epoch": 0.74, + "learning_rate": 0.00018877091979320625, + "loss": 0.0457, "step": 114890 }, { - "epoch": 1.24, - "learning_rate": 0.00011358297099097928, - "loss": 0.0305, + "epoch": 0.74, + "learning_rate": 0.0001887612384388493, + "loss": 0.0446, "step": 114900 }, { - "epoch": 1.24, - "learning_rate": 0.00011356674670647023, - "loss": 0.0403, + "epoch": 0.74, + "learning_rate": 0.00018875155708449238, + "loss": 0.0382, "step": 114910 }, { - "epoch": 1.24, - "learning_rate": 0.00011355052242196118, - "loss": 0.0348, + "epoch": 0.74, + "learning_rate": 0.00018874187573013546, + "loss": 0.0447, "step": 114920 }, { - "epoch": 1.24, - "learning_rate": 0.00011353429813745213, - "loss": 0.0363, + "epoch": 0.74, + "learning_rate": 0.00018873219437577854, + "loss": 0.0382, "step": 114930 }, { - "epoch": 1.24, - "learning_rate": 0.00011351807385294308, - "loss": 0.0349, + "epoch": 0.74, + "learning_rate": 0.0001887225130214216, + "loss": 0.0511, "step": 114940 }, { - "epoch": 1.24, - "learning_rate": 0.00011350184956843402, - "loss": 0.0363, + "epoch": 0.74, + "learning_rate": 0.00018871283166706465, + "loss": 0.0477, "step": 114950 }, { - "epoch": 1.24, - "learning_rate": 0.00011348562528392497, - "loss": 0.0315, + "epoch": 0.74, + "learning_rate": 0.00018870315031270773, + "loss": 0.0494, "step": 114960 }, { - "epoch": 1.24, - "learning_rate": 0.00011346940099941592, - "loss": 0.033, + "epoch": 0.74, + "learning_rate": 0.00018869346895835078, + "loss": 0.0484, "step": 114970 }, { - "epoch": 1.24, - "learning_rate": 0.00011345317671490687, - "loss": 0.0337, + "epoch": 0.74, + "learning_rate": 0.00018868378760399386, + "loss": 0.0438, "step": 114980 }, { - "epoch": 1.24, - "learning_rate": 0.0001134369524303978, - "loss": 0.0299, + "epoch": 0.74, + "learning_rate": 0.00018867410624963694, + "loss": 0.0483, "step": 114990 }, { - "epoch": 1.24, - "learning_rate": 0.00011342072814588875, - "loss": 0.0389, + "epoch": 0.74, + "learning_rate": 0.00018866442489528002, + "loss": 0.0501, "step": 115000 }, { - "epoch": 1.24, - "eval_cer": 0.9211401895250565, - "eval_loss": 0.026066089048981667, - "eval_runtime": 119.1119, - "eval_samples_per_second": 16.791, - "eval_steps_per_second": 4.198, + "epoch": 0.74, + "eval_cer": 0.9198960569427184, + "eval_loss": 0.02958066016435623, + "eval_runtime": 119.869, + "eval_samples_per_second": 16.685, + "eval_steps_per_second": 4.171, "step": 115000 }, { - "epoch": 1.24, - "learning_rate": 0.0001134045038613797, - "loss": 0.0429, + "epoch": 0.74, + "learning_rate": 0.00018865474354092307, + "loss": 0.0397, "step": 115010 }, { - "epoch": 1.24, - "learning_rate": 0.00011338827957687065, - "loss": 0.0318, + "epoch": 0.74, + "learning_rate": 0.00018864506218656613, + "loss": 0.0429, "step": 115020 }, { - "epoch": 1.24, - "learning_rate": 0.0001133720552923616, - "loss": 0.0331, + "epoch": 0.74, + "learning_rate": 0.0001886353808322092, + "loss": 0.0451, "step": 115030 }, { - "epoch": 1.24, - "learning_rate": 0.00011335583100785254, - "loss": 0.033, + "epoch": 0.74, + "learning_rate": 0.00018862569947785226, + "loss": 0.0384, "step": 115040 }, { - "epoch": 1.24, - "learning_rate": 0.00011333960672334349, - "loss": 0.0359, + "epoch": 0.74, + "learning_rate": 0.00018861601812349534, + "loss": 0.0432, "step": 115050 }, { - "epoch": 1.24, - "learning_rate": 0.00011332338243883444, - "loss": 0.0278, + "epoch": 0.74, + "learning_rate": 0.00018860633676913842, + "loss": 0.0445, "step": 115060 }, { - "epoch": 1.24, - "learning_rate": 0.00011330715815432539, - "loss": 0.035, + "epoch": 0.74, + "learning_rate": 0.00018859665541478147, + "loss": 0.0467, "step": 115070 }, { - "epoch": 1.24, - "learning_rate": 0.00011329093386981632, - "loss": 0.0382, + "epoch": 0.74, + "learning_rate": 0.00018858697406042455, + "loss": 0.04, "step": 115080 }, { - "epoch": 1.24, - "learning_rate": 0.00011327470958530727, - "loss": 0.0308, + "epoch": 0.74, + "learning_rate": 0.0001885772927060676, + "loss": 0.0439, "step": 115090 }, { - "epoch": 1.24, - "learning_rate": 0.00011325848530079822, - "loss": 0.0376, + "epoch": 0.74, + "learning_rate": 0.00018856761135171066, + "loss": 0.0527, "step": 115100 }, { - "epoch": 1.25, - "learning_rate": 0.00011324226101628917, - "loss": 0.0402, + "epoch": 0.74, + "learning_rate": 0.00018855792999735373, + "loss": 0.0473, "step": 115110 }, { - "epoch": 1.25, - "learning_rate": 0.00011322603673178012, - "loss": 0.0353, + "epoch": 0.74, + "learning_rate": 0.00018854824864299681, + "loss": 0.0397, "step": 115120 }, { - "epoch": 1.25, - "learning_rate": 0.00011320981244727106, - "loss": 0.0343, + "epoch": 0.74, + "learning_rate": 0.0001885385672886399, + "loss": 0.0505, "step": 115130 }, { - "epoch": 1.25, - "learning_rate": 0.00011319358816276201, - "loss": 0.0318, + "epoch": 0.74, + "learning_rate": 0.00018852888593428295, + "loss": 0.0391, "step": 115140 }, { - "epoch": 1.25, - "learning_rate": 0.00011317736387825296, - "loss": 0.0319, + "epoch": 0.74, + "learning_rate": 0.00018851920457992603, + "loss": 0.0433, "step": 115150 }, { - "epoch": 1.25, - "learning_rate": 0.00011316113959374391, - "loss": 0.031, + "epoch": 0.74, + "learning_rate": 0.00018850952322556908, + "loss": 0.0507, "step": 115160 }, { - "epoch": 1.25, - "learning_rate": 0.00011314491530923485, - "loss": 0.0394, + "epoch": 0.74, + "learning_rate": 0.00018849984187121213, + "loss": 0.0483, "step": 115170 }, { - "epoch": 1.25, - "learning_rate": 0.0001131286910247258, - "loss": 0.0366, + "epoch": 0.74, + "learning_rate": 0.0001884901605168552, + "loss": 0.0472, "step": 115180 }, { - "epoch": 1.25, - "learning_rate": 0.00011311246674021674, - "loss": 0.0406, + "epoch": 0.74, + "learning_rate": 0.0001884804791624983, + "loss": 0.0446, "step": 115190 }, { - "epoch": 1.25, - "learning_rate": 0.0001130962424557077, - "loss": 0.0358, + "epoch": 0.74, + "learning_rate": 0.00018847079780814137, + "loss": 0.0463, "step": 115200 }, { - "epoch": 1.25, - "learning_rate": 0.00011308001817119864, - "loss": 0.0355, + "epoch": 0.74, + "learning_rate": 0.00018846111645378442, + "loss": 0.0422, "step": 115210 }, { - "epoch": 1.25, - "learning_rate": 0.00011306379388668958, - "loss": 0.0396, + "epoch": 0.74, + "learning_rate": 0.0001884514350994275, + "loss": 0.0499, "step": 115220 }, { - "epoch": 1.25, - "learning_rate": 0.00011304756960218053, - "loss": 0.0311, + "epoch": 0.74, + "learning_rate": 0.00018844175374507056, + "loss": 0.0483, "step": 115230 }, { - "epoch": 1.25, - "learning_rate": 0.00011303134531767148, - "loss": 0.0418, + "epoch": 0.74, + "learning_rate": 0.0001884320723907136, + "loss": 0.0414, "step": 115240 }, { - "epoch": 1.25, - "learning_rate": 0.00011301512103316243, - "loss": 0.0328, + "epoch": 0.74, + "learning_rate": 0.0001884223910363567, + "loss": 0.0419, "step": 115250 }, { - "epoch": 1.25, - "learning_rate": 0.00011299889674865337, - "loss": 0.0365, + "epoch": 0.74, + "learning_rate": 0.00018841270968199977, + "loss": 0.0492, "step": 115260 }, { - "epoch": 1.25, - "learning_rate": 0.00011298267246414432, - "loss": 0.0331, + "epoch": 0.74, + "learning_rate": 0.00018840302832764282, + "loss": 0.0414, "step": 115270 }, { - "epoch": 1.25, - "learning_rate": 0.00011296644817963527, - "loss": 0.0387, + "epoch": 0.74, + "learning_rate": 0.0001883933469732859, + "loss": 0.048, "step": 115280 }, { - "epoch": 1.25, - "learning_rate": 0.00011295022389512622, - "loss": 0.0342, + "epoch": 0.74, + "learning_rate": 0.00018838366561892898, + "loss": 0.04, "step": 115290 }, { - "epoch": 1.25, - "learning_rate": 0.00011293399961061717, - "loss": 0.0344, + "epoch": 0.74, + "learning_rate": 0.000188373984264572, + "loss": 0.0416, "step": 115300 }, { - "epoch": 1.25, - "learning_rate": 0.0001129177753261081, - "loss": 0.0332, + "epoch": 0.74, + "learning_rate": 0.0001883643029102151, + "loss": 0.0432, "step": 115310 }, { - "epoch": 1.25, - "learning_rate": 0.00011290155104159905, - "loss": 0.0312, + "epoch": 0.74, + "learning_rate": 0.00018835462155585817, + "loss": 0.0421, "step": 115320 }, { - "epoch": 1.25, - "learning_rate": 0.00011288532675709, - "loss": 0.0344, + "epoch": 0.74, + "learning_rate": 0.00018834494020150125, + "loss": 0.0477, "step": 115330 }, { - "epoch": 1.25, - "learning_rate": 0.00011286910247258095, - "loss": 0.0333, + "epoch": 0.74, + "learning_rate": 0.0001883352588471443, + "loss": 0.0457, "step": 115340 }, { - "epoch": 1.25, - "learning_rate": 0.00011285287818807189, - "loss": 0.0322, + "epoch": 0.74, + "learning_rate": 0.00018832557749278738, + "loss": 0.046, "step": 115350 }, { - "epoch": 1.25, - "learning_rate": 0.00011283665390356284, - "loss": 0.0366, + "epoch": 0.74, + "learning_rate": 0.00018831589613843046, + "loss": 0.0444, "step": 115360 }, { - "epoch": 1.25, - "learning_rate": 0.00011282042961905379, - "loss": 0.0294, + "epoch": 0.74, + "learning_rate": 0.00018830621478407348, + "loss": 0.0462, "step": 115370 }, { - "epoch": 1.25, - "learning_rate": 0.00011280420533454474, - "loss": 0.0301, + "epoch": 0.74, + "learning_rate": 0.00018829653342971656, + "loss": 0.0431, "step": 115380 }, { - "epoch": 1.25, - "learning_rate": 0.00011278798105003569, - "loss": 0.034, + "epoch": 0.74, + "learning_rate": 0.00018828685207535964, + "loss": 0.0475, "step": 115390 }, { - "epoch": 1.25, - "learning_rate": 0.00011277175676552662, - "loss": 0.0318, + "epoch": 0.74, + "learning_rate": 0.00018827717072100272, + "loss": 0.0464, "step": 115400 }, { - "epoch": 1.25, - "learning_rate": 0.00011275553248101757, - "loss": 0.0333, + "epoch": 0.74, + "learning_rate": 0.00018826748936664578, + "loss": 0.0423, "step": 115410 }, { - "epoch": 1.25, - "learning_rate": 0.00011273930819650852, - "loss": 0.0348, + "epoch": 0.74, + "learning_rate": 0.00018825780801228886, + "loss": 0.0482, "step": 115420 }, { - "epoch": 1.25, - "learning_rate": 0.00011272308391199947, - "loss": 0.0305, + "epoch": 0.75, + "learning_rate": 0.00018824812665793194, + "loss": 0.0393, "step": 115430 }, { - "epoch": 1.25, - "learning_rate": 0.00011270685962749042, - "loss": 0.0328, + "epoch": 0.75, + "learning_rate": 0.00018823844530357496, + "loss": 0.0445, "step": 115440 }, { - "epoch": 1.25, - "learning_rate": 0.00011269063534298136, - "loss": 0.0337, + "epoch": 0.75, + "learning_rate": 0.00018822876394921804, + "loss": 0.0425, "step": 115450 }, { - "epoch": 1.25, - "learning_rate": 0.00011267441105847231, - "loss": 0.04, + "epoch": 0.75, + "learning_rate": 0.00018821908259486112, + "loss": 0.0476, "step": 115460 }, { - "epoch": 1.25, - "learning_rate": 0.00011265818677396326, - "loss": 0.0367, + "epoch": 0.75, + "learning_rate": 0.0001882094012405042, + "loss": 0.0526, "step": 115470 }, { - "epoch": 1.25, - "learning_rate": 0.0001126419624894542, - "loss": 0.0319, + "epoch": 0.75, + "learning_rate": 0.00018819971988614725, + "loss": 0.0416, "step": 115480 }, { - "epoch": 1.25, - "learning_rate": 0.00011262573820494514, - "loss": 0.0306, + "epoch": 0.75, + "learning_rate": 0.00018819003853179033, + "loss": 0.0514, "step": 115490 }, { - "epoch": 1.25, - "learning_rate": 0.00011260951392043609, - "loss": 0.0349, + "epoch": 0.75, + "learning_rate": 0.0001881803571774334, + "loss": 0.0465, "step": 115500 }, { - "epoch": 1.25, - "learning_rate": 0.00011259328963592704, - "loss": 0.0294, + "epoch": 0.75, + "learning_rate": 0.00018817067582307644, + "loss": 0.045, "step": 115510 }, { - "epoch": 1.25, - "learning_rate": 0.00011257706535141799, - "loss": 0.0379, + "epoch": 0.75, + "learning_rate": 0.00018816099446871952, + "loss": 0.0482, "step": 115520 }, { - "epoch": 1.25, - "learning_rate": 0.00011256084106690894, - "loss": 0.033, + "epoch": 0.75, + "learning_rate": 0.0001881513131143626, + "loss": 0.0514, "step": 115530 }, { - "epoch": 1.25, - "learning_rate": 0.00011254461678239988, - "loss": 0.0342, + "epoch": 0.75, + "learning_rate": 0.00018814163176000565, + "loss": 0.0459, "step": 115540 }, { - "epoch": 1.25, - "learning_rate": 0.00011252839249789083, - "loss": 0.0346, + "epoch": 0.75, + "learning_rate": 0.00018813195040564873, + "loss": 0.0449, "step": 115550 }, { - "epoch": 1.25, - "learning_rate": 0.00011251216821338178, - "loss": 0.0319, + "epoch": 0.75, + "learning_rate": 0.0001881222690512918, + "loss": 0.043, "step": 115560 }, { - "epoch": 1.25, - "learning_rate": 0.00011249594392887273, - "loss": 0.0339, + "epoch": 0.75, + "learning_rate": 0.0001881125876969349, + "loss": 0.046, "step": 115570 }, { - "epoch": 1.25, - "learning_rate": 0.00011247971964436366, - "loss": 0.0265, + "epoch": 0.75, + "learning_rate": 0.00018810290634257792, + "loss": 0.0459, "step": 115580 }, { - "epoch": 1.25, - "learning_rate": 0.00011246349535985461, - "loss": 0.0346, + "epoch": 0.75, + "learning_rate": 0.000188093224988221, + "loss": 0.0473, "step": 115590 }, { - "epoch": 1.25, - "learning_rate": 0.00011244727107534556, - "loss": 0.0306, + "epoch": 0.75, + "learning_rate": 0.00018808354363386408, + "loss": 0.0404, "step": 115600 }, { - "epoch": 1.25, - "learning_rate": 0.00011243104679083651, - "loss": 0.0283, + "epoch": 0.75, + "learning_rate": 0.00018807386227950713, + "loss": 0.0473, "step": 115610 }, { - "epoch": 1.25, - "learning_rate": 0.00011241482250632746, - "loss": 0.0275, + "epoch": 0.75, + "learning_rate": 0.0001880641809251502, + "loss": 0.0466, "step": 115620 }, { - "epoch": 1.25, - "learning_rate": 0.0001123985982218184, - "loss": 0.0333, + "epoch": 0.75, + "learning_rate": 0.0001880544995707933, + "loss": 0.0427, "step": 115630 }, { - "epoch": 1.25, - "learning_rate": 0.00011238237393730935, - "loss": 0.0263, + "epoch": 0.75, + "learning_rate": 0.00018804481821643637, + "loss": 0.0524, "step": 115640 }, { - "epoch": 1.25, - "learning_rate": 0.0001123661496528003, - "loss": 0.0319, + "epoch": 0.75, + "learning_rate": 0.0001880351368620794, + "loss": 0.0413, "step": 115650 }, { - "epoch": 1.25, - "learning_rate": 0.00011234992536829125, - "loss": 0.0436, + "epoch": 0.75, + "learning_rate": 0.00018802545550772247, + "loss": 0.0413, "step": 115660 }, { - "epoch": 1.25, - "learning_rate": 0.00011233370108378218, - "loss": 0.0332, + "epoch": 0.75, + "learning_rate": 0.00018801577415336555, + "loss": 0.0433, "step": 115670 }, { - "epoch": 1.25, - "learning_rate": 0.00011231747679927313, - "loss": 0.0404, + "epoch": 0.75, + "learning_rate": 0.0001880060927990086, + "loss": 0.0379, "step": 115680 }, { - "epoch": 1.25, - "learning_rate": 0.00011230125251476408, - "loss": 0.0223, + "epoch": 0.75, + "learning_rate": 0.00018799641144465169, + "loss": 0.0432, "step": 115690 }, { - "epoch": 1.25, - "learning_rate": 0.00011228502823025503, - "loss": 0.035, + "epoch": 0.75, + "learning_rate": 0.00018798673009029477, + "loss": 0.0468, "step": 115700 }, { - "epoch": 1.25, - "learning_rate": 0.00011226880394574598, - "loss": 0.0329, + "epoch": 0.75, + "learning_rate": 0.00018797704873593782, + "loss": 0.0406, "step": 115710 }, { - "epoch": 1.25, - "learning_rate": 0.00011225257966123692, - "loss": 0.032, + "epoch": 0.75, + "learning_rate": 0.00018796736738158087, + "loss": 0.0444, "step": 115720 }, { - "epoch": 1.25, - "learning_rate": 0.00011223635537672787, - "loss": 0.0339, + "epoch": 0.75, + "learning_rate": 0.00018795768602722395, + "loss": 0.0411, "step": 115730 }, { - "epoch": 1.25, - "learning_rate": 0.00011222013109221882, - "loss": 0.0344, + "epoch": 0.75, + "learning_rate": 0.000187948004672867, + "loss": 0.0423, "step": 115740 }, { - "epoch": 1.25, - "learning_rate": 0.00011220390680770977, - "loss": 0.0333, + "epoch": 0.75, + "learning_rate": 0.00018793832331851008, + "loss": 0.0471, "step": 115750 }, { - "epoch": 1.25, - "learning_rate": 0.0001121876825232007, - "loss": 0.0285, + "epoch": 0.75, + "learning_rate": 0.00018792864196415316, + "loss": 0.0498, "step": 115760 }, { - "epoch": 1.25, - "learning_rate": 0.00011217145823869166, - "loss": 0.0313, + "epoch": 0.75, + "learning_rate": 0.00018791896060979624, + "loss": 0.0404, "step": 115770 }, { - "epoch": 1.25, - "learning_rate": 0.0001121552339541826, - "loss": 0.0351, + "epoch": 0.75, + "learning_rate": 0.0001879092792554393, + "loss": 0.0396, "step": 115780 }, { - "epoch": 1.25, - "learning_rate": 0.00011213900966967355, - "loss": 0.0304, + "epoch": 0.75, + "learning_rate": 0.00018789959790108235, + "loss": 0.0469, "step": 115790 }, { - "epoch": 1.25, - "learning_rate": 0.0001121227853851645, - "loss": 0.0368, + "epoch": 0.75, + "learning_rate": 0.00018788991654672543, + "loss": 0.0474, "step": 115800 }, { - "epoch": 1.25, - "learning_rate": 0.00011210656110065544, - "loss": 0.0335, + "epoch": 0.75, + "learning_rate": 0.00018788023519236848, + "loss": 0.0468, "step": 115810 }, { - "epoch": 1.25, - "learning_rate": 0.00011209033681614639, - "loss": 0.036, + "epoch": 0.75, + "learning_rate": 0.00018787055383801156, + "loss": 0.0456, "step": 115820 }, { - "epoch": 1.25, - "learning_rate": 0.00011207411253163734, - "loss": 0.0329, + "epoch": 0.75, + "learning_rate": 0.00018786087248365464, + "loss": 0.0463, "step": 115830 }, { - "epoch": 1.25, - "learning_rate": 0.00011205788824712829, - "loss": 0.0313, + "epoch": 0.75, + "learning_rate": 0.00018785119112929772, + "loss": 0.0398, "step": 115840 }, { - "epoch": 1.25, - "learning_rate": 0.00011204166396261923, - "loss": 0.0305, + "epoch": 0.75, + "learning_rate": 0.00018784150977494077, + "loss": 0.0417, "step": 115850 }, { - "epoch": 1.25, - "learning_rate": 0.00011202543967811018, - "loss": 0.0368, + "epoch": 0.75, + "learning_rate": 0.00018783182842058382, + "loss": 0.0508, "step": 115860 }, { - "epoch": 1.25, - "learning_rate": 0.00011200921539360113, - "loss": 0.0401, + "epoch": 0.75, + "learning_rate": 0.0001878221470662269, + "loss": 0.0364, "step": 115870 }, { - "epoch": 1.25, - "learning_rate": 0.00011199299110909208, - "loss": 0.0367, + "epoch": 0.75, + "learning_rate": 0.00018781246571186996, + "loss": 0.0465, "step": 115880 }, { - "epoch": 1.25, - "learning_rate": 0.00011197676682458303, - "loss": 0.035, + "epoch": 0.75, + "learning_rate": 0.00018780278435751304, + "loss": 0.0414, "step": 115890 }, { - "epoch": 1.25, - "learning_rate": 0.00011196054254007396, - "loss": 0.0332, + "epoch": 0.75, + "learning_rate": 0.00018779310300315612, + "loss": 0.0414, "step": 115900 }, { - "epoch": 1.25, - "learning_rate": 0.00011194431825556491, - "loss": 0.0304, + "epoch": 0.75, + "learning_rate": 0.00018778342164879917, + "loss": 0.042, "step": 115910 }, { - "epoch": 1.25, - "learning_rate": 0.00011192809397105586, - "loss": 0.0335, + "epoch": 0.75, + "learning_rate": 0.00018777374029444225, + "loss": 0.0505, "step": 115920 }, { - "epoch": 1.25, - "learning_rate": 0.00011191186968654681, - "loss": 0.0333, + "epoch": 0.75, + "learning_rate": 0.0001877640589400853, + "loss": 0.0379, "step": 115930 }, { - "epoch": 1.25, - "learning_rate": 0.00011189564540203775, - "loss": 0.0355, + "epoch": 0.75, + "learning_rate": 0.00018775437758572835, + "loss": 0.038, "step": 115940 }, { - "epoch": 1.25, - "learning_rate": 0.0001118794211175287, - "loss": 0.0325, + "epoch": 0.75, + "learning_rate": 0.00018774469623137143, + "loss": 0.0413, "step": 115950 }, { - "epoch": 1.25, - "learning_rate": 0.00011186319683301965, - "loss": 0.0351, + "epoch": 0.75, + "learning_rate": 0.00018773501487701451, + "loss": 0.04, "step": 115960 }, { - "epoch": 1.25, - "learning_rate": 0.0001118469725485106, - "loss": 0.0308, + "epoch": 0.75, + "learning_rate": 0.0001877253335226576, + "loss": 0.0433, "step": 115970 }, { - "epoch": 1.25, - "learning_rate": 0.00011183074826400155, - "loss": 0.0336, + "epoch": 0.75, + "learning_rate": 0.00018771565216830065, + "loss": 0.0449, "step": 115980 }, { - "epoch": 1.25, - "learning_rate": 0.00011181452397949248, - "loss": 0.0391, + "epoch": 0.75, + "learning_rate": 0.00018770597081394373, + "loss": 0.0453, "step": 115990 }, { - "epoch": 1.25, - "learning_rate": 0.00011179829969498343, - "loss": 0.0381, + "epoch": 0.75, + "learning_rate": 0.00018769628945958678, + "loss": 0.0387, "step": 116000 }, { - "epoch": 1.25, - "eval_cer": 0.9211375390720941, - "eval_loss": 0.026518533006310463, - "eval_runtime": 118.8239, - "eval_samples_per_second": 16.832, - "eval_steps_per_second": 4.208, + "epoch": 0.75, + "eval_cer": 0.9199774036831997, + "eval_loss": 0.029281143099069595, + "eval_runtime": 119.7604, + "eval_samples_per_second": 16.7, + "eval_steps_per_second": 4.175, "step": 116000 }, { - "epoch": 1.25, - "learning_rate": 0.00011178207541047438, - "loss": 0.0311, + "epoch": 0.75, + "learning_rate": 0.00018768660810522983, + "loss": 0.0402, "step": 116010 }, { - "epoch": 1.25, - "learning_rate": 0.00011176585112596533, - "loss": 0.0339, + "epoch": 0.75, + "learning_rate": 0.0001876769267508729, + "loss": 0.045, "step": 116020 }, { - "epoch": 1.25, - "learning_rate": 0.00011174962684145627, - "loss": 0.0396, + "epoch": 0.75, + "learning_rate": 0.000187667245396516, + "loss": 0.0432, "step": 116030 }, { - "epoch": 1.26, - "learning_rate": 0.00011173340255694722, - "loss": 0.0334, + "epoch": 0.75, + "learning_rate": 0.00018765756404215907, + "loss": 0.0524, "step": 116040 }, { - "epoch": 1.26, - "learning_rate": 0.00011171717827243817, - "loss": 0.0428, + "epoch": 0.75, + "learning_rate": 0.00018764788268780212, + "loss": 0.0421, "step": 116050 }, { - "epoch": 1.26, - "learning_rate": 0.00011170095398792912, - "loss": 0.036, + "epoch": 0.75, + "learning_rate": 0.0001876382013334452, + "loss": 0.0395, "step": 116060 }, { - "epoch": 1.26, - "learning_rate": 0.00011168472970342007, - "loss": 0.0355, + "epoch": 0.75, + "learning_rate": 0.00018762851997908826, + "loss": 0.052, "step": 116070 }, { - "epoch": 1.26, - "learning_rate": 0.000111668505418911, - "loss": 0.0341, + "epoch": 0.75, + "learning_rate": 0.0001876188386247313, + "loss": 0.0378, "step": 116080 }, { - "epoch": 1.26, - "learning_rate": 0.00011165228113440195, - "loss": 0.0305, + "epoch": 0.75, + "learning_rate": 0.0001876091572703744, + "loss": 0.0413, "step": 116090 }, { - "epoch": 1.26, - "learning_rate": 0.0001116360568498929, - "loss": 0.0352, + "epoch": 0.75, + "learning_rate": 0.00018759947591601747, + "loss": 0.0499, "step": 116100 }, { - "epoch": 1.26, - "learning_rate": 0.00011161983256538385, - "loss": 0.037, + "epoch": 0.75, + "learning_rate": 0.00018758979456166052, + "loss": 0.0428, "step": 116110 }, { - "epoch": 1.26, - "learning_rate": 0.00011160360828087479, - "loss": 0.0325, + "epoch": 0.75, + "learning_rate": 0.0001875801132073036, + "loss": 0.044, "step": 116120 }, { - "epoch": 1.26, - "learning_rate": 0.00011158738399636574, - "loss": 0.0357, + "epoch": 0.75, + "learning_rate": 0.00018757043185294668, + "loss": 0.0529, "step": 116130 }, { - "epoch": 1.26, - "learning_rate": 0.00011157115971185669, - "loss": 0.0433, + "epoch": 0.75, + "learning_rate": 0.0001875607504985897, + "loss": 0.0461, "step": 116140 }, { - "epoch": 1.26, - "learning_rate": 0.00011155493542734764, - "loss": 0.0337, + "epoch": 0.75, + "learning_rate": 0.0001875510691442328, + "loss": 0.0361, "step": 116150 }, { - "epoch": 1.26, - "learning_rate": 0.0001115387111428386, - "loss": 0.0374, + "epoch": 0.75, + "learning_rate": 0.00018754138778987587, + "loss": 0.0396, "step": 116160 }, { - "epoch": 1.26, - "learning_rate": 0.00011152248685832955, - "loss": 0.0284, + "epoch": 0.75, + "learning_rate": 0.00018753170643551895, + "loss": 0.0433, "step": 116170 }, { - "epoch": 1.26, - "learning_rate": 0.00011150626257382049, - "loss": 0.0326, + "epoch": 0.75, + "learning_rate": 0.000187522025081162, + "loss": 0.0437, "step": 116180 }, { - "epoch": 1.26, - "learning_rate": 0.00011149003828931144, - "loss": 0.0395, + "epoch": 0.75, + "learning_rate": 0.00018751234372680508, + "loss": 0.0519, "step": 116190 }, { - "epoch": 1.26, - "learning_rate": 0.00011147381400480239, - "loss": 0.0353, + "epoch": 0.75, + "learning_rate": 0.00018750266237244816, + "loss": 0.0477, "step": 116200 }, { - "epoch": 1.26, - "learning_rate": 0.00011145758972029334, - "loss": 0.0321, + "epoch": 0.75, + "learning_rate": 0.00018749298101809118, + "loss": 0.0389, "step": 116210 }, { - "epoch": 1.26, - "learning_rate": 0.00011144136543578429, - "loss": 0.0299, + "epoch": 0.75, + "learning_rate": 0.00018748329966373426, + "loss": 0.048, "step": 116220 }, { - "epoch": 1.26, - "learning_rate": 0.00011142514115127522, - "loss": 0.0296, + "epoch": 0.75, + "learning_rate": 0.00018747361830937734, + "loss": 0.0411, "step": 116230 }, { - "epoch": 1.26, - "learning_rate": 0.00011140891686676617, - "loss": 0.0385, + "epoch": 0.75, + "learning_rate": 0.00018746393695502042, + "loss": 0.049, "step": 116240 }, { - "epoch": 1.26, - "learning_rate": 0.00011139269258225712, - "loss": 0.0321, + "epoch": 0.75, + "learning_rate": 0.00018745425560066348, + "loss": 0.0421, "step": 116250 }, { - "epoch": 1.26, - "learning_rate": 0.00011137646829774807, - "loss": 0.0341, + "epoch": 0.75, + "learning_rate": 0.00018744457424630656, + "loss": 0.0441, "step": 116260 }, { - "epoch": 1.26, - "learning_rate": 0.00011136024401323901, - "loss": 0.0365, + "epoch": 0.75, + "learning_rate": 0.00018743489289194964, + "loss": 0.043, "step": 116270 }, { - "epoch": 1.26, - "learning_rate": 0.00011134401972872996, - "loss": 0.0305, + "epoch": 0.75, + "learning_rate": 0.00018742521153759266, + "loss": 0.0435, "step": 116280 }, { - "epoch": 1.26, - "learning_rate": 0.00011132779544422091, - "loss": 0.0351, + "epoch": 0.75, + "learning_rate": 0.00018741553018323574, + "loss": 0.0413, "step": 116290 }, { - "epoch": 1.26, - "learning_rate": 0.00011131157115971186, - "loss": 0.0279, + "epoch": 0.75, + "learning_rate": 0.00018740584882887882, + "loss": 0.0423, "step": 116300 }, { - "epoch": 1.26, - "learning_rate": 0.00011129534687520281, - "loss": 0.0325, + "epoch": 0.75, + "learning_rate": 0.00018739616747452187, + "loss": 0.0456, "step": 116310 }, { - "epoch": 1.26, - "learning_rate": 0.00011127912259069374, - "loss": 0.0322, + "epoch": 0.75, + "learning_rate": 0.00018738648612016495, + "loss": 0.0456, "step": 116320 }, { - "epoch": 1.26, - "learning_rate": 0.0001112628983061847, - "loss": 0.0327, + "epoch": 0.75, + "learning_rate": 0.00018737680476580803, + "loss": 0.0479, "step": 116330 }, { - "epoch": 1.26, - "learning_rate": 0.00011124667402167564, - "loss": 0.032, + "epoch": 0.75, + "learning_rate": 0.0001873671234114511, + "loss": 0.0504, "step": 116340 }, { - "epoch": 1.26, - "learning_rate": 0.00011123044973716659, - "loss": 0.027, + "epoch": 0.75, + "learning_rate": 0.00018735744205709414, + "loss": 0.0391, "step": 116350 }, { - "epoch": 1.26, - "learning_rate": 0.00011121422545265753, - "loss": 0.0326, + "epoch": 0.75, + "learning_rate": 0.00018734776070273722, + "loss": 0.0438, "step": 116360 }, { - "epoch": 1.26, - "learning_rate": 0.00011119800116814848, - "loss": 0.0384, + "epoch": 0.75, + "learning_rate": 0.0001873380793483803, + "loss": 0.0468, "step": 116370 }, { - "epoch": 1.26, - "learning_rate": 0.00011118177688363943, - "loss": 0.032, + "epoch": 0.75, + "learning_rate": 0.00018732839799402335, + "loss": 0.0447, "step": 116380 }, { - "epoch": 1.26, - "learning_rate": 0.00011116555259913038, - "loss": 0.035, + "epoch": 0.75, + "learning_rate": 0.00018731871663966643, + "loss": 0.0428, "step": 116390 }, { - "epoch": 1.26, - "learning_rate": 0.00011114932831462133, - "loss": 0.0368, + "epoch": 0.75, + "learning_rate": 0.0001873090352853095, + "loss": 0.0439, "step": 116400 }, { - "epoch": 1.26, - "learning_rate": 0.00011113310403011226, - "loss": 0.0321, + "epoch": 0.75, + "learning_rate": 0.0001872993539309526, + "loss": 0.0468, "step": 116410 }, { - "epoch": 1.26, - "learning_rate": 0.00011111687974560321, - "loss": 0.0329, + "epoch": 0.75, + "learning_rate": 0.00018728967257659562, + "loss": 0.0399, "step": 116420 }, { - "epoch": 1.26, - "learning_rate": 0.00011110065546109416, - "loss": 0.0334, + "epoch": 0.75, + "learning_rate": 0.0001872799912222387, + "loss": 0.0414, "step": 116430 }, { - "epoch": 1.26, - "learning_rate": 0.00011108443117658511, - "loss": 0.043, - "step": 116440 + "epoch": 0.75, + "learning_rate": 0.00018727030986788178, + "loss": 0.0476, + "step": 116440 }, { - "epoch": 1.26, - "learning_rate": 0.00011106820689207605, - "loss": 0.0293, + "epoch": 0.75, + "learning_rate": 0.00018726062851352483, + "loss": 0.0436, "step": 116450 }, { - "epoch": 1.26, - "learning_rate": 0.000111051982607567, - "loss": 0.0383, + "epoch": 0.75, + "learning_rate": 0.0001872509471591679, + "loss": 0.0384, "step": 116460 }, { - "epoch": 1.26, - "learning_rate": 0.00011103575832305795, - "loss": 0.0365, + "epoch": 0.75, + "learning_rate": 0.000187241265804811, + "loss": 0.0354, "step": 116470 }, { - "epoch": 1.26, - "learning_rate": 0.0001110195340385489, - "loss": 0.0337, + "epoch": 0.75, + "learning_rate": 0.00018723158445045404, + "loss": 0.0459, "step": 116480 }, { - "epoch": 1.26, - "learning_rate": 0.00011100330975403985, - "loss": 0.0323, + "epoch": 0.75, + "learning_rate": 0.0001872219030960971, + "loss": 0.046, "step": 116490 }, { - "epoch": 1.26, - "learning_rate": 0.00011098708546953079, - "loss": 0.0416, + "epoch": 0.75, + "learning_rate": 0.00018721222174174017, + "loss": 0.0444, "step": 116500 }, { - "epoch": 1.26, - "learning_rate": 0.00011097086118502173, - "loss": 0.0293, + "epoch": 0.75, + "learning_rate": 0.00018720254038738323, + "loss": 0.0393, "step": 116510 }, { - "epoch": 1.26, - "learning_rate": 0.00011095463690051268, - "loss": 0.0257, + "epoch": 0.75, + "learning_rate": 0.0001871928590330263, + "loss": 0.0445, "step": 116520 }, { - "epoch": 1.26, - "learning_rate": 0.00011093841261600363, - "loss": 0.0459, + "epoch": 0.75, + "learning_rate": 0.00018718317767866938, + "loss": 0.0433, "step": 116530 }, { - "epoch": 1.26, - "learning_rate": 0.00011092218833149457, - "loss": 0.0261, + "epoch": 0.75, + "learning_rate": 0.00018717349632431246, + "loss": 0.042, "step": 116540 }, { - "epoch": 1.26, - "learning_rate": 0.00011090596404698552, - "loss": 0.0338, + "epoch": 0.75, + "learning_rate": 0.00018716381496995552, + "loss": 0.0393, "step": 116550 }, { - "epoch": 1.26, - "learning_rate": 0.00011088973976247647, - "loss": 0.0363, + "epoch": 0.75, + "learning_rate": 0.00018715413361559857, + "loss": 0.0366, "step": 116560 }, { - "epoch": 1.26, - "learning_rate": 0.00011087351547796742, - "loss": 0.0304, + "epoch": 0.75, + "learning_rate": 0.00018714445226124165, + "loss": 0.0467, "step": 116570 }, { - "epoch": 1.26, - "learning_rate": 0.00011085729119345837, - "loss": 0.0356, + "epoch": 0.75, + "learning_rate": 0.0001871347709068847, + "loss": 0.0381, "step": 116580 }, { - "epoch": 1.26, - "learning_rate": 0.0001108410669089493, - "loss": 0.0354, + "epoch": 0.75, + "learning_rate": 0.00018712508955252778, + "loss": 0.0444, "step": 116590 }, { - "epoch": 1.26, - "learning_rate": 0.00011082484262444026, - "loss": 0.0344, + "epoch": 0.75, + "learning_rate": 0.00018711540819817086, + "loss": 0.0478, "step": 116600 }, { - "epoch": 1.26, - "learning_rate": 0.0001108086183399312, - "loss": 0.0318, + "epoch": 0.75, + "learning_rate": 0.00018710572684381394, + "loss": 0.0406, "step": 116610 }, { - "epoch": 1.26, - "learning_rate": 0.00011079239405542216, - "loss": 0.035, + "epoch": 0.75, + "learning_rate": 0.000187096045489457, + "loss": 0.0491, "step": 116620 }, { - "epoch": 1.26, - "learning_rate": 0.00011077616977091309, - "loss": 0.0313, + "epoch": 0.75, + "learning_rate": 0.00018708636413510005, + "loss": 0.0446, "step": 116630 }, { - "epoch": 1.26, - "learning_rate": 0.00011075994548640404, - "loss": 0.0335, + "epoch": 0.75, + "learning_rate": 0.00018707668278074313, + "loss": 0.037, "step": 116640 }, { - "epoch": 1.26, - "learning_rate": 0.00011074372120189499, - "loss": 0.0325, + "epoch": 0.75, + "learning_rate": 0.00018706700142638618, + "loss": 0.0441, "step": 116650 }, { - "epoch": 1.26, - "learning_rate": 0.00011072749691738594, - "loss": 0.0377, + "epoch": 0.75, + "learning_rate": 0.00018705732007202926, + "loss": 0.0381, "step": 116660 }, { - "epoch": 1.26, - "learning_rate": 0.00011071127263287689, - "loss": 0.0278, + "epoch": 0.75, + "learning_rate": 0.00018704763871767234, + "loss": 0.0453, "step": 116670 }, { - "epoch": 1.26, - "learning_rate": 0.00011069504834836783, - "loss": 0.039, + "epoch": 0.75, + "learning_rate": 0.0001870379573633154, + "loss": 0.0459, "step": 116680 }, { - "epoch": 1.26, - "learning_rate": 0.00011067882406385878, - "loss": 0.0342, + "epoch": 0.75, + "learning_rate": 0.00018702827600895847, + "loss": 0.0397, "step": 116690 }, { - "epoch": 1.26, - "learning_rate": 0.00011066259977934973, - "loss": 0.0277, + "epoch": 0.75, + "learning_rate": 0.00018701859465460152, + "loss": 0.0481, "step": 116700 }, { - "epoch": 1.26, - "learning_rate": 0.00011064637549484068, - "loss": 0.044, + "epoch": 0.75, + "learning_rate": 0.00018700891330024458, + "loss": 0.0413, "step": 116710 }, { - "epoch": 1.26, - "learning_rate": 0.00011063015121033161, - "loss": 0.0321, + "epoch": 0.75, + "learning_rate": 0.00018699923194588766, + "loss": 0.0415, "step": 116720 }, { - "epoch": 1.26, - "learning_rate": 0.00011061392692582256, - "loss": 0.0276, + "epoch": 0.75, + "learning_rate": 0.00018698955059153074, + "loss": 0.0406, "step": 116730 }, { - "epoch": 1.26, - "learning_rate": 0.00011059770264131351, - "loss": 0.0352, + "epoch": 0.75, + "learning_rate": 0.00018697986923717382, + "loss": 0.0417, "step": 116740 }, { - "epoch": 1.26, - "learning_rate": 0.00011058147835680446, - "loss": 0.0352, + "epoch": 0.75, + "learning_rate": 0.00018697018788281687, + "loss": 0.041, "step": 116750 }, { - "epoch": 1.26, - "learning_rate": 0.00011056525407229541, - "loss": 0.034, + "epoch": 0.75, + "learning_rate": 0.00018696050652845995, + "loss": 0.042, "step": 116760 }, { - "epoch": 1.26, - "learning_rate": 0.00011054902978778635, - "loss": 0.036, + "epoch": 0.75, + "learning_rate": 0.000186950825174103, + "loss": 0.0483, "step": 116770 }, { - "epoch": 1.26, - "learning_rate": 0.0001105328055032773, - "loss": 0.0323, + "epoch": 0.75, + "learning_rate": 0.00018694114381974605, + "loss": 0.046, "step": 116780 }, { - "epoch": 1.26, - "learning_rate": 0.00011051658121876825, - "loss": 0.0373, + "epoch": 0.75, + "learning_rate": 0.00018693146246538913, + "loss": 0.0394, "step": 116790 }, { - "epoch": 1.26, - "learning_rate": 0.0001105003569342592, - "loss": 0.0435, + "epoch": 0.75, + "learning_rate": 0.00018692178111103221, + "loss": 0.0408, "step": 116800 }, { - "epoch": 1.26, - "learning_rate": 0.00011048413264975015, - "loss": 0.0356, + "epoch": 0.75, + "learning_rate": 0.0001869120997566753, + "loss": 0.0405, "step": 116810 }, { - "epoch": 1.26, - "learning_rate": 0.00011046790836524108, - "loss": 0.0279, + "epoch": 0.75, + "learning_rate": 0.00018690241840231835, + "loss": 0.0521, "step": 116820 }, { - "epoch": 1.26, - "learning_rate": 0.00011045168408073203, - "loss": 0.0354, + "epoch": 0.75, + "learning_rate": 0.00018689273704796143, + "loss": 0.0416, "step": 116830 }, { - "epoch": 1.26, - "learning_rate": 0.00011043545979622298, - "loss": 0.0343, + "epoch": 0.75, + "learning_rate": 0.00018688305569360448, + "loss": 0.0521, "step": 116840 }, { - "epoch": 1.26, - "learning_rate": 0.00011041923551171393, - "loss": 0.0352, + "epoch": 0.75, + "learning_rate": 0.00018687337433924753, + "loss": 0.0496, "step": 116850 }, { - "epoch": 1.26, - "learning_rate": 0.00011040301122720487, - "loss": 0.0307, + "epoch": 0.75, + "learning_rate": 0.0001868636929848906, + "loss": 0.0513, "step": 116860 }, { - "epoch": 1.26, - "learning_rate": 0.00011038678694269582, - "loss": 0.0304, + "epoch": 0.75, + "learning_rate": 0.0001868540116305337, + "loss": 0.0521, "step": 116870 }, { - "epoch": 1.26, - "learning_rate": 0.00011037056265818677, - "loss": 0.0307, + "epoch": 0.75, + "learning_rate": 0.00018684433027617674, + "loss": 0.0493, "step": 116880 }, { - "epoch": 1.26, - "learning_rate": 0.00011035433837367772, - "loss": 0.0308, + "epoch": 0.75, + "learning_rate": 0.00018683464892181982, + "loss": 0.041, "step": 116890 }, { - "epoch": 1.26, - "learning_rate": 0.00011033811408916867, - "loss": 0.0301, + "epoch": 0.75, + "learning_rate": 0.0001868249675674629, + "loss": 0.048, "step": 116900 }, { - "epoch": 1.26, - "learning_rate": 0.0001103218898046596, - "loss": 0.0322, + "epoch": 0.75, + "learning_rate": 0.00018681528621310593, + "loss": 0.0402, "step": 116910 }, { - "epoch": 1.26, - "learning_rate": 0.00011030566552015055, - "loss": 0.0308, + "epoch": 0.75, + "learning_rate": 0.000186805604858749, + "loss": 0.0411, "step": 116920 }, { - "epoch": 1.26, - "learning_rate": 0.0001102894412356415, - "loss": 0.0348, + "epoch": 0.75, + "learning_rate": 0.0001867959235043921, + "loss": 0.0395, "step": 116930 }, { - "epoch": 1.26, - "learning_rate": 0.00011027321695113245, - "loss": 0.0337, + "epoch": 0.75, + "learning_rate": 0.00018678624215003517, + "loss": 0.0436, "step": 116940 }, { - "epoch": 1.26, - "learning_rate": 0.00011025699266662339, - "loss": 0.0338, + "epoch": 0.75, + "learning_rate": 0.00018677656079567822, + "loss": 0.0396, "step": 116950 }, { - "epoch": 1.27, - "learning_rate": 0.00011024076838211434, - "loss": 0.032, + "epoch": 0.75, + "learning_rate": 0.0001867668794413213, + "loss": 0.0487, "step": 116960 }, { - "epoch": 1.27, - "learning_rate": 0.00011022454409760529, - "loss": 0.0256, + "epoch": 0.75, + "learning_rate": 0.00018675719808696438, + "loss": 0.0385, "step": 116970 }, { - "epoch": 1.27, - "learning_rate": 0.00011020831981309624, - "loss": 0.0341, + "epoch": 0.76, + "learning_rate": 0.0001867475167326074, + "loss": 0.0423, "step": 116980 }, { - "epoch": 1.27, - "learning_rate": 0.00011019209552858719, - "loss": 0.0365, + "epoch": 0.76, + "learning_rate": 0.00018673783537825049, + "loss": 0.0463, "step": 116990 }, { - "epoch": 1.27, - "learning_rate": 0.00011017587124407812, - "loss": 0.0324, + "epoch": 0.76, + "learning_rate": 0.00018672815402389357, + "loss": 0.0384, "step": 117000 }, { - "epoch": 1.27, - "eval_cer": 0.9211075006051868, - "eval_loss": 0.02649548277258873, - "eval_runtime": 118.8709, - "eval_samples_per_second": 16.825, - "eval_steps_per_second": 4.206, + "epoch": 0.76, + "eval_cer": 0.9199240763755507, + "eval_loss": 0.02930784970521927, + "eval_runtime": 120.0533, + "eval_samples_per_second": 16.659, + "eval_steps_per_second": 4.165, "step": 117000 }, { - "epoch": 1.27, - "learning_rate": 0.00011015964695956907, - "loss": 0.0276, + "epoch": 0.76, + "learning_rate": 0.00018671847266953665, + "loss": 0.0382, "step": 117010 }, { - "epoch": 1.27, - "learning_rate": 0.00011014342267506002, - "loss": 0.0311, + "epoch": 0.76, + "learning_rate": 0.0001867087913151797, + "loss": 0.0464, "step": 117020 }, { - "epoch": 1.27, - "learning_rate": 0.00011012719839055097, - "loss": 0.0284, + "epoch": 0.76, + "learning_rate": 0.00018669910996082278, + "loss": 0.0417, "step": 117030 }, { - "epoch": 1.27, - "learning_rate": 0.00011011097410604191, - "loss": 0.0347, + "epoch": 0.76, + "learning_rate": 0.00018668942860646586, + "loss": 0.0434, "step": 117040 }, { - "epoch": 1.27, - "learning_rate": 0.00011009474982153286, - "loss": 0.0273, + "epoch": 0.76, + "learning_rate": 0.00018667974725210888, + "loss": 0.0404, "step": 117050 }, { - "epoch": 1.27, - "learning_rate": 0.00011007852553702381, - "loss": 0.0315, + "epoch": 0.76, + "learning_rate": 0.00018667006589775196, + "loss": 0.0386, "step": 117060 }, { - "epoch": 1.27, - "learning_rate": 0.00011006230125251476, - "loss": 0.0338, + "epoch": 0.76, + "learning_rate": 0.00018666038454339504, + "loss": 0.0434, "step": 117070 }, { - "epoch": 1.27, - "learning_rate": 0.00011004607696800571, - "loss": 0.039, + "epoch": 0.76, + "learning_rate": 0.0001866507031890381, + "loss": 0.043, "step": 117080 }, { - "epoch": 1.27, - "learning_rate": 0.00011002985268349665, - "loss": 0.0353, + "epoch": 0.76, + "learning_rate": 0.00018664102183468118, + "loss": 0.0431, "step": 117090 }, { - "epoch": 1.27, - "learning_rate": 0.0001100136283989876, - "loss": 0.0294, + "epoch": 0.76, + "learning_rate": 0.00018663134048032426, + "loss": 0.0397, "step": 117100 }, { - "epoch": 1.27, - "learning_rate": 0.00010999740411447855, - "loss": 0.0352, + "epoch": 0.76, + "learning_rate": 0.00018662165912596734, + "loss": 0.0447, "step": 117110 }, { - "epoch": 1.27, - "learning_rate": 0.0001099811798299695, - "loss": 0.0362, + "epoch": 0.76, + "learning_rate": 0.00018661197777161036, + "loss": 0.0444, "step": 117120 }, { - "epoch": 1.27, - "learning_rate": 0.00010996495554546043, - "loss": 0.0315, + "epoch": 0.76, + "learning_rate": 0.00018660229641725344, + "loss": 0.0466, "step": 117130 }, { - "epoch": 1.27, - "learning_rate": 0.00010994873126095138, - "loss": 0.0349, + "epoch": 0.76, + "learning_rate": 0.00018659261506289652, + "loss": 0.0473, "step": 117140 }, { - "epoch": 1.27, - "learning_rate": 0.00010993250697644233, - "loss": 0.032, + "epoch": 0.76, + "learning_rate": 0.00018658293370853957, + "loss": 0.0521, "step": 117150 }, { - "epoch": 1.27, - "learning_rate": 0.00010991628269193328, - "loss": 0.0317, + "epoch": 0.76, + "learning_rate": 0.00018657325235418265, + "loss": 0.0432, "step": 117160 }, { - "epoch": 1.27, - "learning_rate": 0.00010990005840742423, - "loss": 0.0312, + "epoch": 0.76, + "learning_rate": 0.00018656357099982573, + "loss": 0.0385, "step": 117170 }, { - "epoch": 1.27, - "learning_rate": 0.00010988383412291517, - "loss": 0.0348, + "epoch": 0.76, + "learning_rate": 0.0001865538896454688, + "loss": 0.0412, "step": 117180 }, { - "epoch": 1.27, - "learning_rate": 0.00010986760983840612, - "loss": 0.0327, + "epoch": 0.76, + "learning_rate": 0.00018654420829111184, + "loss": 0.0438, "step": 117190 }, { - "epoch": 1.27, - "learning_rate": 0.00010985138555389707, - "loss": 0.0294, + "epoch": 0.76, + "learning_rate": 0.00018653452693675492, + "loss": 0.0441, "step": 117200 }, { - "epoch": 1.27, - "learning_rate": 0.00010983516126938802, - "loss": 0.0313, + "epoch": 0.76, + "learning_rate": 0.000186524845582398, + "loss": 0.0477, "step": 117210 }, { - "epoch": 1.27, - "learning_rate": 0.00010981893698487895, - "loss": 0.032, + "epoch": 0.76, + "learning_rate": 0.00018651516422804105, + "loss": 0.0519, "step": 117220 }, { - "epoch": 1.27, - "learning_rate": 0.0001098027127003699, - "loss": 0.0331, + "epoch": 0.76, + "learning_rate": 0.00018650548287368413, + "loss": 0.0382, "step": 117230 }, { - "epoch": 1.27, - "learning_rate": 0.00010978648841586085, - "loss": 0.0293, + "epoch": 0.76, + "learning_rate": 0.0001864958015193272, + "loss": 0.0411, "step": 117240 }, { - "epoch": 1.27, - "learning_rate": 0.0001097702641313518, - "loss": 0.0307, + "epoch": 0.76, + "learning_rate": 0.0001864861201649703, + "loss": 0.0424, "step": 117250 }, { - "epoch": 1.27, - "learning_rate": 0.00010975403984684275, - "loss": 0.0341, + "epoch": 0.76, + "learning_rate": 0.00018647643881061332, + "loss": 0.046, "step": 117260 }, { - "epoch": 1.27, - "learning_rate": 0.00010973781556233369, - "loss": 0.0312, + "epoch": 0.76, + "learning_rate": 0.0001864667574562564, + "loss": 0.0488, "step": 117270 }, { - "epoch": 1.27, - "learning_rate": 0.00010972159127782464, - "loss": 0.0307, + "epoch": 0.76, + "learning_rate": 0.00018645707610189945, + "loss": 0.0421, "step": 117280 }, { - "epoch": 1.27, - "learning_rate": 0.00010970536699331559, - "loss": 0.0328, + "epoch": 0.76, + "learning_rate": 0.00018644739474754253, + "loss": 0.0431, "step": 117290 }, { - "epoch": 1.27, - "learning_rate": 0.00010968914270880654, - "loss": 0.0306, + "epoch": 0.76, + "learning_rate": 0.0001864377133931856, + "loss": 0.0444, "step": 117300 }, { - "epoch": 1.27, - "learning_rate": 0.00010967291842429747, - "loss": 0.0313, + "epoch": 0.76, + "learning_rate": 0.0001864280320388287, + "loss": 0.0451, "step": 117310 }, { - "epoch": 1.27, - "learning_rate": 0.00010965669413978842, - "loss": 0.0345, + "epoch": 0.76, + "learning_rate": 0.00018641835068447174, + "loss": 0.0473, "step": 117320 }, { - "epoch": 1.27, - "learning_rate": 0.00010964046985527937, - "loss": 0.0304, + "epoch": 0.76, + "learning_rate": 0.0001864086693301148, + "loss": 0.0425, "step": 117330 }, { - "epoch": 1.27, - "learning_rate": 0.00010962424557077032, - "loss": 0.0339, + "epoch": 0.76, + "learning_rate": 0.00018639898797575787, + "loss": 0.0415, "step": 117340 }, { - "epoch": 1.27, - "learning_rate": 0.00010960802128626127, - "loss": 0.0366, + "epoch": 0.76, + "learning_rate": 0.00018638930662140092, + "loss": 0.0433, "step": 117350 }, { - "epoch": 1.27, - "learning_rate": 0.00010959179700175221, - "loss": 0.0335, + "epoch": 0.76, + "learning_rate": 0.000186379625267044, + "loss": 0.0424, "step": 117360 }, { - "epoch": 1.27, - "learning_rate": 0.00010957557271724316, - "loss": 0.0288, + "epoch": 0.76, + "learning_rate": 0.00018636994391268708, + "loss": 0.0372, "step": 117370 }, { - "epoch": 1.27, - "learning_rate": 0.00010955934843273411, - "loss": 0.0379, + "epoch": 0.76, + "learning_rate": 0.00018636026255833016, + "loss": 0.0391, "step": 117380 }, { - "epoch": 1.27, - "learning_rate": 0.00010954312414822506, - "loss": 0.033, + "epoch": 0.76, + "learning_rate": 0.00018635058120397322, + "loss": 0.0411, "step": 117390 }, { - "epoch": 1.27, - "learning_rate": 0.000109526899863716, - "loss": 0.0312, + "epoch": 0.76, + "learning_rate": 0.00018634089984961627, + "loss": 0.0462, "step": 117400 }, { - "epoch": 1.27, - "learning_rate": 0.00010951067557920694, - "loss": 0.0288, + "epoch": 0.76, + "learning_rate": 0.00018633121849525935, + "loss": 0.0426, "step": 117410 }, { - "epoch": 1.27, - "learning_rate": 0.00010949445129469789, - "loss": 0.0341, + "epoch": 0.76, + "learning_rate": 0.0001863215371409024, + "loss": 0.0452, "step": 117420 }, { - "epoch": 1.27, - "learning_rate": 0.00010947822701018884, - "loss": 0.0277, + "epoch": 0.76, + "learning_rate": 0.00018631185578654548, + "loss": 0.051, "step": 117430 }, { - "epoch": 1.27, - "learning_rate": 0.00010946200272567979, - "loss": 0.0358, + "epoch": 0.76, + "learning_rate": 0.00018630217443218856, + "loss": 0.0562, "step": 117440 }, { - "epoch": 1.27, - "learning_rate": 0.00010944577844117073, - "loss": 0.0325, + "epoch": 0.76, + "learning_rate": 0.00018629249307783164, + "loss": 0.0427, "step": 117450 }, { - "epoch": 1.27, - "learning_rate": 0.00010942955415666168, - "loss": 0.0365, + "epoch": 0.76, + "learning_rate": 0.0001862828117234747, + "loss": 0.044, "step": 117460 }, { - "epoch": 1.27, - "learning_rate": 0.00010941332987215263, - "loss": 0.0338, + "epoch": 0.76, + "learning_rate": 0.00018627313036911775, + "loss": 0.044, "step": 117470 }, { - "epoch": 1.27, - "learning_rate": 0.00010939710558764358, - "loss": 0.031, + "epoch": 0.76, + "learning_rate": 0.0001862634490147608, + "loss": 0.0383, "step": 117480 }, { - "epoch": 1.27, - "learning_rate": 0.00010938088130313451, - "loss": 0.0313, + "epoch": 0.76, + "learning_rate": 0.00018625376766040388, + "loss": 0.0543, "step": 117490 }, { - "epoch": 1.27, - "learning_rate": 0.00010936465701862546, - "loss": 0.0357, + "epoch": 0.76, + "learning_rate": 0.00018624408630604696, + "loss": 0.0384, "step": 117500 }, { - "epoch": 1.27, - "learning_rate": 0.00010934843273411641, - "loss": 0.0282, + "epoch": 0.76, + "learning_rate": 0.00018623440495169004, + "loss": 0.046, "step": 117510 }, { - "epoch": 1.27, - "learning_rate": 0.00010933220844960736, - "loss": 0.0336, + "epoch": 0.76, + "learning_rate": 0.0001862247235973331, + "loss": 0.0426, "step": 117520 }, { - "epoch": 1.27, - "learning_rate": 0.00010931598416509831, - "loss": 0.031, + "epoch": 0.76, + "learning_rate": 0.00018621504224297617, + "loss": 0.0499, "step": 117530 }, { - "epoch": 1.27, - "learning_rate": 0.00010929975988058925, - "loss": 0.0334, + "epoch": 0.76, + "learning_rate": 0.00018620536088861922, + "loss": 0.0437, "step": 117540 }, { - "epoch": 1.27, - "learning_rate": 0.0001092835355960802, - "loss": 0.0396, + "epoch": 0.76, + "learning_rate": 0.00018619567953426228, + "loss": 0.0583, "step": 117550 }, { - "epoch": 1.27, - "learning_rate": 0.00010926731131157115, - "loss": 0.0344, + "epoch": 0.76, + "learning_rate": 0.00018618599817990536, + "loss": 0.0443, "step": 117560 }, { - "epoch": 1.27, - "learning_rate": 0.0001092510870270621, - "loss": 0.0294, + "epoch": 0.76, + "learning_rate": 0.00018617631682554844, + "loss": 0.045, "step": 117570 }, { - "epoch": 1.27, - "learning_rate": 0.00010923486274255305, - "loss": 0.0314, + "epoch": 0.76, + "learning_rate": 0.00018616663547119152, + "loss": 0.0378, "step": 117580 }, { - "epoch": 1.27, - "learning_rate": 0.00010921863845804398, - "loss": 0.033, + "epoch": 0.76, + "learning_rate": 0.00018615695411683457, + "loss": 0.0478, "step": 117590 }, { - "epoch": 1.27, - "learning_rate": 0.00010920241417353493, - "loss": 0.0339, + "epoch": 0.76, + "learning_rate": 0.00018614727276247765, + "loss": 0.0473, "step": 117600 }, { - "epoch": 1.27, - "learning_rate": 0.00010918618988902588, - "loss": 0.0318, + "epoch": 0.76, + "learning_rate": 0.0001861375914081207, + "loss": 0.0443, "step": 117610 }, { - "epoch": 1.27, - "learning_rate": 0.00010916996560451683, - "loss": 0.0345, + "epoch": 0.76, + "learning_rate": 0.00018612791005376375, + "loss": 0.0472, "step": 117620 }, { - "epoch": 1.27, - "learning_rate": 0.00010915374132000777, - "loss": 0.0325, + "epoch": 0.76, + "learning_rate": 0.00018611822869940683, + "loss": 0.0409, "step": 117630 }, { - "epoch": 1.27, - "learning_rate": 0.00010913751703549872, - "loss": 0.032, + "epoch": 0.76, + "learning_rate": 0.00018610854734504991, + "loss": 0.0441, "step": 117640 }, { - "epoch": 1.27, - "learning_rate": 0.00010912129275098967, - "loss": 0.029, + "epoch": 0.76, + "learning_rate": 0.000186098865990693, + "loss": 0.0395, "step": 117650 }, { - "epoch": 1.27, - "learning_rate": 0.00010910506846648062, - "loss": 0.0327, + "epoch": 0.76, + "learning_rate": 0.00018608918463633605, + "loss": 0.0418, "step": 117660 }, { - "epoch": 1.27, - "learning_rate": 0.00010908884418197157, - "loss": 0.0351, + "epoch": 0.76, + "learning_rate": 0.00018607950328197913, + "loss": 0.0422, "step": 117670 }, { - "epoch": 1.27, - "learning_rate": 0.0001090726198974625, - "loss": 0.0285, + "epoch": 0.76, + "learning_rate": 0.00018606982192762215, + "loss": 0.0488, "step": 117680 }, { - "epoch": 1.27, - "learning_rate": 0.00010905639561295346, - "loss": 0.034, + "epoch": 0.76, + "learning_rate": 0.00018606014057326523, + "loss": 0.0452, "step": 117690 }, { - "epoch": 1.27, - "learning_rate": 0.0001090401713284444, - "loss": 0.034, + "epoch": 0.76, + "learning_rate": 0.0001860504592189083, + "loss": 0.0408, "step": 117700 }, { - "epoch": 1.27, - "learning_rate": 0.00010902394704393536, - "loss": 0.0376, - "step": 117710 + "epoch": 0.76, + "learning_rate": 0.0001860407778645514, + "loss": 0.0354, + "step": 117710 }, { - "epoch": 1.27, - "learning_rate": 0.00010900772275942629, - "loss": 0.0376, + "epoch": 0.76, + "learning_rate": 0.00018603109651019444, + "loss": 0.0531, "step": 117720 }, { - "epoch": 1.27, - "learning_rate": 0.00010899149847491724, - "loss": 0.0298, + "epoch": 0.76, + "learning_rate": 0.00018602141515583752, + "loss": 0.0456, "step": 117730 }, { - "epoch": 1.27, - "learning_rate": 0.00010897527419040819, - "loss": 0.0285, + "epoch": 0.76, + "learning_rate": 0.0001860117338014806, + "loss": 0.0456, "step": 117740 }, { - "epoch": 1.27, - "learning_rate": 0.00010895904990589914, - "loss": 0.0299, + "epoch": 0.76, + "learning_rate": 0.00018600205244712363, + "loss": 0.042, "step": 117750 }, { - "epoch": 1.27, - "learning_rate": 0.00010894282562139009, - "loss": 0.0355, + "epoch": 0.76, + "learning_rate": 0.0001859923710927667, + "loss": 0.0388, "step": 117760 }, { - "epoch": 1.27, - "learning_rate": 0.00010892660133688103, - "loss": 0.0325, + "epoch": 0.76, + "learning_rate": 0.0001859826897384098, + "loss": 0.0413, "step": 117770 }, { - "epoch": 1.27, - "learning_rate": 0.00010891037705237198, - "loss": 0.0325, + "epoch": 0.76, + "learning_rate": 0.00018597300838405287, + "loss": 0.0447, "step": 117780 }, { - "epoch": 1.27, - "learning_rate": 0.00010889415276786293, - "loss": 0.0316, + "epoch": 0.76, + "learning_rate": 0.00018596332702969592, + "loss": 0.041, "step": 117790 }, { - "epoch": 1.27, - "learning_rate": 0.00010887792848335388, - "loss": 0.0314, + "epoch": 0.76, + "learning_rate": 0.000185953645675339, + "loss": 0.0432, "step": 117800 }, { - "epoch": 1.27, - "learning_rate": 0.00010886170419884481, - "loss": 0.0302, + "epoch": 0.76, + "learning_rate": 0.00018594396432098208, + "loss": 0.0474, "step": 117810 }, { - "epoch": 1.27, - "learning_rate": 0.00010884547991433576, - "loss": 0.039, + "epoch": 0.76, + "learning_rate": 0.0001859342829666251, + "loss": 0.0431, "step": 117820 }, { - "epoch": 1.27, - "learning_rate": 0.00010882925562982671, - "loss": 0.0353, + "epoch": 0.76, + "learning_rate": 0.00018592460161226819, + "loss": 0.0608, "step": 117830 }, { - "epoch": 1.27, - "learning_rate": 0.00010881303134531766, - "loss": 0.0368, + "epoch": 0.76, + "learning_rate": 0.00018591492025791127, + "loss": 0.0547, "step": 117840 }, { - "epoch": 1.27, - "learning_rate": 0.00010879680706080861, - "loss": 0.0281, + "epoch": 0.76, + "learning_rate": 0.00018590523890355435, + "loss": 0.0451, "step": 117850 }, { - "epoch": 1.27, - "learning_rate": 0.00010878058277629955, - "loss": 0.0337, + "epoch": 0.76, + "learning_rate": 0.0001858955575491974, + "loss": 0.0447, "step": 117860 }, { - "epoch": 1.27, - "learning_rate": 0.0001087643584917905, - "loss": 0.0337, + "epoch": 0.76, + "learning_rate": 0.00018588587619484048, + "loss": 0.038, "step": 117870 }, { - "epoch": 1.27, - "learning_rate": 0.00010874813420728145, - "loss": 0.0294, + "epoch": 0.76, + "learning_rate": 0.00018587619484048356, + "loss": 0.0479, "step": 117880 }, { - "epoch": 1.28, - "learning_rate": 0.0001087319099227724, - "loss": 0.0406, + "epoch": 0.76, + "learning_rate": 0.00018586651348612658, + "loss": 0.0391, "step": 117890 }, { - "epoch": 1.28, - "learning_rate": 0.00010871568563826333, - "loss": 0.0319, + "epoch": 0.76, + "learning_rate": 0.00018585683213176966, + "loss": 0.0398, "step": 117900 }, { - "epoch": 1.28, - "learning_rate": 0.00010869946135375428, - "loss": 0.0343, + "epoch": 0.76, + "learning_rate": 0.00018584715077741274, + "loss": 0.0389, "step": 117910 }, { - "epoch": 1.28, - "learning_rate": 0.00010868323706924523, - "loss": 0.0316, + "epoch": 0.76, + "learning_rate": 0.0001858374694230558, + "loss": 0.0533, "step": 117920 }, { - "epoch": 1.28, - "learning_rate": 0.00010866701278473618, - "loss": 0.0317, + "epoch": 0.76, + "learning_rate": 0.00018582778806869888, + "loss": 0.0398, "step": 117930 }, { - "epoch": 1.28, - "learning_rate": 0.00010865078850022713, - "loss": 0.035, + "epoch": 0.76, + "learning_rate": 0.00018581810671434195, + "loss": 0.0422, "step": 117940 }, { - "epoch": 1.28, - "learning_rate": 0.00010863456421571807, - "loss": 0.0361, + "epoch": 0.76, + "learning_rate": 0.00018580842535998503, + "loss": 0.0522, "step": 117950 }, { - "epoch": 1.28, - "learning_rate": 0.00010861833993120902, - "loss": 0.0328, + "epoch": 0.76, + "learning_rate": 0.00018579874400562806, + "loss": 0.0393, "step": 117960 }, { - "epoch": 1.28, - "learning_rate": 0.00010860211564669997, - "loss": 0.0307, + "epoch": 0.76, + "learning_rate": 0.00018578906265127114, + "loss": 0.0408, "step": 117970 }, { - "epoch": 1.28, - "learning_rate": 0.00010858589136219092, - "loss": 0.0271, + "epoch": 0.76, + "learning_rate": 0.00018577938129691422, + "loss": 0.0437, "step": 117980 }, { - "epoch": 1.28, - "learning_rate": 0.00010856966707768185, - "loss": 0.0357, + "epoch": 0.76, + "learning_rate": 0.00018576969994255727, + "loss": 0.0415, "step": 117990 }, { - "epoch": 1.28, - "learning_rate": 0.0001085534427931728, - "loss": 0.0345, + "epoch": 0.76, + "learning_rate": 0.00018576001858820035, + "loss": 0.0492, "step": 118000 }, { - "epoch": 1.28, - "eval_cer": 0.9211940820686255, - "eval_loss": 0.025967586785554886, - "eval_runtime": 118.9614, - "eval_samples_per_second": 16.812, - "eval_steps_per_second": 4.203, + "epoch": 0.76, + "eval_cer": 0.9199322110495989, + "eval_loss": 0.029090311378240585, + "eval_runtime": 119.8047, + "eval_samples_per_second": 16.694, + "eval_steps_per_second": 4.173, "step": 118000 }, { - "epoch": 1.28, - "learning_rate": 0.00010853721850866375, - "loss": 0.0308, + "epoch": 0.76, + "learning_rate": 0.00018575033723384343, + "loss": 0.0435, "step": 118010 }, { - "epoch": 1.28, - "learning_rate": 0.0001085209942241547, - "loss": 0.0317, + "epoch": 0.76, + "learning_rate": 0.0001857406558794865, + "loss": 0.0426, "step": 118020 }, { - "epoch": 1.28, - "learning_rate": 0.00010850476993964565, - "loss": 0.0336, + "epoch": 0.76, + "learning_rate": 0.00018573097452512954, + "loss": 0.0415, "step": 118030 }, { - "epoch": 1.28, - "learning_rate": 0.00010848854565513659, - "loss": 0.0374, + "epoch": 0.76, + "learning_rate": 0.00018572129317077262, + "loss": 0.0477, "step": 118040 }, { - "epoch": 1.28, - "learning_rate": 0.00010847232137062754, - "loss": 0.0366, + "epoch": 0.76, + "learning_rate": 0.0001857116118164157, + "loss": 0.0418, "step": 118050 }, { - "epoch": 1.28, - "learning_rate": 0.00010845609708611849, - "loss": 0.032, + "epoch": 0.76, + "learning_rate": 0.00018570193046205875, + "loss": 0.0453, "step": 118060 }, { - "epoch": 1.28, - "learning_rate": 0.00010843987280160944, - "loss": 0.0337, + "epoch": 0.76, + "learning_rate": 0.00018569224910770183, + "loss": 0.046, "step": 118070 }, { - "epoch": 1.28, - "learning_rate": 0.00010842364851710037, + "epoch": 0.76, + "learning_rate": 0.0001856825677533449, "loss": 0.0414, "step": 118080 }, { - "epoch": 1.28, - "learning_rate": 0.00010840742423259132, - "loss": 0.0363, + "epoch": 0.76, + "learning_rate": 0.00018567288639898796, + "loss": 0.0435, "step": 118090 }, { - "epoch": 1.28, - "learning_rate": 0.00010839119994808227, - "loss": 0.0324, + "epoch": 0.76, + "learning_rate": 0.00018566320504463101, + "loss": 0.0465, "step": 118100 }, { - "epoch": 1.28, - "learning_rate": 0.00010837497566357322, - "loss": 0.033, + "epoch": 0.76, + "learning_rate": 0.0001856535236902741, + "loss": 0.0512, "step": 118110 }, { - "epoch": 1.28, - "learning_rate": 0.00010835875137906417, - "loss": 0.0316, + "epoch": 0.76, + "learning_rate": 0.00018564384233591715, + "loss": 0.0528, "step": 118120 }, { - "epoch": 1.28, - "learning_rate": 0.00010834252709455511, - "loss": 0.0437, + "epoch": 0.76, + "learning_rate": 0.00018563416098156023, + "loss": 0.0521, "step": 118130 }, { - "epoch": 1.28, - "learning_rate": 0.00010832630281004606, - "loss": 0.0301, + "epoch": 0.76, + "learning_rate": 0.0001856244796272033, + "loss": 0.0455, "step": 118140 }, { - "epoch": 1.28, - "learning_rate": 0.00010831007852553701, - "loss": 0.0415, + "epoch": 0.76, + "learning_rate": 0.0001856147982728464, + "loss": 0.041, "step": 118150 }, { - "epoch": 1.28, - "learning_rate": 0.00010829385424102796, - "loss": 0.0319, + "epoch": 0.76, + "learning_rate": 0.00018560511691848944, + "loss": 0.044, "step": 118160 }, { - "epoch": 1.28, - "learning_rate": 0.0001082776299565189, - "loss": 0.0304, + "epoch": 0.76, + "learning_rate": 0.0001855954355641325, + "loss": 0.0421, "step": 118170 }, { - "epoch": 1.28, - "learning_rate": 0.00010826140567200985, - "loss": 0.045, + "epoch": 0.76, + "learning_rate": 0.00018558575420977557, + "loss": 0.0497, "step": 118180 }, { - "epoch": 1.28, - "learning_rate": 0.0001082451813875008, - "loss": 0.031, + "epoch": 0.76, + "learning_rate": 0.00018557607285541862, + "loss": 0.0517, "step": 118190 }, { - "epoch": 1.28, - "learning_rate": 0.00010822895710299174, - "loss": 0.0333, + "epoch": 0.76, + "learning_rate": 0.0001855663915010617, + "loss": 0.0433, "step": 118200 }, { - "epoch": 1.28, - "learning_rate": 0.0001082127328184827, - "loss": 0.0316, + "epoch": 0.76, + "learning_rate": 0.00018555671014670478, + "loss": 0.0603, "step": 118210 }, { - "epoch": 1.28, - "learning_rate": 0.00010819650853397363, - "loss": 0.03, + "epoch": 0.76, + "learning_rate": 0.00018554702879234786, + "loss": 0.0479, "step": 118220 }, { - "epoch": 1.28, - "learning_rate": 0.00010818028424946458, - "loss": 0.0374, + "epoch": 0.76, + "learning_rate": 0.00018553734743799092, + "loss": 0.0471, "step": 118230 }, { - "epoch": 1.28, - "learning_rate": 0.00010816405996495553, - "loss": 0.038, + "epoch": 0.76, + "learning_rate": 0.00018552766608363397, + "loss": 0.054, "step": 118240 }, { - "epoch": 1.28, - "learning_rate": 0.00010814783568044648, - "loss": 0.0331, + "epoch": 0.76, + "learning_rate": 0.00018551798472927705, + "loss": 0.045, "step": 118250 }, { - "epoch": 1.28, - "learning_rate": 0.00010813161139593742, - "loss": 0.0296, + "epoch": 0.76, + "learning_rate": 0.0001855083033749201, + "loss": 0.0401, "step": 118260 }, { - "epoch": 1.28, - "learning_rate": 0.00010811538711142837, - "loss": 0.0305, + "epoch": 0.76, + "learning_rate": 0.00018549862202056318, + "loss": 0.0431, "step": 118270 }, { - "epoch": 1.28, - "learning_rate": 0.00010809916282691932, - "loss": 0.0309, + "epoch": 0.76, + "learning_rate": 0.00018548894066620626, + "loss": 0.0488, "step": 118280 }, { - "epoch": 1.28, - "learning_rate": 0.00010808293854241027, - "loss": 0.0295, + "epoch": 0.76, + "learning_rate": 0.00018547925931184931, + "loss": 0.0384, "step": 118290 }, { - "epoch": 1.28, - "learning_rate": 0.00010806671425790122, - "loss": 0.0352, + "epoch": 0.76, + "learning_rate": 0.0001854695779574924, + "loss": 0.0424, "step": 118300 }, { - "epoch": 1.28, - "learning_rate": 0.00010805048997339215, - "loss": 0.0303, + "epoch": 0.76, + "learning_rate": 0.00018545989660313545, + "loss": 0.04, "step": 118310 }, { - "epoch": 1.28, - "learning_rate": 0.0001080342656888831, - "loss": 0.029, + "epoch": 0.76, + "learning_rate": 0.0001854502152487785, + "loss": 0.0378, "step": 118320 }, { - "epoch": 1.28, - "learning_rate": 0.00010801804140437405, - "loss": 0.0317, + "epoch": 0.76, + "learning_rate": 0.00018544053389442158, + "loss": 0.0416, "step": 118330 }, { - "epoch": 1.28, - "learning_rate": 0.000108001817119865, - "loss": 0.0294, + "epoch": 0.76, + "learning_rate": 0.00018543085254006466, + "loss": 0.043, "step": 118340 }, { - "epoch": 1.28, - "learning_rate": 0.00010798559283535595, - "loss": 0.0333, + "epoch": 0.76, + "learning_rate": 0.00018542117118570774, + "loss": 0.0455, "step": 118350 }, { - "epoch": 1.28, - "learning_rate": 0.00010796936855084689, - "loss": 0.0298, + "epoch": 0.76, + "learning_rate": 0.0001854114898313508, + "loss": 0.0387, "step": 118360 }, { - "epoch": 1.28, - "learning_rate": 0.00010795314426633784, - "loss": 0.0256, + "epoch": 0.76, + "learning_rate": 0.00018540180847699387, + "loss": 0.0437, "step": 118370 }, { - "epoch": 1.28, - "learning_rate": 0.00010793691998182879, - "loss": 0.0295, + "epoch": 0.76, + "learning_rate": 0.00018539212712263692, + "loss": 0.0407, "step": 118380 }, { - "epoch": 1.28, - "learning_rate": 0.00010792069569731974, - "loss": 0.0421, + "epoch": 0.76, + "learning_rate": 0.00018538244576827998, + "loss": 0.0458, "step": 118390 }, { - "epoch": 1.28, - "learning_rate": 0.00010790447141281067, - "loss": 0.0329, + "epoch": 0.76, + "learning_rate": 0.00018537276441392306, + "loss": 0.0424, "step": 118400 }, { - "epoch": 1.28, - "learning_rate": 0.00010788824712830162, - "loss": 0.0363, + "epoch": 0.76, + "learning_rate": 0.00018536308305956614, + "loss": 0.0467, "step": 118410 }, { - "epoch": 1.28, - "learning_rate": 0.00010787202284379257, - "loss": 0.0307, + "epoch": 0.76, + "learning_rate": 0.00018535340170520922, + "loss": 0.0434, "step": 118420 }, { - "epoch": 1.28, - "learning_rate": 0.00010785579855928352, - "loss": 0.0308, + "epoch": 0.76, + "learning_rate": 0.00018534372035085227, + "loss": 0.0372, "step": 118430 }, { - "epoch": 1.28, - "learning_rate": 0.00010783957427477447, - "loss": 0.0295, + "epoch": 0.76, + "learning_rate": 0.00018533403899649535, + "loss": 0.0411, "step": 118440 }, { - "epoch": 1.28, - "learning_rate": 0.00010782334999026541, - "loss": 0.0336, + "epoch": 0.76, + "learning_rate": 0.0001853243576421384, + "loss": 0.045, "step": 118450 }, { - "epoch": 1.28, - "learning_rate": 0.00010780712570575636, - "loss": 0.0322, + "epoch": 0.76, + "learning_rate": 0.00018531467628778145, + "loss": 0.0583, "step": 118460 }, { - "epoch": 1.28, - "learning_rate": 0.00010779090142124731, - "loss": 0.0417, + "epoch": 0.76, + "learning_rate": 0.00018530499493342453, + "loss": 0.046, "step": 118470 }, { - "epoch": 1.28, - "learning_rate": 0.00010777467713673826, - "loss": 0.0322, + "epoch": 0.76, + "learning_rate": 0.0001852953135790676, + "loss": 0.0453, "step": 118480 }, { - "epoch": 1.28, - "learning_rate": 0.0001077584528522292, - "loss": 0.032, + "epoch": 0.76, + "learning_rate": 0.00018528563222471067, + "loss": 0.045, "step": 118490 }, { - "epoch": 1.28, - "learning_rate": 0.00010774222856772014, - "loss": 0.0329, + "epoch": 0.76, + "learning_rate": 0.00018527595087035375, + "loss": 0.0463, "step": 118500 }, { - "epoch": 1.28, - "learning_rate": 0.0001077260042832111, - "loss": 0.033, + "epoch": 0.76, + "learning_rate": 0.00018526626951599683, + "loss": 0.0422, "step": 118510 }, { - "epoch": 1.28, - "learning_rate": 0.00010770977999870206, - "loss": 0.033, + "epoch": 0.76, + "learning_rate": 0.00018525658816163985, + "loss": 0.043, "step": 118520 }, { - "epoch": 1.28, - "learning_rate": 0.000107693555714193, - "loss": 0.0393, + "epoch": 0.77, + "learning_rate": 0.00018524690680728293, + "loss": 0.0469, "step": 118530 }, { - "epoch": 1.28, - "learning_rate": 0.00010767733142968396, - "loss": 0.0363, + "epoch": 0.77, + "learning_rate": 0.000185237225452926, + "loss": 0.0519, "step": 118540 }, { - "epoch": 1.28, - "learning_rate": 0.00010766110714517489, - "loss": 0.0307, + "epoch": 0.77, + "learning_rate": 0.0001852275440985691, + "loss": 0.043, "step": 118550 }, { - "epoch": 1.28, - "learning_rate": 0.00010764488286066584, - "loss": 0.035, + "epoch": 0.77, + "learning_rate": 0.00018521786274421214, + "loss": 0.0503, "step": 118560 }, { - "epoch": 1.28, - "learning_rate": 0.00010762865857615679, - "loss": 0.0303, + "epoch": 0.77, + "learning_rate": 0.00018520818138985522, + "loss": 0.0489, "step": 118570 }, { - "epoch": 1.28, - "learning_rate": 0.00010761243429164774, - "loss": 0.0365, + "epoch": 0.77, + "learning_rate": 0.0001851985000354983, + "loss": 0.0428, "step": 118580 }, { - "epoch": 1.28, - "learning_rate": 0.00010759621000713868, - "loss": 0.0318, + "epoch": 0.77, + "learning_rate": 0.00018518881868114133, + "loss": 0.0446, "step": 118590 }, { - "epoch": 1.28, - "learning_rate": 0.00010757998572262963, - "loss": 0.0326, + "epoch": 0.77, + "learning_rate": 0.0001851791373267844, + "loss": 0.0462, "step": 118600 }, { - "epoch": 1.28, - "learning_rate": 0.00010756376143812058, - "loss": 0.0319, + "epoch": 0.77, + "learning_rate": 0.0001851694559724275, + "loss": 0.0415, "step": 118610 }, { - "epoch": 1.28, - "learning_rate": 0.00010754753715361153, - "loss": 0.0268, + "epoch": 0.77, + "learning_rate": 0.00018515977461807057, + "loss": 0.0438, "step": 118620 }, { - "epoch": 1.28, - "learning_rate": 0.00010753131286910248, - "loss": 0.0352, + "epoch": 0.77, + "learning_rate": 0.00018515009326371362, + "loss": 0.0414, "step": 118630 }, { - "epoch": 1.28, - "learning_rate": 0.00010751508858459341, - "loss": 0.0282, + "epoch": 0.77, + "learning_rate": 0.0001851404119093567, + "loss": 0.0468, "step": 118640 }, { - "epoch": 1.28, - "learning_rate": 0.00010749886430008436, - "loss": 0.0364, + "epoch": 0.77, + "learning_rate": 0.00018513073055499978, + "loss": 0.0438, "step": 118650 }, { - "epoch": 1.28, - "learning_rate": 0.00010748264001557531, - "loss": 0.035, + "epoch": 0.77, + "learning_rate": 0.0001851210492006428, + "loss": 0.0411, "step": 118660 }, { - "epoch": 1.28, - "learning_rate": 0.00010746641573106626, - "loss": 0.0363, + "epoch": 0.77, + "learning_rate": 0.00018511136784628589, + "loss": 0.045, "step": 118670 }, { - "epoch": 1.28, - "learning_rate": 0.0001074501914465572, - "loss": 0.0307, + "epoch": 0.77, + "learning_rate": 0.00018510168649192897, + "loss": 0.0432, "step": 118680 }, { - "epoch": 1.28, - "learning_rate": 0.00010743396716204815, - "loss": 0.0316, + "epoch": 0.77, + "learning_rate": 0.00018509200513757202, + "loss": 0.0497, "step": 118690 }, { - "epoch": 1.28, - "learning_rate": 0.0001074177428775391, - "loss": 0.0317, + "epoch": 0.77, + "learning_rate": 0.0001850823237832151, + "loss": 0.0428, "step": 118700 }, { - "epoch": 1.28, - "learning_rate": 0.00010740151859303005, - "loss": 0.0296, + "epoch": 0.77, + "learning_rate": 0.00018507264242885818, + "loss": 0.0393, "step": 118710 }, { - "epoch": 1.28, - "learning_rate": 0.000107385294308521, - "loss": 0.0346, + "epoch": 0.77, + "learning_rate": 0.00018506296107450126, + "loss": 0.0512, "step": 118720 }, { - "epoch": 1.28, - "learning_rate": 0.00010736907002401193, - "loss": 0.0363, + "epoch": 0.77, + "learning_rate": 0.00018505327972014428, + "loss": 0.0447, "step": 118730 }, { - "epoch": 1.28, - "learning_rate": 0.00010735284573950288, - "loss": 0.0342, + "epoch": 0.77, + "learning_rate": 0.00018504359836578736, + "loss": 0.0483, "step": 118740 }, { - "epoch": 1.28, - "learning_rate": 0.00010733662145499383, - "loss": 0.0314, + "epoch": 0.77, + "learning_rate": 0.00018503391701143044, + "loss": 0.0393, "step": 118750 }, { - "epoch": 1.28, - "learning_rate": 0.00010732039717048478, - "loss": 0.0346, + "epoch": 0.77, + "learning_rate": 0.0001850242356570735, + "loss": 0.0478, "step": 118760 }, { - "epoch": 1.28, - "learning_rate": 0.00010730417288597572, - "loss": 0.0295, + "epoch": 0.77, + "learning_rate": 0.00018501455430271657, + "loss": 0.0441, "step": 118770 }, { - "epoch": 1.28, - "learning_rate": 0.00010728794860146667, - "loss": 0.03, + "epoch": 0.77, + "learning_rate": 0.00018500487294835965, + "loss": 0.0389, "step": 118780 }, { - "epoch": 1.28, - "learning_rate": 0.00010727172431695762, - "loss": 0.0336, + "epoch": 0.77, + "learning_rate": 0.00018499519159400273, + "loss": 0.0435, "step": 118790 }, { - "epoch": 1.28, - "learning_rate": 0.00010725550003244857, - "loss": 0.0352, + "epoch": 0.77, + "learning_rate": 0.00018498551023964576, + "loss": 0.0473, "step": 118800 }, { - "epoch": 1.29, - "learning_rate": 0.00010723927574793952, - "loss": 0.041, + "epoch": 0.77, + "learning_rate": 0.00018497582888528884, + "loss": 0.0438, "step": 118810 }, { - "epoch": 1.29, - "learning_rate": 0.00010722305146343045, - "loss": 0.0334, + "epoch": 0.77, + "learning_rate": 0.00018496614753093192, + "loss": 0.0374, "step": 118820 }, { - "epoch": 1.29, - "learning_rate": 0.0001072068271789214, - "loss": 0.0307, + "epoch": 0.77, + "learning_rate": 0.00018495646617657497, + "loss": 0.0466, "step": 118830 }, { - "epoch": 1.29, - "learning_rate": 0.00010719060289441235, - "loss": 0.0357, + "epoch": 0.77, + "learning_rate": 0.00018494678482221805, + "loss": 0.0459, "step": 118840 }, { - "epoch": 1.29, - "learning_rate": 0.0001071743786099033, - "loss": 0.0299, + "epoch": 0.77, + "learning_rate": 0.00018493710346786113, + "loss": 0.0539, "step": 118850 }, { - "epoch": 1.29, - "learning_rate": 0.00010715815432539424, - "loss": 0.0431, + "epoch": 0.77, + "learning_rate": 0.00018492742211350418, + "loss": 0.0438, "step": 118860 }, { - "epoch": 1.29, - "learning_rate": 0.00010714193004088519, - "loss": 0.0345, + "epoch": 0.77, + "learning_rate": 0.00018491774075914724, + "loss": 0.0448, "step": 118870 }, { - "epoch": 1.29, - "learning_rate": 0.00010712570575637614, - "loss": 0.0386, + "epoch": 0.77, + "learning_rate": 0.00018490805940479032, + "loss": 0.0432, "step": 118880 }, { - "epoch": 1.29, - "learning_rate": 0.00010710948147186709, - "loss": 0.0378, + "epoch": 0.77, + "learning_rate": 0.00018489837805043337, + "loss": 0.0405, "step": 118890 }, { - "epoch": 1.29, - "learning_rate": 0.00010709325718735804, - "loss": 0.0389, + "epoch": 0.77, + "learning_rate": 0.00018488869669607645, + "loss": 0.0406, "step": 118900 }, { - "epoch": 1.29, - "learning_rate": 0.00010707703290284898, - "loss": 0.0323, + "epoch": 0.77, + "learning_rate": 0.00018487901534171953, + "loss": 0.0547, "step": 118910 }, { - "epoch": 1.29, - "learning_rate": 0.00010706080861833992, - "loss": 0.0364, + "epoch": 0.77, + "learning_rate": 0.0001848693339873626, + "loss": 0.0437, "step": 118920 }, { - "epoch": 1.29, - "learning_rate": 0.00010704458433383087, - "loss": 0.032, + "epoch": 0.77, + "learning_rate": 0.00018485965263300566, + "loss": 0.0448, "step": 118930 }, { - "epoch": 1.29, - "learning_rate": 0.00010702836004932182, - "loss": 0.0347, + "epoch": 0.77, + "learning_rate": 0.00018484997127864871, + "loss": 0.0355, "step": 118940 }, { - "epoch": 1.29, - "learning_rate": 0.00010701213576481277, - "loss": 0.0316, + "epoch": 0.77, + "learning_rate": 0.0001848402899242918, + "loss": 0.0403, "step": 118950 }, { - "epoch": 1.29, - "learning_rate": 0.00010699591148030371, - "loss": 0.0333, + "epoch": 0.77, + "learning_rate": 0.00018483060856993485, + "loss": 0.0423, "step": 118960 }, { - "epoch": 1.29, - "learning_rate": 0.00010697968719579466, - "loss": 0.0331, + "epoch": 0.77, + "learning_rate": 0.00018482092721557793, + "loss": 0.0421, "step": 118970 }, { - "epoch": 1.29, - "learning_rate": 0.00010696346291128561, - "loss": 0.0356, + "epoch": 0.77, + "learning_rate": 0.000184811245861221, + "loss": 0.0431, "step": 118980 }, { - "epoch": 1.29, - "learning_rate": 0.00010694723862677656, - "loss": 0.0284, + "epoch": 0.77, + "learning_rate": 0.00018480156450686409, + "loss": 0.0418, "step": 118990 }, { - "epoch": 1.29, - "learning_rate": 0.0001069310143422675, - "loss": 0.032, + "epoch": 0.77, + "learning_rate": 0.00018479188315250714, + "loss": 0.0415, "step": 119000 }, { - "epoch": 1.29, - "eval_cer": 0.9211366555877732, - "eval_loss": 0.026019059121608734, - "eval_runtime": 119.1348, - "eval_samples_per_second": 16.788, - "eval_steps_per_second": 4.197, + "epoch": 0.77, + "eval_cer": 0.9199755959778556, + "eval_loss": 0.028800196945667267, + "eval_runtime": 119.8883, + "eval_samples_per_second": 16.682, + "eval_steps_per_second": 4.171, "step": 119000 }, { - "epoch": 1.29, - "learning_rate": 0.00010691479005775845, - "loss": 0.037, + "epoch": 0.77, + "learning_rate": 0.0001847822017981502, + "loss": 0.0439, "step": 119010 }, { - "epoch": 1.29, - "learning_rate": 0.0001068985657732494, - "loss": 0.0312, + "epoch": 0.77, + "learning_rate": 0.00018477252044379327, + "loss": 0.044, "step": 119020 }, { - "epoch": 1.29, - "learning_rate": 0.00010688234148874035, - "loss": 0.0352, + "epoch": 0.77, + "learning_rate": 0.00018476283908943632, + "loss": 0.0408, "step": 119030 }, { - "epoch": 1.29, - "learning_rate": 0.0001068661172042313, - "loss": 0.0315, + "epoch": 0.77, + "learning_rate": 0.0001847531577350794, + "loss": 0.0408, "step": 119040 }, { - "epoch": 1.29, - "learning_rate": 0.00010684989291972223, - "loss": 0.031, + "epoch": 0.77, + "learning_rate": 0.00018474347638072248, + "loss": 0.0431, "step": 119050 }, { - "epoch": 1.29, - "learning_rate": 0.00010683366863521318, - "loss": 0.0308, + "epoch": 0.77, + "learning_rate": 0.00018473379502636554, + "loss": 0.0401, "step": 119060 }, { - "epoch": 1.29, - "learning_rate": 0.00010681744435070413, - "loss": 0.0326, + "epoch": 0.77, + "learning_rate": 0.00018472411367200862, + "loss": 0.0385, "step": 119070 }, { - "epoch": 1.29, - "learning_rate": 0.00010680122006619508, - "loss": 0.0325, + "epoch": 0.77, + "learning_rate": 0.00018471443231765167, + "loss": 0.0437, "step": 119080 }, { - "epoch": 1.29, - "learning_rate": 0.00010678499578168602, - "loss": 0.0326, + "epoch": 0.77, + "learning_rate": 0.00018470475096329472, + "loss": 0.0423, "step": 119090 }, { - "epoch": 1.29, - "learning_rate": 0.00010676877149717697, - "loss": 0.0296, + "epoch": 0.77, + "learning_rate": 0.0001846950696089378, + "loss": 0.0455, "step": 119100 }, { - "epoch": 1.29, - "learning_rate": 0.00010675254721266792, - "loss": 0.0306, + "epoch": 0.77, + "learning_rate": 0.00018468538825458088, + "loss": 0.0437, "step": 119110 }, { - "epoch": 1.29, - "learning_rate": 0.00010673632292815887, - "loss": 0.032, + "epoch": 0.77, + "learning_rate": 0.00018467570690022396, + "loss": 0.0447, "step": 119120 }, { - "epoch": 1.29, - "learning_rate": 0.00010672009864364982, - "loss": 0.0325, + "epoch": 0.77, + "learning_rate": 0.00018466602554586701, + "loss": 0.0416, "step": 119130 }, { - "epoch": 1.29, - "learning_rate": 0.00010670387435914075, - "loss": 0.0335, + "epoch": 0.77, + "learning_rate": 0.0001846563441915101, + "loss": 0.038, "step": 119140 }, { - "epoch": 1.29, - "learning_rate": 0.0001066876500746317, - "loss": 0.0281, + "epoch": 0.77, + "learning_rate": 0.00018464666283715315, + "loss": 0.0391, "step": 119150 }, { - "epoch": 1.29, - "learning_rate": 0.00010667142579012265, - "loss": 0.0284, + "epoch": 0.77, + "learning_rate": 0.0001846369814827962, + "loss": 0.0428, "step": 119160 }, { - "epoch": 1.29, - "learning_rate": 0.0001066552015056136, - "loss": 0.0282, + "epoch": 0.77, + "learning_rate": 0.00018462730012843928, + "loss": 0.0433, "step": 119170 }, { - "epoch": 1.29, - "learning_rate": 0.00010663897722110454, - "loss": 0.03, + "epoch": 0.77, + "learning_rate": 0.00018461761877408236, + "loss": 0.0441, "step": 119180 }, { - "epoch": 1.29, - "learning_rate": 0.00010662275293659549, - "loss": 0.0314, + "epoch": 0.77, + "learning_rate": 0.00018460793741972544, + "loss": 0.0464, "step": 119190 }, { - "epoch": 1.29, - "learning_rate": 0.00010660652865208644, - "loss": 0.032, + "epoch": 0.77, + "learning_rate": 0.0001845982560653685, + "loss": 0.0408, "step": 119200 }, { - "epoch": 1.29, - "learning_rate": 0.00010659030436757739, - "loss": 0.0306, + "epoch": 0.77, + "learning_rate": 0.00018458857471101157, + "loss": 0.0419, "step": 119210 }, { - "epoch": 1.29, - "learning_rate": 0.00010657408008306834, - "loss": 0.0325, + "epoch": 0.77, + "learning_rate": 0.00018457889335665462, + "loss": 0.0447, "step": 119220 }, { - "epoch": 1.29, - "learning_rate": 0.00010655785579855927, - "loss": 0.0358, + "epoch": 0.77, + "learning_rate": 0.00018456921200229768, + "loss": 0.0444, "step": 119230 }, { - "epoch": 1.29, - "learning_rate": 0.00010654163151405022, - "loss": 0.0342, + "epoch": 0.77, + "learning_rate": 0.00018455953064794076, + "loss": 0.0401, "step": 119240 }, { - "epoch": 1.29, - "learning_rate": 0.00010652540722954117, - "loss": 0.0385, + "epoch": 0.77, + "learning_rate": 0.00018454984929358384, + "loss": 0.0387, "step": 119250 }, { - "epoch": 1.29, - "learning_rate": 0.00010650918294503212, - "loss": 0.0321, + "epoch": 0.77, + "learning_rate": 0.0001845401679392269, + "loss": 0.0465, "step": 119260 }, { - "epoch": 1.29, - "learning_rate": 0.00010649295866052306, - "loss": 0.027, + "epoch": 0.77, + "learning_rate": 0.00018453048658486997, + "loss": 0.0402, "step": 119270 }, { - "epoch": 1.29, - "learning_rate": 0.00010647673437601401, - "loss": 0.0287, + "epoch": 0.77, + "learning_rate": 0.00018452080523051305, + "loss": 0.0386, "step": 119280 }, { - "epoch": 1.29, - "learning_rate": 0.00010646051009150496, - "loss": 0.0393, + "epoch": 0.77, + "learning_rate": 0.00018451112387615607, + "loss": 0.0392, "step": 119290 }, { - "epoch": 1.29, - "learning_rate": 0.00010644428580699591, - "loss": 0.0363, + "epoch": 0.77, + "learning_rate": 0.00018450144252179915, + "loss": 0.0488, "step": 119300 }, { - "epoch": 1.29, - "learning_rate": 0.00010642806152248686, - "loss": 0.0306, + "epoch": 0.77, + "learning_rate": 0.00018449176116744223, + "loss": 0.0429, "step": 119310 }, { - "epoch": 1.29, - "learning_rate": 0.0001064118372379778, - "loss": 0.0382, + "epoch": 0.77, + "learning_rate": 0.0001844820798130853, + "loss": 0.0446, "step": 119320 }, { - "epoch": 1.29, - "learning_rate": 0.00010639561295346874, + "epoch": 0.77, + "learning_rate": 0.00018447239845872837, "loss": 0.035, "step": 119330 }, { - "epoch": 1.29, - "learning_rate": 0.0001063793886689597, - "loss": 0.0298, + "epoch": 0.77, + "learning_rate": 0.00018446271710437145, + "loss": 0.0398, "step": 119340 }, { - "epoch": 1.29, - "learning_rate": 0.00010636316438445064, - "loss": 0.0309, + "epoch": 0.77, + "learning_rate": 0.00018445303575001453, + "loss": 0.0471, "step": 119350 }, { - "epoch": 1.29, - "learning_rate": 0.00010634694009994158, - "loss": 0.0306, + "epoch": 0.77, + "learning_rate": 0.00018444335439565755, + "loss": 0.0451, "step": 119360 }, { - "epoch": 1.29, - "learning_rate": 0.00010633071581543253, - "loss": 0.0392, + "epoch": 0.77, + "learning_rate": 0.00018443367304130063, + "loss": 0.0419, "step": 119370 }, { - "epoch": 1.29, - "learning_rate": 0.00010631449153092348, - "loss": 0.0337, + "epoch": 0.77, + "learning_rate": 0.0001844239916869437, + "loss": 0.0416, "step": 119380 }, { - "epoch": 1.29, - "learning_rate": 0.00010629826724641443, - "loss": 0.0395, + "epoch": 0.77, + "learning_rate": 0.0001844143103325868, + "loss": 0.0407, "step": 119390 }, { - "epoch": 1.29, - "learning_rate": 0.00010628204296190538, - "loss": 0.0297, + "epoch": 0.77, + "learning_rate": 0.00018440462897822984, + "loss": 0.0445, "step": 119400 }, { - "epoch": 1.29, - "learning_rate": 0.00010626581867739631, - "loss": 0.0292, + "epoch": 0.77, + "learning_rate": 0.00018439494762387292, + "loss": 0.0442, "step": 119410 }, { - "epoch": 1.29, - "learning_rate": 0.00010624959439288726, - "loss": 0.0327, + "epoch": 0.77, + "learning_rate": 0.000184385266269516, + "loss": 0.0394, "step": 119420 }, { - "epoch": 1.29, - "learning_rate": 0.00010623337010837821, - "loss": 0.0304, + "epoch": 0.77, + "learning_rate": 0.00018437558491515903, + "loss": 0.0458, "step": 119430 }, { - "epoch": 1.29, - "learning_rate": 0.00010621714582386916, - "loss": 0.0277, + "epoch": 0.77, + "learning_rate": 0.0001843659035608021, + "loss": 0.0444, "step": 119440 }, { - "epoch": 1.29, - "learning_rate": 0.0001062009215393601, - "loss": 0.0315, + "epoch": 0.77, + "learning_rate": 0.0001843562222064452, + "loss": 0.0406, "step": 119450 }, { - "epoch": 1.29, - "learning_rate": 0.00010618469725485105, - "loss": 0.0366, + "epoch": 0.77, + "learning_rate": 0.00018434654085208824, + "loss": 0.0389, "step": 119460 }, { - "epoch": 1.29, - "learning_rate": 0.000106168472970342, - "loss": 0.0338, + "epoch": 0.77, + "learning_rate": 0.00018433685949773132, + "loss": 0.0453, "step": 119470 }, { - "epoch": 1.29, - "learning_rate": 0.00010615224868583295, - "loss": 0.0368, + "epoch": 0.77, + "learning_rate": 0.0001843271781433744, + "loss": 0.0468, "step": 119480 }, { - "epoch": 1.29, - "learning_rate": 0.0001061360244013239, - "loss": 0.042, + "epoch": 0.77, + "learning_rate": 0.00018431749678901748, + "loss": 0.0529, "step": 119490 }, { - "epoch": 1.29, - "learning_rate": 0.00010611980011681484, - "loss": 0.0318, + "epoch": 0.77, + "learning_rate": 0.0001843078154346605, + "loss": 0.0412, "step": 119500 }, { - "epoch": 1.29, - "learning_rate": 0.00010610357583230579, - "loss": 0.035, + "epoch": 0.77, + "learning_rate": 0.00018429813408030358, + "loss": 0.0408, "step": 119510 }, { - "epoch": 1.29, - "learning_rate": 0.00010608735154779674, - "loss": 0.0339, + "epoch": 0.77, + "learning_rate": 0.00018428845272594666, + "loss": 0.0407, "step": 119520 }, { - "epoch": 1.29, - "learning_rate": 0.00010607112726328768, - "loss": 0.0276, + "epoch": 0.77, + "learning_rate": 0.00018427877137158972, + "loss": 0.0403, "step": 119530 }, { - "epoch": 1.29, - "learning_rate": 0.00010605490297877862, - "loss": 0.0335, + "epoch": 0.77, + "learning_rate": 0.0001842690900172328, + "loss": 0.0407, "step": 119540 }, { - "epoch": 1.29, - "learning_rate": 0.00010603867869426957, - "loss": 0.0322, + "epoch": 0.77, + "learning_rate": 0.00018425940866287588, + "loss": 0.0432, "step": 119550 }, { - "epoch": 1.29, - "learning_rate": 0.00010602245440976052, - "loss": 0.0373, + "epoch": 0.77, + "learning_rate": 0.00018424972730851896, + "loss": 0.0482, "step": 119560 }, { - "epoch": 1.29, - "learning_rate": 0.00010600623012525147, - "loss": 0.0323, + "epoch": 0.77, + "learning_rate": 0.00018424004595416198, + "loss": 0.0417, "step": 119570 }, { - "epoch": 1.29, - "learning_rate": 0.00010599000584074242, - "loss": 0.0343, + "epoch": 0.77, + "learning_rate": 0.00018423036459980506, + "loss": 0.047, "step": 119580 }, { - "epoch": 1.29, - "learning_rate": 0.00010597378155623336, - "loss": 0.036, + "epoch": 0.77, + "learning_rate": 0.00018422068324544814, + "loss": 0.0403, "step": 119590 }, { - "epoch": 1.29, - "learning_rate": 0.0001059575572717243, - "loss": 0.0305, + "epoch": 0.77, + "learning_rate": 0.0001842110018910912, + "loss": 0.0501, "step": 119600 }, { - "epoch": 1.29, - "learning_rate": 0.00010594133298721526, - "loss": 0.0355, + "epoch": 0.77, + "learning_rate": 0.00018420132053673427, + "loss": 0.0431, "step": 119610 }, { - "epoch": 1.29, - "learning_rate": 0.0001059251087027062, - "loss": 0.0364, + "epoch": 0.77, + "learning_rate": 0.00018419163918237735, + "loss": 0.0411, "step": 119620 }, { - "epoch": 1.29, - "learning_rate": 0.00010590888441819714, - "loss": 0.0304, + "epoch": 0.77, + "learning_rate": 0.00018418195782802043, + "loss": 0.0434, "step": 119630 }, { - "epoch": 1.29, - "learning_rate": 0.00010589266013368809, - "loss": 0.0277, + "epoch": 0.77, + "learning_rate": 0.00018417227647366346, + "loss": 0.0391, "step": 119640 }, { - "epoch": 1.29, - "learning_rate": 0.00010587643584917904, - "loss": 0.0432, + "epoch": 0.77, + "learning_rate": 0.00018416259511930654, + "loss": 0.0386, "step": 119650 }, { - "epoch": 1.29, - "learning_rate": 0.00010586021156466999, - "loss": 0.0336, + "epoch": 0.77, + "learning_rate": 0.0001841529137649496, + "loss": 0.0431, "step": 119660 }, { - "epoch": 1.29, - "learning_rate": 0.00010584398728016094, - "loss": 0.0279, + "epoch": 0.77, + "learning_rate": 0.00018414323241059267, + "loss": 0.0377, "step": 119670 }, { - "epoch": 1.29, - "learning_rate": 0.00010582776299565188, - "loss": 0.026, + "epoch": 0.77, + "learning_rate": 0.00018413355105623575, + "loss": 0.0356, "step": 119680 }, { - "epoch": 1.29, - "learning_rate": 0.00010581153871114283, - "loss": 0.035, + "epoch": 0.77, + "learning_rate": 0.00018412386970187883, + "loss": 0.0535, "step": 119690 }, { - "epoch": 1.29, - "learning_rate": 0.00010579531442663378, - "loss": 0.0325, + "epoch": 0.77, + "learning_rate": 0.00018411418834752188, + "loss": 0.0403, "step": 119700 }, { - "epoch": 1.29, - "learning_rate": 0.00010577909014212473, - "loss": 0.0295, + "epoch": 0.77, + "learning_rate": 0.00018410450699316494, + "loss": 0.0427, "step": 119710 }, { - "epoch": 1.29, - "learning_rate": 0.00010576286585761568, - "loss": 0.0335, + "epoch": 0.77, + "learning_rate": 0.00018409482563880802, + "loss": 0.0442, "step": 119720 }, { - "epoch": 1.3, - "learning_rate": 0.00010574664157310661, - "loss": 0.0356, + "epoch": 0.77, + "learning_rate": 0.00018408514428445107, + "loss": 0.0417, "step": 119730 }, { - "epoch": 1.3, - "learning_rate": 0.00010573041728859756, - "loss": 0.0339, + "epoch": 0.77, + "learning_rate": 0.00018407546293009415, + "loss": 0.0468, "step": 119740 }, { - "epoch": 1.3, - "learning_rate": 0.00010571419300408851, - "loss": 0.0301, + "epoch": 0.77, + "learning_rate": 0.00018406578157573723, + "loss": 0.0422, "step": 119750 }, { - "epoch": 1.3, - "learning_rate": 0.00010569796871957946, - "loss": 0.0302, + "epoch": 0.77, + "learning_rate": 0.0001840561002213803, + "loss": 0.0376, "step": 119760 }, { - "epoch": 1.3, - "learning_rate": 0.0001056817444350704, - "loss": 0.0335, + "epoch": 0.77, + "learning_rate": 0.00018404641886702336, + "loss": 0.0436, "step": 119770 }, { - "epoch": 1.3, - "learning_rate": 0.00010566552015056135, - "loss": 0.0412, + "epoch": 0.77, + "learning_rate": 0.00018403673751266641, + "loss": 0.0403, "step": 119780 }, { - "epoch": 1.3, - "learning_rate": 0.0001056492958660523, - "loss": 0.0396, + "epoch": 0.77, + "learning_rate": 0.0001840270561583095, + "loss": 0.0389, "step": 119790 }, { - "epoch": 1.3, - "learning_rate": 0.00010563307158154325, - "loss": 0.0321, + "epoch": 0.77, + "learning_rate": 0.00018401737480395255, + "loss": 0.0385, "step": 119800 }, { - "epoch": 1.3, - "learning_rate": 0.0001056168472970342, - "loss": 0.0307, + "epoch": 0.77, + "learning_rate": 0.00018400769344959563, + "loss": 0.0416, "step": 119810 }, { - "epoch": 1.3, - "learning_rate": 0.00010560062301252513, - "loss": 0.0315, + "epoch": 0.77, + "learning_rate": 0.0001839980120952387, + "loss": 0.0406, "step": 119820 }, { - "epoch": 1.3, - "learning_rate": 0.00010558439872801608, - "loss": 0.0376, + "epoch": 0.77, + "learning_rate": 0.00018398833074088179, + "loss": 0.038, "step": 119830 }, { - "epoch": 1.3, - "learning_rate": 0.00010556817444350703, - "loss": 0.0302, + "epoch": 0.77, + "learning_rate": 0.00018397864938652484, + "loss": 0.0409, "step": 119840 }, { - "epoch": 1.3, - "learning_rate": 0.00010555195015899798, - "loss": 0.0342, + "epoch": 0.77, + "learning_rate": 0.0001839689680321679, + "loss": 0.0442, "step": 119850 }, { - "epoch": 1.3, - "learning_rate": 0.00010553572587448892, - "loss": 0.0306, + "epoch": 0.77, + "learning_rate": 0.00018395928667781097, + "loss": 0.0424, "step": 119860 }, { - "epoch": 1.3, - "learning_rate": 0.00010551950158997987, - "loss": 0.0333, + "epoch": 0.77, + "learning_rate": 0.00018394960532345402, + "loss": 0.05, "step": 119870 }, { - "epoch": 1.3, - "learning_rate": 0.00010550327730547082, - "loss": 0.042, + "epoch": 0.77, + "learning_rate": 0.0001839399239690971, + "loss": 0.0394, "step": 119880 }, { - "epoch": 1.3, - "learning_rate": 0.00010548705302096177, - "loss": 0.031, + "epoch": 0.77, + "learning_rate": 0.00018393024261474018, + "loss": 0.0418, "step": 119890 }, { - "epoch": 1.3, - "learning_rate": 0.00010547082873645272, - "loss": 0.0346, + "epoch": 0.77, + "learning_rate": 0.00018392056126038324, + "loss": 0.0464, "step": 119900 }, { - "epoch": 1.3, - "learning_rate": 0.00010545460445194365, - "loss": 0.0351, + "epoch": 0.77, + "learning_rate": 0.00018391087990602632, + "loss": 0.0416, "step": 119910 }, { - "epoch": 1.3, - "learning_rate": 0.0001054383801674346, - "loss": 0.0342, + "epoch": 0.77, + "learning_rate": 0.00018390119855166937, + "loss": 0.0459, "step": 119920 }, { - "epoch": 1.3, - "learning_rate": 0.00010542215588292555, - "loss": 0.0323, + "epoch": 0.77, + "learning_rate": 0.00018389151719731242, + "loss": 0.0351, "step": 119930 }, { - "epoch": 1.3, - "learning_rate": 0.0001054059315984165, - "loss": 0.038, + "epoch": 0.77, + "learning_rate": 0.0001838818358429555, + "loss": 0.0469, "step": 119940 }, { - "epoch": 1.3, - "learning_rate": 0.00010538970731390744, - "loss": 0.0291, + "epoch": 0.77, + "learning_rate": 0.00018387215448859858, + "loss": 0.0426, "step": 119950 }, { - "epoch": 1.3, - "learning_rate": 0.00010537348302939839, - "loss": 0.0289, + "epoch": 0.77, + "learning_rate": 0.00018386247313424166, + "loss": 0.0497, "step": 119960 }, { - "epoch": 1.3, - "learning_rate": 0.00010535725874488934, - "loss": 0.03, + "epoch": 0.77, + "learning_rate": 0.0001838527917798847, + "loss": 0.0409, "step": 119970 }, { - "epoch": 1.3, - "learning_rate": 0.00010534103446038029, - "loss": 0.0329, + "epoch": 0.77, + "learning_rate": 0.0001838431104255278, + "loss": 0.0435, "step": 119980 }, { - "epoch": 1.3, - "learning_rate": 0.00010532481017587124, - "loss": 0.0381, + "epoch": 0.77, + "learning_rate": 0.00018383342907117085, + "loss": 0.0447, "step": 119990 }, { - "epoch": 1.3, - "learning_rate": 0.00010530858589136217, - "loss": 0.0359, + "epoch": 0.77, + "learning_rate": 0.0001838237477168139, + "loss": 0.0435, "step": 120000 }, { - "epoch": 1.3, - "eval_cer": 0.9210898309187707, - "eval_loss": 0.025903452187776566, - "eval_runtime": 119.1367, - "eval_samples_per_second": 16.787, - "eval_steps_per_second": 4.197, + "epoch": 0.77, + "eval_cer": 0.9199069031747825, + "eval_loss": 0.028599528595805168, + "eval_runtime": 120.0989, + "eval_samples_per_second": 16.653, + "eval_steps_per_second": 4.163, "step": 120000 }, { - "epoch": 1.3, - "learning_rate": 0.00010529236160685312, - "loss": 0.029, + "epoch": 0.77, + "learning_rate": 0.00018381406636245698, + "loss": 0.0421, "step": 120010 }, { - "epoch": 1.3, - "learning_rate": 0.00010527613732234407, - "loss": 0.0318, + "epoch": 0.77, + "learning_rate": 0.00018380438500810006, + "loss": 0.0465, "step": 120020 }, { - "epoch": 1.3, - "learning_rate": 0.00010525991303783502, - "loss": 0.035, + "epoch": 0.77, + "learning_rate": 0.00018379470365374314, + "loss": 0.0458, "step": 120030 }, { - "epoch": 1.3, - "learning_rate": 0.00010524368875332596, - "loss": 0.0295, + "epoch": 0.77, + "learning_rate": 0.0001837850222993862, + "loss": 0.0456, "step": 120040 }, { - "epoch": 1.3, - "learning_rate": 0.00010522746446881691, - "loss": 0.0319, + "epoch": 0.77, + "learning_rate": 0.00018377534094502927, + "loss": 0.0451, "step": 120050 }, { - "epoch": 1.3, - "learning_rate": 0.00010521124018430786, - "loss": 0.0337, + "epoch": 0.77, + "learning_rate": 0.00018376565959067232, + "loss": 0.0485, "step": 120060 }, { - "epoch": 1.3, - "learning_rate": 0.00010519501589979881, - "loss": 0.0307, + "epoch": 0.77, + "learning_rate": 0.00018375597823631538, + "loss": 0.0418, "step": 120070 }, { - "epoch": 1.3, - "learning_rate": 0.00010517879161528976, - "loss": 0.0351, + "epoch": 0.78, + "learning_rate": 0.00018374629688195846, + "loss": 0.0393, "step": 120080 }, { - "epoch": 1.3, - "learning_rate": 0.0001051625673307807, - "loss": 0.0353, + "epoch": 0.78, + "learning_rate": 0.00018373661552760154, + "loss": 0.042, "step": 120090 }, { - "epoch": 1.3, - "learning_rate": 0.00010514634304627165, - "loss": 0.0287, + "epoch": 0.78, + "learning_rate": 0.0001837269341732446, + "loss": 0.0386, "step": 120100 }, { - "epoch": 1.3, - "learning_rate": 0.0001051301187617626, - "loss": 0.0296, + "epoch": 0.78, + "learning_rate": 0.00018371725281888767, + "loss": 0.0398, "step": 120110 }, { - "epoch": 1.3, - "learning_rate": 0.00010511389447725355, - "loss": 0.0349, + "epoch": 0.78, + "learning_rate": 0.00018370757146453075, + "loss": 0.0373, "step": 120120 }, { - "epoch": 1.3, - "learning_rate": 0.00010509767019274448, - "loss": 0.0323, + "epoch": 0.78, + "learning_rate": 0.00018369789011017377, + "loss": 0.0463, "step": 120130 }, { - "epoch": 1.3, - "learning_rate": 0.00010508144590823543, - "loss": 0.0277, + "epoch": 0.78, + "learning_rate": 0.00018368820875581685, + "loss": 0.0454, "step": 120140 }, { - "epoch": 1.3, - "learning_rate": 0.00010506522162372638, - "loss": 0.0326, + "epoch": 0.78, + "learning_rate": 0.00018367852740145993, + "loss": 0.0419, "step": 120150 }, { - "epoch": 1.3, - "learning_rate": 0.00010504899733921733, - "loss": 0.0314, + "epoch": 0.78, + "learning_rate": 0.000183668846047103, + "loss": 0.0388, "step": 120160 }, { - "epoch": 1.3, - "learning_rate": 0.00010503277305470828, - "loss": 0.0313, + "epoch": 0.78, + "learning_rate": 0.00018365916469274607, + "loss": 0.0431, "step": 120170 }, { - "epoch": 1.3, - "learning_rate": 0.00010501654877019922, - "loss": 0.0339, + "epoch": 0.78, + "learning_rate": 0.00018364948333838914, + "loss": 0.0445, "step": 120180 }, { - "epoch": 1.3, - "learning_rate": 0.00010500032448569017, - "loss": 0.0398, + "epoch": 0.78, + "learning_rate": 0.00018363980198403222, + "loss": 0.0395, "step": 120190 }, { - "epoch": 1.3, - "learning_rate": 0.00010498410020118112, - "loss": 0.0361, + "epoch": 0.78, + "learning_rate": 0.00018363012062967525, + "loss": 0.0383, "step": 120200 }, { - "epoch": 1.3, - "learning_rate": 0.00010496787591667207, - "loss": 0.0325, + "epoch": 0.78, + "learning_rate": 0.00018362043927531833, + "loss": 0.0493, "step": 120210 }, { - "epoch": 1.3, - "learning_rate": 0.000104951651632163, - "loss": 0.0303, + "epoch": 0.78, + "learning_rate": 0.0001836107579209614, + "loss": 0.0434, "step": 120220 }, { - "epoch": 1.3, - "learning_rate": 0.00010493542734765395, - "loss": 0.0294, + "epoch": 0.78, + "learning_rate": 0.0001836010765666045, + "loss": 0.0404, "step": 120230 }, { - "epoch": 1.3, - "learning_rate": 0.0001049192030631449, - "loss": 0.0293, + "epoch": 0.78, + "learning_rate": 0.00018359139521224754, + "loss": 0.0461, "step": 120240 }, { - "epoch": 1.3, - "learning_rate": 0.00010490297877863585, - "loss": 0.0243, + "epoch": 0.78, + "learning_rate": 0.00018358171385789062, + "loss": 0.0441, "step": 120250 }, { - "epoch": 1.3, - "learning_rate": 0.0001048867544941268, - "loss": 0.031, + "epoch": 0.78, + "learning_rate": 0.0001835720325035337, + "loss": 0.0421, "step": 120260 }, { - "epoch": 1.3, - "learning_rate": 0.00010487053020961774, - "loss": 0.0327, + "epoch": 0.78, + "learning_rate": 0.00018356235114917673, + "loss": 0.039, "step": 120270 }, { - "epoch": 1.3, - "learning_rate": 0.00010485430592510869, - "loss": 0.033, + "epoch": 0.78, + "learning_rate": 0.0001835526697948198, + "loss": 0.0417, "step": 120280 }, { - "epoch": 1.3, - "learning_rate": 0.00010483808164059964, - "loss": 0.0267, + "epoch": 0.78, + "learning_rate": 0.0001835429884404629, + "loss": 0.0475, "step": 120290 }, { - "epoch": 1.3, - "learning_rate": 0.00010482185735609059, - "loss": 0.0298, + "epoch": 0.78, + "learning_rate": 0.00018353330708610594, + "loss": 0.0524, "step": 120300 }, { - "epoch": 1.3, - "learning_rate": 0.00010480563307158152, - "loss": 0.0289, + "epoch": 0.78, + "learning_rate": 0.00018352362573174902, + "loss": 0.0438, "step": 120310 }, { - "epoch": 1.3, - "learning_rate": 0.00010478940878707247, - "loss": 0.0296, + "epoch": 0.78, + "learning_rate": 0.0001835139443773921, + "loss": 0.0386, "step": 120320 }, { - "epoch": 1.3, - "learning_rate": 0.00010477318450256342, - "loss": 0.0352, + "epoch": 0.78, + "learning_rate": 0.00018350426302303518, + "loss": 0.0415, "step": 120330 }, { - "epoch": 1.3, - "learning_rate": 0.00010475696021805437, - "loss": 0.0329, + "epoch": 0.78, + "learning_rate": 0.0001834945816686782, + "loss": 0.0424, "step": 120340 }, { - "epoch": 1.3, - "learning_rate": 0.00010474073593354532, - "loss": 0.0366, + "epoch": 0.78, + "learning_rate": 0.00018348490031432128, + "loss": 0.0435, "step": 120350 }, { - "epoch": 1.3, - "learning_rate": 0.00010472451164903626, - "loss": 0.0315, + "epoch": 0.78, + "learning_rate": 0.00018347521895996436, + "loss": 0.0423, "step": 120360 }, { - "epoch": 1.3, - "learning_rate": 0.00010470828736452721, - "loss": 0.0341, + "epoch": 0.78, + "learning_rate": 0.00018346553760560742, + "loss": 0.046, "step": 120370 }, { - "epoch": 1.3, - "learning_rate": 0.00010469206308001816, - "loss": 0.0349, + "epoch": 0.78, + "learning_rate": 0.0001834558562512505, + "loss": 0.0389, "step": 120380 }, { - "epoch": 1.3, - "learning_rate": 0.00010467583879550911, - "loss": 0.0345, + "epoch": 0.78, + "learning_rate": 0.00018344617489689358, + "loss": 0.0478, "step": 120390 }, { - "epoch": 1.3, - "learning_rate": 0.00010465961451100004, - "loss": 0.0281, + "epoch": 0.78, + "learning_rate": 0.00018343649354253666, + "loss": 0.047, "step": 120400 }, { - "epoch": 1.3, - "learning_rate": 0.000104643390226491, - "loss": 0.0353, + "epoch": 0.78, + "learning_rate": 0.00018342681218817968, + "loss": 0.0405, "step": 120410 }, { - "epoch": 1.3, - "learning_rate": 0.00010462716594198194, - "loss": 0.0294, + "epoch": 0.78, + "learning_rate": 0.00018341713083382276, + "loss": 0.0445, "step": 120420 }, { - "epoch": 1.3, - "learning_rate": 0.00010461094165747289, - "loss": 0.043, + "epoch": 0.78, + "learning_rate": 0.00018340744947946584, + "loss": 0.0454, "step": 120430 }, { - "epoch": 1.3, - "learning_rate": 0.00010459471737296384, - "loss": 0.0307, + "epoch": 0.78, + "learning_rate": 0.0001833977681251089, + "loss": 0.0451, "step": 120440 }, { - "epoch": 1.3, - "learning_rate": 0.00010457849308845478, - "loss": 0.0303, + "epoch": 0.78, + "learning_rate": 0.00018338808677075197, + "loss": 0.0466, "step": 120450 }, { - "epoch": 1.3, - "learning_rate": 0.00010456226880394573, - "loss": 0.0296, + "epoch": 0.78, + "learning_rate": 0.00018337840541639505, + "loss": 0.0361, "step": 120460 }, { - "epoch": 1.3, - "learning_rate": 0.00010454604451943668, - "loss": 0.0319, + "epoch": 0.78, + "learning_rate": 0.0001833687240620381, + "loss": 0.0453, "step": 120470 }, { - "epoch": 1.3, - "learning_rate": 0.00010452982023492763, - "loss": 0.036, + "epoch": 0.78, + "learning_rate": 0.00018335904270768116, + "loss": 0.0406, "step": 120480 }, { - "epoch": 1.3, - "learning_rate": 0.00010451359595041858, - "loss": 0.0351, + "epoch": 0.78, + "learning_rate": 0.00018334936135332424, + "loss": 0.0453, "step": 120490 }, { - "epoch": 1.3, - "learning_rate": 0.00010449737166590951, - "loss": 0.0325, + "epoch": 0.78, + "learning_rate": 0.0001833396799989673, + "loss": 0.0433, "step": 120500 }, { - "epoch": 1.3, - "learning_rate": 0.00010448114738140046, - "loss": 0.0423, + "epoch": 0.78, + "learning_rate": 0.00018332999864461037, + "loss": 0.0478, "step": 120510 }, { - "epoch": 1.3, - "learning_rate": 0.00010446492309689141, - "loss": 0.0297, + "epoch": 0.78, + "learning_rate": 0.00018332031729025345, + "loss": 0.0473, "step": 120520 }, { - "epoch": 1.3, - "learning_rate": 0.00010444869881238236, - "loss": 0.0356, + "epoch": 0.78, + "learning_rate": 0.00018331063593589653, + "loss": 0.0444, "step": 120530 }, { - "epoch": 1.3, - "learning_rate": 0.0001044324745278733, - "loss": 0.0295, + "epoch": 0.78, + "learning_rate": 0.00018330095458153956, + "loss": 0.043, "step": 120540 }, { - "epoch": 1.3, - "learning_rate": 0.00010441625024336425, - "loss": 0.0353, + "epoch": 0.78, + "learning_rate": 0.00018329127322718264, + "loss": 0.0421, "step": 120550 }, { - "epoch": 1.3, - "learning_rate": 0.0001044000259588552, - "loss": 0.0296, + "epoch": 0.78, + "learning_rate": 0.00018328159187282572, + "loss": 0.0354, "step": 120560 }, { - "epoch": 1.3, - "learning_rate": 0.00010438380167434615, - "loss": 0.0404, + "epoch": 0.78, + "learning_rate": 0.00018327191051846877, + "loss": 0.0417, "step": 120570 }, { - "epoch": 1.3, - "learning_rate": 0.0001043675773898371, - "loss": 0.0353, + "epoch": 0.78, + "learning_rate": 0.00018326222916411185, + "loss": 0.0408, "step": 120580 }, { - "epoch": 1.3, - "learning_rate": 0.00010435135310532804, - "loss": 0.0321, + "epoch": 0.78, + "learning_rate": 0.00018325254780975493, + "loss": 0.045, "step": 120590 }, { - "epoch": 1.3, - "learning_rate": 0.00010433512882081899, - "loss": 0.0364, + "epoch": 0.78, + "learning_rate": 0.000183242866455398, + "loss": 0.0446, "step": 120600 }, { - "epoch": 1.3, - "learning_rate": 0.00010431890453630993, - "loss": 0.0404, + "epoch": 0.78, + "learning_rate": 0.00018323318510104103, + "loss": 0.052, "step": 120610 }, { - "epoch": 1.3, - "learning_rate": 0.00010430268025180088, - "loss": 0.0308, + "epoch": 0.78, + "learning_rate": 0.00018322350374668411, + "loss": 0.0372, "step": 120620 }, { - "epoch": 1.3, - "learning_rate": 0.00010428645596729182, - "loss": 0.0342, + "epoch": 0.78, + "learning_rate": 0.0001832138223923272, + "loss": 0.0393, "step": 120630 }, { - "epoch": 1.3, - "learning_rate": 0.00010427023168278277, - "loss": 0.03, + "epoch": 0.78, + "learning_rate": 0.00018320414103797025, + "loss": 0.0402, "step": 120640 }, { - "epoch": 1.3, - "learning_rate": 0.00010425400739827372, - "loss": 0.0326, + "epoch": 0.78, + "learning_rate": 0.00018319445968361333, + "loss": 0.0486, "step": 120650 }, { - "epoch": 1.31, - "learning_rate": 0.00010423778311376467, - "loss": 0.0334, + "epoch": 0.78, + "learning_rate": 0.0001831847783292564, + "loss": 0.0431, "step": 120660 }, { - "epoch": 1.31, - "learning_rate": 0.00010422155882925562, - "loss": 0.0336, + "epoch": 0.78, + "learning_rate": 0.00018317509697489946, + "loss": 0.0469, "step": 120670 }, { - "epoch": 1.31, - "learning_rate": 0.00010420533454474656, - "loss": 0.0336, + "epoch": 0.78, + "learning_rate": 0.0001831654156205425, + "loss": 0.0467, "step": 120680 }, { - "epoch": 1.31, - "learning_rate": 0.0001041891102602375, - "loss": 0.0303, + "epoch": 0.78, + "learning_rate": 0.0001831557342661856, + "loss": 0.0468, "step": 120690 }, { - "epoch": 1.31, - "learning_rate": 0.00010417288597572846, - "loss": 0.0311, + "epoch": 0.78, + "learning_rate": 0.00018314605291182864, + "loss": 0.0485, "step": 120700 }, { - "epoch": 1.31, - "learning_rate": 0.0001041566616912194, - "loss": 0.0333, + "epoch": 0.78, + "learning_rate": 0.00018313637155747172, + "loss": 0.0464, "step": 120710 }, { - "epoch": 1.31, - "learning_rate": 0.00010414043740671034, - "loss": 0.0337, + "epoch": 0.78, + "learning_rate": 0.0001831266902031148, + "loss": 0.0428, "step": 120720 }, { - "epoch": 1.31, - "learning_rate": 0.00010412421312220129, - "loss": 0.0321, + "epoch": 0.78, + "learning_rate": 0.00018311700884875788, + "loss": 0.0424, "step": 120730 }, { - "epoch": 1.31, - "learning_rate": 0.00010410798883769224, - "loss": 0.0354, + "epoch": 0.78, + "learning_rate": 0.00018310732749440094, + "loss": 0.0468, "step": 120740 }, { - "epoch": 1.31, - "learning_rate": 0.00010409176455318319, - "loss": 0.0298, + "epoch": 0.78, + "learning_rate": 0.000183097646140044, + "loss": 0.0537, "step": 120750 }, { - "epoch": 1.31, - "learning_rate": 0.00010407554026867414, - "loss": 0.034, + "epoch": 0.78, + "learning_rate": 0.00018308796478568707, + "loss": 0.0419, "step": 120760 }, { - "epoch": 1.31, - "learning_rate": 0.00010405931598416508, - "loss": 0.0311, + "epoch": 0.78, + "learning_rate": 0.00018307828343133012, + "loss": 0.0457, "step": 120770 }, { - "epoch": 1.31, - "learning_rate": 0.00010404309169965603, - "loss": 0.0297, + "epoch": 0.78, + "learning_rate": 0.0001830686020769732, + "loss": 0.0401, "step": 120780 }, { - "epoch": 1.31, - "learning_rate": 0.00010402686741514698, - "loss": 0.0362, + "epoch": 0.78, + "learning_rate": 0.00018305892072261628, + "loss": 0.0433, "step": 120790 }, { - "epoch": 1.31, - "learning_rate": 0.00010401064313063793, - "loss": 0.0344, + "epoch": 0.78, + "learning_rate": 0.00018304923936825936, + "loss": 0.0417, "step": 120800 }, { - "epoch": 1.31, - "learning_rate": 0.00010399441884612886, - "loss": 0.03, + "epoch": 0.78, + "learning_rate": 0.0001830395580139024, + "loss": 0.0378, "step": 120810 }, { - "epoch": 1.31, - "learning_rate": 0.00010397819456161981, - "loss": 0.0283, + "epoch": 0.78, + "learning_rate": 0.00018302987665954547, + "loss": 0.0405, "step": 120820 }, { - "epoch": 1.31, - "learning_rate": 0.00010396197027711076, - "loss": 0.0375, + "epoch": 0.78, + "learning_rate": 0.00018302019530518855, + "loss": 0.0407, "step": 120830 }, { - "epoch": 1.31, - "learning_rate": 0.00010394574599260171, - "loss": 0.0283, + "epoch": 0.78, + "learning_rate": 0.0001830105139508316, + "loss": 0.0481, "step": 120840 }, { - "epoch": 1.31, - "learning_rate": 0.00010392952170809268, - "loss": 0.0316, + "epoch": 0.78, + "learning_rate": 0.00018300083259647468, + "loss": 0.0488, "step": 120850 }, { - "epoch": 1.31, - "learning_rate": 0.00010391329742358362, - "loss": 0.0323, + "epoch": 0.78, + "learning_rate": 0.00018299115124211776, + "loss": 0.0399, "step": 120860 }, { - "epoch": 1.31, - "learning_rate": 0.00010389707313907456, - "loss": 0.0312, + "epoch": 0.78, + "learning_rate": 0.0001829814698877608, + "loss": 0.0413, "step": 120870 }, { - "epoch": 1.31, - "learning_rate": 0.00010388084885456551, - "loss": 0.0323, + "epoch": 0.78, + "learning_rate": 0.0001829717885334039, + "loss": 0.0407, "step": 120880 }, { - "epoch": 1.31, - "learning_rate": 0.00010386462457005646, - "loss": 0.035, + "epoch": 0.78, + "learning_rate": 0.00018296210717904694, + "loss": 0.0456, "step": 120890 }, { - "epoch": 1.31, - "learning_rate": 0.00010384840028554741, - "loss": 0.0335, + "epoch": 0.78, + "learning_rate": 0.00018295242582469, + "loss": 0.0399, "step": 120900 }, { - "epoch": 1.31, - "learning_rate": 0.00010383217600103835, - "loss": 0.0354, + "epoch": 0.78, + "learning_rate": 0.00018294274447033308, + "loss": 0.039, "step": 120910 }, { - "epoch": 1.31, - "learning_rate": 0.0001038159517165293, - "loss": 0.0394, + "epoch": 0.78, + "learning_rate": 0.00018293306311597616, + "loss": 0.0428, "step": 120920 }, { - "epoch": 1.31, - "learning_rate": 0.00010379972743202025, - "loss": 0.032, + "epoch": 0.78, + "learning_rate": 0.00018292338176161923, + "loss": 0.0397, "step": 120930 }, { - "epoch": 1.31, - "learning_rate": 0.0001037835031475112, - "loss": 0.0333, + "epoch": 0.78, + "learning_rate": 0.0001829137004072623, + "loss": 0.0413, "step": 120940 }, { - "epoch": 1.31, - "learning_rate": 0.00010376727886300215, - "loss": 0.0284, + "epoch": 0.78, + "learning_rate": 0.00018290401905290537, + "loss": 0.0439, "step": 120950 }, { - "epoch": 1.31, - "learning_rate": 0.00010375105457849308, - "loss": 0.0313, + "epoch": 0.78, + "learning_rate": 0.00018289433769854842, + "loss": 0.0413, "step": 120960 }, { - "epoch": 1.31, - "learning_rate": 0.00010373483029398403, - "loss": 0.0327, + "epoch": 0.78, + "learning_rate": 0.00018288465634419147, + "loss": 0.0514, "step": 120970 }, { - "epoch": 1.31, - "learning_rate": 0.00010371860600947498, - "loss": 0.0266, + "epoch": 0.78, + "learning_rate": 0.00018287497498983455, + "loss": 0.0476, "step": 120980 }, { - "epoch": 1.31, - "learning_rate": 0.00010370238172496593, - "loss": 0.0325, + "epoch": 0.78, + "learning_rate": 0.00018286529363547763, + "loss": 0.0417, "step": 120990 }, { - "epoch": 1.31, - "learning_rate": 0.00010368615744045687, - "loss": 0.0347, + "epoch": 0.78, + "learning_rate": 0.0001828556122811207, + "loss": 0.0423, "step": 121000 }, { - "epoch": 1.31, - "eval_cer": 0.9211896646470215, - "eval_loss": 0.025887662544846535, - "eval_runtime": 118.9033, - "eval_samples_per_second": 16.82, - "eval_steps_per_second": 4.205, + "epoch": 0.78, + "eval_cer": 0.9198309795503333, + "eval_loss": 0.02841617912054062, + "eval_runtime": 120.0158, + "eval_samples_per_second": 16.664, + "eval_steps_per_second": 4.166, "step": 121000 }, { - "epoch": 1.31, - "learning_rate": 0.00010366993315594782, - "loss": 0.035, + "epoch": 0.78, + "learning_rate": 0.00018284593092676376, + "loss": 0.0425, "step": 121010 }, { - "epoch": 1.31, - "learning_rate": 0.00010365370887143877, - "loss": 0.0284, + "epoch": 0.78, + "learning_rate": 0.00018283624957240684, + "loss": 0.0448, "step": 121020 }, { - "epoch": 1.31, - "learning_rate": 0.00010363748458692972, - "loss": 0.0318, + "epoch": 0.78, + "learning_rate": 0.0001828265682180499, + "loss": 0.0514, "step": 121030 }, { - "epoch": 1.31, - "learning_rate": 0.00010362126030242067, - "loss": 0.0279, + "epoch": 0.78, + "learning_rate": 0.00018281688686369295, + "loss": 0.0408, "step": 121040 }, { - "epoch": 1.31, - "learning_rate": 0.0001036050360179116, - "loss": 0.0286, + "epoch": 0.78, + "learning_rate": 0.00018280720550933603, + "loss": 0.0441, "step": 121050 }, { - "epoch": 1.31, - "learning_rate": 0.00010358881173340255, - "loss": 0.0359, + "epoch": 0.78, + "learning_rate": 0.0001827975241549791, + "loss": 0.0437, "step": 121060 }, { - "epoch": 1.31, - "learning_rate": 0.0001035725874488935, - "loss": 0.0389, + "epoch": 0.78, + "learning_rate": 0.00018278784280062216, + "loss": 0.0405, "step": 121070 }, { - "epoch": 1.31, - "learning_rate": 0.00010355636316438445, - "loss": 0.0318, + "epoch": 0.78, + "learning_rate": 0.00018277816144626524, + "loss": 0.048, "step": 121080 }, { - "epoch": 1.31, - "learning_rate": 0.0001035401388798754, - "loss": 0.0314, + "epoch": 0.78, + "learning_rate": 0.00018276848009190832, + "loss": 0.0421, "step": 121090 }, { - "epoch": 1.31, - "learning_rate": 0.00010352391459536634, - "loss": 0.0349, + "epoch": 0.78, + "learning_rate": 0.00018275879873755135, + "loss": 0.0439, "step": 121100 }, { - "epoch": 1.31, - "learning_rate": 0.00010350769031085729, - "loss": 0.0325, + "epoch": 0.78, + "learning_rate": 0.00018274911738319443, + "loss": 0.0408, "step": 121110 }, { - "epoch": 1.31, - "learning_rate": 0.00010349146602634824, - "loss": 0.0318, + "epoch": 0.78, + "learning_rate": 0.0001827394360288375, + "loss": 0.0439, "step": 121120 }, { - "epoch": 1.31, - "learning_rate": 0.00010347524174183919, - "loss": 0.0371, + "epoch": 0.78, + "learning_rate": 0.0001827297546744806, + "loss": 0.0491, "step": 121130 }, { - "epoch": 1.31, - "learning_rate": 0.00010345901745733012, - "loss": 0.0319, + "epoch": 0.78, + "learning_rate": 0.00018272007332012364, + "loss": 0.0431, "step": 121140 }, { - "epoch": 1.31, - "learning_rate": 0.00010344279317282107, - "loss": 0.0418, + "epoch": 0.78, + "learning_rate": 0.00018271039196576672, + "loss": 0.0407, "step": 121150 }, { - "epoch": 1.31, - "learning_rate": 0.00010342656888831202, - "loss": 0.0311, + "epoch": 0.78, + "learning_rate": 0.0001827007106114098, + "loss": 0.0556, "step": 121160 }, { - "epoch": 1.31, - "learning_rate": 0.00010341034460380297, - "loss": 0.0303, + "epoch": 0.78, + "learning_rate": 0.00018269102925705282, + "loss": 0.0461, "step": 121170 }, { - "epoch": 1.31, - "learning_rate": 0.00010339412031929392, - "loss": 0.0334, + "epoch": 0.78, + "learning_rate": 0.0001826813479026959, + "loss": 0.0419, "step": 121180 }, { - "epoch": 1.31, - "learning_rate": 0.00010337789603478486, - "loss": 0.0291, + "epoch": 0.78, + "learning_rate": 0.00018267166654833898, + "loss": 0.0469, "step": 121190 }, { - "epoch": 1.31, - "learning_rate": 0.00010336167175027581, - "loss": 0.0356, + "epoch": 0.78, + "learning_rate": 0.00018266198519398206, + "loss": 0.0383, "step": 121200 }, { - "epoch": 1.31, - "learning_rate": 0.00010334544746576676, - "loss": 0.0352, + "epoch": 0.78, + "learning_rate": 0.00018265230383962512, + "loss": 0.0427, "step": 121210 }, { - "epoch": 1.31, - "learning_rate": 0.00010332922318125771, - "loss": 0.0333, + "epoch": 0.78, + "learning_rate": 0.0001826426224852682, + "loss": 0.0391, "step": 121220 }, { - "epoch": 1.31, - "learning_rate": 0.00010331299889674864, - "loss": 0.0285, + "epoch": 0.78, + "learning_rate": 0.00018263294113091128, + "loss": 0.0412, "step": 121230 }, { - "epoch": 1.31, - "learning_rate": 0.0001032967746122396, - "loss": 0.0373, + "epoch": 0.78, + "learning_rate": 0.0001826232597765543, + "loss": 0.0437, "step": 121240 }, { - "epoch": 1.31, - "learning_rate": 0.00010328055032773054, - "loss": 0.0361, + "epoch": 0.78, + "learning_rate": 0.00018261357842219738, + "loss": 0.0408, "step": 121250 }, { - "epoch": 1.31, - "learning_rate": 0.0001032643260432215, - "loss": 0.0328, + "epoch": 0.78, + "learning_rate": 0.00018260389706784046, + "loss": 0.0429, "step": 121260 }, { - "epoch": 1.31, - "learning_rate": 0.00010324810175871244, - "loss": 0.0356, + "epoch": 0.78, + "learning_rate": 0.00018259421571348351, + "loss": 0.0444, "step": 121270 }, { - "epoch": 1.31, - "learning_rate": 0.00010323187747420338, - "loss": 0.032, + "epoch": 0.78, + "learning_rate": 0.0001825845343591266, + "loss": 0.04, "step": 121280 }, { - "epoch": 1.31, - "learning_rate": 0.00010321565318969433, - "loss": 0.0312, + "epoch": 0.78, + "learning_rate": 0.00018257485300476967, + "loss": 0.0409, "step": 121290 }, { - "epoch": 1.31, - "learning_rate": 0.00010319942890518528, - "loss": 0.0317, + "epoch": 0.78, + "learning_rate": 0.00018256517165041275, + "loss": 0.0427, "step": 121300 }, { - "epoch": 1.31, - "learning_rate": 0.00010318320462067623, - "loss": 0.0336, + "epoch": 0.78, + "learning_rate": 0.00018255549029605578, + "loss": 0.0383, "step": 121310 }, { - "epoch": 1.31, - "learning_rate": 0.00010316698033616717, - "loss": 0.0345, + "epoch": 0.78, + "learning_rate": 0.00018254580894169886, + "loss": 0.0467, "step": 121320 }, { - "epoch": 1.31, - "learning_rate": 0.00010315075605165811, - "loss": 0.0381, + "epoch": 0.78, + "learning_rate": 0.00018253612758734194, + "loss": 0.0352, "step": 121330 }, { - "epoch": 1.31, - "learning_rate": 0.00010313453176714906, - "loss": 0.031, + "epoch": 0.78, + "learning_rate": 0.000182526446232985, + "loss": 0.0466, "step": 121340 }, { - "epoch": 1.31, - "learning_rate": 0.00010311830748264001, - "loss": 0.0387, + "epoch": 0.78, + "learning_rate": 0.00018251676487862807, + "loss": 0.0392, "step": 121350 }, { - "epoch": 1.31, - "learning_rate": 0.00010310208319813096, - "loss": 0.0308, + "epoch": 0.78, + "learning_rate": 0.00018250708352427115, + "loss": 0.0391, "step": 121360 }, { - "epoch": 1.31, - "learning_rate": 0.0001030858589136219, - "loss": 0.0315, + "epoch": 0.78, + "learning_rate": 0.00018249740216991423, + "loss": 0.0451, "step": 121370 }, { - "epoch": 1.31, - "learning_rate": 0.00010306963462911285, - "loss": 0.0345, + "epoch": 0.78, + "learning_rate": 0.00018248772081555726, + "loss": 0.0386, "step": 121380 }, { - "epoch": 1.31, - "learning_rate": 0.0001030534103446038, - "loss": 0.0304, + "epoch": 0.78, + "learning_rate": 0.00018247803946120034, + "loss": 0.0392, "step": 121390 }, { - "epoch": 1.31, - "learning_rate": 0.00010303718606009475, - "loss": 0.0343, + "epoch": 0.78, + "learning_rate": 0.00018246835810684342, + "loss": 0.0516, "step": 121400 }, { - "epoch": 1.31, - "learning_rate": 0.00010302096177558569, - "loss": 0.0313, + "epoch": 0.78, + "learning_rate": 0.00018245867675248647, + "loss": 0.0395, "step": 121410 }, { - "epoch": 1.31, - "learning_rate": 0.00010300473749107664, - "loss": 0.0321, + "epoch": 0.78, + "learning_rate": 0.00018244899539812955, + "loss": 0.0409, "step": 121420 }, { - "epoch": 1.31, - "learning_rate": 0.00010298851320656759, - "loss": 0.0321, + "epoch": 0.78, + "learning_rate": 0.00018243931404377263, + "loss": 0.047, "step": 121430 }, { - "epoch": 1.31, - "learning_rate": 0.00010297228892205854, - "loss": 0.0396, + "epoch": 0.78, + "learning_rate": 0.0001824296326894157, + "loss": 0.044, "step": 121440 }, { - "epoch": 1.31, - "learning_rate": 0.00010295606463754949, - "loss": 0.0314, + "epoch": 0.78, + "learning_rate": 0.00018241995133505873, + "loss": 0.0477, "step": 121450 }, { - "epoch": 1.31, - "learning_rate": 0.00010293984035304042, - "loss": 0.0353, + "epoch": 0.78, + "learning_rate": 0.0001824102699807018, + "loss": 0.0414, "step": 121460 }, { - "epoch": 1.31, - "learning_rate": 0.00010292361606853137, - "loss": 0.0313, + "epoch": 0.78, + "learning_rate": 0.00018240058862634487, + "loss": 0.0412, "step": 121470 }, { - "epoch": 1.31, - "learning_rate": 0.00010290739178402232, - "loss": 0.0338, + "epoch": 0.78, + "learning_rate": 0.00018239090727198795, + "loss": 0.0418, "step": 121480 }, { - "epoch": 1.31, - "learning_rate": 0.00010289116749951327, - "loss": 0.0327, + "epoch": 0.78, + "learning_rate": 0.00018238122591763103, + "loss": 0.0406, "step": 121490 }, { - "epoch": 1.31, - "learning_rate": 0.00010287494321500421, - "loss": 0.0415, + "epoch": 0.78, + "learning_rate": 0.0001823715445632741, + "loss": 0.0404, "step": 121500 }, { - "epoch": 1.31, - "learning_rate": 0.00010285871893049516, - "loss": 0.0322, + "epoch": 0.78, + "learning_rate": 0.00018236186320891716, + "loss": 0.0428, "step": 121510 }, { - "epoch": 1.31, - "learning_rate": 0.0001028424946459861, - "loss": 0.0329, + "epoch": 0.78, + "learning_rate": 0.0001823521818545602, + "loss": 0.0447, "step": 121520 }, { - "epoch": 1.31, - "learning_rate": 0.00010282627036147706, - "loss": 0.0282, + "epoch": 0.78, + "learning_rate": 0.0001823425005002033, + "loss": 0.0426, "step": 121530 }, { - "epoch": 1.31, - "learning_rate": 0.000102810046076968, - "loss": 0.0349, + "epoch": 0.78, + "learning_rate": 0.00018233281914584634, + "loss": 0.0383, "step": 121540 }, { - "epoch": 1.31, - "learning_rate": 0.00010279382179245894, - "loss": 0.0322, + "epoch": 0.78, + "learning_rate": 0.00018232313779148942, + "loss": 0.0409, "step": 121550 }, { - "epoch": 1.31, - "learning_rate": 0.00010277759750794989, - "loss": 0.0343, + "epoch": 0.78, + "learning_rate": 0.0001823134564371325, + "loss": 0.0405, "step": 121560 }, { - "epoch": 1.31, - "learning_rate": 0.00010276137322344084, - "loss": 0.0326, + "epoch": 0.78, + "learning_rate": 0.00018230377508277558, + "loss": 0.037, "step": 121570 }, { - "epoch": 1.32, - "learning_rate": 0.00010274514893893179, - "loss": 0.0318, + "epoch": 0.78, + "learning_rate": 0.00018229409372841864, + "loss": 0.0405, "step": 121580 }, { - "epoch": 1.32, - "learning_rate": 0.00010272892465442273, - "loss": 0.0325, + "epoch": 0.78, + "learning_rate": 0.0001822844123740617, + "loss": 0.0409, "step": 121590 }, { - "epoch": 1.32, - "learning_rate": 0.00010271270036991368, - "loss": 0.0352, + "epoch": 0.78, + "learning_rate": 0.00018227473101970477, + "loss": 0.0355, "step": 121600 }, { - "epoch": 1.32, - "learning_rate": 0.00010269647608540463, - "loss": 0.0306, + "epoch": 0.78, + "learning_rate": 0.00018226504966534782, + "loss": 0.0528, "step": 121610 }, { - "epoch": 1.32, - "learning_rate": 0.00010268025180089558, - "loss": 0.0249, + "epoch": 0.78, + "learning_rate": 0.0001822553683109909, + "loss": 0.0413, "step": 121620 }, { - "epoch": 1.32, - "learning_rate": 0.00010266402751638653, - "loss": 0.031, + "epoch": 0.79, + "learning_rate": 0.00018224568695663398, + "loss": 0.0371, "step": 121630 }, { - "epoch": 1.32, - "learning_rate": 0.00010264780323187746, - "loss": 0.0326, + "epoch": 0.79, + "learning_rate": 0.00018223600560227706, + "loss": 0.0406, "step": 121640 }, { - "epoch": 1.32, - "learning_rate": 0.00010263157894736841, - "loss": 0.0334, + "epoch": 0.79, + "learning_rate": 0.0001822263242479201, + "loss": 0.0398, "step": 121650 }, { - "epoch": 1.32, - "learning_rate": 0.00010261535466285936, - "loss": 0.035, + "epoch": 0.79, + "learning_rate": 0.00018221664289356317, + "loss": 0.0439, "step": 121660 }, { - "epoch": 1.32, - "learning_rate": 0.00010259913037835031, - "loss": 0.0307, + "epoch": 0.79, + "learning_rate": 0.00018220696153920622, + "loss": 0.0466, "step": 121670 }, { - "epoch": 1.32, - "learning_rate": 0.00010258290609384125, - "loss": 0.0385, + "epoch": 0.79, + "learning_rate": 0.0001821972801848493, + "loss": 0.0405, "step": 121680 }, { - "epoch": 1.32, - "learning_rate": 0.0001025666818093322, - "loss": 0.0273, + "epoch": 0.79, + "learning_rate": 0.00018218759883049238, + "loss": 0.0435, "step": 121690 }, { - "epoch": 1.32, - "learning_rate": 0.00010255045752482315, - "loss": 0.0303, + "epoch": 0.79, + "learning_rate": 0.00018217791747613546, + "loss": 0.0404, "step": 121700 }, { - "epoch": 1.32, - "learning_rate": 0.0001025342332403141, - "loss": 0.0358, + "epoch": 0.79, + "learning_rate": 0.0001821682361217785, + "loss": 0.0472, "step": 121710 }, { - "epoch": 1.32, - "learning_rate": 0.00010251800895580505, - "loss": 0.031, + "epoch": 0.79, + "learning_rate": 0.0001821585547674216, + "loss": 0.0403, "step": 121720 }, { - "epoch": 1.32, - "learning_rate": 0.00010250178467129598, - "loss": 0.0271, + "epoch": 0.79, + "learning_rate": 0.00018214887341306464, + "loss": 0.0425, "step": 121730 }, { - "epoch": 1.32, - "learning_rate": 0.00010248556038678693, - "loss": 0.0305, + "epoch": 0.79, + "learning_rate": 0.0001821391920587077, + "loss": 0.0447, "step": 121740 }, { - "epoch": 1.32, - "learning_rate": 0.00010246933610227788, - "loss": 0.0341, + "epoch": 0.79, + "learning_rate": 0.00018212951070435077, + "loss": 0.0375, "step": 121750 }, { - "epoch": 1.32, - "learning_rate": 0.00010245311181776883, - "loss": 0.0351, + "epoch": 0.79, + "learning_rate": 0.00018211982934999385, + "loss": 0.0417, "step": 121760 }, { - "epoch": 1.32, - "learning_rate": 0.00010243688753325977, - "loss": 0.0332, + "epoch": 0.79, + "learning_rate": 0.00018211014799563693, + "loss": 0.0444, "step": 121770 }, { - "epoch": 1.32, - "learning_rate": 0.00010242066324875072, - "loss": 0.0294, + "epoch": 0.79, + "learning_rate": 0.00018210046664128, + "loss": 0.0414, "step": 121780 }, { - "epoch": 1.32, - "learning_rate": 0.00010240443896424167, - "loss": 0.0292, + "epoch": 0.79, + "learning_rate": 0.00018209078528692307, + "loss": 0.0475, "step": 121790 }, { - "epoch": 1.32, - "learning_rate": 0.00010238821467973262, - "loss": 0.0289, + "epoch": 0.79, + "learning_rate": 0.00018208110393256612, + "loss": 0.0436, "step": 121800 }, { - "epoch": 1.32, - "learning_rate": 0.00010237199039522357, - "loss": 0.0292, + "epoch": 0.79, + "learning_rate": 0.00018207142257820917, + "loss": 0.0433, "step": 121810 }, { - "epoch": 1.32, - "learning_rate": 0.0001023557661107145, - "loss": 0.0304, + "epoch": 0.79, + "learning_rate": 0.00018206174122385225, + "loss": 0.0383, "step": 121820 }, { - "epoch": 1.32, - "learning_rate": 0.00010233954182620545, - "loss": 0.0389, + "epoch": 0.79, + "learning_rate": 0.00018205205986949533, + "loss": 0.0402, "step": 121830 }, { - "epoch": 1.32, - "learning_rate": 0.0001023233175416964, - "loss": 0.0304, + "epoch": 0.79, + "learning_rate": 0.0001820423785151384, + "loss": 0.0479, "step": 121840 }, { - "epoch": 1.32, - "learning_rate": 0.00010230709325718735, - "loss": 0.0364, + "epoch": 0.79, + "learning_rate": 0.00018203269716078146, + "loss": 0.0493, "step": 121850 }, { - "epoch": 1.32, - "learning_rate": 0.0001022908689726783, - "loss": 0.0286, + "epoch": 0.79, + "learning_rate": 0.00018202301580642454, + "loss": 0.0417, "step": 121860 }, { - "epoch": 1.32, - "learning_rate": 0.00010227464468816924, - "loss": 0.0342, + "epoch": 0.79, + "learning_rate": 0.00018201333445206757, + "loss": 0.0447, "step": 121870 }, { - "epoch": 1.32, - "learning_rate": 0.00010225842040366019, - "loss": 0.03, + "epoch": 0.79, + "learning_rate": 0.00018200365309771065, + "loss": 0.046, "step": 121880 }, { - "epoch": 1.32, - "learning_rate": 0.00010224219611915114, - "loss": 0.0376, + "epoch": 0.79, + "learning_rate": 0.00018199397174335373, + "loss": 0.0388, "step": 121890 }, { - "epoch": 1.32, - "learning_rate": 0.00010222597183464209, - "loss": 0.0342, + "epoch": 0.79, + "learning_rate": 0.0001819842903889968, + "loss": 0.0429, "step": 121900 }, { - "epoch": 1.32, - "learning_rate": 0.00010220974755013303, - "loss": 0.0374, + "epoch": 0.79, + "learning_rate": 0.00018197460903463986, + "loss": 0.043, "step": 121910 }, { - "epoch": 1.32, - "learning_rate": 0.00010219352326562398, - "loss": 0.0296, + "epoch": 0.79, + "learning_rate": 0.00018196492768028294, + "loss": 0.0409, "step": 121920 }, { - "epoch": 1.32, - "learning_rate": 0.00010217729898111493, - "loss": 0.0292, + "epoch": 0.79, + "learning_rate": 0.00018195524632592602, + "loss": 0.0413, "step": 121930 }, { - "epoch": 1.32, - "learning_rate": 0.00010216107469660587, - "loss": 0.0353, + "epoch": 0.79, + "learning_rate": 0.00018194556497156905, + "loss": 0.036, "step": 121940 }, { - "epoch": 1.32, - "learning_rate": 0.00010214485041209682, - "loss": 0.0389, + "epoch": 0.79, + "learning_rate": 0.00018193588361721213, + "loss": 0.0408, "step": 121950 }, { - "epoch": 1.32, - "learning_rate": 0.00010212862612758776, - "loss": 0.0339, + "epoch": 0.79, + "learning_rate": 0.0001819262022628552, + "loss": 0.0478, "step": 121960 }, { - "epoch": 1.32, - "learning_rate": 0.00010211240184307871, - "loss": 0.0241, + "epoch": 0.79, + "learning_rate": 0.00018191652090849829, + "loss": 0.044, "step": 121970 }, { - "epoch": 1.32, - "learning_rate": 0.00010209617755856966, - "loss": 0.0319, + "epoch": 0.79, + "learning_rate": 0.00018190683955414134, + "loss": 0.0502, "step": 121980 }, { - "epoch": 1.32, - "learning_rate": 0.00010207995327406061, - "loss": 0.0282, + "epoch": 0.79, + "learning_rate": 0.00018189715819978442, + "loss": 0.0409, "step": 121990 }, { - "epoch": 1.32, - "learning_rate": 0.00010206372898955155, - "loss": 0.0334, + "epoch": 0.79, + "learning_rate": 0.0001818874768454275, + "loss": 0.0437, "step": 122000 }, { - "epoch": 1.32, - "eval_cer": 0.9211446069466606, - "eval_loss": 0.025309177115559578, - "eval_runtime": 118.7477, - "eval_samples_per_second": 16.842, - "eval_steps_per_second": 4.211, + "epoch": 0.79, + "eval_cer": 0.9198617105411818, + "eval_loss": 0.028577525168657303, + "eval_runtime": 120.1701, + "eval_samples_per_second": 16.643, + "eval_steps_per_second": 4.161, "step": 122000 }, { - "epoch": 1.32, - "learning_rate": 0.0001020475047050425, - "loss": 0.0333, + "epoch": 0.79, + "learning_rate": 0.00018187779549107052, + "loss": 0.0392, "step": 122010 }, { - "epoch": 1.32, - "learning_rate": 0.00010203128042053345, - "loss": 0.0345, + "epoch": 0.79, + "learning_rate": 0.0001818681141367136, + "loss": 0.0412, "step": 122020 }, { - "epoch": 1.32, - "learning_rate": 0.0001020150561360244, - "loss": 0.0296, + "epoch": 0.79, + "learning_rate": 0.00018185843278235668, + "loss": 0.0414, "step": 122030 }, { - "epoch": 1.32, - "learning_rate": 0.00010199883185151535, - "loss": 0.0349, + "epoch": 0.79, + "learning_rate": 0.00018184875142799976, + "loss": 0.049, "step": 122040 }, { - "epoch": 1.32, - "learning_rate": 0.00010198260756700628, - "loss": 0.0337, + "epoch": 0.79, + "learning_rate": 0.00018183907007364282, + "loss": 0.038, "step": 122050 }, { - "epoch": 1.32, - "learning_rate": 0.00010196638328249723, - "loss": 0.0427, + "epoch": 0.79, + "learning_rate": 0.0001818293887192859, + "loss": 0.0456, "step": 122060 }, { - "epoch": 1.32, - "learning_rate": 0.00010195015899798818, - "loss": 0.0287, + "epoch": 0.79, + "learning_rate": 0.00018181970736492898, + "loss": 0.0418, "step": 122070 }, { - "epoch": 1.32, - "learning_rate": 0.00010193393471347913, - "loss": 0.0384, + "epoch": 0.79, + "learning_rate": 0.000181810026010572, + "loss": 0.0422, "step": 122080 }, { - "epoch": 1.32, - "learning_rate": 0.00010191771042897007, - "loss": 0.0325, + "epoch": 0.79, + "learning_rate": 0.00018180034465621508, + "loss": 0.0392, "step": 122090 }, { - "epoch": 1.32, - "learning_rate": 0.00010190148614446102, - "loss": 0.0327, + "epoch": 0.79, + "learning_rate": 0.00018179066330185816, + "loss": 0.0377, "step": 122100 }, { - "epoch": 1.32, - "learning_rate": 0.00010188526185995197, - "loss": 0.0324, + "epoch": 0.79, + "learning_rate": 0.00018178098194750121, + "loss": 0.0398, "step": 122110 }, { - "epoch": 1.32, - "learning_rate": 0.00010186903757544292, - "loss": 0.033, + "epoch": 0.79, + "learning_rate": 0.0001817713005931443, + "loss": 0.0417, "step": 122120 }, { - "epoch": 1.32, - "learning_rate": 0.00010185281329093387, - "loss": 0.0357, + "epoch": 0.79, + "learning_rate": 0.00018176161923878737, + "loss": 0.0403, "step": 122130 }, { - "epoch": 1.32, - "learning_rate": 0.0001018365890064248, - "loss": 0.031, + "epoch": 0.79, + "learning_rate": 0.00018175193788443045, + "loss": 0.0431, "step": 122140 }, { - "epoch": 1.32, - "learning_rate": 0.00010182036472191575, - "loss": 0.0277, + "epoch": 0.79, + "learning_rate": 0.00018174225653007348, + "loss": 0.0439, "step": 122150 }, { - "epoch": 1.32, - "learning_rate": 0.0001018041404374067, - "loss": 0.0399, + "epoch": 0.79, + "learning_rate": 0.00018173257517571656, + "loss": 0.0469, "step": 122160 }, { - "epoch": 1.32, - "learning_rate": 0.00010178791615289765, - "loss": 0.0345, + "epoch": 0.79, + "learning_rate": 0.00018172289382135964, + "loss": 0.0407, "step": 122170 }, { - "epoch": 1.32, - "learning_rate": 0.00010177169186838859, - "loss": 0.0282, + "epoch": 0.79, + "learning_rate": 0.0001817132124670027, + "loss": 0.0426, "step": 122180 }, { - "epoch": 1.32, - "learning_rate": 0.00010175546758387954, - "loss": 0.0342, + "epoch": 0.79, + "learning_rate": 0.00018170353111264577, + "loss": 0.0447, "step": 122190 }, { - "epoch": 1.32, - "learning_rate": 0.00010173924329937049, - "loss": 0.0358, + "epoch": 0.79, + "learning_rate": 0.00018169384975828885, + "loss": 0.0438, "step": 122200 }, { - "epoch": 1.32, - "learning_rate": 0.00010172301901486144, - "loss": 0.0325, + "epoch": 0.79, + "learning_rate": 0.00018168416840393193, + "loss": 0.04, "step": 122210 }, { - "epoch": 1.32, - "learning_rate": 0.00010170679473035239, - "loss": 0.0291, + "epoch": 0.79, + "learning_rate": 0.00018167448704957496, + "loss": 0.0423, "step": 122220 }, { - "epoch": 1.32, - "learning_rate": 0.00010169057044584332, - "loss": 0.0348, + "epoch": 0.79, + "learning_rate": 0.00018166480569521804, + "loss": 0.0494, "step": 122230 }, { - "epoch": 1.32, - "learning_rate": 0.00010167434616133427, - "loss": 0.034, + "epoch": 0.79, + "learning_rate": 0.00018165512434086112, + "loss": 0.0421, "step": 122240 }, { - "epoch": 1.32, - "learning_rate": 0.00010165812187682522, - "loss": 0.0333, + "epoch": 0.79, + "learning_rate": 0.00018164544298650417, + "loss": 0.0453, "step": 122250 }, { - "epoch": 1.32, - "learning_rate": 0.00010164189759231617, - "loss": 0.0308, + "epoch": 0.79, + "learning_rate": 0.00018163576163214725, + "loss": 0.0417, "step": 122260 }, { - "epoch": 1.32, - "learning_rate": 0.00010162567330780711, - "loss": 0.0316, + "epoch": 0.79, + "learning_rate": 0.00018162608027779033, + "loss": 0.0451, "step": 122270 }, { - "epoch": 1.32, - "learning_rate": 0.00010160944902329806, - "loss": 0.0351, + "epoch": 0.79, + "learning_rate": 0.00018161639892343338, + "loss": 0.0361, "step": 122280 }, { - "epoch": 1.32, - "learning_rate": 0.00010159322473878901, - "loss": 0.0315, + "epoch": 0.79, + "learning_rate": 0.00018160671756907643, + "loss": 0.0395, "step": 122290 }, { - "epoch": 1.32, - "learning_rate": 0.00010157700045427996, - "loss": 0.031, + "epoch": 0.79, + "learning_rate": 0.0001815970362147195, + "loss": 0.0419, "step": 122300 }, { - "epoch": 1.32, - "learning_rate": 0.00010156077616977091, - "loss": 0.0324, + "epoch": 0.79, + "learning_rate": 0.00018158735486036257, + "loss": 0.0433, "step": 122310 }, { - "epoch": 1.32, - "learning_rate": 0.00010154455188526184, - "loss": 0.0324, + "epoch": 0.79, + "learning_rate": 0.00018157767350600565, + "loss": 0.0469, "step": 122320 }, { - "epoch": 1.32, - "learning_rate": 0.0001015283276007528, - "loss": 0.0313, + "epoch": 0.79, + "learning_rate": 0.00018156799215164873, + "loss": 0.0382, "step": 122330 }, { - "epoch": 1.32, - "learning_rate": 0.00010151210331624374, - "loss": 0.0265, + "epoch": 0.79, + "learning_rate": 0.0001815583107972918, + "loss": 0.041, "step": 122340 }, { - "epoch": 1.32, - "learning_rate": 0.0001014958790317347, - "loss": 0.0401, + "epoch": 0.79, + "learning_rate": 0.00018154862944293486, + "loss": 0.0466, "step": 122350 }, { - "epoch": 1.32, - "learning_rate": 0.00010147965474722563, - "loss": 0.0315, + "epoch": 0.79, + "learning_rate": 0.0001815389480885779, + "loss": 0.0423, "step": 122360 }, { - "epoch": 1.32, - "learning_rate": 0.00010146343046271658, - "loss": 0.0316, + "epoch": 0.79, + "learning_rate": 0.000181529266734221, + "loss": 0.0409, "step": 122370 }, { - "epoch": 1.32, - "learning_rate": 0.00010144720617820753, - "loss": 0.029, + "epoch": 0.79, + "learning_rate": 0.00018151958537986404, + "loss": 0.0368, "step": 122380 }, { - "epoch": 1.32, - "learning_rate": 0.00010143098189369848, - "loss": 0.0314, + "epoch": 0.79, + "learning_rate": 0.00018150990402550712, + "loss": 0.0403, "step": 122390 }, { - "epoch": 1.32, - "learning_rate": 0.00010141475760918943, - "loss": 0.033, + "epoch": 0.79, + "learning_rate": 0.0001815002226711502, + "loss": 0.0406, "step": 122400 }, { - "epoch": 1.32, - "learning_rate": 0.00010139853332468036, - "loss": 0.033, + "epoch": 0.79, + "learning_rate": 0.00018149054131679328, + "loss": 0.0427, "step": 122410 }, { - "epoch": 1.32, - "learning_rate": 0.00010138230904017131, - "loss": 0.0326, + "epoch": 0.79, + "learning_rate": 0.00018148085996243633, + "loss": 0.0399, "step": 122420 }, { - "epoch": 1.32, - "learning_rate": 0.00010136608475566226, - "loss": 0.0421, + "epoch": 0.79, + "learning_rate": 0.0001814711786080794, + "loss": 0.0492, "step": 122430 }, { - "epoch": 1.32, - "learning_rate": 0.00010134986047115321, - "loss": 0.0342, + "epoch": 0.79, + "learning_rate": 0.00018146149725372247, + "loss": 0.0457, "step": 122440 }, { - "epoch": 1.32, - "learning_rate": 0.00010133363618664415, - "loss": 0.0333, + "epoch": 0.79, + "learning_rate": 0.00018145181589936552, + "loss": 0.0567, "step": 122450 }, { - "epoch": 1.32, - "learning_rate": 0.0001013174119021351, - "loss": 0.0301, + "epoch": 0.79, + "learning_rate": 0.0001814421345450086, + "loss": 0.0425, "step": 122460 }, { - "epoch": 1.32, - "learning_rate": 0.00010130118761762605, - "loss": 0.0388, + "epoch": 0.79, + "learning_rate": 0.00018143245319065168, + "loss": 0.0411, "step": 122470 }, { - "epoch": 1.32, - "learning_rate": 0.000101284963333117, - "loss": 0.0335, + "epoch": 0.79, + "learning_rate": 0.00018142277183629473, + "loss": 0.0401, "step": 122480 }, { - "epoch": 1.32, - "learning_rate": 0.00010126873904860795, - "loss": 0.0322, + "epoch": 0.79, + "learning_rate": 0.0001814130904819378, + "loss": 0.0471, "step": 122490 }, { - "epoch": 1.32, - "learning_rate": 0.00010125251476409889, - "loss": 0.0288, + "epoch": 0.79, + "learning_rate": 0.00018140340912758086, + "loss": 0.044, "step": 122500 }, { - "epoch": 1.33, - "learning_rate": 0.00010123629047958984, - "loss": 0.0295, + "epoch": 0.79, + "learning_rate": 0.00018139372777322392, + "loss": 0.0362, "step": 122510 }, { - "epoch": 1.33, - "learning_rate": 0.00010122006619508079, - "loss": 0.034, + "epoch": 0.79, + "learning_rate": 0.000181384046418867, + "loss": 0.0564, "step": 122520 }, { - "epoch": 1.33, - "learning_rate": 0.00010120384191057174, - "loss": 0.0319, + "epoch": 0.79, + "learning_rate": 0.00018137436506451008, + "loss": 0.0446, "step": 122530 }, { - "epoch": 1.33, - "learning_rate": 0.00010118761762606267, - "loss": 0.0256, + "epoch": 0.79, + "learning_rate": 0.00018136468371015316, + "loss": 0.0444, "step": 122540 }, { - "epoch": 1.33, - "learning_rate": 0.00010117139334155362, - "loss": 0.0343, + "epoch": 0.79, + "learning_rate": 0.0001813550023557962, + "loss": 0.0431, "step": 122550 }, { - "epoch": 1.33, - "learning_rate": 0.00010115516905704457, - "loss": 0.0323, + "epoch": 0.79, + "learning_rate": 0.0001813453210014393, + "loss": 0.0413, "step": 122560 }, { - "epoch": 1.33, - "learning_rate": 0.00010113894477253552, - "loss": 0.029, + "epoch": 0.79, + "learning_rate": 0.00018133563964708234, + "loss": 0.0418, "step": 122570 }, { - "epoch": 1.33, - "learning_rate": 0.00010112272048802647, - "loss": 0.0388, + "epoch": 0.79, + "learning_rate": 0.0001813259582927254, + "loss": 0.05, "step": 122580 }, { - "epoch": 1.33, - "learning_rate": 0.0001011064962035174, - "loss": 0.0407, + "epoch": 0.79, + "learning_rate": 0.00018131627693836847, + "loss": 0.044, "step": 122590 }, { - "epoch": 1.33, - "learning_rate": 0.00010109027191900836, - "loss": 0.0259, + "epoch": 0.79, + "learning_rate": 0.00018130659558401155, + "loss": 0.0391, "step": 122600 }, { - "epoch": 1.33, - "learning_rate": 0.0001010740476344993, - "loss": 0.0314, + "epoch": 0.79, + "learning_rate": 0.00018129691422965463, + "loss": 0.0466, "step": 122610 }, { - "epoch": 1.33, - "learning_rate": 0.00010105782334999026, - "loss": 0.0297, + "epoch": 0.79, + "learning_rate": 0.0001812872328752977, + "loss": 0.0549, "step": 122620 }, { - "epoch": 1.33, - "learning_rate": 0.0001010415990654812, - "loss": 0.0291, + "epoch": 0.79, + "learning_rate": 0.00018127755152094077, + "loss": 0.0499, "step": 122630 }, { - "epoch": 1.33, - "learning_rate": 0.00010102537478097214, - "loss": 0.0378, + "epoch": 0.79, + "learning_rate": 0.00018126787016658382, + "loss": 0.0438, "step": 122640 }, { - "epoch": 1.33, - "learning_rate": 0.00010100915049646309, - "loss": 0.0306, + "epoch": 0.79, + "learning_rate": 0.00018125818881222687, + "loss": 0.0403, "step": 122650 }, { - "epoch": 1.33, - "learning_rate": 0.00010099292621195404, - "loss": 0.0332, + "epoch": 0.79, + "learning_rate": 0.00018124850745786995, + "loss": 0.0416, "step": 122660 }, { - "epoch": 1.33, - "learning_rate": 0.00010097670192744499, - "loss": 0.0334, + "epoch": 0.79, + "learning_rate": 0.00018123882610351303, + "loss": 0.035, "step": 122670 }, { - "epoch": 1.33, - "learning_rate": 0.00010096047764293593, - "loss": 0.0327, + "epoch": 0.79, + "learning_rate": 0.00018122914474915608, + "loss": 0.0451, "step": 122680 }, { - "epoch": 1.33, - "learning_rate": 0.00010094425335842688, - "loss": 0.0299, + "epoch": 0.79, + "learning_rate": 0.00018121946339479916, + "loss": 0.0402, "step": 122690 }, { - "epoch": 1.33, - "learning_rate": 0.00010092802907391783, - "loss": 0.0324, + "epoch": 0.79, + "learning_rate": 0.00018120978204044224, + "loss": 0.0413, "step": 122700 }, { - "epoch": 1.33, - "learning_rate": 0.00010091180478940878, - "loss": 0.0317, + "epoch": 0.79, + "learning_rate": 0.00018120010068608527, + "loss": 0.0393, "step": 122710 }, { - "epoch": 1.33, - "learning_rate": 0.00010089558050489973, - "loss": 0.0316, + "epoch": 0.79, + "learning_rate": 0.00018119041933172835, + "loss": 0.0445, "step": 122720 }, { - "epoch": 1.33, - "learning_rate": 0.00010087935622039066, - "loss": 0.0317, + "epoch": 0.79, + "learning_rate": 0.00018118073797737143, + "loss": 0.0408, "step": 122730 }, { - "epoch": 1.33, - "learning_rate": 0.00010086313193588161, - "loss": 0.0299, + "epoch": 0.79, + "learning_rate": 0.0001811710566230145, + "loss": 0.038, "step": 122740 }, { - "epoch": 1.33, - "learning_rate": 0.00010084690765137256, - "loss": 0.0345, + "epoch": 0.79, + "learning_rate": 0.00018116137526865756, + "loss": 0.042, "step": 122750 }, { - "epoch": 1.33, - "learning_rate": 0.00010083068336686351, - "loss": 0.0309, + "epoch": 0.79, + "learning_rate": 0.00018115169391430064, + "loss": 0.0491, "step": 122760 }, { - "epoch": 1.33, - "learning_rate": 0.00010081445908235445, - "loss": 0.0341, + "epoch": 0.79, + "learning_rate": 0.00018114201255994372, + "loss": 0.0413, "step": 122770 }, { - "epoch": 1.33, - "learning_rate": 0.0001007982347978454, - "loss": 0.0325, + "epoch": 0.79, + "learning_rate": 0.00018113233120558675, + "loss": 0.0562, "step": 122780 }, { - "epoch": 1.33, - "learning_rate": 0.00010078201051333635, - "loss": 0.0328, + "epoch": 0.79, + "learning_rate": 0.00018112264985122983, + "loss": 0.0416, "step": 122790 }, { - "epoch": 1.33, - "learning_rate": 0.0001007657862288273, - "loss": 0.0264, + "epoch": 0.79, + "learning_rate": 0.0001811129684968729, + "loss": 0.0394, "step": 122800 }, { - "epoch": 1.33, - "learning_rate": 0.00010074956194431825, - "loss": 0.0327, + "epoch": 0.79, + "learning_rate": 0.00018110328714251599, + "loss": 0.04, "step": 122810 }, { - "epoch": 1.33, - "learning_rate": 0.00010073333765980918, - "loss": 0.0292, + "epoch": 0.79, + "learning_rate": 0.00018109360578815904, + "loss": 0.0432, "step": 122820 }, { - "epoch": 1.33, - "learning_rate": 0.00010071711337530013, - "loss": 0.0396, + "epoch": 0.79, + "learning_rate": 0.00018108392443380212, + "loss": 0.0475, "step": 122830 }, { - "epoch": 1.33, - "learning_rate": 0.00010070088909079108, - "loss": 0.037, + "epoch": 0.79, + "learning_rate": 0.0001810742430794452, + "loss": 0.0402, "step": 122840 }, { - "epoch": 1.33, - "learning_rate": 0.00010068466480628203, - "loss": 0.035, + "epoch": 0.79, + "learning_rate": 0.00018106456172508822, + "loss": 0.0397, "step": 122850 }, { - "epoch": 1.33, - "learning_rate": 0.00010066844052177297, - "loss": 0.0391, + "epoch": 0.79, + "learning_rate": 0.0001810548803707313, + "loss": 0.0455, "step": 122860 }, { - "epoch": 1.33, - "learning_rate": 0.00010065221623726392, - "loss": 0.0297, + "epoch": 0.79, + "learning_rate": 0.00018104519901637438, + "loss": 0.0462, "step": 122870 }, { - "epoch": 1.33, - "learning_rate": 0.00010063599195275487, - "loss": 0.0276, + "epoch": 0.79, + "learning_rate": 0.00018103551766201744, + "loss": 0.0453, "step": 122880 }, { - "epoch": 1.33, - "learning_rate": 0.00010061976766824582, - "loss": 0.0325, + "epoch": 0.79, + "learning_rate": 0.00018102583630766052, + "loss": 0.0509, "step": 122890 }, { - "epoch": 1.33, - "learning_rate": 0.00010060354338373677, - "loss": 0.032, + "epoch": 0.79, + "learning_rate": 0.0001810161549533036, + "loss": 0.0442, "step": 122900 }, { - "epoch": 1.33, - "learning_rate": 0.0001005873190992277, - "loss": 0.027, + "epoch": 0.79, + "learning_rate": 0.00018100647359894668, + "loss": 0.0431, "step": 122910 }, { - "epoch": 1.33, - "learning_rate": 0.00010057109481471865, - "loss": 0.0302, + "epoch": 0.79, + "learning_rate": 0.0001809967922445897, + "loss": 0.042, "step": 122920 }, { - "epoch": 1.33, - "learning_rate": 0.0001005548705302096, - "loss": 0.0316, + "epoch": 0.79, + "learning_rate": 0.00018098711089023278, + "loss": 0.0471, "step": 122930 }, { - "epoch": 1.33, - "learning_rate": 0.00010053864624570055, - "loss": 0.0402, + "epoch": 0.79, + "learning_rate": 0.00018097742953587586, + "loss": 0.0413, "step": 122940 }, { - "epoch": 1.33, - "learning_rate": 0.00010052242196119149, - "loss": 0.0354, + "epoch": 0.79, + "learning_rate": 0.0001809677481815189, + "loss": 0.0395, "step": 122950 }, { - "epoch": 1.33, - "learning_rate": 0.00010050619767668244, - "loss": 0.0324, + "epoch": 0.79, + "learning_rate": 0.000180958066827162, + "loss": 0.0459, "step": 122960 }, { - "epoch": 1.33, - "learning_rate": 0.00010048997339217339, - "loss": 0.0335, + "epoch": 0.79, + "learning_rate": 0.00018094838547280507, + "loss": 0.0457, "step": 122970 }, { - "epoch": 1.33, - "learning_rate": 0.00010047374910766434, - "loss": 0.0296, + "epoch": 0.79, + "learning_rate": 0.00018093870411844815, + "loss": 0.0395, "step": 122980 }, { - "epoch": 1.33, - "learning_rate": 0.00010045752482315529, - "loss": 0.0307, + "epoch": 0.79, + "learning_rate": 0.00018092902276409118, + "loss": 0.0393, "step": 122990 }, { - "epoch": 1.33, - "learning_rate": 0.00010044130053864623, - "loss": 0.0297, + "epoch": 0.79, + "learning_rate": 0.00018091934140973426, + "loss": 0.0512, "step": 123000 }, { - "epoch": 1.33, - "eval_cer": 0.9210218026260688, - "eval_loss": 0.0259681586176157, - "eval_runtime": 118.848, - "eval_samples_per_second": 16.828, - "eval_steps_per_second": 4.207, + "epoch": 0.79, + "eval_cer": 0.9199557112190713, + "eval_loss": 0.028470169752836227, + "eval_runtime": 120.5044, + "eval_samples_per_second": 16.597, + "eval_steps_per_second": 4.149, "step": 123000 }, { - "epoch": 1.33, - "learning_rate": 0.00010042507625413718, - "loss": 0.0336, + "epoch": 0.79, + "learning_rate": 0.00018090966005537734, + "loss": 0.0497, "step": 123010 }, { - "epoch": 1.33, - "learning_rate": 0.00010040885196962812, - "loss": 0.0312, + "epoch": 0.79, + "learning_rate": 0.0001808999787010204, + "loss": 0.0392, "step": 123020 }, { - "epoch": 1.33, - "learning_rate": 0.00010039262768511907, - "loss": 0.0308, + "epoch": 0.79, + "learning_rate": 0.00018089029734666347, + "loss": 0.041, "step": 123030 }, { - "epoch": 1.33, - "learning_rate": 0.00010037640340061001, - "loss": 0.0394, + "epoch": 0.79, + "learning_rate": 0.00018088061599230655, + "loss": 0.0441, "step": 123040 }, { - "epoch": 1.33, - "learning_rate": 0.00010036017911610096, - "loss": 0.0352, + "epoch": 0.79, + "learning_rate": 0.0001808709346379496, + "loss": 0.0418, "step": 123050 }, { - "epoch": 1.33, - "learning_rate": 0.00010034395483159191, - "loss": 0.0303, + "epoch": 0.79, + "learning_rate": 0.00018086125328359266, + "loss": 0.0438, "step": 123060 }, { - "epoch": 1.33, - "learning_rate": 0.00010032773054708286, - "loss": 0.0383, + "epoch": 0.79, + "learning_rate": 0.00018085157192923574, + "loss": 0.0466, "step": 123070 }, { - "epoch": 1.33, - "learning_rate": 0.00010031150626257381, - "loss": 0.033, + "epoch": 0.79, + "learning_rate": 0.0001808418905748788, + "loss": 0.0421, "step": 123080 }, { - "epoch": 1.33, - "learning_rate": 0.00010029528197806475, - "loss": 0.0353, + "epoch": 0.79, + "learning_rate": 0.00018083220922052187, + "loss": 0.039, "step": 123090 }, { - "epoch": 1.33, - "learning_rate": 0.0001002790576935557, - "loss": 0.0332, + "epoch": 0.79, + "learning_rate": 0.00018082252786616495, + "loss": 0.0419, "step": 123100 }, { - "epoch": 1.33, - "learning_rate": 0.00010026283340904665, - "loss": 0.0267, + "epoch": 0.79, + "learning_rate": 0.00018081284651180803, + "loss": 0.0413, "step": 123110 }, { - "epoch": 1.33, - "learning_rate": 0.0001002466091245376, - "loss": 0.0302, + "epoch": 0.79, + "learning_rate": 0.00018080316515745108, + "loss": 0.0429, "step": 123120 }, { - "epoch": 1.33, - "learning_rate": 0.00010023038484002853, - "loss": 0.0313, + "epoch": 0.79, + "learning_rate": 0.00018079348380309413, + "loss": 0.0419, "step": 123130 }, { - "epoch": 1.33, - "learning_rate": 0.00010021416055551948, - "loss": 0.035, + "epoch": 0.79, + "learning_rate": 0.0001807838024487372, + "loss": 0.0502, "step": 123140 }, { - "epoch": 1.33, - "learning_rate": 0.00010019793627101043, - "loss": 0.0321, + "epoch": 0.79, + "learning_rate": 0.00018077412109438027, + "loss": 0.0367, "step": 123150 }, { - "epoch": 1.33, - "learning_rate": 0.00010018171198650138, - "loss": 0.0338, + "epoch": 0.79, + "learning_rate": 0.00018076443974002334, + "loss": 0.0345, "step": 123160 }, { - "epoch": 1.33, - "learning_rate": 0.00010016548770199233, - "loss": 0.0342, + "epoch": 0.79, + "learning_rate": 0.00018075475838566642, + "loss": 0.037, "step": 123170 }, { - "epoch": 1.33, - "learning_rate": 0.00010014926341748327, - "loss": 0.0359, + "epoch": 0.8, + "learning_rate": 0.0001807450770313095, + "loss": 0.0378, "step": 123180 }, { - "epoch": 1.33, - "learning_rate": 0.00010013303913297422, - "loss": 0.0313, + "epoch": 0.8, + "learning_rate": 0.00018073539567695256, + "loss": 0.0434, "step": 123190 }, { - "epoch": 1.33, - "learning_rate": 0.00010011681484846518, - "loss": 0.0339, + "epoch": 0.8, + "learning_rate": 0.0001807257143225956, + "loss": 0.0393, "step": 123200 }, { - "epoch": 1.33, - "learning_rate": 0.00010010059056395613, - "loss": 0.0294, + "epoch": 0.8, + "learning_rate": 0.0001807160329682387, + "loss": 0.0417, "step": 123210 }, { - "epoch": 1.33, - "learning_rate": 0.00010008436627944708, - "loss": 0.0398, + "epoch": 0.8, + "learning_rate": 0.00018070635161388174, + "loss": 0.0395, "step": 123220 }, { - "epoch": 1.33, - "learning_rate": 0.00010006814199493803, - "loss": 0.0336, + "epoch": 0.8, + "learning_rate": 0.00018069667025952482, + "loss": 0.0413, "step": 123230 }, { - "epoch": 1.33, - "learning_rate": 0.00010005191771042897, - "loss": 0.0341, + "epoch": 0.8, + "learning_rate": 0.0001806869889051679, + "loss": 0.0443, "step": 123240 }, { - "epoch": 1.33, - "learning_rate": 0.00010003569342591992, - "loss": 0.031, + "epoch": 0.8, + "learning_rate": 0.00018067730755081095, + "loss": 0.0431, "step": 123250 }, { - "epoch": 1.33, - "learning_rate": 0.00010001946914141087, - "loss": 0.0344, + "epoch": 0.8, + "learning_rate": 0.00018066762619645403, + "loss": 0.0407, "step": 123260 }, { - "epoch": 1.33, - "learning_rate": 0.00010000324485690181, - "loss": 0.0309, + "epoch": 0.8, + "learning_rate": 0.0001806579448420971, + "loss": 0.0443, "step": 123270 }, { - "epoch": 1.33, - "learning_rate": 9.998702057239275e-05, - "loss": 0.0307, + "epoch": 0.8, + "learning_rate": 0.00018064826348774014, + "loss": 0.0403, "step": 123280 }, { - "epoch": 1.33, - "learning_rate": 9.99707962878837e-05, - "loss": 0.0338, + "epoch": 0.8, + "learning_rate": 0.00018063858213338322, + "loss": 0.0446, "step": 123290 }, { - "epoch": 1.33, - "learning_rate": 9.995457200337465e-05, - "loss": 0.0303, + "epoch": 0.8, + "learning_rate": 0.0001806289007790263, + "loss": 0.0427, "step": 123300 }, { - "epoch": 1.33, - "learning_rate": 9.99383477188656e-05, - "loss": 0.0336, + "epoch": 0.8, + "learning_rate": 0.00018061921942466938, + "loss": 0.0539, "step": 123310 }, { - "epoch": 1.33, - "learning_rate": 9.992212343435655e-05, - "loss": 0.0328, + "epoch": 0.8, + "learning_rate": 0.00018060953807031243, + "loss": 0.0481, "step": 123320 }, { - "epoch": 1.33, - "learning_rate": 9.990589914984749e-05, - "loss": 0.0323, + "epoch": 0.8, + "learning_rate": 0.0001805998567159555, + "loss": 0.0467, "step": 123330 }, { - "epoch": 1.33, - "learning_rate": 9.988967486533844e-05, - "loss": 0.0324, + "epoch": 0.8, + "learning_rate": 0.00018059017536159856, + "loss": 0.0444, "step": 123340 }, { - "epoch": 1.33, - "learning_rate": 9.987345058082939e-05, - "loss": 0.0382, + "epoch": 0.8, + "learning_rate": 0.00018058049400724162, + "loss": 0.0419, "step": 123350 }, { - "epoch": 1.33, - "learning_rate": 9.985722629632034e-05, - "loss": 0.0324, + "epoch": 0.8, + "learning_rate": 0.0001805708126528847, + "loss": 0.0467, "step": 123360 }, { - "epoch": 1.33, - "learning_rate": 9.984100201181127e-05, - "loss": 0.0297, + "epoch": 0.8, + "learning_rate": 0.00018056113129852778, + "loss": 0.0411, "step": 123370 }, { - "epoch": 1.33, - "learning_rate": 9.982477772730222e-05, - "loss": 0.0293, + "epoch": 0.8, + "learning_rate": 0.00018055144994417086, + "loss": 0.0427, "step": 123380 }, { - "epoch": 1.33, - "learning_rate": 9.980855344279317e-05, - "loss": 0.0327, + "epoch": 0.8, + "learning_rate": 0.0001805417685898139, + "loss": 0.0398, "step": 123390 }, { - "epoch": 1.33, - "learning_rate": 9.979232915828412e-05, - "loss": 0.0339, + "epoch": 0.8, + "learning_rate": 0.000180532087235457, + "loss": 0.0514, "step": 123400 }, { - "epoch": 1.33, - "learning_rate": 9.977610487377507e-05, - "loss": 0.0322, + "epoch": 0.8, + "learning_rate": 0.00018052240588110004, + "loss": 0.0387, "step": 123410 }, { - "epoch": 1.33, - "learning_rate": 9.975988058926601e-05, - "loss": 0.031, + "epoch": 0.8, + "learning_rate": 0.0001805127245267431, + "loss": 0.0464, "step": 123420 }, { - "epoch": 1.34, - "learning_rate": 9.974365630475696e-05, - "loss": 0.0307, + "epoch": 0.8, + "learning_rate": 0.00018050304317238617, + "loss": 0.0445, "step": 123430 }, { - "epoch": 1.34, - "learning_rate": 9.97274320202479e-05, - "loss": 0.031, + "epoch": 0.8, + "learning_rate": 0.00018049336181802925, + "loss": 0.042, "step": 123440 }, { - "epoch": 1.34, - "learning_rate": 9.971120773573886e-05, - "loss": 0.0338, + "epoch": 0.8, + "learning_rate": 0.0001804836804636723, + "loss": 0.0413, "step": 123450 }, { - "epoch": 1.34, - "learning_rate": 9.969498345122979e-05, - "loss": 0.034, + "epoch": 0.8, + "learning_rate": 0.00018047399910931539, + "loss": 0.0454, "step": 123460 }, { - "epoch": 1.34, - "learning_rate": 9.967875916672074e-05, - "loss": 0.0289, + "epoch": 0.8, + "learning_rate": 0.00018046431775495847, + "loss": 0.0383, "step": 123470 }, { - "epoch": 1.34, - "learning_rate": 9.966253488221169e-05, - "loss": 0.0346, + "epoch": 0.8, + "learning_rate": 0.0001804546364006015, + "loss": 0.0393, "step": 123480 }, { - "epoch": 1.34, - "learning_rate": 9.964631059770264e-05, - "loss": 0.0317, + "epoch": 0.8, + "learning_rate": 0.00018044495504624457, + "loss": 0.0388, "step": 123490 }, { - "epoch": 1.34, - "learning_rate": 9.963008631319359e-05, - "loss": 0.0301, + "epoch": 0.8, + "learning_rate": 0.00018043527369188765, + "loss": 0.0455, "step": 123500 }, { - "epoch": 1.34, - "learning_rate": 9.961386202868453e-05, - "loss": 0.0305, + "epoch": 0.8, + "learning_rate": 0.00018042559233753073, + "loss": 0.0487, "step": 123510 }, { - "epoch": 1.34, - "learning_rate": 9.959763774417548e-05, - "loss": 0.0293, + "epoch": 0.8, + "learning_rate": 0.00018041591098317378, + "loss": 0.0377, "step": 123520 }, { - "epoch": 1.34, - "learning_rate": 9.958141345966643e-05, - "loss": 0.0289, + "epoch": 0.8, + "learning_rate": 0.00018040622962881686, + "loss": 0.0405, "step": 123530 }, { - "epoch": 1.34, - "learning_rate": 9.956518917515738e-05, - "loss": 0.0262, + "epoch": 0.8, + "learning_rate": 0.00018039654827445994, + "loss": 0.0439, "step": 123540 }, { - "epoch": 1.34, - "learning_rate": 9.954896489064831e-05, - "loss": 0.0336, + "epoch": 0.8, + "learning_rate": 0.00018038686692010297, + "loss": 0.0545, "step": 123550 }, { - "epoch": 1.34, - "learning_rate": 9.953274060613926e-05, - "loss": 0.0257, + "epoch": 0.8, + "learning_rate": 0.00018037718556574605, + "loss": 0.0394, "step": 123560 }, { - "epoch": 1.34, - "learning_rate": 9.951651632163021e-05, - "loss": 0.0303, + "epoch": 0.8, + "learning_rate": 0.00018036750421138913, + "loss": 0.042, "step": 123570 }, { - "epoch": 1.34, - "learning_rate": 9.950029203712116e-05, - "loss": 0.0276, + "epoch": 0.8, + "learning_rate": 0.0001803578228570322, + "loss": 0.0477, "step": 123580 }, { - "epoch": 1.34, - "learning_rate": 9.948406775261211e-05, - "loss": 0.0295, + "epoch": 0.8, + "learning_rate": 0.00018034814150267526, + "loss": 0.045, "step": 123590 }, { - "epoch": 1.34, - "learning_rate": 9.946784346810305e-05, - "loss": 0.0326, + "epoch": 0.8, + "learning_rate": 0.00018033846014831834, + "loss": 0.0394, "step": 123600 }, { - "epoch": 1.34, - "learning_rate": 9.9451619183594e-05, - "loss": 0.0313, + "epoch": 0.8, + "learning_rate": 0.00018032877879396142, + "loss": 0.0461, "step": 123610 }, { - "epoch": 1.34, - "learning_rate": 9.943539489908495e-05, - "loss": 0.0322, + "epoch": 0.8, + "learning_rate": 0.00018031909743960445, + "loss": 0.0422, "step": 123620 }, { - "epoch": 1.34, - "learning_rate": 9.94191706145759e-05, - "loss": 0.0321, + "epoch": 0.8, + "learning_rate": 0.00018030941608524753, + "loss": 0.0426, "step": 123630 }, { - "epoch": 1.34, - "learning_rate": 9.940294633006683e-05, - "loss": 0.035, + "epoch": 0.8, + "learning_rate": 0.0001802997347308906, + "loss": 0.04, "step": 123640 }, { - "epoch": 1.34, - "learning_rate": 9.938672204555778e-05, - "loss": 0.0322, + "epoch": 0.8, + "learning_rate": 0.00018029005337653366, + "loss": 0.0424, "step": 123650 }, { - "epoch": 1.34, - "learning_rate": 9.937049776104873e-05, - "loss": 0.0333, + "epoch": 0.8, + "learning_rate": 0.00018028037202217674, + "loss": 0.048, "step": 123660 }, { - "epoch": 1.34, - "learning_rate": 9.935427347653968e-05, - "loss": 0.0359, + "epoch": 0.8, + "learning_rate": 0.00018027069066781982, + "loss": 0.0471, "step": 123670 }, { - "epoch": 1.34, - "learning_rate": 9.933804919203063e-05, - "loss": 0.0318, + "epoch": 0.8, + "learning_rate": 0.0001802610093134629, + "loss": 0.0413, "step": 123680 }, { - "epoch": 1.34, - "learning_rate": 9.932182490752157e-05, - "loss": 0.0276, + "epoch": 0.8, + "learning_rate": 0.00018025132795910592, + "loss": 0.0395, "step": 123690 }, { - "epoch": 1.34, - "learning_rate": 9.930560062301252e-05, - "loss": 0.0272, + "epoch": 0.8, + "learning_rate": 0.000180241646604749, + "loss": 0.0398, "step": 123700 }, { - "epoch": 1.34, - "learning_rate": 9.928937633850347e-05, - "loss": 0.0281, + "epoch": 0.8, + "learning_rate": 0.00018023196525039208, + "loss": 0.0429, "step": 123710 }, { - "epoch": 1.34, - "learning_rate": 9.927315205399442e-05, - "loss": 0.0303, + "epoch": 0.8, + "learning_rate": 0.00018022228389603514, + "loss": 0.0391, "step": 123720 }, { - "epoch": 1.34, - "learning_rate": 9.925692776948536e-05, - "loss": 0.029, + "epoch": 0.8, + "learning_rate": 0.00018021260254167822, + "loss": 0.0376, "step": 123730 }, { - "epoch": 1.34, - "learning_rate": 9.92407034849763e-05, - "loss": 0.0283, + "epoch": 0.8, + "learning_rate": 0.0001802029211873213, + "loss": 0.0422, "step": 123740 }, { - "epoch": 1.34, - "learning_rate": 9.922447920046725e-05, - "loss": 0.0324, + "epoch": 0.8, + "learning_rate": 0.00018019323983296438, + "loss": 0.0425, "step": 123750 }, { - "epoch": 1.34, - "learning_rate": 9.92082549159582e-05, - "loss": 0.0359, + "epoch": 0.8, + "learning_rate": 0.0001801835584786074, + "loss": 0.0378, "step": 123760 }, { - "epoch": 1.34, - "learning_rate": 9.919203063144915e-05, - "loss": 0.0291, + "epoch": 0.8, + "learning_rate": 0.00018017387712425048, + "loss": 0.0423, "step": 123770 }, { - "epoch": 1.34, - "learning_rate": 9.917580634694009e-05, - "loss": 0.0393, + "epoch": 0.8, + "learning_rate": 0.00018016419576989356, + "loss": 0.0435, "step": 123780 }, { - "epoch": 1.34, - "learning_rate": 9.915958206243104e-05, - "loss": 0.0358, + "epoch": 0.8, + "learning_rate": 0.0001801545144155366, + "loss": 0.047, "step": 123790 }, { - "epoch": 1.34, - "learning_rate": 9.914335777792199e-05, - "loss": 0.0306, + "epoch": 0.8, + "learning_rate": 0.0001801448330611797, + "loss": 0.0393, "step": 123800 }, { - "epoch": 1.34, - "learning_rate": 9.912713349341294e-05, - "loss": 0.0316, + "epoch": 0.8, + "learning_rate": 0.00018013515170682277, + "loss": 0.0401, "step": 123810 }, { - "epoch": 1.34, - "learning_rate": 9.911090920890388e-05, - "loss": 0.0314, + "epoch": 0.8, + "learning_rate": 0.00018012547035246585, + "loss": 0.0382, "step": 123820 }, { - "epoch": 1.34, - "learning_rate": 9.909468492439483e-05, - "loss": 0.0329, + "epoch": 0.8, + "learning_rate": 0.00018011578899810888, + "loss": 0.0439, "step": 123830 }, { - "epoch": 1.34, - "learning_rate": 9.907846063988578e-05, - "loss": 0.0312, + "epoch": 0.8, + "learning_rate": 0.00018010610764375196, + "loss": 0.0571, "step": 123840 }, { - "epoch": 1.34, - "learning_rate": 9.906223635537673e-05, - "loss": 0.035, + "epoch": 0.8, + "learning_rate": 0.000180096426289395, + "loss": 0.052, "step": 123850 }, { - "epoch": 1.34, - "learning_rate": 9.904601207086768e-05, - "loss": 0.0306, + "epoch": 0.8, + "learning_rate": 0.0001800867449350381, + "loss": 0.0403, "step": 123860 }, { - "epoch": 1.34, - "learning_rate": 9.902978778635861e-05, - "loss": 0.0346, + "epoch": 0.8, + "learning_rate": 0.00018007706358068117, + "loss": 0.0421, "step": 123870 }, { - "epoch": 1.34, - "learning_rate": 9.901356350184956e-05, - "loss": 0.0295, + "epoch": 0.8, + "learning_rate": 0.00018006738222632425, + "loss": 0.041, "step": 123880 }, { - "epoch": 1.34, - "learning_rate": 9.899733921734051e-05, - "loss": 0.0344, + "epoch": 0.8, + "learning_rate": 0.0001800577008719673, + "loss": 0.0447, "step": 123890 }, { - "epoch": 1.34, - "learning_rate": 9.898111493283146e-05, - "loss": 0.0332, + "epoch": 0.8, + "learning_rate": 0.00018004801951761036, + "loss": 0.0358, "step": 123900 }, { - "epoch": 1.34, - "learning_rate": 9.89648906483224e-05, - "loss": 0.0288, + "epoch": 0.8, + "learning_rate": 0.00018003833816325343, + "loss": 0.0426, "step": 123910 }, { - "epoch": 1.34, - "learning_rate": 9.894866636381335e-05, - "loss": 0.03, + "epoch": 0.8, + "learning_rate": 0.0001800286568088965, + "loss": 0.0456, "step": 123920 }, { - "epoch": 1.34, - "learning_rate": 9.89324420793043e-05, - "loss": 0.0341, + "epoch": 0.8, + "learning_rate": 0.00018001897545453957, + "loss": 0.0377, "step": 123930 }, { - "epoch": 1.34, - "learning_rate": 9.891621779479525e-05, - "loss": 0.0276, + "epoch": 0.8, + "learning_rate": 0.00018000929410018265, + "loss": 0.0432, "step": 123940 }, { - "epoch": 1.34, - "learning_rate": 9.88999935102862e-05, - "loss": 0.0291, + "epoch": 0.8, + "learning_rate": 0.00017999961274582573, + "loss": 0.048, "step": 123950 }, { - "epoch": 1.34, - "learning_rate": 9.888376922577713e-05, - "loss": 0.0333, + "epoch": 0.8, + "learning_rate": 0.00017998993139146878, + "loss": 0.04, "step": 123960 }, { - "epoch": 1.34, - "learning_rate": 9.886754494126808e-05, - "loss": 0.0333, + "epoch": 0.8, + "learning_rate": 0.00017998025003711183, + "loss": 0.0436, "step": 123970 }, { - "epoch": 1.34, - "learning_rate": 9.885132065675903e-05, - "loss": 0.0333, + "epoch": 0.8, + "learning_rate": 0.0001799705686827549, + "loss": 0.0347, "step": 123980 }, { - "epoch": 1.34, - "learning_rate": 9.883509637224998e-05, - "loss": 0.0344, + "epoch": 0.8, + "learning_rate": 0.00017996088732839796, + "loss": 0.0524, "step": 123990 }, { - "epoch": 1.34, - "learning_rate": 9.881887208774093e-05, - "loss": 0.0333, + "epoch": 0.8, + "learning_rate": 0.00017995120597404104, + "loss": 0.0427, "step": 124000 }, { - "epoch": 1.34, - "eval_cer": 0.9212108682707209, - "eval_loss": 0.02509281225502491, - "eval_runtime": 118.7646, - "eval_samples_per_second": 16.84, - "eval_steps_per_second": 4.21, + "epoch": 0.8, + "eval_cer": 0.9199322110495989, + "eval_loss": 0.02851358987390995, + "eval_runtime": 120.0347, + "eval_samples_per_second": 16.662, + "eval_steps_per_second": 4.165, "step": 124000 }, { - "epoch": 1.34, - "learning_rate": 9.880264780323187e-05, - "loss": 0.0347, + "epoch": 0.8, + "learning_rate": 0.00017994152461968412, + "loss": 0.0427, "step": 124010 }, { - "epoch": 1.34, - "learning_rate": 9.878642351872282e-05, - "loss": 0.03, + "epoch": 0.8, + "learning_rate": 0.0001799318432653272, + "loss": 0.0406, "step": 124020 }, { - "epoch": 1.34, - "learning_rate": 9.877019923421377e-05, - "loss": 0.0316, + "epoch": 0.8, + "learning_rate": 0.00017992216191097026, + "loss": 0.0433, "step": 124030 }, { - "epoch": 1.34, - "learning_rate": 9.875397494970472e-05, - "loss": 0.0303, + "epoch": 0.8, + "learning_rate": 0.0001799124805566133, + "loss": 0.0464, "step": 124040 }, { - "epoch": 1.34, - "learning_rate": 9.873775066519565e-05, - "loss": 0.0346, + "epoch": 0.8, + "learning_rate": 0.0001799027992022564, + "loss": 0.0488, "step": 124050 }, { - "epoch": 1.34, - "learning_rate": 9.87215263806866e-05, - "loss": 0.0322, + "epoch": 0.8, + "learning_rate": 0.00017989311784789944, + "loss": 0.0359, "step": 124060 }, { - "epoch": 1.34, - "learning_rate": 9.870530209617755e-05, - "loss": 0.0321, + "epoch": 0.8, + "learning_rate": 0.00017988343649354252, + "loss": 0.0368, "step": 124070 }, { - "epoch": 1.34, - "learning_rate": 9.86890778116685e-05, - "loss": 0.0318, + "epoch": 0.8, + "learning_rate": 0.0001798737551391856, + "loss": 0.0484, "step": 124080 }, { - "epoch": 1.34, - "learning_rate": 9.867285352715945e-05, - "loss": 0.0311, + "epoch": 0.8, + "learning_rate": 0.00017986407378482865, + "loss": 0.0388, "step": 124090 }, { - "epoch": 1.34, - "learning_rate": 9.865662924265039e-05, - "loss": 0.0323, + "epoch": 0.8, + "learning_rate": 0.00017985439243047173, + "loss": 0.0451, "step": 124100 }, { - "epoch": 1.34, - "learning_rate": 9.864040495814134e-05, - "loss": 0.0264, + "epoch": 0.8, + "learning_rate": 0.0001798447110761148, + "loss": 0.04, "step": 124110 }, { - "epoch": 1.34, - "learning_rate": 9.862418067363229e-05, - "loss": 0.0299, + "epoch": 0.8, + "learning_rate": 0.00017983502972175784, + "loss": 0.0372, "step": 124120 }, { - "epoch": 1.34, - "learning_rate": 9.860795638912324e-05, - "loss": 0.0346, + "epoch": 0.8, + "learning_rate": 0.00017982534836740092, + "loss": 0.0458, "step": 124130 }, { - "epoch": 1.34, - "learning_rate": 9.859173210461417e-05, - "loss": 0.0366, + "epoch": 0.8, + "learning_rate": 0.000179815667013044, + "loss": 0.0421, "step": 124140 }, { - "epoch": 1.34, - "learning_rate": 9.857550782010512e-05, - "loss": 0.0359, + "epoch": 0.8, + "learning_rate": 0.00017980598565868708, + "loss": 0.039, "step": 124150 }, { - "epoch": 1.34, - "learning_rate": 9.855928353559607e-05, - "loss": 0.0307, + "epoch": 0.8, + "learning_rate": 0.00017979630430433013, + "loss": 0.0429, "step": 124160 }, { - "epoch": 1.34, - "learning_rate": 9.854305925108702e-05, - "loss": 0.033, + "epoch": 0.8, + "learning_rate": 0.0001797866229499732, + "loss": 0.0469, "step": 124170 }, { - "epoch": 1.34, - "learning_rate": 9.852683496657797e-05, - "loss": 0.0301, + "epoch": 0.8, + "learning_rate": 0.00017977694159561626, + "loss": 0.0422, "step": 124180 }, { - "epoch": 1.34, - "learning_rate": 9.851061068206891e-05, - "loss": 0.0302, + "epoch": 0.8, + "learning_rate": 0.00017976726024125932, + "loss": 0.041, "step": 124190 }, { - "epoch": 1.34, - "learning_rate": 9.849438639755986e-05, - "loss": 0.031, + "epoch": 0.8, + "learning_rate": 0.0001797575788869024, + "loss": 0.0453, "step": 124200 }, { - "epoch": 1.34, - "learning_rate": 9.847816211305081e-05, - "loss": 0.0308, + "epoch": 0.8, + "learning_rate": 0.00017974789753254548, + "loss": 0.0416, "step": 124210 }, { - "epoch": 1.34, - "learning_rate": 9.846193782854176e-05, - "loss": 0.0316, + "epoch": 0.8, + "learning_rate": 0.00017973821617818856, + "loss": 0.0487, "step": 124220 }, { - "epoch": 1.34, - "learning_rate": 9.84457135440327e-05, - "loss": 0.0277, + "epoch": 0.8, + "learning_rate": 0.0001797285348238316, + "loss": 0.0436, "step": 124230 }, { - "epoch": 1.34, - "learning_rate": 9.842948925952364e-05, - "loss": 0.0303, + "epoch": 0.8, + "learning_rate": 0.0001797188534694747, + "loss": 0.0462, "step": 124240 }, { - "epoch": 1.34, - "learning_rate": 9.84132649750146e-05, - "loss": 0.0285, + "epoch": 0.8, + "learning_rate": 0.00017970917211511774, + "loss": 0.0436, "step": 124250 }, { - "epoch": 1.34, - "learning_rate": 9.839704069050554e-05, - "loss": 0.0285, + "epoch": 0.8, + "learning_rate": 0.0001796994907607608, + "loss": 0.0456, "step": 124260 }, { - "epoch": 1.34, - "learning_rate": 9.83808164059965e-05, - "loss": 0.0342, + "epoch": 0.8, + "learning_rate": 0.00017968980940640387, + "loss": 0.0457, "step": 124270 }, { - "epoch": 1.34, - "learning_rate": 9.836459212148743e-05, - "loss": 0.0351, + "epoch": 0.8, + "learning_rate": 0.00017968012805204695, + "loss": 0.0408, "step": 124280 }, { - "epoch": 1.34, - "learning_rate": 9.834836783697838e-05, - "loss": 0.0277, + "epoch": 0.8, + "learning_rate": 0.00017967044669769, + "loss": 0.0421, "step": 124290 }, { - "epoch": 1.34, - "learning_rate": 9.833214355246933e-05, - "loss": 0.0321, + "epoch": 0.8, + "learning_rate": 0.00017966076534333309, + "loss": 0.0431, "step": 124300 }, { - "epoch": 1.34, - "learning_rate": 9.831591926796028e-05, - "loss": 0.0284, + "epoch": 0.8, + "learning_rate": 0.00017965108398897617, + "loss": 0.0403, "step": 124310 }, { - "epoch": 1.34, - "learning_rate": 9.829969498345122e-05, - "loss": 0.0305, + "epoch": 0.8, + "learning_rate": 0.0001796414026346192, + "loss": 0.0445, "step": 124320 }, { - "epoch": 1.34, - "learning_rate": 9.828347069894217e-05, - "loss": 0.0279, + "epoch": 0.8, + "learning_rate": 0.00017963172128026227, + "loss": 0.0405, "step": 124330 }, { - "epoch": 1.34, - "learning_rate": 9.826724641443312e-05, - "loss": 0.0357, + "epoch": 0.8, + "learning_rate": 0.00017962203992590535, + "loss": 0.0401, "step": 124340 }, { - "epoch": 1.34, - "learning_rate": 9.825102212992406e-05, - "loss": 0.0295, + "epoch": 0.8, + "learning_rate": 0.00017961235857154843, + "loss": 0.04, "step": 124350 }, { - "epoch": 1.35, - "learning_rate": 9.823479784541501e-05, - "loss": 0.0304, + "epoch": 0.8, + "learning_rate": 0.00017960267721719148, + "loss": 0.0392, "step": 124360 }, { - "epoch": 1.35, - "learning_rate": 9.821857356090595e-05, - "loss": 0.0345, + "epoch": 0.8, + "learning_rate": 0.00017959299586283456, + "loss": 0.0405, "step": 124370 }, { - "epoch": 1.35, - "learning_rate": 9.82023492763969e-05, - "loss": 0.0316, + "epoch": 0.8, + "learning_rate": 0.00017958331450847764, + "loss": 0.0501, "step": 124380 }, { - "epoch": 1.35, - "learning_rate": 9.818612499188785e-05, - "loss": 0.0277, + "epoch": 0.8, + "learning_rate": 0.00017957363315412067, + "loss": 0.0421, "step": 124390 }, { - "epoch": 1.35, - "learning_rate": 9.81699007073788e-05, - "loss": 0.0334, + "epoch": 0.8, + "learning_rate": 0.00017956395179976375, + "loss": 0.0413, "step": 124400 }, { - "epoch": 1.35, - "learning_rate": 9.815367642286974e-05, - "loss": 0.0379, + "epoch": 0.8, + "learning_rate": 0.00017955427044540683, + "loss": 0.0385, "step": 124410 }, { - "epoch": 1.35, - "learning_rate": 9.813745213836069e-05, - "loss": 0.0293, + "epoch": 0.8, + "learning_rate": 0.0001795445890910499, + "loss": 0.045, "step": 124420 }, { - "epoch": 1.35, - "learning_rate": 9.812122785385164e-05, - "loss": 0.0327, + "epoch": 0.8, + "learning_rate": 0.00017953490773669296, + "loss": 0.0403, "step": 124430 }, { - "epoch": 1.35, - "learning_rate": 9.810500356934259e-05, - "loss": 0.0307, + "epoch": 0.8, + "learning_rate": 0.00017952522638233604, + "loss": 0.0437, "step": 124440 }, { - "epoch": 1.35, - "learning_rate": 9.808877928483354e-05, - "loss": 0.0293, + "epoch": 0.8, + "learning_rate": 0.00017951554502797912, + "loss": 0.0403, "step": 124450 }, { - "epoch": 1.35, - "learning_rate": 9.807255500032447e-05, - "loss": 0.029, + "epoch": 0.8, + "learning_rate": 0.00017950586367362215, + "loss": 0.0444, "step": 124460 }, { - "epoch": 1.35, - "learning_rate": 9.805633071581542e-05, - "loss": 0.0325, + "epoch": 0.8, + "learning_rate": 0.00017949618231926523, + "loss": 0.0474, "step": 124470 }, { - "epoch": 1.35, - "learning_rate": 9.804010643130637e-05, - "loss": 0.0321, + "epoch": 0.8, + "learning_rate": 0.0001794865009649083, + "loss": 0.0477, "step": 124480 }, { - "epoch": 1.35, - "learning_rate": 9.802388214679732e-05, - "loss": 0.0314, + "epoch": 0.8, + "learning_rate": 0.00017947681961055136, + "loss": 0.0481, "step": 124490 }, { - "epoch": 1.35, - "learning_rate": 9.800765786228826e-05, - "loss": 0.0321, + "epoch": 0.8, + "learning_rate": 0.00017946713825619444, + "loss": 0.0429, "step": 124500 }, { - "epoch": 1.35, - "learning_rate": 9.799143357777921e-05, - "loss": 0.0354, + "epoch": 0.8, + "learning_rate": 0.00017945745690183752, + "loss": 0.044, "step": 124510 }, { - "epoch": 1.35, - "learning_rate": 9.797520929327016e-05, - "loss": 0.0304, + "epoch": 0.8, + "learning_rate": 0.0001794477755474806, + "loss": 0.0468, "step": 124520 }, { - "epoch": 1.35, - "learning_rate": 9.79589850087611e-05, - "loss": 0.0328, + "epoch": 0.8, + "learning_rate": 0.00017943809419312362, + "loss": 0.0445, "step": 124530 }, { - "epoch": 1.35, - "learning_rate": 9.794276072425206e-05, - "loss": 0.0355, + "epoch": 0.8, + "learning_rate": 0.0001794284128387667, + "loss": 0.0368, "step": 124540 }, { - "epoch": 1.35, - "learning_rate": 9.792653643974299e-05, - "loss": 0.0388, + "epoch": 0.8, + "learning_rate": 0.00017941873148440978, + "loss": 0.0411, "step": 124550 }, { - "epoch": 1.35, - "learning_rate": 9.791031215523394e-05, - "loss": 0.0301, + "epoch": 0.8, + "learning_rate": 0.00017940905013005284, + "loss": 0.0366, "step": 124560 }, { - "epoch": 1.35, - "learning_rate": 9.789408787072489e-05, - "loss": 0.037, + "epoch": 0.8, + "learning_rate": 0.00017939936877569592, + "loss": 0.0438, "step": 124570 }, { - "epoch": 1.35, - "learning_rate": 9.787786358621584e-05, - "loss": 0.0309, + "epoch": 0.8, + "learning_rate": 0.000179389687421339, + "loss": 0.0437, "step": 124580 }, { - "epoch": 1.35, - "learning_rate": 9.786163930170678e-05, - "loss": 0.0285, + "epoch": 0.8, + "learning_rate": 0.00017938000606698207, + "loss": 0.0402, "step": 124590 }, { - "epoch": 1.35, - "learning_rate": 9.784541501719773e-05, - "loss": 0.0342, + "epoch": 0.8, + "learning_rate": 0.0001793703247126251, + "loss": 0.0423, "step": 124600 }, { - "epoch": 1.35, - "learning_rate": 9.782919073268868e-05, - "loss": 0.0332, + "epoch": 0.8, + "learning_rate": 0.00017936064335826818, + "loss": 0.0489, "step": 124610 }, { - "epoch": 1.35, - "learning_rate": 9.781296644817963e-05, - "loss": 0.0328, + "epoch": 0.8, + "learning_rate": 0.00017935096200391126, + "loss": 0.0469, "step": 124620 }, { - "epoch": 1.35, - "learning_rate": 9.779674216367058e-05, - "loss": 0.036, + "epoch": 0.8, + "learning_rate": 0.0001793412806495543, + "loss": 0.0451, "step": 124630 }, { - "epoch": 1.35, - "learning_rate": 9.778051787916151e-05, - "loss": 0.0329, + "epoch": 0.8, + "learning_rate": 0.0001793315992951974, + "loss": 0.0426, "step": 124640 }, { - "epoch": 1.35, - "learning_rate": 9.776429359465246e-05, - "loss": 0.0322, + "epoch": 0.8, + "learning_rate": 0.00017932191794084047, + "loss": 0.0435, "step": 124650 }, { - "epoch": 1.35, - "learning_rate": 9.774806931014341e-05, - "loss": 0.0268, + "epoch": 0.8, + "learning_rate": 0.00017931223658648352, + "loss": 0.0416, "step": 124660 }, { - "epoch": 1.35, - "learning_rate": 9.773184502563436e-05, - "loss": 0.0302, + "epoch": 0.8, + "learning_rate": 0.00017930255523212658, + "loss": 0.042, "step": 124670 }, { - "epoch": 1.35, - "learning_rate": 9.77156207411253e-05, - "loss": 0.0351, + "epoch": 0.8, + "learning_rate": 0.00017929287387776966, + "loss": 0.0523, "step": 124680 }, { - "epoch": 1.35, - "learning_rate": 9.769939645661625e-05, - "loss": 0.0402, + "epoch": 0.8, + "learning_rate": 0.0001792831925234127, + "loss": 0.0401, "step": 124690 }, { - "epoch": 1.35, - "learning_rate": 9.76831721721072e-05, - "loss": 0.032, + "epoch": 0.8, + "learning_rate": 0.0001792735111690558, + "loss": 0.0499, "step": 124700 }, { - "epoch": 1.35, - "learning_rate": 9.766694788759815e-05, - "loss": 0.0363, + "epoch": 0.8, + "learning_rate": 0.00017926382981469887, + "loss": 0.0482, "step": 124710 }, { - "epoch": 1.35, - "learning_rate": 9.76507236030891e-05, - "loss": 0.0286, + "epoch": 0.8, + "learning_rate": 0.00017925414846034195, + "loss": 0.0429, "step": 124720 }, { - "epoch": 1.35, - "learning_rate": 9.763449931858003e-05, - "loss": 0.0313, + "epoch": 0.81, + "learning_rate": 0.000179244467105985, + "loss": 0.0513, "step": 124730 }, { - "epoch": 1.35, - "learning_rate": 9.761827503407098e-05, - "loss": 0.0313, + "epoch": 0.81, + "learning_rate": 0.00017923478575162805, + "loss": 0.0387, "step": 124740 }, { - "epoch": 1.35, - "learning_rate": 9.760205074956193e-05, - "loss": 0.0336, + "epoch": 0.81, + "learning_rate": 0.00017922510439727113, + "loss": 0.0408, "step": 124750 }, { - "epoch": 1.35, - "learning_rate": 9.758582646505288e-05, - "loss": 0.0356, + "epoch": 0.81, + "learning_rate": 0.0001792154230429142, + "loss": 0.0388, "step": 124760 }, { - "epoch": 1.35, - "learning_rate": 9.756960218054383e-05, - "loss": 0.0317, + "epoch": 0.81, + "learning_rate": 0.00017920574168855727, + "loss": 0.0441, "step": 124770 }, { - "epoch": 1.35, - "learning_rate": 9.755337789603477e-05, - "loss": 0.0311, + "epoch": 0.81, + "learning_rate": 0.00017919606033420035, + "loss": 0.0433, "step": 124780 }, { - "epoch": 1.35, - "learning_rate": 9.753715361152572e-05, - "loss": 0.0342, + "epoch": 0.81, + "learning_rate": 0.00017918637897984343, + "loss": 0.0525, "step": 124790 }, { - "epoch": 1.35, - "learning_rate": 9.752092932701667e-05, - "loss": 0.0304, + "epoch": 0.81, + "learning_rate": 0.00017917669762548648, + "loss": 0.0428, "step": 124800 }, { - "epoch": 1.35, - "learning_rate": 9.750470504250762e-05, - "loss": 0.0309, + "epoch": 0.81, + "learning_rate": 0.00017916701627112953, + "loss": 0.0408, "step": 124810 }, { - "epoch": 1.35, - "learning_rate": 9.748848075799855e-05, - "loss": 0.0352, + "epoch": 0.81, + "learning_rate": 0.0001791573349167726, + "loss": 0.0453, "step": 124820 }, { - "epoch": 1.35, - "learning_rate": 9.74722564734895e-05, - "loss": 0.0342, + "epoch": 0.81, + "learning_rate": 0.00017914765356241566, + "loss": 0.0426, "step": 124830 }, { - "epoch": 1.35, - "learning_rate": 9.745603218898045e-05, - "loss": 0.0354, + "epoch": 0.81, + "learning_rate": 0.00017913797220805874, + "loss": 0.0424, "step": 124840 }, { - "epoch": 1.35, - "learning_rate": 9.74398079044714e-05, - "loss": 0.0345, + "epoch": 0.81, + "learning_rate": 0.00017912829085370182, + "loss": 0.0411, "step": 124850 }, { - "epoch": 1.35, - "learning_rate": 9.742358361996235e-05, - "loss": 0.0304, + "epoch": 0.81, + "learning_rate": 0.00017911860949934488, + "loss": 0.0396, "step": 124860 }, { - "epoch": 1.35, - "learning_rate": 9.740735933545329e-05, - "loss": 0.035, + "epoch": 0.81, + "learning_rate": 0.00017910892814498796, + "loss": 0.039, "step": 124870 }, { - "epoch": 1.35, - "learning_rate": 9.739113505094424e-05, - "loss": 0.0361, + "epoch": 0.81, + "learning_rate": 0.000179099246790631, + "loss": 0.0395, "step": 124880 }, { - "epoch": 1.35, - "learning_rate": 9.737491076643519e-05, - "loss": 0.037, + "epoch": 0.81, + "learning_rate": 0.00017908956543627406, + "loss": 0.0391, "step": 124890 }, { - "epoch": 1.35, - "learning_rate": 9.735868648192614e-05, - "loss": 0.0284, + "epoch": 0.81, + "learning_rate": 0.00017907988408191714, + "loss": 0.0425, "step": 124900 }, { - "epoch": 1.35, - "learning_rate": 9.734246219741708e-05, - "loss": 0.0302, + "epoch": 0.81, + "learning_rate": 0.00017907020272756022, + "loss": 0.0445, "step": 124910 }, { - "epoch": 1.35, - "learning_rate": 9.732623791290803e-05, - "loss": 0.0292, + "epoch": 0.81, + "learning_rate": 0.0001790605213732033, + "loss": 0.0444, "step": 124920 }, { - "epoch": 1.35, - "learning_rate": 9.731001362839898e-05, - "loss": 0.0281, + "epoch": 0.81, + "learning_rate": 0.00017905084001884635, + "loss": 0.0433, "step": 124930 }, { - "epoch": 1.35, - "learning_rate": 9.729378934388993e-05, - "loss": 0.0349, + "epoch": 0.81, + "learning_rate": 0.00017904115866448943, + "loss": 0.0423, "step": 124940 }, { - "epoch": 1.35, - "learning_rate": 9.727756505938087e-05, - "loss": 0.034, + "epoch": 0.81, + "learning_rate": 0.00017903147731013249, + "loss": 0.0402, "step": 124950 }, { - "epoch": 1.35, - "learning_rate": 9.726134077487181e-05, - "loss": 0.032, + "epoch": 0.81, + "learning_rate": 0.00017902179595577554, + "loss": 0.0404, "step": 124960 }, { - "epoch": 1.35, - "learning_rate": 9.724511649036276e-05, - "loss": 0.0271, + "epoch": 0.81, + "learning_rate": 0.00017901211460141862, + "loss": 0.0447, "step": 124970 }, { - "epoch": 1.35, - "learning_rate": 9.722889220585371e-05, - "loss": 0.0284, + "epoch": 0.81, + "learning_rate": 0.0001790024332470617, + "loss": 0.0517, "step": 124980 }, { - "epoch": 1.35, - "learning_rate": 9.721266792134466e-05, - "loss": 0.0331, + "epoch": 0.81, + "learning_rate": 0.00017899275189270478, + "loss": 0.0411, "step": 124990 }, { - "epoch": 1.35, - "learning_rate": 9.71964436368356e-05, - "loss": 0.0303, + "epoch": 0.81, + "learning_rate": 0.00017898307053834783, + "loss": 0.0461, "step": 125000 }, { - "epoch": 1.35, - "eval_cer": 0.9211331216504901, - "eval_loss": 0.025354767218232155, - "eval_runtime": 118.9816, - "eval_samples_per_second": 16.809, - "eval_steps_per_second": 4.202, + "epoch": 0.81, + "eval_cer": 0.919931307196927, + "eval_loss": 0.028672238811850548, + "eval_runtime": 120.0797, + "eval_samples_per_second": 16.656, + "eval_steps_per_second": 4.164, "step": 125000 }, { - "epoch": 1.35, - "learning_rate": 9.718021935232655e-05, - "loss": 0.0296, + "epoch": 0.81, + "learning_rate": 0.0001789733891839909, + "loss": 0.0371, "step": 125010 }, { - "epoch": 1.35, - "learning_rate": 9.71639950678175e-05, - "loss": 0.0277, + "epoch": 0.81, + "learning_rate": 0.00017896370782963396, + "loss": 0.0457, "step": 125020 }, { - "epoch": 1.35, - "learning_rate": 9.714777078330845e-05, - "loss": 0.03, + "epoch": 0.81, + "learning_rate": 0.00017895402647527702, + "loss": 0.0354, "step": 125030 }, { - "epoch": 1.35, - "learning_rate": 9.71315464987994e-05, - "loss": 0.0337, + "epoch": 0.81, + "learning_rate": 0.0001789443451209201, + "loss": 0.0426, "step": 125040 }, { - "epoch": 1.35, - "learning_rate": 9.711532221429033e-05, - "loss": 0.0276, + "epoch": 0.81, + "learning_rate": 0.00017893466376656318, + "loss": 0.0381, "step": 125050 }, { - "epoch": 1.35, - "learning_rate": 9.709909792978128e-05, - "loss": 0.0296, + "epoch": 0.81, + "learning_rate": 0.00017892498241220623, + "loss": 0.0444, "step": 125060 }, { - "epoch": 1.35, - "learning_rate": 9.708287364527223e-05, - "loss": 0.0316, + "epoch": 0.81, + "learning_rate": 0.0001789153010578493, + "loss": 0.0395, "step": 125070 }, { - "epoch": 1.35, - "learning_rate": 9.706664936076318e-05, - "loss": 0.0305, + "epoch": 0.81, + "learning_rate": 0.0001789056197034924, + "loss": 0.042, "step": 125080 }, { - "epoch": 1.35, - "learning_rate": 9.705042507625412e-05, - "loss": 0.0274, + "epoch": 0.81, + "learning_rate": 0.00017889593834913541, + "loss": 0.0374, "step": 125090 }, { - "epoch": 1.35, - "learning_rate": 9.703420079174507e-05, - "loss": 0.0287, + "epoch": 0.81, + "learning_rate": 0.0001788862569947785, + "loss": 0.0452, "step": 125100 }, { - "epoch": 1.35, - "learning_rate": 9.701797650723602e-05, - "loss": 0.0306, + "epoch": 0.81, + "learning_rate": 0.00017887657564042157, + "loss": 0.0428, "step": 125110 }, { - "epoch": 1.35, - "learning_rate": 9.700175222272697e-05, - "loss": 0.0296, + "epoch": 0.81, + "learning_rate": 0.00017886689428606465, + "loss": 0.041, "step": 125120 }, { - "epoch": 1.35, - "learning_rate": 9.698552793821792e-05, - "loss": 0.0333, + "epoch": 0.81, + "learning_rate": 0.0001788572129317077, + "loss": 0.0412, "step": 125130 }, { - "epoch": 1.35, - "learning_rate": 9.696930365370885e-05, - "loss": 0.0285, + "epoch": 0.81, + "learning_rate": 0.00017884753157735079, + "loss": 0.0368, "step": 125140 }, { - "epoch": 1.35, - "learning_rate": 9.69530793691998e-05, - "loss": 0.0296, + "epoch": 0.81, + "learning_rate": 0.00017883785022299387, + "loss": 0.0437, "step": 125150 }, { - "epoch": 1.35, - "learning_rate": 9.693685508469075e-05, - "loss": 0.0284, + "epoch": 0.81, + "learning_rate": 0.0001788281688686369, + "loss": 0.0453, "step": 125160 }, { - "epoch": 1.35, - "learning_rate": 9.69206308001817e-05, - "loss": 0.0328, + "epoch": 0.81, + "learning_rate": 0.00017881848751427997, + "loss": 0.0439, "step": 125170 }, { - "epoch": 1.35, - "learning_rate": 9.690440651567264e-05, - "loss": 0.0292, + "epoch": 0.81, + "learning_rate": 0.00017880880615992305, + "loss": 0.0397, "step": 125180 }, { - "epoch": 1.35, - "learning_rate": 9.688818223116359e-05, - "loss": 0.0293, + "epoch": 0.81, + "learning_rate": 0.00017879912480556613, + "loss": 0.0423, "step": 125190 }, { - "epoch": 1.35, - "learning_rate": 9.687195794665454e-05, - "loss": 0.0401, + "epoch": 0.81, + "learning_rate": 0.00017878944345120918, + "loss": 0.0392, "step": 125200 }, { - "epoch": 1.35, - "learning_rate": 9.685573366214549e-05, - "loss": 0.0311, + "epoch": 0.81, + "learning_rate": 0.00017877976209685226, + "loss": 0.0431, "step": 125210 }, { - "epoch": 1.35, - "learning_rate": 9.683950937763644e-05, - "loss": 0.0292, + "epoch": 0.81, + "learning_rate": 0.00017877008074249534, + "loss": 0.0365, "step": 125220 }, { - "epoch": 1.35, - "learning_rate": 9.682328509312737e-05, - "loss": 0.0283, + "epoch": 0.81, + "learning_rate": 0.00017876039938813837, + "loss": 0.0379, "step": 125230 }, { - "epoch": 1.35, - "learning_rate": 9.680706080861832e-05, - "loss": 0.0278, + "epoch": 0.81, + "learning_rate": 0.00017875071803378145, + "loss": 0.0404, "step": 125240 }, { - "epoch": 1.35, - "learning_rate": 9.679083652410927e-05, - "loss": 0.0306, + "epoch": 0.81, + "learning_rate": 0.00017874103667942453, + "loss": 0.047, "step": 125250 }, { - "epoch": 1.35, - "learning_rate": 9.677461223960022e-05, - "loss": 0.0327, + "epoch": 0.81, + "learning_rate": 0.00017873135532506758, + "loss": 0.0412, "step": 125260 }, { - "epoch": 1.35, - "learning_rate": 9.675838795509116e-05, - "loss": 0.0298, + "epoch": 0.81, + "learning_rate": 0.00017872167397071066, + "loss": 0.0474, "step": 125270 }, { - "epoch": 1.36, - "learning_rate": 9.674216367058211e-05, - "loss": 0.0365, + "epoch": 0.81, + "learning_rate": 0.00017871199261635374, + "loss": 0.0445, "step": 125280 }, { - "epoch": 1.36, - "learning_rate": 9.672593938607306e-05, - "loss": 0.037, + "epoch": 0.81, + "learning_rate": 0.00017870231126199682, + "loss": 0.0489, "step": 125290 }, { - "epoch": 1.36, - "learning_rate": 9.670971510156401e-05, - "loss": 0.0283, + "epoch": 0.81, + "learning_rate": 0.00017869262990763985, + "loss": 0.0441, "step": 125300 }, { - "epoch": 1.36, - "learning_rate": 9.669349081705496e-05, - "loss": 0.033, + "epoch": 0.81, + "learning_rate": 0.00017868294855328293, + "loss": 0.0384, "step": 125310 }, { - "epoch": 1.36, - "learning_rate": 9.66772665325459e-05, - "loss": 0.0297, + "epoch": 0.81, + "learning_rate": 0.000178673267198926, + "loss": 0.0399, "step": 125320 }, { - "epoch": 1.36, - "learning_rate": 9.666104224803684e-05, - "loss": 0.0307, + "epoch": 0.81, + "learning_rate": 0.00017866358584456906, + "loss": 0.0445, "step": 125330 }, { - "epoch": 1.36, - "learning_rate": 9.66448179635278e-05, - "loss": 0.0309, + "epoch": 0.81, + "learning_rate": 0.00017865390449021214, + "loss": 0.0402, "step": 125340 }, { - "epoch": 1.36, - "learning_rate": 9.662859367901874e-05, - "loss": 0.0335, + "epoch": 0.81, + "learning_rate": 0.00017864422313585522, + "loss": 0.0436, "step": 125350 }, { - "epoch": 1.36, - "learning_rate": 9.661236939450968e-05, - "loss": 0.0372, + "epoch": 0.81, + "learning_rate": 0.0001786345417814983, + "loss": 0.0434, "step": 125360 }, { - "epoch": 1.36, - "learning_rate": 9.659614511000063e-05, - "loss": 0.0306, + "epoch": 0.81, + "learning_rate": 0.00017862486042714132, + "loss": 0.04, "step": 125370 }, { - "epoch": 1.36, - "learning_rate": 9.657992082549158e-05, - "loss": 0.028, + "epoch": 0.81, + "learning_rate": 0.0001786151790727844, + "loss": 0.0415, "step": 125380 }, { - "epoch": 1.36, - "learning_rate": 9.656369654098253e-05, - "loss": 0.0305, + "epoch": 0.81, + "learning_rate": 0.00017860549771842748, + "loss": 0.0509, "step": 125390 }, { - "epoch": 1.36, - "learning_rate": 9.654747225647348e-05, - "loss": 0.0295, + "epoch": 0.81, + "learning_rate": 0.00017859581636407053, + "loss": 0.0459, "step": 125400 }, { - "epoch": 1.36, - "learning_rate": 9.653124797196442e-05, - "loss": 0.0344, + "epoch": 0.81, + "learning_rate": 0.00017858613500971361, + "loss": 0.0464, "step": 125410 }, { - "epoch": 1.36, - "learning_rate": 9.651502368745537e-05, - "loss": 0.034, + "epoch": 0.81, + "learning_rate": 0.0001785764536553567, + "loss": 0.0423, "step": 125420 }, { - "epoch": 1.36, - "learning_rate": 9.649879940294631e-05, - "loss": 0.037, + "epoch": 0.81, + "learning_rate": 0.00017856677230099977, + "loss": 0.0398, "step": 125430 }, { - "epoch": 1.36, - "learning_rate": 9.648257511843726e-05, - "loss": 0.0361, + "epoch": 0.81, + "learning_rate": 0.0001785570909466428, + "loss": 0.0365, "step": 125440 }, { - "epoch": 1.36, - "learning_rate": 9.646635083392821e-05, - "loss": 0.0278, + "epoch": 0.81, + "learning_rate": 0.00017854740959228588, + "loss": 0.0468, "step": 125450 }, { - "epoch": 1.36, - "learning_rate": 9.645012654941915e-05, - "loss": 0.0275, + "epoch": 0.81, + "learning_rate": 0.00017853772823792893, + "loss": 0.0423, "step": 125460 }, { - "epoch": 1.36, - "learning_rate": 9.64339022649101e-05, - "loss": 0.0283, + "epoch": 0.81, + "learning_rate": 0.000178528046883572, + "loss": 0.0511, "step": 125470 }, { - "epoch": 1.36, - "learning_rate": 9.641767798040105e-05, - "loss": 0.0374, + "epoch": 0.81, + "learning_rate": 0.0001785183655292151, + "loss": 0.0347, "step": 125480 }, { - "epoch": 1.36, - "learning_rate": 9.6401453695892e-05, - "loss": 0.0368, + "epoch": 0.81, + "learning_rate": 0.00017850868417485817, + "loss": 0.0416, "step": 125490 }, { - "epoch": 1.36, - "learning_rate": 9.638522941138294e-05, - "loss": 0.0299, + "epoch": 0.81, + "learning_rate": 0.00017849900282050122, + "loss": 0.0417, "step": 125500 }, { - "epoch": 1.36, - "learning_rate": 9.636900512687389e-05, - "loss": 0.033, + "epoch": 0.81, + "learning_rate": 0.00017848932146614428, + "loss": 0.0377, "step": 125510 }, { - "epoch": 1.36, - "learning_rate": 9.635278084236484e-05, - "loss": 0.0369, + "epoch": 0.81, + "learning_rate": 0.00017847964011178736, + "loss": 0.0468, "step": 125520 }, { - "epoch": 1.36, - "learning_rate": 9.633655655785579e-05, - "loss": 0.0328, + "epoch": 0.81, + "learning_rate": 0.0001784699587574304, + "loss": 0.0344, "step": 125530 }, { - "epoch": 1.36, - "learning_rate": 9.632033227334674e-05, - "loss": 0.0338, + "epoch": 0.81, + "learning_rate": 0.0001784602774030735, + "loss": 0.0398, "step": 125540 }, { - "epoch": 1.36, - "learning_rate": 9.63041079888377e-05, - "loss": 0.0308, + "epoch": 0.81, + "learning_rate": 0.00017845059604871657, + "loss": 0.0382, "step": 125550 }, { - "epoch": 1.36, - "learning_rate": 9.628788370432863e-05, - "loss": 0.0324, + "epoch": 0.81, + "learning_rate": 0.00017844091469435965, + "loss": 0.0548, "step": 125560 }, { - "epoch": 1.36, - "learning_rate": 9.627165941981958e-05, - "loss": 0.0311, + "epoch": 0.81, + "learning_rate": 0.0001784312333400027, + "loss": 0.0423, "step": 125570 }, { - "epoch": 1.36, - "learning_rate": 9.625543513531053e-05, - "loss": 0.0325, + "epoch": 0.81, + "learning_rate": 0.00017842155198564575, + "loss": 0.0403, "step": 125580 }, { - "epoch": 1.36, - "learning_rate": 9.623921085080148e-05, - "loss": 0.0307, + "epoch": 0.81, + "learning_rate": 0.00017841187063128883, + "loss": 0.0381, "step": 125590 }, { - "epoch": 1.36, - "learning_rate": 9.622298656629242e-05, - "loss": 0.0338, + "epoch": 0.81, + "learning_rate": 0.0001784021892769319, + "loss": 0.0379, "step": 125600 }, { - "epoch": 1.36, - "learning_rate": 9.620676228178337e-05, - "loss": 0.0341, + "epoch": 0.81, + "learning_rate": 0.00017839250792257497, + "loss": 0.0523, "step": 125610 }, { - "epoch": 1.36, - "learning_rate": 9.619053799727432e-05, - "loss": 0.0363, + "epoch": 0.81, + "learning_rate": 0.00017838282656821805, + "loss": 0.0426, "step": 125620 }, { - "epoch": 1.36, - "learning_rate": 9.617431371276527e-05, - "loss": 0.0316, + "epoch": 0.81, + "learning_rate": 0.00017837314521386113, + "loss": 0.0366, "step": 125630 }, { - "epoch": 1.36, - "learning_rate": 9.615808942825622e-05, - "loss": 0.0286, + "epoch": 0.81, + "learning_rate": 0.00017836346385950418, + "loss": 0.0448, "step": 125640 }, { - "epoch": 1.36, - "learning_rate": 9.614186514374716e-05, - "loss": 0.0337, + "epoch": 0.81, + "learning_rate": 0.00017835378250514723, + "loss": 0.0405, "step": 125650 }, { - "epoch": 1.36, - "learning_rate": 9.61256408592381e-05, - "loss": 0.0347, + "epoch": 0.81, + "learning_rate": 0.00017834410115079028, + "loss": 0.0473, "step": 125660 }, { - "epoch": 1.36, - "learning_rate": 9.610941657472906e-05, - "loss": 0.0269, + "epoch": 0.81, + "learning_rate": 0.00017833441979643336, + "loss": 0.0437, "step": 125670 }, { - "epoch": 1.36, - "learning_rate": 9.609319229022e-05, - "loss": 0.0398, + "epoch": 0.81, + "learning_rate": 0.00017832473844207644, + "loss": 0.042, "step": 125680 }, { - "epoch": 1.36, - "learning_rate": 9.607696800571094e-05, - "loss": 0.0329, + "epoch": 0.81, + "learning_rate": 0.00017831505708771952, + "loss": 0.0476, "step": 125690 }, { - "epoch": 1.36, - "learning_rate": 9.606074372120189e-05, - "loss": 0.0339, + "epoch": 0.81, + "learning_rate": 0.00017830537573336258, + "loss": 0.0426, "step": 125700 }, { - "epoch": 1.36, - "learning_rate": 9.604451943669284e-05, - "loss": 0.0275, + "epoch": 0.81, + "learning_rate": 0.00017829569437900566, + "loss": 0.0395, "step": 125710 }, { - "epoch": 1.36, - "learning_rate": 9.602829515218379e-05, - "loss": 0.0424, + "epoch": 0.81, + "learning_rate": 0.0001782860130246487, + "loss": 0.0485, "step": 125720 }, { - "epoch": 1.36, - "learning_rate": 9.601207086767474e-05, - "loss": 0.0329, + "epoch": 0.81, + "learning_rate": 0.00017827633167029176, + "loss": 0.0394, "step": 125730 }, { - "epoch": 1.36, - "learning_rate": 9.599584658316568e-05, - "loss": 0.0305, + "epoch": 0.81, + "learning_rate": 0.00017826665031593484, + "loss": 0.0453, "step": 125740 }, { - "epoch": 1.36, - "learning_rate": 9.597962229865663e-05, - "loss": 0.0264, + "epoch": 0.81, + "learning_rate": 0.00017825696896157792, + "loss": 0.0397, "step": 125750 }, { - "epoch": 1.36, - "learning_rate": 9.596339801414758e-05, - "loss": 0.0292, + "epoch": 0.81, + "learning_rate": 0.000178247287607221, + "loss": 0.0425, "step": 125760 }, { - "epoch": 1.36, - "learning_rate": 9.594717372963853e-05, - "loss": 0.0268, + "epoch": 0.81, + "learning_rate": 0.00017823760625286405, + "loss": 0.0426, "step": 125770 }, { - "epoch": 1.36, - "learning_rate": 9.593094944512946e-05, - "loss": 0.0319, + "epoch": 0.81, + "learning_rate": 0.00017822792489850713, + "loss": 0.0425, "step": 125780 }, { - "epoch": 1.36, - "learning_rate": 9.591472516062041e-05, - "loss": 0.0367, + "epoch": 0.81, + "learning_rate": 0.00017821824354415019, + "loss": 0.0471, "step": 125790 }, { - "epoch": 1.36, - "learning_rate": 9.589850087611136e-05, - "loss": 0.0314, + "epoch": 0.81, + "learning_rate": 0.00017820856218979324, + "loss": 0.0445, "step": 125800 }, { - "epoch": 1.36, - "learning_rate": 9.588227659160231e-05, - "loss": 0.0373, + "epoch": 0.81, + "learning_rate": 0.00017819888083543632, + "loss": 0.0416, "step": 125810 }, { - "epoch": 1.36, - "learning_rate": 9.586605230709326e-05, - "loss": 0.0342, + "epoch": 0.81, + "learning_rate": 0.0001781891994810794, + "loss": 0.0448, "step": 125820 }, { - "epoch": 1.36, - "learning_rate": 9.58498280225842e-05, - "loss": 0.0322, + "epoch": 0.81, + "learning_rate": 0.00017817951812672248, + "loss": 0.0356, "step": 125830 }, { - "epoch": 1.36, - "learning_rate": 9.583360373807515e-05, - "loss": 0.0292, + "epoch": 0.81, + "learning_rate": 0.00017816983677236553, + "loss": 0.0406, "step": 125840 }, { - "epoch": 1.36, - "learning_rate": 9.58173794535661e-05, - "loss": 0.0322, + "epoch": 0.81, + "learning_rate": 0.0001781601554180086, + "loss": 0.0399, "step": 125850 }, { - "epoch": 1.36, - "learning_rate": 9.580115516905705e-05, - "loss": 0.0324, + "epoch": 0.81, + "learning_rate": 0.00017815047406365164, + "loss": 0.0423, "step": 125860 }, { - "epoch": 1.36, - "learning_rate": 9.578493088454798e-05, - "loss": 0.0319, + "epoch": 0.81, + "learning_rate": 0.00017814079270929472, + "loss": 0.0316, "step": 125870 }, { - "epoch": 1.36, - "learning_rate": 9.576870660003893e-05, - "loss": 0.0311, + "epoch": 0.81, + "learning_rate": 0.0001781311113549378, + "loss": 0.0393, "step": 125880 }, { - "epoch": 1.36, - "learning_rate": 9.575248231552988e-05, - "loss": 0.034, + "epoch": 0.81, + "learning_rate": 0.00017812143000058088, + "loss": 0.0367, "step": 125890 }, { - "epoch": 1.36, - "learning_rate": 9.573625803102083e-05, - "loss": 0.0273, + "epoch": 0.81, + "learning_rate": 0.00017811174864622393, + "loss": 0.0407, "step": 125900 }, { - "epoch": 1.36, - "learning_rate": 9.572003374651178e-05, - "loss": 0.0313, + "epoch": 0.81, + "learning_rate": 0.000178102067291867, + "loss": 0.0402, "step": 125910 }, { - "epoch": 1.36, - "learning_rate": 9.570380946200272e-05, - "loss": 0.0331, + "epoch": 0.81, + "learning_rate": 0.0001780923859375101, + "loss": 0.0401, "step": 125920 }, { - "epoch": 1.36, - "learning_rate": 9.568758517749367e-05, - "loss": 0.0275, + "epoch": 0.81, + "learning_rate": 0.0001780827045831531, + "loss": 0.0376, "step": 125930 }, { - "epoch": 1.36, - "learning_rate": 9.567136089298462e-05, - "loss": 0.0357, + "epoch": 0.81, + "learning_rate": 0.0001780730232287962, + "loss": 0.0445, "step": 125940 }, { - "epoch": 1.36, - "learning_rate": 9.565513660847557e-05, - "loss": 0.0353, + "epoch": 0.81, + "learning_rate": 0.00017806334187443927, + "loss": 0.0395, "step": 125950 }, { - "epoch": 1.36, - "learning_rate": 9.56389123239665e-05, - "loss": 0.0335, + "epoch": 0.81, + "learning_rate": 0.00017805366052008235, + "loss": 0.0363, "step": 125960 }, { - "epoch": 1.36, - "learning_rate": 9.562268803945745e-05, - "loss": 0.0288, + "epoch": 0.81, + "learning_rate": 0.0001780439791657254, + "loss": 0.0429, "step": 125970 }, { - "epoch": 1.36, - "learning_rate": 9.56064637549484e-05, - "loss": 0.0314, + "epoch": 0.81, + "learning_rate": 0.00017803429781136849, + "loss": 0.0444, "step": 125980 }, { - "epoch": 1.36, - "learning_rate": 9.559023947043935e-05, - "loss": 0.0313, + "epoch": 0.81, + "learning_rate": 0.00017802461645701156, + "loss": 0.0455, "step": 125990 }, { - "epoch": 1.36, - "learning_rate": 9.55740151859303e-05, - "loss": 0.0292, + "epoch": 0.81, + "learning_rate": 0.0001780149351026546, + "loss": 0.0433, "step": 126000 }, { - "epoch": 1.36, - "eval_cer": 0.9210739282009962, - "eval_loss": 0.024977944791316986, - "eval_runtime": 118.9233, - "eval_samples_per_second": 16.818, - "eval_steps_per_second": 4.204, + "epoch": 0.81, + "eval_cer": 0.9197939215907807, + "eval_loss": 0.029015522450208664, + "eval_runtime": 119.846, + "eval_samples_per_second": 16.688, + "eval_steps_per_second": 4.172, "step": 126000 }, { - "epoch": 1.36, - "learning_rate": 9.555779090142124e-05, - "loss": 0.028, + "epoch": 0.81, + "learning_rate": 0.00017800525374829767, + "loss": 0.041, "step": 126010 }, { - "epoch": 1.36, - "learning_rate": 9.554156661691219e-05, - "loss": 0.0311, + "epoch": 0.81, + "learning_rate": 0.00017799557239394075, + "loss": 0.0422, "step": 126020 }, { - "epoch": 1.36, - "learning_rate": 9.552534233240314e-05, - "loss": 0.0339, + "epoch": 0.81, + "learning_rate": 0.00017798589103958383, + "loss": 0.0416, "step": 126030 }, { - "epoch": 1.36, - "learning_rate": 9.550911804789409e-05, - "loss": 0.0334, + "epoch": 0.81, + "learning_rate": 0.00017797620968522688, + "loss": 0.0384, "step": 126040 }, { - "epoch": 1.36, - "learning_rate": 9.549289376338502e-05, - "loss": 0.0304, + "epoch": 0.81, + "learning_rate": 0.00017796652833086996, + "loss": 0.0471, "step": 126050 }, { - "epoch": 1.36, - "learning_rate": 9.547666947887597e-05, - "loss": 0.0382, + "epoch": 0.81, + "learning_rate": 0.00017795684697651304, + "loss": 0.0389, "step": 126060 }, { - "epoch": 1.36, - "learning_rate": 9.546044519436692e-05, - "loss": 0.0377, + "epoch": 0.81, + "learning_rate": 0.00017794716562215607, + "loss": 0.0447, "step": 126070 }, { - "epoch": 1.36, - "learning_rate": 9.544422090985787e-05, - "loss": 0.0339, + "epoch": 0.81, + "learning_rate": 0.00017793748426779915, + "loss": 0.0411, "step": 126080 }, { - "epoch": 1.36, - "learning_rate": 9.542799662534882e-05, - "loss": 0.0346, + "epoch": 0.81, + "learning_rate": 0.00017792780291344223, + "loss": 0.0413, "step": 126090 }, { - "epoch": 1.36, - "learning_rate": 9.541177234083976e-05, - "loss": 0.0327, + "epoch": 0.81, + "learning_rate": 0.00017791812155908528, + "loss": 0.0375, "step": 126100 }, { - "epoch": 1.36, - "learning_rate": 9.539554805633071e-05, - "loss": 0.0364, + "epoch": 0.81, + "learning_rate": 0.00017790844020472836, + "loss": 0.0353, "step": 126110 }, { - "epoch": 1.36, - "learning_rate": 9.537932377182166e-05, - "loss": 0.028, + "epoch": 0.81, + "learning_rate": 0.00017789875885037144, + "loss": 0.039, "step": 126120 }, { - "epoch": 1.36, - "learning_rate": 9.536309948731261e-05, - "loss": 0.0373, + "epoch": 0.81, + "learning_rate": 0.00017788907749601452, + "loss": 0.0429, "step": 126130 }, { - "epoch": 1.36, - "learning_rate": 9.534687520280356e-05, - "loss": 0.0248, + "epoch": 0.81, + "learning_rate": 0.00017787939614165755, + "loss": 0.0418, "step": 126140 }, { - "epoch": 1.36, - "learning_rate": 9.53306509182945e-05, - "loss": 0.0365, + "epoch": 0.81, + "learning_rate": 0.00017786971478730062, + "loss": 0.0367, "step": 126150 }, { - "epoch": 1.36, - "learning_rate": 9.531442663378544e-05, - "loss": 0.0335, + "epoch": 0.81, + "learning_rate": 0.0001778600334329437, + "loss": 0.0382, "step": 126160 }, { - "epoch": 1.36, - "learning_rate": 9.52982023492764e-05, - "loss": 0.0303, + "epoch": 0.81, + "learning_rate": 0.00017785035207858676, + "loss": 0.041, "step": 126170 }, { - "epoch": 1.36, - "learning_rate": 9.528197806476734e-05, - "loss": 0.0288, + "epoch": 0.81, + "learning_rate": 0.00017784067072422984, + "loss": 0.0396, "step": 126180 }, { - "epoch": 1.36, - "learning_rate": 9.526575378025828e-05, - "loss": 0.0318, + "epoch": 0.81, + "learning_rate": 0.00017783098936987292, + "loss": 0.0366, "step": 126190 }, { - "epoch": 1.36, - "learning_rate": 9.524952949574923e-05, - "loss": 0.0293, + "epoch": 0.81, + "learning_rate": 0.000177821308015516, + "loss": 0.0409, "step": 126200 }, { - "epoch": 1.37, - "learning_rate": 9.523330521124018e-05, - "loss": 0.0267, + "epoch": 0.81, + "learning_rate": 0.00017781162666115902, + "loss": 0.0422, "step": 126210 }, { - "epoch": 1.37, - "learning_rate": 9.521708092673113e-05, - "loss": 0.0238, + "epoch": 0.81, + "learning_rate": 0.0001778019453068021, + "loss": 0.045, "step": 126220 }, { - "epoch": 1.37, - "learning_rate": 9.520085664222208e-05, - "loss": 0.0348, + "epoch": 0.81, + "learning_rate": 0.00017779226395244518, + "loss": 0.0449, "step": 126230 }, { - "epoch": 1.37, - "learning_rate": 9.518463235771302e-05, - "loss": 0.0343, + "epoch": 0.81, + "learning_rate": 0.00017778258259808823, + "loss": 0.0432, "step": 126240 }, { - "epoch": 1.37, - "learning_rate": 9.516840807320397e-05, - "loss": 0.0301, + "epoch": 0.81, + "learning_rate": 0.00017777290124373131, + "loss": 0.0409, "step": 126250 }, { - "epoch": 1.37, - "learning_rate": 9.515218378869492e-05, - "loss": 0.0348, + "epoch": 0.81, + "learning_rate": 0.0001777632198893744, + "loss": 0.0451, "step": 126260 }, { - "epoch": 1.37, - "learning_rate": 9.513595950418587e-05, - "loss": 0.0278, + "epoch": 0.81, + "learning_rate": 0.00017775353853501745, + "loss": 0.0413, "step": 126270 }, { - "epoch": 1.37, - "learning_rate": 9.51197352196768e-05, - "loss": 0.0333, + "epoch": 0.82, + "learning_rate": 0.0001777438571806605, + "loss": 0.041, "step": 126280 }, { - "epoch": 1.37, - "learning_rate": 9.510351093516775e-05, - "loss": 0.0263, + "epoch": 0.82, + "learning_rate": 0.00017773417582630358, + "loss": 0.0451, "step": 126290 }, { - "epoch": 1.37, - "learning_rate": 9.50872866506587e-05, - "loss": 0.0339, + "epoch": 0.82, + "learning_rate": 0.00017772449447194663, + "loss": 0.0415, "step": 126300 }, { - "epoch": 1.37, - "learning_rate": 9.507106236614965e-05, - "loss": 0.0266, + "epoch": 0.82, + "learning_rate": 0.0001777148131175897, + "loss": 0.0458, "step": 126310 }, { - "epoch": 1.37, - "learning_rate": 9.50548380816406e-05, - "loss": 0.039, + "epoch": 0.82, + "learning_rate": 0.0001777051317632328, + "loss": 0.038, "step": 126320 }, { - "epoch": 1.37, - "learning_rate": 9.503861379713154e-05, - "loss": 0.0313, + "epoch": 0.82, + "learning_rate": 0.00017769545040887587, + "loss": 0.0371, "step": 126330 }, { - "epoch": 1.37, - "learning_rate": 9.502238951262249e-05, - "loss": 0.028, + "epoch": 0.82, + "learning_rate": 0.00017768576905451892, + "loss": 0.0388, "step": 126340 }, { - "epoch": 1.37, - "learning_rate": 9.500616522811344e-05, - "loss": 0.0371, + "epoch": 0.82, + "learning_rate": 0.00017767608770016198, + "loss": 0.0419, "step": 126350 }, { - "epoch": 1.37, - "learning_rate": 9.498994094360439e-05, - "loss": 0.0368, + "epoch": 0.82, + "learning_rate": 0.00017766640634580506, + "loss": 0.0479, "step": 126360 }, { - "epoch": 1.37, - "learning_rate": 9.497371665909532e-05, - "loss": 0.0362, + "epoch": 0.82, + "learning_rate": 0.0001776567249914481, + "loss": 0.0361, "step": 126370 }, { - "epoch": 1.37, - "learning_rate": 9.495749237458627e-05, - "loss": 0.0344, + "epoch": 0.82, + "learning_rate": 0.0001776470436370912, + "loss": 0.0462, "step": 126380 }, { - "epoch": 1.37, - "learning_rate": 9.494126809007722e-05, - "loss": 0.0342, + "epoch": 0.82, + "learning_rate": 0.00017763736228273427, + "loss": 0.0452, "step": 126390 }, { - "epoch": 1.37, - "learning_rate": 9.492504380556817e-05, - "loss": 0.0315, + "epoch": 0.82, + "learning_rate": 0.00017762768092837735, + "loss": 0.0508, "step": 126400 }, { - "epoch": 1.37, - "learning_rate": 9.490881952105912e-05, - "loss": 0.0291, + "epoch": 0.82, + "learning_rate": 0.0001776179995740204, + "loss": 0.0408, "step": 126410 }, { - "epoch": 1.37, - "learning_rate": 9.489259523655006e-05, - "loss": 0.0338, + "epoch": 0.82, + "learning_rate": 0.00017760831821966345, + "loss": 0.0406, "step": 126420 }, { - "epoch": 1.37, - "learning_rate": 9.487637095204101e-05, - "loss": 0.0294, + "epoch": 0.82, + "learning_rate": 0.00017759863686530653, + "loss": 0.039, "step": 126430 }, { - "epoch": 1.37, - "learning_rate": 9.486014666753196e-05, - "loss": 0.027, + "epoch": 0.82, + "learning_rate": 0.00017758895551094959, + "loss": 0.0394, "step": 126440 }, { - "epoch": 1.37, - "learning_rate": 9.484392238302291e-05, - "loss": 0.0279, + "epoch": 0.82, + "learning_rate": 0.00017757927415659267, + "loss": 0.0464, "step": 126450 }, { - "epoch": 1.37, - "learning_rate": 9.482769809851384e-05, - "loss": 0.029, + "epoch": 0.82, + "learning_rate": 0.00017756959280223575, + "loss": 0.0538, "step": 126460 }, { - "epoch": 1.37, - "learning_rate": 9.481147381400479e-05, - "loss": 0.0289, + "epoch": 0.82, + "learning_rate": 0.0001775599114478788, + "loss": 0.039, "step": 126470 }, { - "epoch": 1.37, - "learning_rate": 9.479524952949574e-05, - "loss": 0.0364, + "epoch": 0.82, + "learning_rate": 0.00017755023009352188, + "loss": 0.0411, "step": 126480 }, { - "epoch": 1.37, - "learning_rate": 9.477902524498669e-05, - "loss": 0.0273, + "epoch": 0.82, + "learning_rate": 0.00017754054873916493, + "loss": 0.0392, "step": 126490 }, { - "epoch": 1.37, - "learning_rate": 9.476280096047764e-05, - "loss": 0.03, + "epoch": 0.82, + "learning_rate": 0.00017753086738480798, + "loss": 0.04, "step": 126500 }, { - "epoch": 1.37, - "learning_rate": 9.474657667596858e-05, - "loss": 0.0339, + "epoch": 0.82, + "learning_rate": 0.00017752118603045106, + "loss": 0.0443, "step": 126510 }, { - "epoch": 1.37, - "learning_rate": 9.473035239145953e-05, - "loss": 0.0344, + "epoch": 0.82, + "learning_rate": 0.00017751150467609414, + "loss": 0.0478, "step": 126520 }, { - "epoch": 1.37, - "learning_rate": 9.471412810695048e-05, - "loss": 0.0384, + "epoch": 0.82, + "learning_rate": 0.00017750182332173722, + "loss": 0.044, "step": 126530 }, { - "epoch": 1.37, - "learning_rate": 9.469790382244143e-05, - "loss": 0.0339, + "epoch": 0.82, + "learning_rate": 0.00017749214196738028, + "loss": 0.0419, "step": 126540 }, { - "epoch": 1.37, - "learning_rate": 9.468167953793236e-05, - "loss": 0.033, + "epoch": 0.82, + "learning_rate": 0.00017748246061302336, + "loss": 0.0403, "step": 126550 }, { - "epoch": 1.37, - "learning_rate": 9.466545525342331e-05, - "loss": 0.0293, + "epoch": 0.82, + "learning_rate": 0.0001774727792586664, + "loss": 0.0347, "step": 126560 }, { - "epoch": 1.37, - "learning_rate": 9.464923096891426e-05, - "loss": 0.029, + "epoch": 0.82, + "learning_rate": 0.00017746309790430946, + "loss": 0.0388, "step": 126570 }, { - "epoch": 1.37, - "learning_rate": 9.463300668440521e-05, - "loss": 0.034, + "epoch": 0.82, + "learning_rate": 0.00017745341654995254, + "loss": 0.0421, "step": 126580 }, { - "epoch": 1.37, - "learning_rate": 9.461678239989616e-05, - "loss": 0.0314, + "epoch": 0.82, + "learning_rate": 0.00017744373519559562, + "loss": 0.0411, "step": 126590 }, { - "epoch": 1.37, - "learning_rate": 9.46005581153871e-05, - "loss": 0.0298, + "epoch": 0.82, + "learning_rate": 0.0001774340538412387, + "loss": 0.0369, "step": 126600 }, { - "epoch": 1.37, - "learning_rate": 9.458433383087805e-05, - "loss": 0.0307, + "epoch": 0.82, + "learning_rate": 0.00017742437248688175, + "loss": 0.0381, "step": 126610 }, { - "epoch": 1.37, - "learning_rate": 9.4568109546369e-05, - "loss": 0.0298, + "epoch": 0.82, + "learning_rate": 0.00017741469113252483, + "loss": 0.0385, "step": 126620 }, { - "epoch": 1.37, - "learning_rate": 9.455188526185995e-05, - "loss": 0.0288, + "epoch": 0.82, + "learning_rate": 0.00017740500977816789, + "loss": 0.0419, "step": 126630 }, { - "epoch": 1.37, - "learning_rate": 9.453566097735088e-05, - "loss": 0.0321, + "epoch": 0.82, + "learning_rate": 0.00017739532842381094, + "loss": 0.0411, "step": 126640 }, { - "epoch": 1.37, - "learning_rate": 9.451943669284183e-05, - "loss": 0.0368, + "epoch": 0.82, + "learning_rate": 0.00017738564706945402, + "loss": 0.0495, "step": 126650 }, { - "epoch": 1.37, - "learning_rate": 9.450321240833278e-05, - "loss": 0.0359, + "epoch": 0.82, + "learning_rate": 0.0001773759657150971, + "loss": 0.0458, "step": 126660 }, { - "epoch": 1.37, - "learning_rate": 9.448698812382373e-05, - "loss": 0.0308, + "epoch": 0.82, + "learning_rate": 0.00017736628436074015, + "loss": 0.0382, "step": 126670 }, { - "epoch": 1.37, - "learning_rate": 9.447076383931468e-05, - "loss": 0.0305, + "epoch": 0.82, + "learning_rate": 0.00017735660300638323, + "loss": 0.0472, "step": 126680 }, { - "epoch": 1.37, - "learning_rate": 9.445453955480562e-05, - "loss": 0.0292, + "epoch": 0.82, + "learning_rate": 0.0001773469216520263, + "loss": 0.037, "step": 126690 }, { - "epoch": 1.37, - "learning_rate": 9.443831527029657e-05, - "loss": 0.0301, + "epoch": 0.82, + "learning_rate": 0.00017733724029766934, + "loss": 0.0417, "step": 126700 }, { - "epoch": 1.37, - "learning_rate": 9.442209098578752e-05, - "loss": 0.0322, + "epoch": 0.82, + "learning_rate": 0.00017732755894331242, + "loss": 0.0442, "step": 126710 }, { - "epoch": 1.37, - "learning_rate": 9.440586670127847e-05, - "loss": 0.0327, + "epoch": 0.82, + "learning_rate": 0.0001773178775889555, + "loss": 0.0461, "step": 126720 }, { - "epoch": 1.37, - "learning_rate": 9.43896424167694e-05, - "loss": 0.0276, + "epoch": 0.82, + "learning_rate": 0.00017730819623459858, + "loss": 0.043, "step": 126730 }, { - "epoch": 1.37, - "learning_rate": 9.437341813226036e-05, - "loss": 0.0331, + "epoch": 0.82, + "learning_rate": 0.00017729851488024163, + "loss": 0.0416, "step": 126740 }, { - "epoch": 1.37, - "learning_rate": 9.43571938477513e-05, - "loss": 0.0327, + "epoch": 0.82, + "learning_rate": 0.0001772888335258847, + "loss": 0.0514, "step": 126750 }, { - "epoch": 1.37, - "learning_rate": 9.434096956324225e-05, - "loss": 0.0286, + "epoch": 0.82, + "learning_rate": 0.0001772791521715278, + "loss": 0.0514, "step": 126760 }, { - "epoch": 1.37, - "learning_rate": 9.43247452787332e-05, - "loss": 0.0323, + "epoch": 0.82, + "learning_rate": 0.0001772694708171708, + "loss": 0.0449, "step": 126770 }, { - "epoch": 1.37, - "learning_rate": 9.430852099422414e-05, - "loss": 0.0329, + "epoch": 0.82, + "learning_rate": 0.0001772597894628139, + "loss": 0.0397, "step": 126780 }, { - "epoch": 1.37, - "learning_rate": 9.429229670971509e-05, - "loss": 0.0328, + "epoch": 0.82, + "learning_rate": 0.00017725010810845697, + "loss": 0.046, "step": 126790 }, { - "epoch": 1.37, - "learning_rate": 9.427607242520604e-05, - "loss": 0.028, + "epoch": 0.82, + "learning_rate": 0.00017724042675410005, + "loss": 0.0405, "step": 126800 }, { - "epoch": 1.37, - "learning_rate": 9.425984814069699e-05, - "loss": 0.0286, + "epoch": 0.82, + "learning_rate": 0.0001772307453997431, + "loss": 0.0456, "step": 126810 }, { - "epoch": 1.37, - "learning_rate": 9.424362385618793e-05, - "loss": 0.0386, + "epoch": 0.82, + "learning_rate": 0.00017722106404538618, + "loss": 0.0519, "step": 126820 }, { - "epoch": 1.37, - "learning_rate": 9.422739957167888e-05, - "loss": 0.0329, + "epoch": 0.82, + "learning_rate": 0.00017721138269102926, + "loss": 0.0399, "step": 126830 }, { - "epoch": 1.37, - "learning_rate": 9.421117528716983e-05, - "loss": 0.0335, + "epoch": 0.82, + "learning_rate": 0.0001772017013366723, + "loss": 0.0401, "step": 126840 }, { - "epoch": 1.37, - "learning_rate": 9.419495100266078e-05, - "loss": 0.0336, + "epoch": 0.82, + "learning_rate": 0.00017719201998231537, + "loss": 0.0455, "step": 126850 }, { - "epoch": 1.37, - "learning_rate": 9.417872671815173e-05, - "loss": 0.0289, + "epoch": 0.82, + "learning_rate": 0.00017718233862795845, + "loss": 0.0411, "step": 126860 }, { - "epoch": 1.37, - "learning_rate": 9.416250243364266e-05, - "loss": 0.0311, + "epoch": 0.82, + "learning_rate": 0.0001771726572736015, + "loss": 0.0432, "step": 126870 }, { - "epoch": 1.37, - "learning_rate": 9.414627814913361e-05, - "loss": 0.0299, + "epoch": 0.82, + "learning_rate": 0.00017716297591924458, + "loss": 0.0412, "step": 126880 }, { - "epoch": 1.37, - "learning_rate": 9.413005386462456e-05, - "loss": 0.0315, + "epoch": 0.82, + "learning_rate": 0.00017715329456488766, + "loss": 0.0459, "step": 126890 }, { - "epoch": 1.37, - "learning_rate": 9.411382958011551e-05, - "loss": 0.0304, + "epoch": 0.82, + "learning_rate": 0.00017714361321053074, + "loss": 0.0392, "step": 126900 }, { - "epoch": 1.37, - "learning_rate": 9.409760529560646e-05, - "loss": 0.0358, + "epoch": 0.82, + "learning_rate": 0.00017713393185617377, + "loss": 0.0407, "step": 126910 }, { - "epoch": 1.37, - "learning_rate": 9.40813810110974e-05, - "loss": 0.0348, + "epoch": 0.82, + "learning_rate": 0.00017712425050181685, + "loss": 0.0444, "step": 126920 }, { - "epoch": 1.37, - "learning_rate": 9.406515672658835e-05, - "loss": 0.0361, + "epoch": 0.82, + "learning_rate": 0.00017711456914745993, + "loss": 0.0394, "step": 126930 }, { - "epoch": 1.37, - "learning_rate": 9.40489324420793e-05, - "loss": 0.035, + "epoch": 0.82, + "learning_rate": 0.00017710488779310298, + "loss": 0.0364, "step": 126940 }, { - "epoch": 1.37, - "learning_rate": 9.403270815757025e-05, - "loss": 0.0317, + "epoch": 0.82, + "learning_rate": 0.00017709520643874606, + "loss": 0.0368, "step": 126950 }, { - "epoch": 1.37, - "learning_rate": 9.401648387306118e-05, - "loss": 0.028, + "epoch": 0.82, + "learning_rate": 0.00017708552508438914, + "loss": 0.0365, "step": 126960 }, { - "epoch": 1.37, - "learning_rate": 9.400025958855213e-05, - "loss": 0.0354, + "epoch": 0.82, + "learning_rate": 0.00017707584373003222, + "loss": 0.0384, "step": 126970 }, { - "epoch": 1.37, - "learning_rate": 9.398403530404308e-05, - "loss": 0.035, + "epoch": 0.82, + "learning_rate": 0.00017706616237567524, + "loss": 0.0408, "step": 126980 }, { - "epoch": 1.37, - "learning_rate": 9.396781101953403e-05, - "loss": 0.0318, + "epoch": 0.82, + "learning_rate": 0.00017705648102131832, + "loss": 0.0367, "step": 126990 }, { - "epoch": 1.37, - "learning_rate": 9.395158673502498e-05, - "loss": 0.0318, + "epoch": 0.82, + "learning_rate": 0.0001770467996669614, + "loss": 0.0386, "step": 127000 }, { - "epoch": 1.37, - "eval_cer": 0.9211613931487558, - "eval_loss": 0.0249780360609293, - "eval_runtime": 118.9676, - "eval_samples_per_second": 16.811, - "eval_steps_per_second": 4.203, + "epoch": 0.82, + "eval_cer": 0.9199466726923512, + "eval_loss": 0.028268195688724518, + "eval_runtime": 120.0387, + "eval_samples_per_second": 16.661, + "eval_steps_per_second": 4.165, "step": 127000 }, { - "epoch": 1.37, - "learning_rate": 9.393536245051592e-05, - "loss": 0.0343, + "epoch": 0.82, + "learning_rate": 0.00017703711831260446, + "loss": 0.0422, "step": 127010 }, { - "epoch": 1.37, - "learning_rate": 9.391913816600687e-05, - "loss": 0.0303, + "epoch": 0.82, + "learning_rate": 0.00017702743695824754, + "loss": 0.041, "step": 127020 }, { - "epoch": 1.37, - "learning_rate": 9.390291388149782e-05, - "loss": 0.0304, + "epoch": 0.82, + "learning_rate": 0.00017701775560389062, + "loss": 0.0395, "step": 127030 }, { - "epoch": 1.37, - "learning_rate": 9.388668959698877e-05, - "loss": 0.031, + "epoch": 0.82, + "learning_rate": 0.00017700807424953367, + "loss": 0.0428, "step": 127040 }, { - "epoch": 1.37, - "learning_rate": 9.38704653124797e-05, - "loss": 0.0341, + "epoch": 0.82, + "learning_rate": 0.00017699839289517672, + "loss": 0.0419, "step": 127050 }, { - "epoch": 1.37, - "learning_rate": 9.385424102797065e-05, - "loss": 0.0276, + "epoch": 0.82, + "learning_rate": 0.0001769887115408198, + "loss": 0.045, "step": 127060 }, { - "epoch": 1.37, - "learning_rate": 9.38380167434616e-05, - "loss": 0.0336, + "epoch": 0.82, + "learning_rate": 0.00017697903018646285, + "loss": 0.0441, "step": 127070 }, { - "epoch": 1.37, - "learning_rate": 9.382179245895255e-05, - "loss": 0.0306, + "epoch": 0.82, + "learning_rate": 0.00017696934883210593, + "loss": 0.039, "step": 127080 }, { - "epoch": 1.37, - "learning_rate": 9.38055681744435e-05, - "loss": 0.0427, + "epoch": 0.82, + "learning_rate": 0.00017695966747774901, + "loss": 0.0419, "step": 127090 }, { - "epoch": 1.37, - "learning_rate": 9.378934388993444e-05, - "loss": 0.0328, + "epoch": 0.82, + "learning_rate": 0.0001769499861233921, + "loss": 0.0339, "step": 127100 }, { - "epoch": 1.37, - "learning_rate": 9.377311960542539e-05, - "loss": 0.0354, + "epoch": 0.82, + "learning_rate": 0.00017694030476903515, + "loss": 0.0528, "step": 127110 }, { - "epoch": 1.37, - "learning_rate": 9.375689532091634e-05, - "loss": 0.0332, + "epoch": 0.82, + "learning_rate": 0.0001769306234146782, + "loss": 0.0467, "step": 127120 }, { - "epoch": 1.38, - "learning_rate": 9.374067103640729e-05, - "loss": 0.0319, + "epoch": 0.82, + "learning_rate": 0.00017692094206032128, + "loss": 0.0422, "step": 127130 }, { - "epoch": 1.38, - "learning_rate": 9.372444675189822e-05, - "loss": 0.029, + "epoch": 0.82, + "learning_rate": 0.00017691126070596433, + "loss": 0.0408, "step": 127140 }, { - "epoch": 1.38, - "learning_rate": 9.370822246738917e-05, - "loss": 0.0369, + "epoch": 0.82, + "learning_rate": 0.0001769015793516074, + "loss": 0.0477, "step": 127150 }, { - "epoch": 1.38, - "learning_rate": 9.369199818288012e-05, - "loss": 0.0359, + "epoch": 0.82, + "learning_rate": 0.0001768918979972505, + "loss": 0.0406, "step": 127160 }, { - "epoch": 1.38, - "learning_rate": 9.367577389837107e-05, - "loss": 0.03, + "epoch": 0.82, + "learning_rate": 0.00017688221664289357, + "loss": 0.0406, "step": 127170 }, { - "epoch": 1.38, - "learning_rate": 9.365954961386202e-05, - "loss": 0.0375, + "epoch": 0.82, + "learning_rate": 0.00017687253528853662, + "loss": 0.0431, "step": 127180 }, { - "epoch": 1.38, - "learning_rate": 9.364332532935296e-05, - "loss": 0.0254, + "epoch": 0.82, + "learning_rate": 0.00017686285393417968, + "loss": 0.0433, "step": 127190 }, { - "epoch": 1.38, - "learning_rate": 9.362710104484391e-05, - "loss": 0.0278, + "epoch": 0.82, + "learning_rate": 0.00017685317257982276, + "loss": 0.0435, "step": 127200 }, { - "epoch": 1.38, - "learning_rate": 9.361087676033486e-05, - "loss": 0.0286, + "epoch": 0.82, + "learning_rate": 0.0001768434912254658, + "loss": 0.0459, "step": 127210 }, { - "epoch": 1.38, - "learning_rate": 9.359465247582581e-05, - "loss": 0.032, + "epoch": 0.82, + "learning_rate": 0.0001768338098711089, + "loss": 0.0479, "step": 127220 }, { - "epoch": 1.38, - "learning_rate": 9.357842819131674e-05, - "loss": 0.0304, + "epoch": 0.82, + "learning_rate": 0.00017682412851675197, + "loss": 0.045, "step": 127230 }, { - "epoch": 1.38, - "learning_rate": 9.35622039068077e-05, - "loss": 0.0299, + "epoch": 0.82, + "learning_rate": 0.00017681444716239502, + "loss": 0.0353, "step": 127240 }, { - "epoch": 1.38, - "learning_rate": 9.354597962229864e-05, - "loss": 0.0313, + "epoch": 0.82, + "learning_rate": 0.0001768047658080381, + "loss": 0.051, "step": 127250 }, { - "epoch": 1.38, - "learning_rate": 9.35297553377896e-05, - "loss": 0.0344, + "epoch": 0.82, + "learning_rate": 0.00017679508445368115, + "loss": 0.0416, "step": 127260 }, { - "epoch": 1.38, - "learning_rate": 9.351353105328054e-05, - "loss": 0.0288, + "epoch": 0.82, + "learning_rate": 0.0001767854030993242, + "loss": 0.0445, "step": 127270 }, { - "epoch": 1.38, - "learning_rate": 9.349730676877148e-05, - "loss": 0.032, + "epoch": 0.82, + "learning_rate": 0.00017677572174496729, + "loss": 0.0381, "step": 127280 }, { - "epoch": 1.38, - "learning_rate": 9.348108248426243e-05, - "loss": 0.0328, + "epoch": 0.82, + "learning_rate": 0.00017676604039061037, + "loss": 0.0484, "step": 127290 }, { - "epoch": 1.38, - "learning_rate": 9.346485819975338e-05, - "loss": 0.0309, + "epoch": 0.82, + "learning_rate": 0.00017675635903625345, + "loss": 0.0425, "step": 127300 }, { - "epoch": 1.38, - "learning_rate": 9.344863391524433e-05, - "loss": 0.0349, + "epoch": 0.82, + "learning_rate": 0.0001767466776818965, + "loss": 0.0469, "step": 127310 }, { - "epoch": 1.38, - "learning_rate": 9.343240963073527e-05, - "loss": 0.0273, + "epoch": 0.82, + "learning_rate": 0.00017673699632753958, + "loss": 0.0387, "step": 127320 }, { - "epoch": 1.38, - "learning_rate": 9.341618534622622e-05, - "loss": 0.03, + "epoch": 0.82, + "learning_rate": 0.00017672731497318263, + "loss": 0.0447, "step": 127330 }, { - "epoch": 1.38, - "learning_rate": 9.339996106171717e-05, - "loss": 0.0328, + "epoch": 0.82, + "learning_rate": 0.00017671763361882568, + "loss": 0.0422, "step": 127340 }, { - "epoch": 1.38, - "learning_rate": 9.338373677720812e-05, - "loss": 0.0321, + "epoch": 0.82, + "learning_rate": 0.00017670795226446876, + "loss": 0.0605, "step": 127350 }, { - "epoch": 1.38, - "learning_rate": 9.336751249269906e-05, - "loss": 0.0297, + "epoch": 0.82, + "learning_rate": 0.00017669827091011184, + "loss": 0.0427, "step": 127360 }, { - "epoch": 1.38, - "learning_rate": 9.335128820819e-05, - "loss": 0.0294, + "epoch": 0.82, + "learning_rate": 0.00017668858955575492, + "loss": 0.0439, "step": 127370 }, { - "epoch": 1.38, - "learning_rate": 9.333506392368095e-05, - "loss": 0.0349, + "epoch": 0.82, + "learning_rate": 0.00017667890820139798, + "loss": 0.0366, "step": 127380 }, { - "epoch": 1.38, - "learning_rate": 9.33188396391719e-05, - "loss": 0.0302, + "epoch": 0.82, + "learning_rate": 0.00017666922684704106, + "loss": 0.0442, "step": 127390 }, { - "epoch": 1.38, - "learning_rate": 9.330261535466285e-05, - "loss": 0.0263, + "epoch": 0.82, + "learning_rate": 0.0001766595454926841, + "loss": 0.0502, "step": 127400 }, { - "epoch": 1.38, - "learning_rate": 9.328639107015379e-05, - "loss": 0.0294, + "epoch": 0.82, + "learning_rate": 0.00017664986413832716, + "loss": 0.0392, "step": 127410 }, { - "epoch": 1.38, - "learning_rate": 9.327016678564474e-05, - "loss": 0.0256, + "epoch": 0.82, + "learning_rate": 0.00017664018278397024, + "loss": 0.0474, "step": 127420 }, { - "epoch": 1.38, - "learning_rate": 9.325394250113569e-05, - "loss": 0.0349, + "epoch": 0.82, + "learning_rate": 0.00017663050142961332, + "loss": 0.0513, "step": 127430 }, { - "epoch": 1.38, - "learning_rate": 9.323771821662664e-05, - "loss": 0.0312, + "epoch": 0.82, + "learning_rate": 0.00017662082007525637, + "loss": 0.0382, "step": 127440 }, { - "epoch": 1.38, - "learning_rate": 9.322149393211759e-05, - "loss": 0.0309, + "epoch": 0.82, + "learning_rate": 0.00017661113872089945, + "loss": 0.0405, "step": 127450 }, { - "epoch": 1.38, - "learning_rate": 9.320526964760852e-05, - "loss": 0.0333, + "epoch": 0.82, + "learning_rate": 0.0001766014573665425, + "loss": 0.0391, "step": 127460 }, { - "epoch": 1.38, - "learning_rate": 9.318904536309947e-05, - "loss": 0.0293, + "epoch": 0.82, + "learning_rate": 0.00017659177601218556, + "loss": 0.0434, "step": 127470 }, { - "epoch": 1.38, - "learning_rate": 9.317282107859042e-05, - "loss": 0.0341, + "epoch": 0.82, + "learning_rate": 0.00017658209465782864, + "loss": 0.0446, "step": 127480 }, { - "epoch": 1.38, - "learning_rate": 9.315659679408137e-05, - "loss": 0.0345, + "epoch": 0.82, + "learning_rate": 0.00017657241330347172, + "loss": 0.0356, "step": 127490 }, { - "epoch": 1.38, - "learning_rate": 9.314037250957231e-05, - "loss": 0.0294, + "epoch": 0.82, + "learning_rate": 0.0001765627319491148, + "loss": 0.0395, "step": 127500 }, { - "epoch": 1.38, - "learning_rate": 9.312414822506326e-05, - "loss": 0.0338, + "epoch": 0.82, + "learning_rate": 0.00017655305059475785, + "loss": 0.0421, "step": 127510 }, { - "epoch": 1.38, - "learning_rate": 9.310792394055421e-05, - "loss": 0.0394, + "epoch": 0.82, + "learning_rate": 0.00017654336924040093, + "loss": 0.0395, "step": 127520 }, { - "epoch": 1.38, - "learning_rate": 9.309169965604516e-05, - "loss": 0.0289, + "epoch": 0.82, + "learning_rate": 0.00017653368788604398, + "loss": 0.0436, "step": 127530 }, { - "epoch": 1.38, - "learning_rate": 9.30754753715361e-05, - "loss": 0.0327, + "epoch": 0.82, + "learning_rate": 0.00017652400653168704, + "loss": 0.0451, "step": 127540 }, { - "epoch": 1.38, - "learning_rate": 9.305925108702704e-05, - "loss": 0.0346, + "epoch": 0.82, + "learning_rate": 0.00017651432517733012, + "loss": 0.0421, "step": 127550 }, { - "epoch": 1.38, - "learning_rate": 9.304302680251799e-05, - "loss": 0.0323, + "epoch": 0.82, + "learning_rate": 0.0001765046438229732, + "loss": 0.0394, "step": 127560 }, { - "epoch": 1.38, - "learning_rate": 9.302680251800894e-05, - "loss": 0.0303, + "epoch": 0.82, + "learning_rate": 0.00017649496246861627, + "loss": 0.0394, "step": 127570 }, { - "epoch": 1.38, - "learning_rate": 9.301057823349989e-05, - "loss": 0.0296, + "epoch": 0.82, + "learning_rate": 0.00017648528111425933, + "loss": 0.0413, "step": 127580 }, { - "epoch": 1.38, - "learning_rate": 9.299435394899084e-05, - "loss": 0.0301, + "epoch": 0.82, + "learning_rate": 0.0001764755997599024, + "loss": 0.0377, "step": 127590 }, { - "epoch": 1.38, - "learning_rate": 9.297812966448178e-05, - "loss": 0.0322, + "epoch": 0.82, + "learning_rate": 0.00017646591840554546, + "loss": 0.048, "step": 127600 }, { - "epoch": 1.38, - "learning_rate": 9.296190537997273e-05, - "loss": 0.0314, + "epoch": 0.82, + "learning_rate": 0.0001764562370511885, + "loss": 0.0425, "step": 127610 }, { - "epoch": 1.38, - "learning_rate": 9.294568109546368e-05, - "loss": 0.0311, + "epoch": 0.82, + "learning_rate": 0.0001764465556968316, + "loss": 0.0428, "step": 127620 }, { - "epoch": 1.38, - "learning_rate": 9.292945681095463e-05, - "loss": 0.0325, + "epoch": 0.82, + "learning_rate": 0.00017643687434247467, + "loss": 0.0404, "step": 127630 }, { - "epoch": 1.38, - "learning_rate": 9.291323252644556e-05, - "loss": 0.033, + "epoch": 0.82, + "learning_rate": 0.00017642719298811772, + "loss": 0.0465, "step": 127640 }, { - "epoch": 1.38, - "learning_rate": 9.289700824193651e-05, - "loss": 0.0305, + "epoch": 0.82, + "learning_rate": 0.0001764175116337608, + "loss": 0.0435, "step": 127650 }, { - "epoch": 1.38, - "learning_rate": 9.288078395742746e-05, - "loss": 0.0309, + "epoch": 0.82, + "learning_rate": 0.00017640783027940388, + "loss": 0.0424, "step": 127660 }, { - "epoch": 1.38, - "learning_rate": 9.286455967291841e-05, - "loss": 0.0307, + "epoch": 0.82, + "learning_rate": 0.0001763981489250469, + "loss": 0.0423, "step": 127670 }, { - "epoch": 1.38, - "learning_rate": 9.284833538840936e-05, - "loss": 0.0275, + "epoch": 0.82, + "learning_rate": 0.00017638846757069, + "loss": 0.0483, "step": 127680 }, { - "epoch": 1.38, - "learning_rate": 9.28321111039003e-05, - "loss": 0.0287, + "epoch": 0.82, + "learning_rate": 0.00017637878621633307, + "loss": 0.0465, "step": 127690 }, { - "epoch": 1.38, - "learning_rate": 9.281588681939125e-05, - "loss": 0.0317, + "epoch": 0.82, + "learning_rate": 0.00017636910486197615, + "loss": 0.0513, "step": 127700 }, { - "epoch": 1.38, - "learning_rate": 9.27996625348822e-05, - "loss": 0.0296, + "epoch": 0.82, + "learning_rate": 0.0001763594235076192, + "loss": 0.0442, "step": 127710 }, { - "epoch": 1.38, - "learning_rate": 9.278343825037315e-05, - "loss": 0.0337, + "epoch": 0.82, + "learning_rate": 0.00017634974215326228, + "loss": 0.0404, "step": 127720 }, { - "epoch": 1.38, - "learning_rate": 9.276721396586408e-05, - "loss": 0.0324, + "epoch": 0.82, + "learning_rate": 0.00017634006079890536, + "loss": 0.0453, "step": 127730 }, { - "epoch": 1.38, - "learning_rate": 9.275098968135503e-05, - "loss": 0.0392, + "epoch": 0.82, + "learning_rate": 0.0001763303794445484, + "loss": 0.0441, "step": 127740 }, { - "epoch": 1.38, - "learning_rate": 9.273476539684598e-05, - "loss": 0.0319, + "epoch": 0.82, + "learning_rate": 0.00017632069809019147, + "loss": 0.0381, "step": 127750 }, { - "epoch": 1.38, - "learning_rate": 9.271854111233693e-05, - "loss": 0.0312, + "epoch": 0.82, + "learning_rate": 0.00017631101673583455, + "loss": 0.0426, "step": 127760 }, { - "epoch": 1.38, - "learning_rate": 9.270231682782788e-05, - "loss": 0.025, + "epoch": 0.82, + "learning_rate": 0.00017630133538147763, + "loss": 0.0375, "step": 127770 }, { - "epoch": 1.38, - "learning_rate": 9.268609254331882e-05, - "loss": 0.0265, + "epoch": 0.82, + "learning_rate": 0.00017629165402712068, + "loss": 0.0441, "step": 127780 }, { - "epoch": 1.38, - "learning_rate": 9.266986825880977e-05, - "loss": 0.03, + "epoch": 0.82, + "learning_rate": 0.00017628197267276376, + "loss": 0.0416, "step": 127790 }, { - "epoch": 1.38, - "learning_rate": 9.265364397430072e-05, - "loss": 0.0348, + "epoch": 0.82, + "learning_rate": 0.00017627229131840684, + "loss": 0.0388, "step": 127800 }, { - "epoch": 1.38, - "learning_rate": 9.263741968979167e-05, - "loss": 0.0348, + "epoch": 0.82, + "learning_rate": 0.00017626260996404986, + "loss": 0.0484, "step": 127810 }, { - "epoch": 1.38, - "learning_rate": 9.26211954052826e-05, - "loss": 0.0275, + "epoch": 0.82, + "learning_rate": 0.00017625292860969294, + "loss": 0.048, "step": 127820 }, { - "epoch": 1.38, - "learning_rate": 9.260497112077356e-05, - "loss": 0.0314, + "epoch": 0.83, + "learning_rate": 0.00017624324725533602, + "loss": 0.0383, "step": 127830 }, { - "epoch": 1.38, - "learning_rate": 9.25887468362645e-05, - "loss": 0.0279, + "epoch": 0.83, + "learning_rate": 0.00017623356590097908, + "loss": 0.0385, "step": 127840 }, { - "epoch": 1.38, - "learning_rate": 9.257252255175545e-05, - "loss": 0.0314, + "epoch": 0.83, + "learning_rate": 0.00017622388454662216, + "loss": 0.042, "step": 127850 }, { - "epoch": 1.38, - "learning_rate": 9.25562982672464e-05, - "loss": 0.0285, + "epoch": 0.83, + "learning_rate": 0.00017621420319226524, + "loss": 0.0385, "step": 127860 }, { - "epoch": 1.38, - "learning_rate": 9.254007398273734e-05, - "loss": 0.0325, + "epoch": 0.83, + "learning_rate": 0.00017620452183790832, + "loss": 0.0397, "step": 127870 }, { - "epoch": 1.38, - "learning_rate": 9.252384969822829e-05, - "loss": 0.0349, + "epoch": 0.83, + "learning_rate": 0.00017619484048355134, + "loss": 0.0395, "step": 127880 }, { - "epoch": 1.38, - "learning_rate": 9.250762541371925e-05, - "loss": 0.0276, + "epoch": 0.83, + "learning_rate": 0.00017618515912919442, + "loss": 0.0447, "step": 127890 }, { - "epoch": 1.38, - "learning_rate": 9.24914011292102e-05, - "loss": 0.0354, + "epoch": 0.83, + "learning_rate": 0.0001761754777748375, + "loss": 0.0465, "step": 127900 }, { - "epoch": 1.38, - "learning_rate": 9.247517684470115e-05, - "loss": 0.0349, + "epoch": 0.83, + "learning_rate": 0.00017616579642048055, + "loss": 0.0433, "step": 127910 }, { - "epoch": 1.38, - "learning_rate": 9.245895256019209e-05, - "loss": 0.0327, + "epoch": 0.83, + "learning_rate": 0.00017615611506612363, + "loss": 0.0416, "step": 127920 }, { - "epoch": 1.38, - "learning_rate": 9.244272827568304e-05, - "loss": 0.0297, + "epoch": 0.83, + "learning_rate": 0.0001761464337117667, + "loss": 0.0389, "step": 127930 }, { - "epoch": 1.38, - "learning_rate": 9.242650399117399e-05, - "loss": 0.0285, + "epoch": 0.83, + "learning_rate": 0.0001761367523574098, + "loss": 0.038, "step": 127940 }, { - "epoch": 1.38, - "learning_rate": 9.241027970666494e-05, - "loss": 0.0285, + "epoch": 0.83, + "learning_rate": 0.00017612707100305282, + "loss": 0.0432, "step": 127950 }, { - "epoch": 1.38, - "learning_rate": 9.239405542215589e-05, - "loss": 0.0429, + "epoch": 0.83, + "learning_rate": 0.0001761173896486959, + "loss": 0.0416, "step": 127960 }, { - "epoch": 1.38, - "learning_rate": 9.237783113764682e-05, - "loss": 0.0328, + "epoch": 0.83, + "learning_rate": 0.00017610770829433898, + "loss": 0.0366, "step": 127970 }, { - "epoch": 1.38, - "learning_rate": 9.236160685313777e-05, - "loss": 0.0283, + "epoch": 0.83, + "learning_rate": 0.00017609802693998203, + "loss": 0.0428, "step": 127980 }, { - "epoch": 1.38, - "learning_rate": 9.234538256862872e-05, - "loss": 0.0341, + "epoch": 0.83, + "learning_rate": 0.0001760883455856251, + "loss": 0.0395, "step": 127990 }, { - "epoch": 1.38, - "learning_rate": 9.232915828411967e-05, - "loss": 0.0284, + "epoch": 0.83, + "learning_rate": 0.0001760786642312682, + "loss": 0.0407, "step": 128000 }, { - "epoch": 1.38, - "eval_cer": 0.9211083840895076, - "eval_loss": 0.025005817413330078, - "eval_runtime": 118.8317, - "eval_samples_per_second": 16.831, - "eval_steps_per_second": 4.208, + "epoch": 0.83, + "eval_cer": 0.9198951530900463, + "eval_loss": 0.028159523382782936, + "eval_runtime": 120.0077, + "eval_samples_per_second": 16.666, + "eval_steps_per_second": 4.166, "step": 128000 }, { - "epoch": 1.38, - "learning_rate": 9.231293399961061e-05, - "loss": 0.032, + "epoch": 0.83, + "learning_rate": 0.00017606898287691127, + "loss": 0.0419, "step": 128010 }, { - "epoch": 1.38, - "learning_rate": 9.229670971510156e-05, - "loss": 0.0315, + "epoch": 0.83, + "learning_rate": 0.0001760593015225543, + "loss": 0.0419, "step": 128020 }, { - "epoch": 1.38, - "learning_rate": 9.228048543059251e-05, - "loss": 0.0345, + "epoch": 0.83, + "learning_rate": 0.00017604962016819738, + "loss": 0.0392, "step": 128030 }, { - "epoch": 1.38, - "learning_rate": 9.226426114608346e-05, - "loss": 0.0295, + "epoch": 0.83, + "learning_rate": 0.00017603993881384043, + "loss": 0.0534, "step": 128040 }, { - "epoch": 1.38, - "learning_rate": 9.224803686157441e-05, - "loss": 0.0286, + "epoch": 0.83, + "learning_rate": 0.0001760302574594835, + "loss": 0.0363, "step": 128050 }, { - "epoch": 1.39, - "learning_rate": 9.223181257706535e-05, - "loss": 0.0325, + "epoch": 0.83, + "learning_rate": 0.0001760205761051266, + "loss": 0.0479, "step": 128060 }, { - "epoch": 1.39, - "learning_rate": 9.22155882925563e-05, - "loss": 0.0306, + "epoch": 0.83, + "learning_rate": 0.00017601089475076967, + "loss": 0.041, "step": 128070 }, { - "epoch": 1.39, - "learning_rate": 9.219936400804725e-05, - "loss": 0.0335, + "epoch": 0.83, + "learning_rate": 0.00017600121339641272, + "loss": 0.0438, "step": 128080 }, { - "epoch": 1.39, - "learning_rate": 9.21831397235382e-05, - "loss": 0.0317, + "epoch": 0.83, + "learning_rate": 0.00017599153204205577, + "loss": 0.0371, "step": 128090 }, { - "epoch": 1.39, - "learning_rate": 9.216691543902913e-05, - "loss": 0.0324, + "epoch": 0.83, + "learning_rate": 0.00017598185068769885, + "loss": 0.0415, "step": 128100 }, { - "epoch": 1.39, - "learning_rate": 9.215069115452008e-05, - "loss": 0.0294, + "epoch": 0.83, + "learning_rate": 0.0001759721693333419, + "loss": 0.0406, "step": 128110 }, { - "epoch": 1.39, - "learning_rate": 9.213446687001103e-05, - "loss": 0.0343, + "epoch": 0.83, + "learning_rate": 0.00017596248797898499, + "loss": 0.0466, "step": 128120 }, { - "epoch": 1.39, - "learning_rate": 9.211824258550198e-05, - "loss": 0.0359, + "epoch": 0.83, + "learning_rate": 0.00017595280662462807, + "loss": 0.0355, "step": 128130 }, { - "epoch": 1.39, - "learning_rate": 9.210201830099293e-05, - "loss": 0.0282, + "epoch": 0.83, + "learning_rate": 0.00017594312527027115, + "loss": 0.0436, "step": 128140 }, { - "epoch": 1.39, - "learning_rate": 9.208579401648387e-05, - "loss": 0.028, + "epoch": 0.83, + "learning_rate": 0.0001759334439159142, + "loss": 0.0417, "step": 128150 }, { - "epoch": 1.39, - "learning_rate": 9.206956973197482e-05, - "loss": 0.0273, + "epoch": 0.83, + "learning_rate": 0.00017592376256155725, + "loss": 0.039, "step": 128160 }, { - "epoch": 1.39, - "learning_rate": 9.205334544746577e-05, - "loss": 0.0258, + "epoch": 0.83, + "learning_rate": 0.00017591408120720033, + "loss": 0.0443, "step": 128170 }, { - "epoch": 1.39, - "learning_rate": 9.203712116295672e-05, - "loss": 0.0334, + "epoch": 0.83, + "learning_rate": 0.00017590439985284338, + "loss": 0.0416, "step": 128180 }, { - "epoch": 1.39, - "learning_rate": 9.202089687844765e-05, - "loss": 0.0398, + "epoch": 0.83, + "learning_rate": 0.00017589471849848646, + "loss": 0.041, "step": 128190 }, { - "epoch": 1.39, - "learning_rate": 9.20046725939386e-05, - "loss": 0.0311, + "epoch": 0.83, + "learning_rate": 0.00017588503714412954, + "loss": 0.0408, "step": 128200 }, { - "epoch": 1.39, - "learning_rate": 9.198844830942955e-05, - "loss": 0.0292, + "epoch": 0.83, + "learning_rate": 0.00017587535578977262, + "loss": 0.0445, "step": 128210 }, { - "epoch": 1.39, - "learning_rate": 9.19722240249205e-05, - "loss": 0.0309, + "epoch": 0.83, + "learning_rate": 0.00017586567443541568, + "loss": 0.0421, "step": 128220 }, { - "epoch": 1.39, - "learning_rate": 9.195599974041145e-05, - "loss": 0.0327, + "epoch": 0.83, + "learning_rate": 0.00017585599308105873, + "loss": 0.0461, "step": 128230 }, { - "epoch": 1.39, - "learning_rate": 9.193977545590239e-05, - "loss": 0.0293, + "epoch": 0.83, + "learning_rate": 0.00017584631172670178, + "loss": 0.0395, "step": 128240 }, { - "epoch": 1.39, - "learning_rate": 9.192355117139334e-05, - "loss": 0.0252, + "epoch": 0.83, + "learning_rate": 0.00017583663037234486, + "loss": 0.0454, "step": 128250 }, { - "epoch": 1.39, - "learning_rate": 9.190732688688429e-05, - "loss": 0.0321, + "epoch": 0.83, + "learning_rate": 0.00017582694901798794, + "loss": 0.0414, "step": 128260 }, { - "epoch": 1.39, - "learning_rate": 9.189110260237524e-05, - "loss": 0.029, + "epoch": 0.83, + "learning_rate": 0.00017581726766363102, + "loss": 0.0423, "step": 128270 }, { - "epoch": 1.39, - "learning_rate": 9.187487831786619e-05, - "loss": 0.0322, + "epoch": 0.83, + "learning_rate": 0.00017580758630927407, + "loss": 0.0423, "step": 128280 }, { - "epoch": 1.39, - "learning_rate": 9.185865403335712e-05, - "loss": 0.0284, + "epoch": 0.83, + "learning_rate": 0.00017579790495491715, + "loss": 0.0431, "step": 128290 }, { - "epoch": 1.39, - "learning_rate": 9.184242974884807e-05, - "loss": 0.0294, + "epoch": 0.83, + "learning_rate": 0.0001757882236005602, + "loss": 0.0347, "step": 128300 }, { - "epoch": 1.39, - "learning_rate": 9.182620546433902e-05, - "loss": 0.0324, + "epoch": 0.83, + "learning_rate": 0.00017577854224620326, + "loss": 0.0474, "step": 128310 }, { - "epoch": 1.39, - "learning_rate": 9.180998117982997e-05, - "loss": 0.0257, + "epoch": 0.83, + "learning_rate": 0.00017576886089184634, + "loss": 0.0453, "step": 128320 }, { - "epoch": 1.39, - "learning_rate": 9.179375689532091e-05, - "loss": 0.0303, + "epoch": 0.83, + "learning_rate": 0.00017575917953748942, + "loss": 0.0374, "step": 128330 }, { - "epoch": 1.39, - "learning_rate": 9.177753261081186e-05, - "loss": 0.0343, + "epoch": 0.83, + "learning_rate": 0.0001757494981831325, + "loss": 0.0409, "step": 128340 }, { - "epoch": 1.39, - "learning_rate": 9.176130832630281e-05, - "loss": 0.0236, + "epoch": 0.83, + "learning_rate": 0.00017573981682877555, + "loss": 0.038, "step": 128350 }, { - "epoch": 1.39, - "learning_rate": 9.174508404179376e-05, - "loss": 0.0353, + "epoch": 0.83, + "learning_rate": 0.00017573013547441863, + "loss": 0.0439, "step": 128360 }, { - "epoch": 1.39, - "learning_rate": 9.172885975728471e-05, - "loss": 0.0291, + "epoch": 0.83, + "learning_rate": 0.00017572045412006168, + "loss": 0.04, "step": 128370 }, { - "epoch": 1.39, - "learning_rate": 9.171263547277564e-05, - "loss": 0.0284, + "epoch": 0.83, + "learning_rate": 0.00017571077276570473, + "loss": 0.0437, "step": 128380 }, { - "epoch": 1.39, - "learning_rate": 9.169641118826659e-05, - "loss": 0.0307, + "epoch": 0.83, + "learning_rate": 0.00017570109141134781, + "loss": 0.045, "step": 128390 }, { - "epoch": 1.39, - "learning_rate": 9.168018690375754e-05, - "loss": 0.0306, + "epoch": 0.83, + "learning_rate": 0.0001756914100569909, + "loss": 0.0391, "step": 128400 }, { - "epoch": 1.39, - "learning_rate": 9.166396261924849e-05, - "loss": 0.0289, + "epoch": 0.83, + "learning_rate": 0.00017568172870263397, + "loss": 0.0347, "step": 128410 }, { - "epoch": 1.39, - "learning_rate": 9.164773833473943e-05, - "loss": 0.0325, + "epoch": 0.83, + "learning_rate": 0.00017567204734827703, + "loss": 0.0365, "step": 128420 }, { - "epoch": 1.39, - "learning_rate": 9.163151405023038e-05, - "loss": 0.0324, + "epoch": 0.83, + "learning_rate": 0.0001756623659939201, + "loss": 0.0465, "step": 128430 }, { - "epoch": 1.39, - "learning_rate": 9.161528976572133e-05, - "loss": 0.0274, + "epoch": 0.83, + "learning_rate": 0.00017565268463956316, + "loss": 0.0418, "step": 128440 }, { - "epoch": 1.39, - "learning_rate": 9.159906548121228e-05, - "loss": 0.0341, + "epoch": 0.83, + "learning_rate": 0.0001756430032852062, + "loss": 0.0368, "step": 128450 }, { - "epoch": 1.39, - "learning_rate": 9.158284119670323e-05, - "loss": 0.0401, + "epoch": 0.83, + "learning_rate": 0.0001756333219308493, + "loss": 0.0473, "step": 128460 }, { - "epoch": 1.39, - "learning_rate": 9.156661691219416e-05, - "loss": 0.0337, + "epoch": 0.83, + "learning_rate": 0.00017562364057649237, + "loss": 0.0415, "step": 128470 }, { - "epoch": 1.39, - "learning_rate": 9.155039262768511e-05, - "loss": 0.031, + "epoch": 0.83, + "learning_rate": 0.00017561395922213542, + "loss": 0.048, "step": 128480 }, { - "epoch": 1.39, - "learning_rate": 9.153416834317606e-05, - "loss": 0.0385, + "epoch": 0.83, + "learning_rate": 0.0001756042778677785, + "loss": 0.0483, "step": 128490 }, { - "epoch": 1.39, - "learning_rate": 9.151794405866701e-05, - "loss": 0.0303, + "epoch": 0.83, + "learning_rate": 0.00017559459651342158, + "loss": 0.0351, "step": 128500 }, { - "epoch": 1.39, - "learning_rate": 9.150171977415795e-05, - "loss": 0.0285, + "epoch": 0.83, + "learning_rate": 0.0001755849151590646, + "loss": 0.0359, "step": 128510 }, { - "epoch": 1.39, - "learning_rate": 9.14854954896489e-05, - "loss": 0.0362, + "epoch": 0.83, + "learning_rate": 0.0001755752338047077, + "loss": 0.0387, "step": 128520 }, { - "epoch": 1.39, - "learning_rate": 9.146927120513985e-05, - "loss": 0.036, + "epoch": 0.83, + "learning_rate": 0.00017556555245035077, + "loss": 0.0398, "step": 128530 }, { - "epoch": 1.39, - "learning_rate": 9.14530469206308e-05, - "loss": 0.0296, + "epoch": 0.83, + "learning_rate": 0.00017555587109599385, + "loss": 0.0434, "step": 128540 }, { - "epoch": 1.39, - "learning_rate": 9.143682263612175e-05, - "loss": 0.0336, + "epoch": 0.83, + "learning_rate": 0.0001755461897416369, + "loss": 0.0389, "step": 128550 }, { - "epoch": 1.39, - "learning_rate": 9.142059835161268e-05, - "loss": 0.0312, + "epoch": 0.83, + "learning_rate": 0.00017553650838727998, + "loss": 0.04, "step": 128560 }, { - "epoch": 1.39, - "learning_rate": 9.140437406710363e-05, - "loss": 0.0283, + "epoch": 0.83, + "learning_rate": 0.00017552682703292306, + "loss": 0.0417, "step": 128570 }, { - "epoch": 1.39, - "learning_rate": 9.138814978259458e-05, - "loss": 0.0359, + "epoch": 0.83, + "learning_rate": 0.0001755171456785661, + "loss": 0.045, "step": 128580 }, { - "epoch": 1.39, - "learning_rate": 9.137192549808553e-05, - "loss": 0.0317, + "epoch": 0.83, + "learning_rate": 0.00017550746432420917, + "loss": 0.0525, "step": 128590 }, { - "epoch": 1.39, - "learning_rate": 9.135570121357647e-05, - "loss": 0.0305, + "epoch": 0.83, + "learning_rate": 0.00017549778296985225, + "loss": 0.0429, "step": 128600 }, { - "epoch": 1.39, - "learning_rate": 9.133947692906742e-05, - "loss": 0.0289, + "epoch": 0.83, + "learning_rate": 0.00017548810161549533, + "loss": 0.0382, "step": 128610 }, { - "epoch": 1.39, - "learning_rate": 9.132325264455837e-05, - "loss": 0.0334, + "epoch": 0.83, + "learning_rate": 0.00017547842026113838, + "loss": 0.0427, "step": 128620 }, { - "epoch": 1.39, - "learning_rate": 9.130702836004932e-05, - "loss": 0.03, + "epoch": 0.83, + "learning_rate": 0.00017546873890678146, + "loss": 0.0413, "step": 128630 }, { - "epoch": 1.39, - "learning_rate": 9.129080407554027e-05, - "loss": 0.0339, + "epoch": 0.83, + "learning_rate": 0.00017545905755242454, + "loss": 0.0482, "step": 128640 }, { - "epoch": 1.39, - "learning_rate": 9.12745797910312e-05, - "loss": 0.0361, + "epoch": 0.83, + "learning_rate": 0.00017544937619806756, + "loss": 0.0372, "step": 128650 }, { - "epoch": 1.39, - "learning_rate": 9.125835550652216e-05, - "loss": 0.0314, + "epoch": 0.83, + "learning_rate": 0.00017543969484371064, + "loss": 0.0432, "step": 128660 }, { - "epoch": 1.39, - "learning_rate": 9.12421312220131e-05, - "loss": 0.034, + "epoch": 0.83, + "learning_rate": 0.00017543001348935372, + "loss": 0.0434, "step": 128670 }, { - "epoch": 1.39, - "learning_rate": 9.122590693750406e-05, - "loss": 0.0327, + "epoch": 0.83, + "learning_rate": 0.00017542033213499678, + "loss": 0.0446, "step": 128680 }, { - "epoch": 1.39, - "learning_rate": 9.120968265299499e-05, - "loss": 0.0289, + "epoch": 0.83, + "learning_rate": 0.00017541065078063986, + "loss": 0.0437, "step": 128690 }, { - "epoch": 1.39, - "learning_rate": 9.119345836848594e-05, - "loss": 0.0318, + "epoch": 0.83, + "learning_rate": 0.00017540096942628294, + "loss": 0.0425, "step": 128700 }, { - "epoch": 1.39, - "learning_rate": 9.117723408397689e-05, - "loss": 0.0317, + "epoch": 0.83, + "learning_rate": 0.00017539128807192602, + "loss": 0.0402, "step": 128710 }, { - "epoch": 1.39, - "learning_rate": 9.116100979946784e-05, - "loss": 0.0274, + "epoch": 0.83, + "learning_rate": 0.00017538160671756904, + "loss": 0.0434, "step": 128720 }, { - "epoch": 1.39, - "learning_rate": 9.114478551495879e-05, - "loss": 0.035, + "epoch": 0.83, + "learning_rate": 0.00017537192536321212, + "loss": 0.0432, "step": 128730 }, { - "epoch": 1.39, - "learning_rate": 9.112856123044973e-05, - "loss": 0.0299, + "epoch": 0.83, + "learning_rate": 0.0001753622440088552, + "loss": 0.0391, "step": 128740 }, { - "epoch": 1.39, - "learning_rate": 9.111233694594068e-05, - "loss": 0.0313, + "epoch": 0.83, + "learning_rate": 0.00017535256265449825, + "loss": 0.0513, "step": 128750 }, { - "epoch": 1.39, - "learning_rate": 9.109611266143163e-05, - "loss": 0.025, + "epoch": 0.83, + "learning_rate": 0.00017534288130014133, + "loss": 0.0407, "step": 128760 }, { - "epoch": 1.39, - "learning_rate": 9.107988837692258e-05, - "loss": 0.0282, + "epoch": 0.83, + "learning_rate": 0.0001753331999457844, + "loss": 0.0399, "step": 128770 }, { - "epoch": 1.39, - "learning_rate": 9.106366409241351e-05, - "loss": 0.031, + "epoch": 0.83, + "learning_rate": 0.0001753235185914275, + "loss": 0.0423, "step": 128780 }, { - "epoch": 1.39, - "learning_rate": 9.104743980790446e-05, - "loss": 0.025, + "epoch": 0.83, + "learning_rate": 0.00017531383723707052, + "loss": 0.04, "step": 128790 }, { - "epoch": 1.39, - "learning_rate": 9.103121552339541e-05, - "loss": 0.0311, + "epoch": 0.83, + "learning_rate": 0.0001753041558827136, + "loss": 0.0329, "step": 128800 }, { - "epoch": 1.39, - "learning_rate": 9.101499123888636e-05, - "loss": 0.0299, + "epoch": 0.83, + "learning_rate": 0.00017529447452835668, + "loss": 0.0418, "step": 128810 }, { - "epoch": 1.39, - "learning_rate": 9.099876695437731e-05, - "loss": 0.0306, + "epoch": 0.83, + "learning_rate": 0.00017528479317399973, + "loss": 0.0436, "step": 128820 }, { - "epoch": 1.39, - "learning_rate": 9.098254266986825e-05, - "loss": 0.0308, + "epoch": 0.83, + "learning_rate": 0.0001752751118196428, + "loss": 0.0481, "step": 128830 }, { - "epoch": 1.39, - "learning_rate": 9.09663183853592e-05, - "loss": 0.0303, + "epoch": 0.83, + "learning_rate": 0.0001752654304652859, + "loss": 0.0432, "step": 128840 }, { - "epoch": 1.39, - "learning_rate": 9.095009410085015e-05, - "loss": 0.0371, + "epoch": 0.83, + "learning_rate": 0.00017525574911092894, + "loss": 0.039, "step": 128850 }, { - "epoch": 1.39, - "learning_rate": 9.09338698163411e-05, - "loss": 0.0307, + "epoch": 0.83, + "learning_rate": 0.000175246067756572, + "loss": 0.0367, "step": 128860 }, { - "epoch": 1.39, - "learning_rate": 9.091764553183203e-05, - "loss": 0.0353, + "epoch": 0.83, + "learning_rate": 0.00017523638640221508, + "loss": 0.045, "step": 128870 }, { - "epoch": 1.39, - "learning_rate": 9.090142124732298e-05, - "loss": 0.0288, + "epoch": 0.83, + "learning_rate": 0.00017522670504785813, + "loss": 0.0413, "step": 128880 }, { - "epoch": 1.39, - "learning_rate": 9.088519696281393e-05, - "loss": 0.0299, + "epoch": 0.83, + "learning_rate": 0.0001752170236935012, + "loss": 0.0378, "step": 128890 }, { - "epoch": 1.39, - "learning_rate": 9.086897267830488e-05, - "loss": 0.0319, + "epoch": 0.83, + "learning_rate": 0.0001752073423391443, + "loss": 0.0395, "step": 128900 }, { - "epoch": 1.39, - "learning_rate": 9.085274839379583e-05, - "loss": 0.0303, + "epoch": 0.83, + "learning_rate": 0.00017519766098478737, + "loss": 0.0403, "step": 128910 }, { - "epoch": 1.39, - "learning_rate": 9.083652410928677e-05, - "loss": 0.032, + "epoch": 0.83, + "learning_rate": 0.00017518797963043042, + "loss": 0.0482, "step": 128920 }, { - "epoch": 1.39, - "learning_rate": 9.082029982477772e-05, - "loss": 0.0299, + "epoch": 0.83, + "learning_rate": 0.00017517829827607347, + "loss": 0.0403, "step": 128930 }, { - "epoch": 1.39, - "learning_rate": 9.080407554026867e-05, - "loss": 0.0369, + "epoch": 0.83, + "learning_rate": 0.00017516861692171655, + "loss": 0.0473, "step": 128940 }, { - "epoch": 1.39, - "learning_rate": 9.078785125575962e-05, - "loss": 0.0259, + "epoch": 0.83, + "learning_rate": 0.0001751589355673596, + "loss": 0.04, "step": 128950 }, { - "epoch": 1.39, - "learning_rate": 9.077162697125055e-05, - "loss": 0.0342, + "epoch": 0.83, + "learning_rate": 0.00017514925421300269, + "loss": 0.0416, "step": 128960 }, { - "epoch": 1.39, - "learning_rate": 9.07554026867415e-05, - "loss": 0.0348, + "epoch": 0.83, + "learning_rate": 0.00017513957285864577, + "loss": 0.0386, "step": 128970 }, { - "epoch": 1.4, - "learning_rate": 9.073917840223245e-05, - "loss": 0.0285, + "epoch": 0.83, + "learning_rate": 0.00017512989150428884, + "loss": 0.0403, "step": 128980 }, { - "epoch": 1.4, - "learning_rate": 9.07229541177234e-05, - "loss": 0.0313, + "epoch": 0.83, + "learning_rate": 0.0001751202101499319, + "loss": 0.0432, "step": 128990 }, { - "epoch": 1.4, - "learning_rate": 9.070672983321435e-05, - "loss": 0.0311, + "epoch": 0.83, + "learning_rate": 0.00017511052879557495, + "loss": 0.0466, "step": 129000 }, { - "epoch": 1.4, - "eval_cer": 0.9211428399780189, - "eval_loss": 0.02476543001830578, - "eval_runtime": 118.8769, - "eval_samples_per_second": 16.824, - "eval_steps_per_second": 4.206, + "epoch": 0.83, + "eval_cer": 0.9198589989831657, + "eval_loss": 0.02755168452858925, + "eval_runtime": 119.9933, + "eval_samples_per_second": 16.668, + "eval_steps_per_second": 4.167, "step": 129000 }, { - "epoch": 1.4, - "learning_rate": 9.069050554870529e-05, - "loss": 0.0339, + "epoch": 0.83, + "learning_rate": 0.00017510084744121803, + "loss": 0.0418, "step": 129010 }, { - "epoch": 1.4, - "learning_rate": 9.067428126419624e-05, - "loss": 0.0349, + "epoch": 0.83, + "learning_rate": 0.00017509116608686108, + "loss": 0.0393, "step": 129020 }, { - "epoch": 1.4, - "learning_rate": 9.065805697968719e-05, - "loss": 0.0334, + "epoch": 0.83, + "learning_rate": 0.00017508148473250416, + "loss": 0.0434, "step": 129030 }, { - "epoch": 1.4, - "learning_rate": 9.064183269517814e-05, - "loss": 0.0263, + "epoch": 0.83, + "learning_rate": 0.00017507180337814724, + "loss": 0.0441, "step": 129040 }, { - "epoch": 1.4, - "learning_rate": 9.062560841066909e-05, - "loss": 0.0325, + "epoch": 0.83, + "learning_rate": 0.0001750621220237903, + "loss": 0.0422, "step": 129050 }, { - "epoch": 1.4, - "learning_rate": 9.060938412616002e-05, - "loss": 0.0318, + "epoch": 0.83, + "learning_rate": 0.00017505244066943337, + "loss": 0.0391, "step": 129060 }, { - "epoch": 1.4, - "learning_rate": 9.059315984165097e-05, - "loss": 0.0297, + "epoch": 0.83, + "learning_rate": 0.00017504275931507643, + "loss": 0.0462, "step": 129070 }, { - "epoch": 1.4, - "learning_rate": 9.057693555714192e-05, - "loss": 0.0306, + "epoch": 0.83, + "learning_rate": 0.00017503307796071948, + "loss": 0.0385, "step": 129080 }, { - "epoch": 1.4, - "learning_rate": 9.056071127263287e-05, - "loss": 0.0313, + "epoch": 0.83, + "learning_rate": 0.00017502339660636256, + "loss": 0.0378, "step": 129090 }, { - "epoch": 1.4, - "learning_rate": 9.054448698812381e-05, - "loss": 0.0286, + "epoch": 0.83, + "learning_rate": 0.00017501371525200564, + "loss": 0.0351, "step": 129100 }, { - "epoch": 1.4, - "learning_rate": 9.052826270361476e-05, - "loss": 0.0349, + "epoch": 0.83, + "learning_rate": 0.00017500403389764872, + "loss": 0.0418, "step": 129110 }, { - "epoch": 1.4, - "learning_rate": 9.051203841910571e-05, - "loss": 0.0309, + "epoch": 0.83, + "learning_rate": 0.00017499435254329177, + "loss": 0.0412, "step": 129120 }, { - "epoch": 1.4, - "learning_rate": 9.049581413459666e-05, - "loss": 0.0301, + "epoch": 0.83, + "learning_rate": 0.00017498467118893485, + "loss": 0.0423, "step": 129130 }, { - "epoch": 1.4, - "learning_rate": 9.047958985008761e-05, - "loss": 0.0275, + "epoch": 0.83, + "learning_rate": 0.0001749749898345779, + "loss": 0.0368, "step": 129140 }, { - "epoch": 1.4, - "learning_rate": 9.046336556557855e-05, - "loss": 0.0312, + "epoch": 0.83, + "learning_rate": 0.00017496530848022096, + "loss": 0.0378, "step": 129150 }, { - "epoch": 1.4, - "learning_rate": 9.04471412810695e-05, - "loss": 0.0388, + "epoch": 0.83, + "learning_rate": 0.00017495562712586404, + "loss": 0.0469, "step": 129160 }, { - "epoch": 1.4, - "learning_rate": 9.043091699656044e-05, - "loss": 0.0323, + "epoch": 0.83, + "learning_rate": 0.00017494594577150712, + "loss": 0.0397, "step": 129170 }, { - "epoch": 1.4, - "learning_rate": 9.04146927120514e-05, - "loss": 0.0376, + "epoch": 0.83, + "learning_rate": 0.0001749362644171502, + "loss": 0.0386, "step": 129180 }, { - "epoch": 1.4, - "learning_rate": 9.039846842754233e-05, - "loss": 0.0357, + "epoch": 0.83, + "learning_rate": 0.00017492658306279325, + "loss": 0.0468, "step": 129190 }, { - "epoch": 1.4, - "learning_rate": 9.038224414303328e-05, - "loss": 0.0291, + "epoch": 0.83, + "learning_rate": 0.00017491690170843633, + "loss": 0.0411, "step": 129200 }, { - "epoch": 1.4, - "learning_rate": 9.036601985852423e-05, - "loss": 0.0282, + "epoch": 0.83, + "learning_rate": 0.00017490722035407938, + "loss": 0.045, "step": 129210 }, { - "epoch": 1.4, - "learning_rate": 9.034979557401518e-05, - "loss": 0.032, + "epoch": 0.83, + "learning_rate": 0.00017489753899972243, + "loss": 0.039, "step": 129220 }, { - "epoch": 1.4, - "learning_rate": 9.033357128950613e-05, - "loss": 0.0275, + "epoch": 0.83, + "learning_rate": 0.00017488785764536551, + "loss": 0.0414, "step": 129230 }, { - "epoch": 1.4, - "learning_rate": 9.031734700499707e-05, - "loss": 0.0314, + "epoch": 0.83, + "learning_rate": 0.0001748781762910086, + "loss": 0.0433, "step": 129240 }, { - "epoch": 1.4, - "learning_rate": 9.030112272048802e-05, - "loss": 0.0285, + "epoch": 0.83, + "learning_rate": 0.00017486849493665165, + "loss": 0.0534, "step": 129250 }, { - "epoch": 1.4, - "learning_rate": 9.028489843597897e-05, - "loss": 0.0331, + "epoch": 0.83, + "learning_rate": 0.00017485881358229473, + "loss": 0.0487, "step": 129260 }, { - "epoch": 1.4, - "learning_rate": 9.026867415146992e-05, - "loss": 0.0277, + "epoch": 0.83, + "learning_rate": 0.0001748491322279378, + "loss": 0.0456, "step": 129270 }, { - "epoch": 1.4, - "learning_rate": 9.025244986696085e-05, - "loss": 0.0346, + "epoch": 0.83, + "learning_rate": 0.00017483945087358083, + "loss": 0.0432, "step": 129280 }, { - "epoch": 1.4, - "learning_rate": 9.02362255824518e-05, - "loss": 0.0294, + "epoch": 0.83, + "learning_rate": 0.0001748297695192239, + "loss": 0.0385, "step": 129290 }, { - "epoch": 1.4, - "learning_rate": 9.022000129794275e-05, - "loss": 0.0346, + "epoch": 0.83, + "learning_rate": 0.000174820088164867, + "loss": 0.0461, "step": 129300 }, { - "epoch": 1.4, - "learning_rate": 9.02037770134337e-05, - "loss": 0.0323, + "epoch": 0.83, + "learning_rate": 0.00017481040681051007, + "loss": 0.041, "step": 129310 }, { - "epoch": 1.4, - "learning_rate": 9.018755272892465e-05, - "loss": 0.0351, + "epoch": 0.83, + "learning_rate": 0.00017480072545615312, + "loss": 0.0494, "step": 129320 }, { - "epoch": 1.4, - "learning_rate": 9.017132844441559e-05, - "loss": 0.0241, + "epoch": 0.83, + "learning_rate": 0.0001747910441017962, + "loss": 0.0425, "step": 129330 }, { - "epoch": 1.4, - "learning_rate": 9.015510415990654e-05, - "loss": 0.0295, + "epoch": 0.83, + "learning_rate": 0.00017478136274743928, + "loss": 0.0438, "step": 129340 }, { - "epoch": 1.4, - "learning_rate": 9.013887987539749e-05, - "loss": 0.0261, + "epoch": 0.83, + "learning_rate": 0.0001747716813930823, + "loss": 0.0415, "step": 129350 }, { - "epoch": 1.4, - "learning_rate": 9.012265559088844e-05, - "loss": 0.0292, + "epoch": 0.83, + "learning_rate": 0.0001747620000387254, + "loss": 0.039, "step": 129360 }, { - "epoch": 1.4, - "learning_rate": 9.010643130637937e-05, - "loss": 0.0306, + "epoch": 0.83, + "learning_rate": 0.00017475231868436847, + "loss": 0.0415, "step": 129370 }, { - "epoch": 1.4, - "learning_rate": 9.009020702187032e-05, - "loss": 0.0276, + "epoch": 0.84, + "learning_rate": 0.00017474263733001155, + "loss": 0.0437, "step": 129380 }, { - "epoch": 1.4, - "learning_rate": 9.007398273736127e-05, - "loss": 0.0251, + "epoch": 0.84, + "learning_rate": 0.0001747329559756546, + "loss": 0.0453, "step": 129390 }, { - "epoch": 1.4, - "learning_rate": 9.005775845285222e-05, - "loss": 0.0327, + "epoch": 0.84, + "learning_rate": 0.00017472327462129768, + "loss": 0.044, "step": 129400 }, { - "epoch": 1.4, - "learning_rate": 9.004153416834317e-05, - "loss": 0.0279, + "epoch": 0.84, + "learning_rate": 0.00017471359326694076, + "loss": 0.0434, "step": 129410 }, { - "epoch": 1.4, - "learning_rate": 9.002530988383411e-05, - "loss": 0.0317, + "epoch": 0.84, + "learning_rate": 0.0001747039119125838, + "loss": 0.0458, "step": 129420 }, { - "epoch": 1.4, - "learning_rate": 9.000908559932506e-05, - "loss": 0.0282, + "epoch": 0.84, + "learning_rate": 0.00017469423055822687, + "loss": 0.0415, "step": 129430 }, { - "epoch": 1.4, - "learning_rate": 8.999286131481601e-05, - "loss": 0.0304, + "epoch": 0.84, + "learning_rate": 0.00017468454920386995, + "loss": 0.0378, "step": 129440 }, { - "epoch": 1.4, - "learning_rate": 8.997663703030696e-05, - "loss": 0.0296, + "epoch": 0.84, + "learning_rate": 0.000174674867849513, + "loss": 0.0408, "step": 129450 }, { - "epoch": 1.4, - "learning_rate": 8.99604127457979e-05, - "loss": 0.0372, + "epoch": 0.84, + "learning_rate": 0.00017466518649515608, + "loss": 0.0467, "step": 129460 }, { - "epoch": 1.4, - "learning_rate": 8.994418846128884e-05, - "loss": 0.0325, + "epoch": 0.84, + "learning_rate": 0.00017465550514079916, + "loss": 0.038, "step": 129470 }, { - "epoch": 1.4, - "learning_rate": 8.992796417677979e-05, - "loss": 0.0294, + "epoch": 0.84, + "learning_rate": 0.00017464582378644224, + "loss": 0.0437, "step": 129480 }, { - "epoch": 1.4, - "learning_rate": 8.991173989227074e-05, - "loss": 0.0314, + "epoch": 0.84, + "learning_rate": 0.00017463614243208526, + "loss": 0.042, "step": 129490 }, { - "epoch": 1.4, - "learning_rate": 8.989551560776169e-05, - "loss": 0.0305, + "epoch": 0.84, + "learning_rate": 0.00017462646107772834, + "loss": 0.0351, "step": 129500 }, { - "epoch": 1.4, - "learning_rate": 8.987929132325263e-05, - "loss": 0.0326, + "epoch": 0.84, + "learning_rate": 0.00017461677972337142, + "loss": 0.0441, "step": 129510 }, { - "epoch": 1.4, - "learning_rate": 8.986306703874358e-05, - "loss": 0.0286, + "epoch": 0.84, + "learning_rate": 0.00017460709836901448, + "loss": 0.0413, "step": 129520 }, { - "epoch": 1.4, - "learning_rate": 8.984684275423453e-05, - "loss": 0.0303, + "epoch": 0.84, + "learning_rate": 0.00017459741701465756, + "loss": 0.0441, "step": 129530 }, { - "epoch": 1.4, - "learning_rate": 8.983061846972548e-05, - "loss": 0.0328, + "epoch": 0.84, + "learning_rate": 0.00017458773566030064, + "loss": 0.0414, "step": 129540 }, { - "epoch": 1.4, - "learning_rate": 8.981439418521641e-05, - "loss": 0.0335, + "epoch": 0.84, + "learning_rate": 0.00017457805430594372, + "loss": 0.0451, "step": 129550 }, { - "epoch": 1.4, - "learning_rate": 8.979816990070736e-05, - "loss": 0.0293, + "epoch": 0.84, + "learning_rate": 0.00017456837295158674, + "loss": 0.0456, "step": 129560 }, { - "epoch": 1.4, - "learning_rate": 8.978194561619831e-05, - "loss": 0.0315, + "epoch": 0.84, + "learning_rate": 0.00017455869159722982, + "loss": 0.0504, "step": 129570 }, { - "epoch": 1.4, - "learning_rate": 8.976572133168926e-05, - "loss": 0.0263, + "epoch": 0.84, + "learning_rate": 0.0001745490102428729, + "loss": 0.0426, "step": 129580 }, { - "epoch": 1.4, - "learning_rate": 8.974949704718021e-05, - "loss": 0.0392, + "epoch": 0.84, + "learning_rate": 0.00017453932888851595, + "loss": 0.0428, "step": 129590 }, { - "epoch": 1.4, - "learning_rate": 8.973327276267115e-05, - "loss": 0.0369, + "epoch": 0.84, + "learning_rate": 0.00017452964753415903, + "loss": 0.0394, "step": 129600 }, { - "epoch": 1.4, - "learning_rate": 8.97170484781621e-05, - "loss": 0.0327, + "epoch": 0.84, + "learning_rate": 0.0001745199661798021, + "loss": 0.0355, "step": 129610 }, { - "epoch": 1.4, - "learning_rate": 8.970082419365305e-05, - "loss": 0.0318, + "epoch": 0.84, + "learning_rate": 0.0001745102848254452, + "loss": 0.0436, "step": 129620 }, { - "epoch": 1.4, - "learning_rate": 8.9684599909144e-05, - "loss": 0.0302, + "epoch": 0.84, + "learning_rate": 0.00017450060347108822, + "loss": 0.0405, "step": 129630 }, { - "epoch": 1.4, - "learning_rate": 8.966837562463493e-05, - "loss": 0.0319, + "epoch": 0.84, + "learning_rate": 0.0001744909221167313, + "loss": 0.0402, "step": 129640 }, { - "epoch": 1.4, - "learning_rate": 8.965215134012588e-05, - "loss": 0.0285, + "epoch": 0.84, + "learning_rate": 0.00017448124076237435, + "loss": 0.0441, "step": 129650 }, { - "epoch": 1.4, - "learning_rate": 8.963592705561683e-05, - "loss": 0.0293, + "epoch": 0.84, + "learning_rate": 0.00017447155940801743, + "loss": 0.0404, "step": 129660 }, { - "epoch": 1.4, - "learning_rate": 8.961970277110778e-05, - "loss": 0.0311, + "epoch": 0.84, + "learning_rate": 0.0001744618780536605, + "loss": 0.0424, "step": 129670 }, { - "epoch": 1.4, - "learning_rate": 8.960347848659873e-05, - "loss": 0.0348, + "epoch": 0.84, + "learning_rate": 0.0001744521966993036, + "loss": 0.0457, "step": 129680 }, { - "epoch": 1.4, - "learning_rate": 8.958725420208967e-05, - "loss": 0.0303, + "epoch": 0.84, + "learning_rate": 0.00017444251534494664, + "loss": 0.0409, "step": 129690 }, { - "epoch": 1.4, - "learning_rate": 8.957102991758062e-05, - "loss": 0.0308, + "epoch": 0.84, + "learning_rate": 0.0001744328339905897, + "loss": 0.0508, "step": 129700 }, { - "epoch": 1.4, - "learning_rate": 8.955480563307157e-05, - "loss": 0.032, + "epoch": 0.84, + "learning_rate": 0.00017442315263623278, + "loss": 0.0407, "step": 129710 }, { - "epoch": 1.4, - "learning_rate": 8.953858134856252e-05, - "loss": 0.0296, + "epoch": 0.84, + "learning_rate": 0.00017441347128187583, + "loss": 0.0384, "step": 129720 }, { - "epoch": 1.4, - "learning_rate": 8.952235706405347e-05, - "loss": 0.029, + "epoch": 0.84, + "learning_rate": 0.0001744037899275189, + "loss": 0.0422, "step": 129730 }, { - "epoch": 1.4, - "learning_rate": 8.95061327795444e-05, - "loss": 0.0301, + "epoch": 0.84, + "learning_rate": 0.000174394108573162, + "loss": 0.0466, "step": 129740 }, { - "epoch": 1.4, - "learning_rate": 8.948990849503536e-05, - "loss": 0.028, + "epoch": 0.84, + "learning_rate": 0.00017438442721880507, + "loss": 0.0439, "step": 129750 }, { - "epoch": 1.4, - "learning_rate": 8.94736842105263e-05, - "loss": 0.0376, + "epoch": 0.84, + "learning_rate": 0.00017437474586444812, + "loss": 0.0451, "step": 129760 }, { - "epoch": 1.4, - "learning_rate": 8.945745992601725e-05, - "loss": 0.0382, + "epoch": 0.84, + "learning_rate": 0.00017436506451009117, + "loss": 0.0388, "step": 129770 }, { - "epoch": 1.4, - "learning_rate": 8.944123564150819e-05, - "loss": 0.0324, + "epoch": 0.84, + "learning_rate": 0.00017435538315573425, + "loss": 0.0399, "step": 129780 }, { - "epoch": 1.4, - "learning_rate": 8.942501135699914e-05, - "loss": 0.029, + "epoch": 0.84, + "learning_rate": 0.0001743457018013773, + "loss": 0.0484, "step": 129790 }, { - "epoch": 1.4, - "learning_rate": 8.940878707249009e-05, - "loss": 0.0299, + "epoch": 0.84, + "learning_rate": 0.00017433602044702038, + "loss": 0.0386, "step": 129800 }, { - "epoch": 1.4, - "learning_rate": 8.939256278798104e-05, - "loss": 0.0301, + "epoch": 0.84, + "learning_rate": 0.00017432633909266346, + "loss": 0.0395, "step": 129810 }, { - "epoch": 1.4, - "learning_rate": 8.937633850347199e-05, - "loss": 0.0314, + "epoch": 0.84, + "learning_rate": 0.00017431665773830654, + "loss": 0.0396, "step": 129820 }, { - "epoch": 1.4, - "learning_rate": 8.936011421896293e-05, - "loss": 0.0297, + "epoch": 0.84, + "learning_rate": 0.0001743069763839496, + "loss": 0.0438, "step": 129830 }, { - "epoch": 1.4, - "learning_rate": 8.934388993445388e-05, - "loss": 0.0322, + "epoch": 0.84, + "learning_rate": 0.00017429729502959265, + "loss": 0.0347, "step": 129840 }, { - "epoch": 1.4, - "learning_rate": 8.932766564994483e-05, - "loss": 0.0334, + "epoch": 0.84, + "learning_rate": 0.0001742876136752357, + "loss": 0.0432, "step": 129850 }, { - "epoch": 1.4, - "learning_rate": 8.931144136543578e-05, - "loss": 0.0313, + "epoch": 0.84, + "learning_rate": 0.00017427793232087878, + "loss": 0.0423, "step": 129860 }, { - "epoch": 1.4, - "learning_rate": 8.929521708092671e-05, - "loss": 0.0266, + "epoch": 0.84, + "learning_rate": 0.00017426825096652186, + "loss": 0.0407, "step": 129870 }, { - "epoch": 1.4, - "learning_rate": 8.927899279641766e-05, - "loss": 0.0312, + "epoch": 0.84, + "learning_rate": 0.00017425856961216494, + "loss": 0.04, "step": 129880 }, { - "epoch": 1.4, - "learning_rate": 8.926276851190861e-05, - "loss": 0.034, + "epoch": 0.84, + "learning_rate": 0.000174248888257808, + "loss": 0.0359, "step": 129890 }, { - "epoch": 1.41, - "learning_rate": 8.924654422739956e-05, - "loss": 0.0282, + "epoch": 0.84, + "learning_rate": 0.00017423920690345107, + "loss": 0.0375, "step": 129900 }, { - "epoch": 1.41, - "learning_rate": 8.923031994289051e-05, - "loss": 0.0338, + "epoch": 0.84, + "learning_rate": 0.00017422952554909413, + "loss": 0.042, "step": 129910 }, { - "epoch": 1.41, - "learning_rate": 8.921409565838145e-05, - "loss": 0.0329, + "epoch": 0.84, + "learning_rate": 0.00017421984419473718, + "loss": 0.0393, "step": 129920 }, { - "epoch": 1.41, - "learning_rate": 8.91978713738724e-05, - "loss": 0.0352, + "epoch": 0.84, + "learning_rate": 0.00017421016284038026, + "loss": 0.0406, "step": 129930 }, { - "epoch": 1.41, - "learning_rate": 8.918164708936335e-05, - "loss": 0.0263, + "epoch": 0.84, + "learning_rate": 0.00017420048148602334, + "loss": 0.0397, "step": 129940 }, { - "epoch": 1.41, - "learning_rate": 8.91654228048543e-05, - "loss": 0.0304, + "epoch": 0.84, + "learning_rate": 0.00017419080013166642, + "loss": 0.0428, "step": 129950 }, { - "epoch": 1.41, - "learning_rate": 8.914919852034523e-05, - "loss": 0.0293, + "epoch": 0.84, + "learning_rate": 0.00017418111877730947, + "loss": 0.038, "step": 129960 }, { - "epoch": 1.41, - "learning_rate": 8.913297423583618e-05, - "loss": 0.0301, + "epoch": 0.84, + "learning_rate": 0.00017417143742295255, + "loss": 0.0456, "step": 129970 }, { - "epoch": 1.41, - "learning_rate": 8.911674995132713e-05, - "loss": 0.028, + "epoch": 0.84, + "learning_rate": 0.0001741617560685956, + "loss": 0.0417, "step": 129980 }, { - "epoch": 1.41, - "learning_rate": 8.910052566681808e-05, - "loss": 0.0296, + "epoch": 0.84, + "learning_rate": 0.00017415207471423866, + "loss": 0.0365, "step": 129990 }, { - "epoch": 1.41, - "learning_rate": 8.908430138230903e-05, - "loss": 0.0323, + "epoch": 0.84, + "learning_rate": 0.00017414239335988174, + "loss": 0.048, "step": 130000 }, { - "epoch": 1.41, - "eval_cer": 0.9211189859013572, - "eval_loss": 0.024808140471577644, - "eval_runtime": 119.0125, - "eval_samples_per_second": 16.805, - "eval_steps_per_second": 4.201, + "epoch": 0.84, + "eval_cer": 0.9200705005084171, + "eval_loss": 0.027759570628404617, + "eval_runtime": 119.9767, + "eval_samples_per_second": 16.67, + "eval_steps_per_second": 4.167, "step": 130000 }, { - "epoch": 1.41, - "learning_rate": 8.906807709779997e-05, - "loss": 0.0291, + "epoch": 0.84, + "learning_rate": 0.00017413271200552482, + "loss": 0.0449, "step": 130010 }, { - "epoch": 1.41, - "learning_rate": 8.905185281329092e-05, - "loss": 0.0331, + "epoch": 0.84, + "learning_rate": 0.0001741230306511679, + "loss": 0.0449, "step": 130020 }, { - "epoch": 1.41, - "learning_rate": 8.903562852878187e-05, - "loss": 0.0275, + "epoch": 0.84, + "learning_rate": 0.00017411334929681095, + "loss": 0.0391, "step": 130030 }, { - "epoch": 1.41, - "learning_rate": 8.901940424427282e-05, - "loss": 0.0333, + "epoch": 0.84, + "learning_rate": 0.00017410366794245403, + "loss": 0.0437, "step": 130040 }, { - "epoch": 1.41, - "learning_rate": 8.900317995976375e-05, - "loss": 0.0282, + "epoch": 0.84, + "learning_rate": 0.00017409398658809705, + "loss": 0.0405, "step": 130050 }, { - "epoch": 1.41, - "learning_rate": 8.89869556752547e-05, - "loss": 0.028, + "epoch": 0.84, + "learning_rate": 0.00017408430523374013, + "loss": 0.0438, "step": 130060 }, { - "epoch": 1.41, - "learning_rate": 8.897073139074565e-05, - "loss": 0.0307, + "epoch": 0.84, + "learning_rate": 0.00017407462387938321, + "loss": 0.0419, "step": 130070 }, { - "epoch": 1.41, - "learning_rate": 8.89545071062366e-05, - "loss": 0.0323, + "epoch": 0.84, + "learning_rate": 0.0001740649425250263, + "loss": 0.0374, "step": 130080 }, { - "epoch": 1.41, - "learning_rate": 8.893828282172755e-05, - "loss": 0.0324, + "epoch": 0.84, + "learning_rate": 0.00017405526117066935, + "loss": 0.0395, "step": 130090 }, { - "epoch": 1.41, - "learning_rate": 8.892205853721849e-05, - "loss": 0.0374, + "epoch": 0.84, + "learning_rate": 0.00017404557981631243, + "loss": 0.039, "step": 130100 }, { - "epoch": 1.41, - "learning_rate": 8.890583425270944e-05, - "loss": 0.0336, + "epoch": 0.84, + "learning_rate": 0.0001740358984619555, + "loss": 0.0373, "step": 130110 }, { - "epoch": 1.41, - "learning_rate": 8.888960996820039e-05, - "loss": 0.0293, + "epoch": 0.84, + "learning_rate": 0.00017402621710759853, + "loss": 0.0426, "step": 130120 }, { - "epoch": 1.41, - "learning_rate": 8.887338568369134e-05, - "loss": 0.032, + "epoch": 0.84, + "learning_rate": 0.0001740165357532416, + "loss": 0.0419, "step": 130130 }, { - "epoch": 1.41, - "learning_rate": 8.885716139918227e-05, - "loss": 0.0301, + "epoch": 0.84, + "learning_rate": 0.0001740068543988847, + "loss": 0.0461, "step": 130140 }, { - "epoch": 1.41, - "learning_rate": 8.884093711467322e-05, - "loss": 0.0336, + "epoch": 0.84, + "learning_rate": 0.00017399717304452777, + "loss": 0.0405, "step": 130150 }, { - "epoch": 1.41, - "learning_rate": 8.882471283016417e-05, - "loss": 0.0275, + "epoch": 0.84, + "learning_rate": 0.00017398749169017082, + "loss": 0.0387, "step": 130160 }, { - "epoch": 1.41, - "learning_rate": 8.880848854565512e-05, - "loss": 0.029, + "epoch": 0.84, + "learning_rate": 0.0001739778103358139, + "loss": 0.038, "step": 130170 }, { - "epoch": 1.41, - "learning_rate": 8.879226426114607e-05, - "loss": 0.0307, + "epoch": 0.84, + "learning_rate": 0.00017396812898145698, + "loss": 0.0424, "step": 130180 }, { - "epoch": 1.41, - "learning_rate": 8.877603997663701e-05, - "loss": 0.0287, + "epoch": 0.84, + "learning_rate": 0.0001739584476271, + "loss": 0.0409, "step": 130190 }, { - "epoch": 1.41, - "learning_rate": 8.875981569212796e-05, - "loss": 0.0273, + "epoch": 0.84, + "learning_rate": 0.0001739487662727431, + "loss": 0.0448, "step": 130200 }, { - "epoch": 1.41, - "learning_rate": 8.874359140761891e-05, - "loss": 0.0373, + "epoch": 0.84, + "learning_rate": 0.00017393908491838617, + "loss": 0.0453, "step": 130210 }, { - "epoch": 1.41, - "learning_rate": 8.872736712310986e-05, - "loss": 0.0301, + "epoch": 0.84, + "learning_rate": 0.00017392940356402925, + "loss": 0.0398, "step": 130220 }, { - "epoch": 1.41, - "learning_rate": 8.87111428386008e-05, - "loss": 0.0292, + "epoch": 0.84, + "learning_rate": 0.0001739197222096723, + "loss": 0.0396, "step": 130230 }, { - "epoch": 1.41, - "learning_rate": 8.869491855409176e-05, - "loss": 0.0354, + "epoch": 0.84, + "learning_rate": 0.00017391004085531538, + "loss": 0.0413, "step": 130240 }, { - "epoch": 1.41, - "learning_rate": 8.867869426958271e-05, - "loss": 0.0323, + "epoch": 0.84, + "learning_rate": 0.00017390035950095846, + "loss": 0.0361, "step": 130250 }, { - "epoch": 1.41, - "learning_rate": 8.866246998507366e-05, - "loss": 0.0284, + "epoch": 0.84, + "learning_rate": 0.00017389067814660149, + "loss": 0.0472, "step": 130260 }, { - "epoch": 1.41, - "learning_rate": 8.864624570056461e-05, - "loss": 0.0347, + "epoch": 0.84, + "learning_rate": 0.00017388099679224457, + "loss": 0.0438, "step": 130270 }, { - "epoch": 1.41, - "learning_rate": 8.863002141605556e-05, - "loss": 0.032, + "epoch": 0.84, + "learning_rate": 0.00017387131543788765, + "loss": 0.0371, "step": 130280 }, { - "epoch": 1.41, - "learning_rate": 8.86137971315465e-05, - "loss": 0.0301, + "epoch": 0.84, + "learning_rate": 0.0001738616340835307, + "loss": 0.0377, "step": 130290 }, { - "epoch": 1.41, - "learning_rate": 8.859757284703744e-05, - "loss": 0.031, + "epoch": 0.84, + "learning_rate": 0.00017385195272917378, + "loss": 0.0426, "step": 130300 }, { - "epoch": 1.41, - "learning_rate": 8.85813485625284e-05, - "loss": 0.0306, + "epoch": 0.84, + "learning_rate": 0.00017384227137481686, + "loss": 0.0405, "step": 130310 }, { - "epoch": 1.41, - "learning_rate": 8.856512427801934e-05, - "loss": 0.0297, + "epoch": 0.84, + "learning_rate": 0.00017383259002045994, + "loss": 0.0428, "step": 130320 }, { - "epoch": 1.41, - "learning_rate": 8.854889999351028e-05, - "loss": 0.0377, + "epoch": 0.84, + "learning_rate": 0.00017382290866610296, + "loss": 0.0509, "step": 130330 }, { - "epoch": 1.41, - "learning_rate": 8.853267570900123e-05, - "loss": 0.0285, + "epoch": 0.84, + "learning_rate": 0.00017381322731174604, + "loss": 0.0366, "step": 130340 }, { - "epoch": 1.41, - "learning_rate": 8.851645142449218e-05, - "loss": 0.0316, + "epoch": 0.84, + "learning_rate": 0.00017380354595738912, + "loss": 0.0408, "step": 130350 }, { - "epoch": 1.41, - "learning_rate": 8.850022713998313e-05, - "loss": 0.0323, + "epoch": 0.84, + "learning_rate": 0.00017379386460303218, + "loss": 0.0382, "step": 130360 }, { - "epoch": 1.41, - "learning_rate": 8.848400285547408e-05, - "loss": 0.0274, + "epoch": 0.84, + "learning_rate": 0.00017378418324867526, + "loss": 0.0406, "step": 130370 }, { - "epoch": 1.41, - "learning_rate": 8.846777857096501e-05, - "loss": 0.0334, + "epoch": 0.84, + "learning_rate": 0.00017377450189431834, + "loss": 0.0385, "step": 130380 }, { - "epoch": 1.41, - "learning_rate": 8.845155428645596e-05, - "loss": 0.028, + "epoch": 0.84, + "learning_rate": 0.00017376482053996141, + "loss": 0.0459, "step": 130390 }, { - "epoch": 1.41, - "learning_rate": 8.843533000194691e-05, - "loss": 0.0274, + "epoch": 0.84, + "learning_rate": 0.00017375513918560444, + "loss": 0.0398, "step": 130400 }, { - "epoch": 1.41, - "learning_rate": 8.841910571743786e-05, - "loss": 0.0311, + "epoch": 0.84, + "learning_rate": 0.00017374545783124752, + "loss": 0.0427, "step": 130410 }, { - "epoch": 1.41, - "learning_rate": 8.840288143292881e-05, - "loss": 0.0259, + "epoch": 0.84, + "learning_rate": 0.0001737357764768906, + "loss": 0.0541, "step": 130420 }, { - "epoch": 1.41, - "learning_rate": 8.838665714841975e-05, - "loss": 0.0288, + "epoch": 0.84, + "learning_rate": 0.00017372609512253365, + "loss": 0.0397, "step": 130430 }, { - "epoch": 1.41, - "learning_rate": 8.83704328639107e-05, - "loss": 0.0273, + "epoch": 0.84, + "learning_rate": 0.00017371641376817673, + "loss": 0.051, "step": 130440 }, { - "epoch": 1.41, - "learning_rate": 8.835420857940165e-05, - "loss": 0.0331, + "epoch": 0.84, + "learning_rate": 0.0001737067324138198, + "loss": 0.0392, "step": 130450 }, { - "epoch": 1.41, - "learning_rate": 8.83379842948926e-05, - "loss": 0.0295, + "epoch": 0.84, + "learning_rate": 0.00017369705105946287, + "loss": 0.0375, "step": 130460 }, { - "epoch": 1.41, - "learning_rate": 8.832176001038354e-05, - "loss": 0.0306, + "epoch": 0.84, + "learning_rate": 0.00017368736970510592, + "loss": 0.0455, "step": 130470 }, { - "epoch": 1.41, - "learning_rate": 8.830553572587449e-05, - "loss": 0.0334, + "epoch": 0.84, + "learning_rate": 0.000173677688350749, + "loss": 0.0429, "step": 130480 }, { - "epoch": 1.41, - "learning_rate": 8.828931144136544e-05, - "loss": 0.0335, + "epoch": 0.84, + "learning_rate": 0.00017366800699639205, + "loss": 0.0397, "step": 130490 }, { - "epoch": 1.41, - "learning_rate": 8.827308715685638e-05, - "loss": 0.0273, + "epoch": 0.84, + "learning_rate": 0.00017365832564203513, + "loss": 0.0416, "step": 130500 }, { - "epoch": 1.41, - "learning_rate": 8.825686287234733e-05, - "loss": 0.0311, + "epoch": 0.84, + "learning_rate": 0.0001736486442876782, + "loss": 0.0454, "step": 130510 }, { - "epoch": 1.41, - "learning_rate": 8.824063858783827e-05, - "loss": 0.0289, + "epoch": 0.84, + "learning_rate": 0.0001736389629333213, + "loss": 0.0412, "step": 130520 }, { - "epoch": 1.41, - "learning_rate": 8.822441430332922e-05, - "loss": 0.0312, + "epoch": 0.84, + "learning_rate": 0.00017362928157896434, + "loss": 0.0391, "step": 130530 }, { - "epoch": 1.41, - "learning_rate": 8.820819001882017e-05, - "loss": 0.0292, + "epoch": 0.84, + "learning_rate": 0.0001736196002246074, + "loss": 0.0382, "step": 130540 }, { - "epoch": 1.41, - "learning_rate": 8.819196573431112e-05, - "loss": 0.0315, + "epoch": 0.84, + "learning_rate": 0.00017360991887025047, + "loss": 0.047, "step": 130550 }, { - "epoch": 1.41, - "learning_rate": 8.817574144980206e-05, - "loss": 0.0308, + "epoch": 0.84, + "learning_rate": 0.00017360023751589353, + "loss": 0.0474, "step": 130560 }, { - "epoch": 1.41, - "learning_rate": 8.8159517165293e-05, - "loss": 0.0289, + "epoch": 0.84, + "learning_rate": 0.0001735905561615366, + "loss": 0.0391, "step": 130570 }, { - "epoch": 1.41, - "learning_rate": 8.814329288078396e-05, - "loss": 0.0299, + "epoch": 0.84, + "learning_rate": 0.0001735808748071797, + "loss": 0.0408, "step": 130580 }, { - "epoch": 1.41, - "learning_rate": 8.81270685962749e-05, - "loss": 0.0255, + "epoch": 0.84, + "learning_rate": 0.00017357119345282277, + "loss": 0.0402, "step": 130590 }, { - "epoch": 1.41, - "learning_rate": 8.811084431176586e-05, - "loss": 0.0315, + "epoch": 0.84, + "learning_rate": 0.00017356151209846582, + "loss": 0.0432, "step": 130600 }, { - "epoch": 1.41, - "learning_rate": 8.809462002725679e-05, - "loss": 0.0319, + "epoch": 0.84, + "learning_rate": 0.00017355183074410887, + "loss": 0.0434, "step": 130610 }, { - "epoch": 1.41, - "learning_rate": 8.807839574274774e-05, - "loss": 0.0434, + "epoch": 0.84, + "learning_rate": 0.00017354214938975195, + "loss": 0.0424, "step": 130620 }, { - "epoch": 1.41, - "learning_rate": 8.806217145823869e-05, - "loss": 0.0297, + "epoch": 0.84, + "learning_rate": 0.000173532468035395, + "loss": 0.0418, "step": 130630 }, { - "epoch": 1.41, - "learning_rate": 8.804594717372964e-05, - "loss": 0.033, + "epoch": 0.84, + "learning_rate": 0.00017352278668103808, + "loss": 0.0479, "step": 130640 }, { - "epoch": 1.41, - "learning_rate": 8.802972288922058e-05, - "loss": 0.0317, + "epoch": 0.84, + "learning_rate": 0.00017351310532668116, + "loss": 0.0399, "step": 130650 }, { - "epoch": 1.41, - "learning_rate": 8.801349860471153e-05, - "loss": 0.0279, + "epoch": 0.84, + "learning_rate": 0.00017350342397232422, + "loss": 0.0488, "step": 130660 }, { - "epoch": 1.41, - "learning_rate": 8.799727432020248e-05, - "loss": 0.0294, + "epoch": 0.84, + "learning_rate": 0.0001734937426179673, + "loss": 0.0459, "step": 130670 }, { - "epoch": 1.41, - "learning_rate": 8.798105003569343e-05, - "loss": 0.0247, + "epoch": 0.84, + "learning_rate": 0.00017348406126361035, + "loss": 0.0429, "step": 130680 }, { - "epoch": 1.41, - "learning_rate": 8.796482575118438e-05, - "loss": 0.0319, + "epoch": 0.84, + "learning_rate": 0.0001734743799092534, + "loss": 0.0503, "step": 130690 }, { - "epoch": 1.41, - "learning_rate": 8.794860146667531e-05, - "loss": 0.0383, + "epoch": 0.84, + "learning_rate": 0.00017346469855489648, + "loss": 0.0488, "step": 130700 }, { - "epoch": 1.41, - "learning_rate": 8.793237718216626e-05, - "loss": 0.0308, + "epoch": 0.84, + "learning_rate": 0.00017345501720053956, + "loss": 0.042, "step": 130710 }, { - "epoch": 1.41, - "learning_rate": 8.791615289765721e-05, - "loss": 0.0297, + "epoch": 0.84, + "learning_rate": 0.00017344533584618264, + "loss": 0.0478, "step": 130720 }, { - "epoch": 1.41, - "learning_rate": 8.789992861314816e-05, - "loss": 0.0341, + "epoch": 0.84, + "learning_rate": 0.0001734356544918257, + "loss": 0.0448, "step": 130730 }, { - "epoch": 1.41, - "learning_rate": 8.78837043286391e-05, - "loss": 0.0296, + "epoch": 0.84, + "learning_rate": 0.00017342597313746877, + "loss": 0.0401, "step": 130740 }, { - "epoch": 1.41, - "learning_rate": 8.786748004413005e-05, - "loss": 0.03, + "epoch": 0.84, + "learning_rate": 0.00017341629178311183, + "loss": 0.0374, "step": 130750 }, { - "epoch": 1.41, - "learning_rate": 8.7851255759621e-05, - "loss": 0.0312, + "epoch": 0.84, + "learning_rate": 0.00017340661042875488, + "loss": 0.0432, "step": 130760 }, { - "epoch": 1.41, - "learning_rate": 8.783503147511195e-05, - "loss": 0.0321, + "epoch": 0.84, + "learning_rate": 0.00017339692907439796, + "loss": 0.0473, "step": 130770 }, { - "epoch": 1.41, - "learning_rate": 8.78188071906029e-05, - "loss": 0.0303, + "epoch": 0.84, + "learning_rate": 0.00017338724772004104, + "loss": 0.0414, "step": 130780 }, { - "epoch": 1.41, - "learning_rate": 8.780258290609383e-05, - "loss": 0.0356, + "epoch": 0.84, + "learning_rate": 0.00017337756636568412, + "loss": 0.0475, "step": 130790 }, { - "epoch": 1.41, - "learning_rate": 8.778635862158478e-05, - "loss": 0.0287, + "epoch": 0.84, + "learning_rate": 0.00017336788501132717, + "loss": 0.0431, "step": 130800 }, { - "epoch": 1.41, - "learning_rate": 8.777013433707573e-05, - "loss": 0.0283, + "epoch": 0.84, + "learning_rate": 0.00017335820365697025, + "loss": 0.0412, "step": 130810 }, { - "epoch": 1.41, - "learning_rate": 8.775391005256668e-05, - "loss": 0.0314, + "epoch": 0.84, + "learning_rate": 0.0001733485223026133, + "loss": 0.043, "step": 130820 }, { - "epoch": 1.42, - "learning_rate": 8.773768576805762e-05, - "loss": 0.0306, + "epoch": 0.84, + "learning_rate": 0.00017333884094825636, + "loss": 0.0398, "step": 130830 }, { - "epoch": 1.42, - "learning_rate": 8.772146148354857e-05, - "loss": 0.0318, + "epoch": 0.84, + "learning_rate": 0.00017332915959389944, + "loss": 0.0377, "step": 130840 }, { - "epoch": 1.42, - "learning_rate": 8.770523719903952e-05, - "loss": 0.0295, + "epoch": 0.84, + "learning_rate": 0.00017331947823954252, + "loss": 0.0456, "step": 130850 }, { - "epoch": 1.42, - "learning_rate": 8.768901291453047e-05, - "loss": 0.0298, + "epoch": 0.84, + "learning_rate": 0.00017330979688518557, + "loss": 0.0503, "step": 130860 }, { - "epoch": 1.42, - "learning_rate": 8.767278863002142e-05, - "loss": 0.0328, + "epoch": 0.84, + "learning_rate": 0.00017330011553082865, + "loss": 0.0369, "step": 130870 }, { - "epoch": 1.42, - "learning_rate": 8.765656434551235e-05, - "loss": 0.0377, + "epoch": 0.84, + "learning_rate": 0.00017329043417647173, + "loss": 0.0378, "step": 130880 }, { - "epoch": 1.42, - "learning_rate": 8.76403400610033e-05, - "loss": 0.0299, + "epoch": 0.84, + "learning_rate": 0.00017328075282211475, + "loss": 0.0399, "step": 130890 }, { - "epoch": 1.42, - "learning_rate": 8.762411577649425e-05, - "loss": 0.0262, + "epoch": 0.84, + "learning_rate": 0.00017327107146775783, + "loss": 0.0456, "step": 130900 }, { - "epoch": 1.42, - "learning_rate": 8.76078914919852e-05, - "loss": 0.0301, + "epoch": 0.84, + "learning_rate": 0.00017326139011340091, + "loss": 0.045, "step": 130910 }, { - "epoch": 1.42, - "learning_rate": 8.759166720747614e-05, - "loss": 0.0355, + "epoch": 0.84, + "learning_rate": 0.000173251708759044, + "loss": 0.0337, "step": 130920 }, { - "epoch": 1.42, - "learning_rate": 8.757544292296709e-05, - "loss": 0.0295, + "epoch": 0.85, + "learning_rate": 0.00017324202740468705, + "loss": 0.0427, "step": 130930 }, { - "epoch": 1.42, - "learning_rate": 8.755921863845804e-05, - "loss": 0.0369, + "epoch": 0.85, + "learning_rate": 0.00017323234605033013, + "loss": 0.0418, "step": 130940 }, { - "epoch": 1.42, - "learning_rate": 8.754299435394899e-05, - "loss": 0.0274, + "epoch": 0.85, + "learning_rate": 0.0001732226646959732, + "loss": 0.0379, "step": 130950 }, { - "epoch": 1.42, - "learning_rate": 8.752677006943994e-05, - "loss": 0.0324, + "epoch": 0.85, + "learning_rate": 0.00017321298334161623, + "loss": 0.0463, "step": 130960 }, { - "epoch": 1.42, - "learning_rate": 8.751054578493087e-05, - "loss": 0.0326, + "epoch": 0.85, + "learning_rate": 0.0001732033019872593, + "loss": 0.0456, "step": 130970 }, { - "epoch": 1.42, - "learning_rate": 8.749432150042182e-05, - "loss": 0.0299, + "epoch": 0.85, + "learning_rate": 0.0001731936206329024, + "loss": 0.0439, "step": 130980 }, { - "epoch": 1.42, - "learning_rate": 8.747809721591277e-05, - "loss": 0.0329, + "epoch": 0.85, + "learning_rate": 0.00017318393927854547, + "loss": 0.0475, "step": 130990 }, { - "epoch": 1.42, - "learning_rate": 8.746187293140372e-05, - "loss": 0.0253, + "epoch": 0.85, + "learning_rate": 0.00017317425792418852, + "loss": 0.046, "step": 131000 }, { - "epoch": 1.42, - "eval_cer": 0.9211322381661693, - "eval_loss": 0.02442746050655842, - "eval_runtime": 118.8813, - "eval_samples_per_second": 16.824, - "eval_steps_per_second": 4.206, + "epoch": 0.85, + "eval_cer": 0.9198933453847022, + "eval_loss": 0.027897853404283524, + "eval_runtime": 120.109, + "eval_samples_per_second": 16.652, + "eval_steps_per_second": 4.163, "step": 131000 }, { - "epoch": 1.42, - "learning_rate": 8.744564864689466e-05, - "loss": 0.0304, + "epoch": 0.85, + "learning_rate": 0.0001731645765698316, + "loss": 0.041, "step": 131010 }, { - "epoch": 1.42, - "learning_rate": 8.742942436238561e-05, - "loss": 0.0293, + "epoch": 0.85, + "learning_rate": 0.00017315489521547468, + "loss": 0.0381, "step": 131020 }, { - "epoch": 1.42, - "learning_rate": 8.741320007787656e-05, - "loss": 0.0365, + "epoch": 0.85, + "learning_rate": 0.0001731452138611177, + "loss": 0.0421, "step": 131030 }, { - "epoch": 1.42, - "learning_rate": 8.739697579336751e-05, - "loss": 0.034, + "epoch": 0.85, + "learning_rate": 0.0001731355325067608, + "loss": 0.0418, "step": 131040 }, { - "epoch": 1.42, - "learning_rate": 8.738075150885846e-05, - "loss": 0.0311, + "epoch": 0.85, + "learning_rate": 0.00017312585115240387, + "loss": 0.039, "step": 131050 }, { - "epoch": 1.42, - "learning_rate": 8.73645272243494e-05, - "loss": 0.0282, + "epoch": 0.85, + "learning_rate": 0.00017311616979804692, + "loss": 0.0444, "step": 131060 }, { - "epoch": 1.42, - "learning_rate": 8.734830293984035e-05, - "loss": 0.0294, + "epoch": 0.85, + "learning_rate": 0.00017310648844369, + "loss": 0.0419, "step": 131070 }, { - "epoch": 1.42, - "learning_rate": 8.73320786553313e-05, - "loss": 0.0299, + "epoch": 0.85, + "learning_rate": 0.00017309680708933308, + "loss": 0.0396, "step": 131080 }, { - "epoch": 1.42, - "learning_rate": 8.731585437082225e-05, - "loss": 0.0335, + "epoch": 0.85, + "learning_rate": 0.00017308712573497616, + "loss": 0.0399, "step": 131090 }, { - "epoch": 1.42, - "learning_rate": 8.729963008631318e-05, - "loss": 0.0234, + "epoch": 0.85, + "learning_rate": 0.00017307744438061919, + "loss": 0.0428, "step": 131100 }, { - "epoch": 1.42, - "learning_rate": 8.728340580180413e-05, - "loss": 0.0325, + "epoch": 0.85, + "learning_rate": 0.00017306776302626227, + "loss": 0.0487, "step": 131110 }, { - "epoch": 1.42, - "learning_rate": 8.726718151729508e-05, - "loss": 0.0323, + "epoch": 0.85, + "learning_rate": 0.00017305808167190535, + "loss": 0.042, "step": 131120 }, { - "epoch": 1.42, - "learning_rate": 8.725095723278603e-05, - "loss": 0.0395, + "epoch": 0.85, + "learning_rate": 0.0001730484003175484, + "loss": 0.0399, "step": 131130 }, { - "epoch": 1.42, - "learning_rate": 8.723473294827698e-05, - "loss": 0.0351, + "epoch": 0.85, + "learning_rate": 0.00017303871896319148, + "loss": 0.0366, "step": 131140 }, { - "epoch": 1.42, - "learning_rate": 8.721850866376792e-05, - "loss": 0.0365, + "epoch": 0.85, + "learning_rate": 0.00017302903760883456, + "loss": 0.0481, "step": 131150 }, { - "epoch": 1.42, - "learning_rate": 8.720228437925887e-05, - "loss": 0.0328, + "epoch": 0.85, + "learning_rate": 0.00017301935625447764, + "loss": 0.0384, "step": 131160 }, { - "epoch": 1.42, - "learning_rate": 8.718606009474982e-05, - "loss": 0.0281, + "epoch": 0.85, + "learning_rate": 0.00017300967490012066, + "loss": 0.0386, "step": 131170 }, { - "epoch": 1.42, - "learning_rate": 8.716983581024077e-05, - "loss": 0.027, + "epoch": 0.85, + "learning_rate": 0.00017299999354576374, + "loss": 0.0432, "step": 131180 }, { - "epoch": 1.42, - "learning_rate": 8.715361152573172e-05, - "loss": 0.0283, + "epoch": 0.85, + "learning_rate": 0.00017299031219140682, + "loss": 0.0446, "step": 131190 }, { - "epoch": 1.42, - "learning_rate": 8.713738724122265e-05, - "loss": 0.0335, + "epoch": 0.85, + "learning_rate": 0.00017298063083704988, + "loss": 0.04, "step": 131200 }, { - "epoch": 1.42, - "learning_rate": 8.71211629567136e-05, - "loss": 0.0327, + "epoch": 0.85, + "learning_rate": 0.00017297094948269295, + "loss": 0.0359, "step": 131210 }, { - "epoch": 1.42, - "learning_rate": 8.710493867220455e-05, - "loss": 0.0282, + "epoch": 0.85, + "learning_rate": 0.00017296126812833603, + "loss": 0.0455, "step": 131220 }, { - "epoch": 1.42, - "learning_rate": 8.70887143876955e-05, - "loss": 0.0355, + "epoch": 0.85, + "learning_rate": 0.0001729515867739791, + "loss": 0.0344, "step": 131230 }, { - "epoch": 1.42, - "learning_rate": 8.707249010318644e-05, - "loss": 0.0301, + "epoch": 0.85, + "learning_rate": 0.00017294190541962214, + "loss": 0.0465, "step": 131240 }, { - "epoch": 1.42, - "learning_rate": 8.705626581867739e-05, - "loss": 0.0288, + "epoch": 0.85, + "learning_rate": 0.00017293222406526522, + "loss": 0.0467, "step": 131250 }, { - "epoch": 1.42, - "learning_rate": 8.704004153416834e-05, - "loss": 0.0261, + "epoch": 0.85, + "learning_rate": 0.00017292254271090827, + "loss": 0.0398, "step": 131260 }, { - "epoch": 1.42, - "learning_rate": 8.702381724965929e-05, - "loss": 0.0274, + "epoch": 0.85, + "learning_rate": 0.00017291286135655135, + "loss": 0.0333, "step": 131270 }, { - "epoch": 1.42, - "learning_rate": 8.700759296515024e-05, - "loss": 0.0335, + "epoch": 0.85, + "learning_rate": 0.00017290318000219443, + "loss": 0.0384, "step": 131280 }, { - "epoch": 1.42, - "learning_rate": 8.699136868064117e-05, - "loss": 0.0267, + "epoch": 0.85, + "learning_rate": 0.0001728934986478375, + "loss": 0.0361, "step": 131290 }, { - "epoch": 1.42, - "learning_rate": 8.697514439613212e-05, - "loss": 0.0354, + "epoch": 0.85, + "learning_rate": 0.00017288381729348056, + "loss": 0.0386, "step": 131300 }, { - "epoch": 1.42, - "learning_rate": 8.695892011162307e-05, - "loss": 0.0343, + "epoch": 0.85, + "learning_rate": 0.00017287413593912362, + "loss": 0.0397, "step": 131310 }, { - "epoch": 1.42, - "learning_rate": 8.694269582711402e-05, - "loss": 0.0314, + "epoch": 0.85, + "learning_rate": 0.0001728644545847667, + "loss": 0.0443, "step": 131320 }, { - "epoch": 1.42, - "learning_rate": 8.692647154260496e-05, - "loss": 0.0281, + "epoch": 0.85, + "learning_rate": 0.00017285477323040975, + "loss": 0.0434, "step": 131330 }, { - "epoch": 1.42, - "learning_rate": 8.691024725809591e-05, - "loss": 0.0269, + "epoch": 0.85, + "learning_rate": 0.00017284509187605283, + "loss": 0.0414, "step": 131340 }, { - "epoch": 1.42, - "learning_rate": 8.689402297358686e-05, - "loss": 0.026, + "epoch": 0.85, + "learning_rate": 0.0001728354105216959, + "loss": 0.046, "step": 131350 }, { - "epoch": 1.42, - "learning_rate": 8.687779868907781e-05, - "loss": 0.0259, + "epoch": 0.85, + "learning_rate": 0.000172825729167339, + "loss": 0.0412, "step": 131360 }, { - "epoch": 1.42, - "learning_rate": 8.686157440456876e-05, - "loss": 0.0301, + "epoch": 0.85, + "learning_rate": 0.00017281604781298204, + "loss": 0.0448, "step": 131370 }, { - "epoch": 1.42, - "learning_rate": 8.68453501200597e-05, - "loss": 0.0296, + "epoch": 0.85, + "learning_rate": 0.0001728063664586251, + "loss": 0.0472, "step": 131380 }, { - "epoch": 1.42, - "learning_rate": 8.682912583555064e-05, - "loss": 0.0257, + "epoch": 0.85, + "learning_rate": 0.00017279668510426817, + "loss": 0.045, "step": 131390 }, { - "epoch": 1.42, - "learning_rate": 8.681290155104159e-05, - "loss": 0.0314, + "epoch": 0.85, + "learning_rate": 0.00017278700374991123, + "loss": 0.0403, "step": 131400 }, { - "epoch": 1.42, - "learning_rate": 8.679667726653254e-05, - "loss": 0.0273, + "epoch": 0.85, + "learning_rate": 0.0001727773223955543, + "loss": 0.045, "step": 131410 }, { - "epoch": 1.42, - "learning_rate": 8.678045298202348e-05, - "loss": 0.0334, + "epoch": 0.85, + "learning_rate": 0.0001727676410411974, + "loss": 0.0426, "step": 131420 }, { - "epoch": 1.42, - "learning_rate": 8.676422869751443e-05, - "loss": 0.029, + "epoch": 0.85, + "learning_rate": 0.00017275795968684044, + "loss": 0.044, "step": 131430 }, { - "epoch": 1.42, - "learning_rate": 8.674800441300538e-05, - "loss": 0.0448, + "epoch": 0.85, + "learning_rate": 0.00017274827833248352, + "loss": 0.0365, "step": 131440 }, { - "epoch": 1.42, - "learning_rate": 8.673178012849633e-05, - "loss": 0.0294, + "epoch": 0.85, + "learning_rate": 0.00017273859697812657, + "loss": 0.0409, "step": 131450 }, { - "epoch": 1.42, - "learning_rate": 8.671555584398728e-05, - "loss": 0.0287, + "epoch": 0.85, + "learning_rate": 0.00017272891562376962, + "loss": 0.0441, "step": 131460 }, { - "epoch": 1.42, - "learning_rate": 8.669933155947821e-05, - "loss": 0.0308, + "epoch": 0.85, + "learning_rate": 0.0001727192342694127, + "loss": 0.0408, "step": 131470 }, { - "epoch": 1.42, - "learning_rate": 8.668310727496916e-05, - "loss": 0.0326, + "epoch": 0.85, + "learning_rate": 0.00017270955291505578, + "loss": 0.038, "step": 131480 }, { - "epoch": 1.42, - "learning_rate": 8.666688299046011e-05, - "loss": 0.032, + "epoch": 0.85, + "learning_rate": 0.00017269987156069886, + "loss": 0.0431, "step": 131490 }, { - "epoch": 1.42, - "learning_rate": 8.665065870595106e-05, - "loss": 0.0335, + "epoch": 0.85, + "learning_rate": 0.00017269019020634192, + "loss": 0.0373, "step": 131500 }, { - "epoch": 1.42, - "learning_rate": 8.6634434421442e-05, - "loss": 0.0281, + "epoch": 0.85, + "learning_rate": 0.000172680508851985, + "loss": 0.0389, "step": 131510 }, { - "epoch": 1.42, - "learning_rate": 8.661821013693295e-05, - "loss": 0.0318, + "epoch": 0.85, + "learning_rate": 0.00017267082749762805, + "loss": 0.0445, "step": 131520 }, { - "epoch": 1.42, - "learning_rate": 8.66019858524239e-05, - "loss": 0.0256, + "epoch": 0.85, + "learning_rate": 0.0001726611461432711, + "loss": 0.0447, "step": 131530 }, { - "epoch": 1.42, - "learning_rate": 8.658576156791485e-05, - "loss": 0.0283, + "epoch": 0.85, + "learning_rate": 0.00017265146478891418, + "loss": 0.0466, "step": 131540 }, { - "epoch": 1.42, - "learning_rate": 8.65695372834058e-05, - "loss": 0.0279, + "epoch": 0.85, + "learning_rate": 0.00017264178343455726, + "loss": 0.0427, "step": 131550 }, { - "epoch": 1.42, - "learning_rate": 8.655331299889674e-05, - "loss": 0.0414, + "epoch": 0.85, + "learning_rate": 0.00017263210208020034, + "loss": 0.0388, "step": 131560 }, { - "epoch": 1.42, - "learning_rate": 8.653708871438769e-05, - "loss": 0.0261, + "epoch": 0.85, + "learning_rate": 0.0001726224207258434, + "loss": 0.0371, "step": 131570 }, { - "epoch": 1.42, - "learning_rate": 8.652086442987863e-05, - "loss": 0.0316, + "epoch": 0.85, + "learning_rate": 0.00017261273937148647, + "loss": 0.0322, "step": 131580 }, { - "epoch": 1.42, - "learning_rate": 8.650464014536958e-05, - "loss": 0.0293, + "epoch": 0.85, + "learning_rate": 0.00017260305801712953, + "loss": 0.0352, "step": 131590 }, { - "epoch": 1.42, - "learning_rate": 8.648841586086052e-05, - "loss": 0.0311, + "epoch": 0.85, + "learning_rate": 0.00017259337666277258, + "loss": 0.0396, "step": 131600 }, { - "epoch": 1.42, - "learning_rate": 8.647219157635147e-05, - "loss": 0.0325, + "epoch": 0.85, + "learning_rate": 0.00017258369530841566, + "loss": 0.0444, "step": 131610 }, { - "epoch": 1.42, - "learning_rate": 8.645596729184242e-05, - "loss": 0.0313, + "epoch": 0.85, + "learning_rate": 0.00017257401395405874, + "loss": 0.0396, "step": 131620 }, { - "epoch": 1.42, - "learning_rate": 8.643974300733337e-05, - "loss": 0.0311, + "epoch": 0.85, + "learning_rate": 0.0001725643325997018, + "loss": 0.0417, "step": 131630 }, { - "epoch": 1.42, - "learning_rate": 8.642351872282432e-05, - "loss": 0.035, + "epoch": 0.85, + "learning_rate": 0.00017255465124534487, + "loss": 0.0406, "step": 131640 }, { - "epoch": 1.42, - "learning_rate": 8.640729443831526e-05, - "loss": 0.0279, + "epoch": 0.85, + "learning_rate": 0.00017254496989098795, + "loss": 0.0377, "step": 131650 }, { - "epoch": 1.42, - "learning_rate": 8.63910701538062e-05, - "loss": 0.0362, + "epoch": 0.85, + "learning_rate": 0.00017253528853663098, + "loss": 0.0472, "step": 131660 }, { - "epoch": 1.42, - "learning_rate": 8.637484586929716e-05, - "loss": 0.0281, + "epoch": 0.85, + "learning_rate": 0.00017252560718227406, + "loss": 0.04, "step": 131670 }, { - "epoch": 1.42, - "learning_rate": 8.63586215847881e-05, - "loss": 0.0305, + "epoch": 0.85, + "learning_rate": 0.00017251592582791714, + "loss": 0.0448, "step": 131680 }, { - "epoch": 1.42, - "learning_rate": 8.634239730027904e-05, - "loss": 0.037, + "epoch": 0.85, + "learning_rate": 0.00017250624447356022, + "loss": 0.0369, "step": 131690 }, { - "epoch": 1.42, - "learning_rate": 8.632617301576999e-05, - "loss": 0.0385, + "epoch": 0.85, + "learning_rate": 0.00017249656311920327, + "loss": 0.0446, "step": 131700 }, { - "epoch": 1.42, - "learning_rate": 8.630994873126094e-05, - "loss": 0.0293, + "epoch": 0.85, + "learning_rate": 0.00017248688176484635, + "loss": 0.0417, "step": 131710 }, { - "epoch": 1.42, - "learning_rate": 8.629372444675189e-05, - "loss": 0.0319, + "epoch": 0.85, + "learning_rate": 0.00017247720041048943, + "loss": 0.0469, "step": 131720 }, { - "epoch": 1.42, - "learning_rate": 8.627750016224284e-05, - "loss": 0.0288, + "epoch": 0.85, + "learning_rate": 0.00017246751905613245, + "loss": 0.0384, "step": 131730 }, { - "epoch": 1.42, - "learning_rate": 8.626127587773378e-05, - "loss": 0.0304, + "epoch": 0.85, + "learning_rate": 0.00017245783770177553, + "loss": 0.041, "step": 131740 }, { - "epoch": 1.43, - "learning_rate": 8.624505159322473e-05, - "loss": 0.027, + "epoch": 0.85, + "learning_rate": 0.0001724481563474186, + "loss": 0.0448, "step": 131750 }, { - "epoch": 1.43, - "learning_rate": 8.622882730871568e-05, - "loss": 0.035, + "epoch": 0.85, + "learning_rate": 0.0001724384749930617, + "loss": 0.0387, "step": 131760 }, { - "epoch": 1.43, - "learning_rate": 8.621260302420663e-05, - "loss": 0.0291, + "epoch": 0.85, + "learning_rate": 0.00017242879363870475, + "loss": 0.0449, "step": 131770 }, { - "epoch": 1.43, - "learning_rate": 8.619637873969756e-05, - "loss": 0.0349, + "epoch": 0.85, + "learning_rate": 0.00017241911228434783, + "loss": 0.0413, "step": 131780 }, { - "epoch": 1.43, - "learning_rate": 8.618015445518851e-05, - "loss": 0.0274, + "epoch": 0.85, + "learning_rate": 0.0001724094309299909, + "loss": 0.038, "step": 131790 }, { - "epoch": 1.43, - "learning_rate": 8.616393017067946e-05, - "loss": 0.0278, + "epoch": 0.85, + "learning_rate": 0.00017239974957563393, + "loss": 0.0404, "step": 131800 }, { - "epoch": 1.43, - "learning_rate": 8.614770588617041e-05, - "loss": 0.0304, + "epoch": 0.85, + "learning_rate": 0.000172390068221277, + "loss": 0.0361, "step": 131810 }, { - "epoch": 1.43, - "learning_rate": 8.613148160166136e-05, - "loss": 0.0293, + "epoch": 0.85, + "learning_rate": 0.0001723803868669201, + "loss": 0.0392, "step": 131820 }, { - "epoch": 1.43, - "learning_rate": 8.61152573171523e-05, - "loss": 0.0323, + "epoch": 0.85, + "learning_rate": 0.00017237070551256314, + "loss": 0.0426, "step": 131830 }, { - "epoch": 1.43, - "learning_rate": 8.609903303264325e-05, - "loss": 0.028, + "epoch": 0.85, + "learning_rate": 0.00017236102415820622, + "loss": 0.0393, "step": 131840 }, { - "epoch": 1.43, - "learning_rate": 8.60828087481342e-05, - "loss": 0.0306, + "epoch": 0.85, + "learning_rate": 0.0001723513428038493, + "loss": 0.0512, "step": 131850 }, { - "epoch": 1.43, - "learning_rate": 8.606658446362515e-05, - "loss": 0.0281, + "epoch": 0.85, + "learning_rate": 0.00017234166144949238, + "loss": 0.0415, "step": 131860 }, { - "epoch": 1.43, - "learning_rate": 8.60503601791161e-05, - "loss": 0.0248, + "epoch": 0.85, + "learning_rate": 0.0001723319800951354, + "loss": 0.0415, "step": 131870 }, { - "epoch": 1.43, - "learning_rate": 8.603413589460703e-05, - "loss": 0.0294, + "epoch": 0.85, + "learning_rate": 0.0001723222987407785, + "loss": 0.0451, "step": 131880 }, { - "epoch": 1.43, - "learning_rate": 8.601791161009798e-05, - "loss": 0.0332, + "epoch": 0.85, + "learning_rate": 0.00017231261738642157, + "loss": 0.0403, "step": 131890 }, { - "epoch": 1.43, - "learning_rate": 8.600168732558893e-05, - "loss": 0.032, + "epoch": 0.85, + "learning_rate": 0.00017230293603206462, + "loss": 0.0385, "step": 131900 }, { - "epoch": 1.43, - "learning_rate": 8.598546304107988e-05, - "loss": 0.0266, + "epoch": 0.85, + "learning_rate": 0.0001722932546777077, + "loss": 0.0434, "step": 131910 }, { - "epoch": 1.43, - "learning_rate": 8.596923875657082e-05, - "loss": 0.0309, + "epoch": 0.85, + "learning_rate": 0.00017228357332335078, + "loss": 0.0441, "step": 131920 }, { - "epoch": 1.43, - "learning_rate": 8.595301447206177e-05, - "loss": 0.0315, + "epoch": 0.85, + "learning_rate": 0.00017227389196899386, + "loss": 0.0385, "step": 131930 }, { - "epoch": 1.43, - "learning_rate": 8.593679018755272e-05, - "loss": 0.0326, + "epoch": 0.85, + "learning_rate": 0.00017226421061463689, + "loss": 0.0405, "step": 131940 }, { - "epoch": 1.43, - "learning_rate": 8.592056590304367e-05, - "loss": 0.0314, + "epoch": 0.85, + "learning_rate": 0.00017225452926027997, + "loss": 0.0367, "step": 131950 }, { - "epoch": 1.43, - "learning_rate": 8.590434161853462e-05, - "loss": 0.0299, + "epoch": 0.85, + "learning_rate": 0.00017224484790592304, + "loss": 0.0424, "step": 131960 }, { - "epoch": 1.43, - "learning_rate": 8.588811733402555e-05, - "loss": 0.025, + "epoch": 0.85, + "learning_rate": 0.0001722351665515661, + "loss": 0.0378, "step": 131970 }, { - "epoch": 1.43, - "learning_rate": 8.58718930495165e-05, - "loss": 0.0274, + "epoch": 0.85, + "learning_rate": 0.00017222548519720918, + "loss": 0.0361, "step": 131980 }, { - "epoch": 1.43, - "learning_rate": 8.585566876500745e-05, - "loss": 0.0313, + "epoch": 0.85, + "learning_rate": 0.00017221580384285226, + "loss": 0.036, "step": 131990 }, { - "epoch": 1.43, - "learning_rate": 8.58394444804984e-05, - "loss": 0.0287, + "epoch": 0.85, + "learning_rate": 0.00017220612248849534, + "loss": 0.0431, "step": 132000 }, { - "epoch": 1.43, - "eval_cer": 0.9211481408839437, - "eval_loss": 0.024598222225904465, - "eval_runtime": 118.8469, - "eval_samples_per_second": 16.828, - "eval_steps_per_second": 4.207, + "epoch": 0.85, + "eval_cer": 0.9199023839114224, + "eval_loss": 0.02698080614209175, + "eval_runtime": 119.8592, + "eval_samples_per_second": 16.686, + "eval_steps_per_second": 4.172, "step": 132000 }, { - "epoch": 1.43, - "learning_rate": 8.582322019598934e-05, - "loss": 0.032, + "epoch": 0.85, + "learning_rate": 0.00017219644113413836, + "loss": 0.0361, "step": 132010 }, { - "epoch": 1.43, - "learning_rate": 8.580699591148029e-05, - "loss": 0.0299, + "epoch": 0.85, + "learning_rate": 0.00017218675977978144, + "loss": 0.042, "step": 132020 }, { - "epoch": 1.43, - "learning_rate": 8.579077162697124e-05, - "loss": 0.0335, + "epoch": 0.85, + "learning_rate": 0.0001721770784254245, + "loss": 0.0419, "step": 132030 }, { - "epoch": 1.43, - "learning_rate": 8.577454734246219e-05, - "loss": 0.0322, + "epoch": 0.85, + "learning_rate": 0.00017216739707106757, + "loss": 0.0405, "step": 132040 }, { - "epoch": 1.43, - "learning_rate": 8.575832305795314e-05, - "loss": 0.0276, + "epoch": 0.85, + "learning_rate": 0.00017215771571671065, + "loss": 0.0392, "step": 132050 }, { - "epoch": 1.43, - "learning_rate": 8.574209877344407e-05, - "loss": 0.0284, + "epoch": 0.85, + "learning_rate": 0.00017214803436235373, + "loss": 0.0426, "step": 132060 }, { - "epoch": 1.43, - "learning_rate": 8.572587448893502e-05, - "loss": 0.0268, + "epoch": 0.85, + "learning_rate": 0.0001721383530079968, + "loss": 0.0427, "step": 132070 }, { - "epoch": 1.43, - "learning_rate": 8.570965020442597e-05, - "loss": 0.0314, + "epoch": 0.85, + "learning_rate": 0.00017212867165363984, + "loss": 0.0444, "step": 132080 }, { - "epoch": 1.43, - "learning_rate": 8.569342591991692e-05, - "loss": 0.0325, + "epoch": 0.85, + "learning_rate": 0.00017211899029928292, + "loss": 0.035, "step": 132090 }, { - "epoch": 1.43, - "learning_rate": 8.567720163540786e-05, - "loss": 0.028, + "epoch": 0.85, + "learning_rate": 0.00017210930894492597, + "loss": 0.0454, "step": 132100 }, { - "epoch": 1.43, - "learning_rate": 8.566097735089881e-05, - "loss": 0.0296, + "epoch": 0.85, + "learning_rate": 0.00017209962759056905, + "loss": 0.046, "step": 132110 }, { - "epoch": 1.43, - "learning_rate": 8.564475306638976e-05, - "loss": 0.0319, + "epoch": 0.85, + "learning_rate": 0.00017208994623621213, + "loss": 0.0384, "step": 132120 }, { - "epoch": 1.43, - "learning_rate": 8.562852878188071e-05, - "loss": 0.0436, + "epoch": 0.85, + "learning_rate": 0.0001720802648818552, + "loss": 0.0372, "step": 132130 }, { - "epoch": 1.43, - "learning_rate": 8.561230449737166e-05, - "loss": 0.0377, + "epoch": 0.85, + "learning_rate": 0.00017207058352749826, + "loss": 0.0381, "step": 132140 }, { - "epoch": 1.43, - "learning_rate": 8.55960802128626e-05, - "loss": 0.0319, + "epoch": 0.85, + "learning_rate": 0.00017206090217314132, + "loss": 0.0474, "step": 132150 }, { - "epoch": 1.43, - "learning_rate": 8.557985592835355e-05, - "loss": 0.0291, + "epoch": 0.85, + "learning_rate": 0.0001720512208187844, + "loss": 0.0437, "step": 132160 }, { - "epoch": 1.43, - "learning_rate": 8.55636316438445e-05, - "loss": 0.0417, + "epoch": 0.85, + "learning_rate": 0.00017204153946442745, + "loss": 0.0409, "step": 132170 }, { - "epoch": 1.43, - "learning_rate": 8.554740735933544e-05, - "loss": 0.0278, + "epoch": 0.85, + "learning_rate": 0.00017203185811007053, + "loss": 0.0388, "step": 132180 }, { - "epoch": 1.43, - "learning_rate": 8.553118307482638e-05, - "loss": 0.028, + "epoch": 0.85, + "learning_rate": 0.0001720221767557136, + "loss": 0.0507, "step": 132190 }, { - "epoch": 1.43, - "learning_rate": 8.551495879031733e-05, - "loss": 0.0281, + "epoch": 0.85, + "learning_rate": 0.0001720124954013567, + "loss": 0.0459, "step": 132200 }, { - "epoch": 1.43, - "learning_rate": 8.549873450580828e-05, - "loss": 0.0269, + "epoch": 0.85, + "learning_rate": 0.00017200281404699974, + "loss": 0.0471, "step": 132210 }, { - "epoch": 1.43, - "learning_rate": 8.548251022129923e-05, - "loss": 0.0322, + "epoch": 0.85, + "learning_rate": 0.0001719931326926428, + "loss": 0.0393, "step": 132220 }, { - "epoch": 1.43, - "learning_rate": 8.546628593679018e-05, - "loss": 0.0301, + "epoch": 0.85, + "learning_rate": 0.00017198345133828585, + "loss": 0.0377, "step": 132230 }, { - "epoch": 1.43, - "learning_rate": 8.545006165228112e-05, - "loss": 0.0302, + "epoch": 0.85, + "learning_rate": 0.00017197376998392893, + "loss": 0.0418, "step": 132240 }, { - "epoch": 1.43, - "learning_rate": 8.543383736777207e-05, - "loss": 0.0301, + "epoch": 0.85, + "learning_rate": 0.000171964088629572, + "loss": 0.0477, "step": 132250 }, { - "epoch": 1.43, - "learning_rate": 8.541761308326302e-05, - "loss": 0.0282, + "epoch": 0.85, + "learning_rate": 0.00017195440727521509, + "loss": 0.0373, "step": 132260 }, { - "epoch": 1.43, - "learning_rate": 8.540138879875397e-05, - "loss": 0.0291, + "epoch": 0.85, + "learning_rate": 0.00017194472592085814, + "loss": 0.0484, "step": 132270 }, { - "epoch": 1.43, - "learning_rate": 8.53851645142449e-05, - "loss": 0.0324, + "epoch": 0.85, + "learning_rate": 0.00017193504456650122, + "loss": 0.0436, "step": 132280 }, { - "epoch": 1.43, - "learning_rate": 8.536894022973585e-05, - "loss": 0.0289, + "epoch": 0.85, + "learning_rate": 0.00017192536321214427, + "loss": 0.0416, "step": 132290 }, { - "epoch": 1.43, - "learning_rate": 8.53527159452268e-05, - "loss": 0.0293, + "epoch": 0.85, + "learning_rate": 0.00017191568185778732, + "loss": 0.0406, "step": 132300 }, { - "epoch": 1.43, - "learning_rate": 8.533649166071775e-05, - "loss": 0.0323, + "epoch": 0.85, + "learning_rate": 0.0001719060005034304, + "loss": 0.0418, "step": 132310 }, { - "epoch": 1.43, - "learning_rate": 8.53202673762087e-05, - "loss": 0.0331, + "epoch": 0.85, + "learning_rate": 0.00017189631914907348, + "loss": 0.0391, "step": 132320 }, { - "epoch": 1.43, - "learning_rate": 8.530404309169964e-05, - "loss": 0.0261, + "epoch": 0.85, + "learning_rate": 0.00017188663779471656, + "loss": 0.0356, "step": 132330 }, { - "epoch": 1.43, - "learning_rate": 8.528781880719059e-05, - "loss": 0.0316, + "epoch": 0.85, + "learning_rate": 0.00017187695644035962, + "loss": 0.0388, "step": 132340 }, { - "epoch": 1.43, - "learning_rate": 8.527159452268154e-05, - "loss": 0.0311, + "epoch": 0.85, + "learning_rate": 0.0001718672750860027, + "loss": 0.0425, "step": 132350 }, { - "epoch": 1.43, - "learning_rate": 8.525537023817249e-05, - "loss": 0.0273, + "epoch": 0.85, + "learning_rate": 0.00017185759373164575, + "loss": 0.0365, "step": 132360 }, { - "epoch": 1.43, - "learning_rate": 8.523914595366342e-05, - "loss": 0.0301, + "epoch": 0.85, + "learning_rate": 0.0001718479123772888, + "loss": 0.0433, "step": 132370 }, { - "epoch": 1.43, - "learning_rate": 8.522292166915437e-05, - "loss": 0.0356, + "epoch": 0.85, + "learning_rate": 0.00017183823102293188, + "loss": 0.0383, "step": 132380 }, { - "epoch": 1.43, - "learning_rate": 8.520669738464532e-05, - "loss": 0.0276, + "epoch": 0.85, + "learning_rate": 0.00017182854966857496, + "loss": 0.0511, "step": 132390 }, { - "epoch": 1.43, - "learning_rate": 8.519047310013627e-05, - "loss": 0.0278, + "epoch": 0.85, + "learning_rate": 0.00017181886831421804, + "loss": 0.041, "step": 132400 }, { - "epoch": 1.43, - "learning_rate": 8.517424881562722e-05, - "loss": 0.0285, + "epoch": 0.85, + "learning_rate": 0.0001718091869598611, + "loss": 0.0422, "step": 132410 }, { - "epoch": 1.43, - "learning_rate": 8.515802453111816e-05, - "loss": 0.0333, + "epoch": 0.85, + "learning_rate": 0.00017179950560550417, + "loss": 0.04, "step": 132420 }, { - "epoch": 1.43, - "learning_rate": 8.514180024660911e-05, - "loss": 0.0304, + "epoch": 0.85, + "learning_rate": 0.0001717898242511472, + "loss": 0.0455, "step": 132430 }, { - "epoch": 1.43, - "learning_rate": 8.512557596210006e-05, - "loss": 0.0322, + "epoch": 0.85, + "learning_rate": 0.00017178014289679028, + "loss": 0.0431, "step": 132440 }, { - "epoch": 1.43, - "learning_rate": 8.510935167759101e-05, - "loss": 0.0275, + "epoch": 0.85, + "learning_rate": 0.00017177046154243336, + "loss": 0.0329, "step": 132450 }, { - "epoch": 1.43, - "learning_rate": 8.509312739308194e-05, - "loss": 0.0333, + "epoch": 0.85, + "learning_rate": 0.00017176078018807644, + "loss": 0.0386, "step": 132460 }, { - "epoch": 1.43, - "learning_rate": 8.50769031085729e-05, - "loss": 0.0254, + "epoch": 0.85, + "learning_rate": 0.0001717510988337195, + "loss": 0.0463, "step": 132470 }, { - "epoch": 1.43, - "learning_rate": 8.506067882406384e-05, - "loss": 0.0296, + "epoch": 0.86, + "learning_rate": 0.00017174141747936257, + "loss": 0.0368, "step": 132480 }, { - "epoch": 1.43, - "learning_rate": 8.504445453955479e-05, - "loss": 0.0315, + "epoch": 0.86, + "learning_rate": 0.00017173173612500565, + "loss": 0.0441, "step": 132490 }, { - "epoch": 1.43, - "learning_rate": 8.502823025504574e-05, - "loss": 0.031, + "epoch": 0.86, + "learning_rate": 0.00017172205477064868, + "loss": 0.0394, "step": 132500 }, { - "epoch": 1.43, - "learning_rate": 8.501200597053668e-05, - "loss": 0.0316, + "epoch": 0.86, + "learning_rate": 0.00017171237341629176, + "loss": 0.0432, "step": 132510 }, { - "epoch": 1.43, - "learning_rate": 8.499578168602763e-05, - "loss": 0.0387, + "epoch": 0.86, + "learning_rate": 0.00017170269206193484, + "loss": 0.041, "step": 132520 }, { - "epoch": 1.43, - "learning_rate": 8.497955740151858e-05, - "loss": 0.0307, + "epoch": 0.86, + "learning_rate": 0.00017169301070757792, + "loss": 0.0408, "step": 132530 }, { - "epoch": 1.43, - "learning_rate": 8.496333311700953e-05, - "loss": 0.0375, + "epoch": 0.86, + "learning_rate": 0.00017168332935322097, + "loss": 0.0397, "step": 132540 }, { - "epoch": 1.43, - "learning_rate": 8.494710883250046e-05, - "loss": 0.0344, + "epoch": 0.86, + "learning_rate": 0.00017167364799886405, + "loss": 0.0359, "step": 132550 }, { - "epoch": 1.43, - "learning_rate": 8.493088454799141e-05, - "loss": 0.0355, + "epoch": 0.86, + "learning_rate": 0.00017166396664450713, + "loss": 0.0451, "step": 132560 }, { - "epoch": 1.43, - "learning_rate": 8.491466026348236e-05, - "loss": 0.0293, + "epoch": 0.86, + "learning_rate": 0.00017165428529015015, + "loss": 0.0445, "step": 132570 }, { - "epoch": 1.43, - "learning_rate": 8.489843597897333e-05, - "loss": 0.0373, + "epoch": 0.86, + "learning_rate": 0.00017164460393579323, + "loss": 0.0427, "step": 132580 }, { - "epoch": 1.43, - "learning_rate": 8.488221169446428e-05, - "loss": 0.0316, + "epoch": 0.86, + "learning_rate": 0.0001716349225814363, + "loss": 0.0343, "step": 132590 }, { - "epoch": 1.43, - "learning_rate": 8.486598740995523e-05, - "loss": 0.0304, + "epoch": 0.86, + "learning_rate": 0.0001716252412270794, + "loss": 0.0397, "step": 132600 }, { - "epoch": 1.43, - "learning_rate": 8.484976312544616e-05, - "loss": 0.0249, + "epoch": 0.86, + "learning_rate": 0.00017161555987272245, + "loss": 0.0436, "step": 132610 }, { - "epoch": 1.43, - "learning_rate": 8.483353884093711e-05, - "loss": 0.0325, + "epoch": 0.86, + "learning_rate": 0.00017160587851836553, + "loss": 0.0376, "step": 132620 }, { - "epoch": 1.43, - "learning_rate": 8.481731455642806e-05, - "loss": 0.0252, + "epoch": 0.86, + "learning_rate": 0.0001715961971640086, + "loss": 0.0425, "step": 132630 }, { - "epoch": 1.43, - "learning_rate": 8.480109027191901e-05, - "loss": 0.025, + "epoch": 0.86, + "learning_rate": 0.00017158651580965163, + "loss": 0.0398, "step": 132640 }, { - "epoch": 1.43, - "learning_rate": 8.478486598740996e-05, - "loss": 0.0281, + "epoch": 0.86, + "learning_rate": 0.0001715768344552947, + "loss": 0.0443, "step": 132650 }, { - "epoch": 1.43, - "learning_rate": 8.47686417029009e-05, - "loss": 0.0279, + "epoch": 0.86, + "learning_rate": 0.0001715671531009378, + "loss": 0.0422, "step": 132660 }, { - "epoch": 1.43, - "learning_rate": 8.475241741839185e-05, - "loss": 0.0367, + "epoch": 0.86, + "learning_rate": 0.00017155747174658084, + "loss": 0.0425, "step": 132670 }, { - "epoch": 1.44, - "learning_rate": 8.47361931338828e-05, - "loss": 0.0303, + "epoch": 0.86, + "learning_rate": 0.00017154779039222392, + "loss": 0.0397, "step": 132680 }, { - "epoch": 1.44, - "learning_rate": 8.471996884937375e-05, - "loss": 0.0352, + "epoch": 0.86, + "learning_rate": 0.000171538109037867, + "loss": 0.0432, "step": 132690 }, { - "epoch": 1.44, - "learning_rate": 8.470374456486468e-05, - "loss": 0.034, + "epoch": 0.86, + "learning_rate": 0.00017152842768351008, + "loss": 0.0389, "step": 132700 }, { - "epoch": 1.44, - "learning_rate": 8.468752028035563e-05, - "loss": 0.0333, + "epoch": 0.86, + "learning_rate": 0.0001715187463291531, + "loss": 0.0529, "step": 132710 }, { - "epoch": 1.44, - "learning_rate": 8.467129599584658e-05, - "loss": 0.0433, + "epoch": 0.86, + "learning_rate": 0.0001715090649747962, + "loss": 0.0457, "step": 132720 }, { - "epoch": 1.44, - "learning_rate": 8.465507171133753e-05, - "loss": 0.0293, + "epoch": 0.86, + "learning_rate": 0.00017149938362043927, + "loss": 0.0406, "step": 132730 }, { - "epoch": 1.44, - "learning_rate": 8.463884742682848e-05, - "loss": 0.0295, + "epoch": 0.86, + "learning_rate": 0.00017148970226608232, + "loss": 0.0377, "step": 132740 }, { - "epoch": 1.44, - "learning_rate": 8.462262314231942e-05, - "loss": 0.0309, + "epoch": 0.86, + "learning_rate": 0.0001714800209117254, + "loss": 0.0367, "step": 132750 }, { - "epoch": 1.44, - "learning_rate": 8.460639885781037e-05, - "loss": 0.0393, + "epoch": 0.86, + "learning_rate": 0.00017147033955736848, + "loss": 0.0487, "step": 132760 }, { - "epoch": 1.44, - "learning_rate": 8.459017457330132e-05, - "loss": 0.0336, + "epoch": 0.86, + "learning_rate": 0.00017146065820301156, + "loss": 0.0432, "step": 132770 }, { - "epoch": 1.44, - "learning_rate": 8.457395028879227e-05, - "loss": 0.0351, + "epoch": 0.86, + "learning_rate": 0.00017145097684865458, + "loss": 0.0406, "step": 132780 }, { - "epoch": 1.44, - "learning_rate": 8.45577260042832e-05, - "loss": 0.0324, + "epoch": 0.86, + "learning_rate": 0.00017144129549429766, + "loss": 0.0527, "step": 132790 }, { - "epoch": 1.44, - "learning_rate": 8.454150171977415e-05, - "loss": 0.0321, + "epoch": 0.86, + "learning_rate": 0.00017143161413994074, + "loss": 0.0396, "step": 132800 }, { - "epoch": 1.44, - "learning_rate": 8.45252774352651e-05, - "loss": 0.0293, + "epoch": 0.86, + "learning_rate": 0.0001714219327855838, + "loss": 0.0399, "step": 132810 }, { - "epoch": 1.44, - "learning_rate": 8.450905315075605e-05, - "loss": 0.0375, + "epoch": 0.86, + "learning_rate": 0.00017141225143122688, + "loss": 0.0404, "step": 132820 }, { - "epoch": 1.44, - "learning_rate": 8.4492828866247e-05, - "loss": 0.0282, + "epoch": 0.86, + "learning_rate": 0.00017140257007686996, + "loss": 0.0392, "step": 132830 }, { - "epoch": 1.44, - "learning_rate": 8.447660458173794e-05, - "loss": 0.0292, + "epoch": 0.86, + "learning_rate": 0.000171392888722513, + "loss": 0.0549, "step": 132840 }, { - "epoch": 1.44, - "learning_rate": 8.446038029722889e-05, - "loss": 0.0233, + "epoch": 0.86, + "learning_rate": 0.00017138320736815606, + "loss": 0.0434, "step": 132850 }, { - "epoch": 1.44, - "learning_rate": 8.444415601271984e-05, - "loss": 0.0268, + "epoch": 0.86, + "learning_rate": 0.00017137352601379914, + "loss": 0.0435, "step": 132860 }, { - "epoch": 1.44, - "learning_rate": 8.442793172821079e-05, - "loss": 0.0307, + "epoch": 0.86, + "learning_rate": 0.0001713638446594422, + "loss": 0.0373, "step": 132870 }, { - "epoch": 1.44, - "learning_rate": 8.441170744370173e-05, - "loss": 0.0352, + "epoch": 0.86, + "learning_rate": 0.00017135416330508527, + "loss": 0.0454, "step": 132880 }, { - "epoch": 1.44, - "learning_rate": 8.439548315919268e-05, - "loss": 0.0284, + "epoch": 0.86, + "learning_rate": 0.00017134448195072835, + "loss": 0.0418, "step": 132890 }, { - "epoch": 1.44, - "learning_rate": 8.437925887468363e-05, - "loss": 0.0309, + "epoch": 0.86, + "learning_rate": 0.00017133480059637143, + "loss": 0.0436, "step": 132900 }, { - "epoch": 1.44, - "learning_rate": 8.436303459017457e-05, - "loss": 0.0331, + "epoch": 0.86, + "learning_rate": 0.0001713251192420145, + "loss": 0.0432, "step": 132910 }, { - "epoch": 1.44, - "learning_rate": 8.434681030566552e-05, - "loss": 0.0308, + "epoch": 0.86, + "learning_rate": 0.00017131543788765754, + "loss": 0.0438, "step": 132920 }, { - "epoch": 1.44, - "learning_rate": 8.433058602115646e-05, - "loss": 0.0335, + "epoch": 0.86, + "learning_rate": 0.00017130575653330062, + "loss": 0.0447, "step": 132930 }, { - "epoch": 1.44, - "learning_rate": 8.431436173664741e-05, - "loss": 0.029, + "epoch": 0.86, + "learning_rate": 0.00017129607517894367, + "loss": 0.0453, "step": 132940 }, { - "epoch": 1.44, - "learning_rate": 8.429813745213836e-05, - "loss": 0.0269, + "epoch": 0.86, + "learning_rate": 0.00017128639382458675, + "loss": 0.043, "step": 132950 }, { - "epoch": 1.44, - "learning_rate": 8.428191316762931e-05, - "loss": 0.0313, + "epoch": 0.86, + "learning_rate": 0.00017127671247022983, + "loss": 0.0468, "step": 132960 }, { - "epoch": 1.44, - "learning_rate": 8.426568888312025e-05, - "loss": 0.0315, + "epoch": 0.86, + "learning_rate": 0.0001712670311158729, + "loss": 0.0397, "step": 132970 }, { - "epoch": 1.44, - "learning_rate": 8.42494645986112e-05, - "loss": 0.0354, + "epoch": 0.86, + "learning_rate": 0.00017125734976151596, + "loss": 0.0438, "step": 132980 }, { - "epoch": 1.44, - "learning_rate": 8.423324031410215e-05, - "loss": 0.0355, - "step": 132990 + "epoch": 0.86, + "learning_rate": 0.00017124766840715902, + "loss": 0.0447, + "step": 132990 }, { - "epoch": 1.44, - "learning_rate": 8.42170160295931e-05, - "loss": 0.0351, + "epoch": 0.86, + "learning_rate": 0.0001712379870528021, + "loss": 0.047, "step": 133000 }, { - "epoch": 1.44, - "eval_cer": 0.9211684610233222, - "eval_loss": 0.023968951776623726, - "eval_runtime": 118.7908, - "eval_samples_per_second": 16.836, - "eval_steps_per_second": 4.209, + "epoch": 0.86, + "eval_cer": 0.9198843068579822, + "eval_loss": 0.02717752754688263, + "eval_runtime": 119.8783, + "eval_samples_per_second": 16.684, + "eval_steps_per_second": 4.171, "step": 133000 }, { - "epoch": 1.44, - "learning_rate": 8.420079174508405e-05, - "loss": 0.0278, + "epoch": 0.86, + "learning_rate": 0.00017122830569844515, + "loss": 0.0351, "step": 133010 }, { - "epoch": 1.44, - "learning_rate": 8.418456746057498e-05, - "loss": 0.028, + "epoch": 0.86, + "learning_rate": 0.00017121862434408823, + "loss": 0.0372, "step": 133020 }, { - "epoch": 1.44, - "learning_rate": 8.416834317606593e-05, - "loss": 0.034, + "epoch": 0.86, + "learning_rate": 0.0001712089429897313, + "loss": 0.0383, "step": 133030 }, { - "epoch": 1.44, - "learning_rate": 8.415211889155688e-05, - "loss": 0.0316, + "epoch": 0.86, + "learning_rate": 0.00017119926163537436, + "loss": 0.0396, "step": 133040 }, { - "epoch": 1.44, - "learning_rate": 8.413589460704783e-05, - "loss": 0.0319, + "epoch": 0.86, + "learning_rate": 0.00017118958028101744, + "loss": 0.0387, "step": 133050 }, { - "epoch": 1.44, - "learning_rate": 8.411967032253877e-05, - "loss": 0.0349, + "epoch": 0.86, + "learning_rate": 0.0001711798989266605, + "loss": 0.0369, "step": 133060 }, { - "epoch": 1.44, - "learning_rate": 8.410344603802972e-05, - "loss": 0.029, + "epoch": 0.86, + "learning_rate": 0.00017117021757230355, + "loss": 0.037, "step": 133070 }, { - "epoch": 1.44, - "learning_rate": 8.408722175352067e-05, - "loss": 0.0301, + "epoch": 0.86, + "learning_rate": 0.00017116053621794663, + "loss": 0.0409, "step": 133080 }, { - "epoch": 1.44, - "learning_rate": 8.407099746901162e-05, - "loss": 0.0278, + "epoch": 0.86, + "learning_rate": 0.0001711508548635897, + "loss": 0.0414, "step": 133090 }, { - "epoch": 1.44, - "learning_rate": 8.405477318450257e-05, - "loss": 0.0287, + "epoch": 0.86, + "learning_rate": 0.00017114117350923279, + "loss": 0.04, "step": 133100 }, { - "epoch": 1.44, - "learning_rate": 8.40385488999935e-05, - "loss": 0.0302, + "epoch": 0.86, + "learning_rate": 0.00017113149215487584, + "loss": 0.0406, "step": 133110 }, { - "epoch": 1.44, - "learning_rate": 8.402232461548445e-05, - "loss": 0.0271, + "epoch": 0.86, + "learning_rate": 0.00017112181080051892, + "loss": 0.1446, "step": 133120 }, { - "epoch": 1.44, - "learning_rate": 8.40061003309754e-05, - "loss": 0.0265, + "epoch": 0.86, + "learning_rate": 0.00017111212944616197, + "loss": 0.0545, "step": 133130 }, { - "epoch": 1.44, - "learning_rate": 8.398987604646635e-05, - "loss": 0.0339, + "epoch": 0.86, + "learning_rate": 0.00017110244809180502, + "loss": 0.078, "step": 133140 }, { - "epoch": 1.44, - "learning_rate": 8.397365176195729e-05, - "loss": 0.029, + "epoch": 0.86, + "learning_rate": 0.0001710927667374481, + "loss": 0.0487, "step": 133150 }, { - "epoch": 1.44, - "learning_rate": 8.395742747744824e-05, - "loss": 0.029, + "epoch": 0.86, + "learning_rate": 0.00017108308538309118, + "loss": 0.0443, "step": 133160 }, { - "epoch": 1.44, - "learning_rate": 8.394120319293919e-05, - "loss": 0.0357, + "epoch": 0.86, + "learning_rate": 0.00017107340402873426, + "loss": 0.037, "step": 133170 }, { - "epoch": 1.44, - "learning_rate": 8.392497890843014e-05, - "loss": 0.028, + "epoch": 0.86, + "learning_rate": 0.00017106372267437732, + "loss": 0.0493, "step": 133180 }, { - "epoch": 1.44, - "learning_rate": 8.390875462392109e-05, - "loss": 0.0307, + "epoch": 0.86, + "learning_rate": 0.0001710540413200204, + "loss": 0.039, "step": 133190 }, { - "epoch": 1.44, - "learning_rate": 8.389253033941202e-05, - "loss": 0.0371, + "epoch": 0.86, + "learning_rate": 0.00017104435996566345, + "loss": 0.038, "step": 133200 }, { - "epoch": 1.44, - "learning_rate": 8.387630605490297e-05, - "loss": 0.0325, + "epoch": 0.86, + "learning_rate": 0.0001710346786113065, + "loss": 0.0395, "step": 133210 }, { - "epoch": 1.44, - "learning_rate": 8.386008177039392e-05, - "loss": 0.0297, + "epoch": 0.86, + "learning_rate": 0.00017102499725694958, + "loss": 0.0388, "step": 133220 }, { - "epoch": 1.44, - "learning_rate": 8.384385748588487e-05, - "loss": 0.0272, + "epoch": 0.86, + "learning_rate": 0.00017101531590259266, + "loss": 0.0379, "step": 133230 }, { - "epoch": 1.44, - "learning_rate": 8.382763320137581e-05, - "loss": 0.0321, + "epoch": 0.86, + "learning_rate": 0.0001710056345482357, + "loss": 0.0393, "step": 133240 }, { - "epoch": 1.44, - "learning_rate": 8.381140891686676e-05, - "loss": 0.0316, + "epoch": 0.86, + "learning_rate": 0.0001709959531938788, + "loss": 0.0392, "step": 133250 }, { - "epoch": 1.44, - "learning_rate": 8.379518463235771e-05, - "loss": 0.0279, + "epoch": 0.86, + "learning_rate": 0.00017098627183952187, + "loss": 0.045, "step": 133260 }, { - "epoch": 1.44, - "learning_rate": 8.377896034784866e-05, - "loss": 0.0295, + "epoch": 0.86, + "learning_rate": 0.0001709765904851649, + "loss": 0.0366, "step": 133270 }, { - "epoch": 1.44, - "learning_rate": 8.376273606333961e-05, - "loss": 0.0282, + "epoch": 0.86, + "learning_rate": 0.00017096690913080798, + "loss": 0.0471, "step": 133280 }, { - "epoch": 1.44, - "learning_rate": 8.374651177883054e-05, - "loss": 0.0278, + "epoch": 0.86, + "learning_rate": 0.00017095722777645106, + "loss": 0.0408, "step": 133290 }, { - "epoch": 1.44, - "learning_rate": 8.37302874943215e-05, - "loss": 0.0293, + "epoch": 0.86, + "learning_rate": 0.00017094754642209414, + "loss": 0.0447, "step": 133300 }, { - "epoch": 1.44, - "learning_rate": 8.371406320981244e-05, - "loss": 0.0319, + "epoch": 0.86, + "learning_rate": 0.0001709378650677372, + "loss": 0.0412, "step": 133310 }, { - "epoch": 1.44, - "learning_rate": 8.36978389253034e-05, - "loss": 0.0349, + "epoch": 0.86, + "learning_rate": 0.00017092818371338027, + "loss": 0.0457, "step": 133320 }, { - "epoch": 1.44, - "learning_rate": 8.368161464079434e-05, - "loss": 0.0316, + "epoch": 0.86, + "learning_rate": 0.00017091850235902335, + "loss": 0.0424, "step": 133330 }, { - "epoch": 1.44, - "learning_rate": 8.366539035628528e-05, - "loss": 0.0293, + "epoch": 0.86, + "learning_rate": 0.00017090882100466638, + "loss": 0.0463, "step": 133340 }, { - "epoch": 1.44, - "learning_rate": 8.364916607177623e-05, - "loss": 0.0336, + "epoch": 0.86, + "learning_rate": 0.00017089913965030946, + "loss": 0.0443, "step": 133350 }, { - "epoch": 1.44, - "learning_rate": 8.363294178726718e-05, - "loss": 0.0291, + "epoch": 0.86, + "learning_rate": 0.00017088945829595254, + "loss": 0.0365, "step": 133360 }, { - "epoch": 1.44, - "learning_rate": 8.361671750275813e-05, - "loss": 0.0315, + "epoch": 0.86, + "learning_rate": 0.00017087977694159561, + "loss": 0.0391, "step": 133370 }, { - "epoch": 1.44, - "learning_rate": 8.360049321824906e-05, - "loss": 0.0378, + "epoch": 0.86, + "learning_rate": 0.00017087009558723867, + "loss": 0.0374, "step": 133380 }, { - "epoch": 1.44, - "learning_rate": 8.358426893374001e-05, - "loss": 0.0297, + "epoch": 0.86, + "learning_rate": 0.00017086041423288175, + "loss": 0.0414, "step": 133390 }, { - "epoch": 1.44, - "learning_rate": 8.356804464923096e-05, - "loss": 0.0354, + "epoch": 0.86, + "learning_rate": 0.00017085073287852483, + "loss": 0.0419, "step": 133400 }, { - "epoch": 1.44, - "learning_rate": 8.355182036472191e-05, - "loss": 0.0288, + "epoch": 0.86, + "learning_rate": 0.00017084105152416785, + "loss": 0.0355, "step": 133410 }, { - "epoch": 1.44, - "learning_rate": 8.353559608021286e-05, - "loss": 0.0258, + "epoch": 0.86, + "learning_rate": 0.00017083137016981093, + "loss": 0.0361, "step": 133420 }, { - "epoch": 1.44, - "learning_rate": 8.35193717957038e-05, - "loss": 0.0331, + "epoch": 0.86, + "learning_rate": 0.000170821688815454, + "loss": 0.0384, "step": 133430 }, { - "epoch": 1.44, - "learning_rate": 8.350314751119475e-05, - "loss": 0.0313, + "epoch": 0.86, + "learning_rate": 0.00017081200746109707, + "loss": 0.0385, "step": 133440 }, { - "epoch": 1.44, - "learning_rate": 8.34869232266857e-05, - "loss": 0.0306, + "epoch": 0.86, + "learning_rate": 0.00017080232610674014, + "loss": 0.0405, "step": 133450 }, { - "epoch": 1.44, - "learning_rate": 8.347069894217665e-05, - "loss": 0.0258, + "epoch": 0.86, + "learning_rate": 0.00017079264475238322, + "loss": 0.0434, "step": 133460 }, { - "epoch": 1.44, - "learning_rate": 8.345447465766759e-05, - "loss": 0.0353, + "epoch": 0.86, + "learning_rate": 0.0001707829633980263, + "loss": 0.0365, "step": 133470 }, { - "epoch": 1.44, - "learning_rate": 8.343825037315854e-05, - "loss": 0.0279, + "epoch": 0.86, + "learning_rate": 0.00017077328204366933, + "loss": 0.0375, "step": 133480 }, { - "epoch": 1.44, - "learning_rate": 8.342202608864949e-05, - "loss": 0.0283, + "epoch": 0.86, + "learning_rate": 0.0001707636006893124, + "loss": 0.0396, "step": 133490 }, { - "epoch": 1.44, - "learning_rate": 8.340580180414044e-05, - "loss": 0.0249, + "epoch": 0.86, + "learning_rate": 0.0001707539193349555, + "loss": 0.0408, "step": 133500 }, { - "epoch": 1.44, - "learning_rate": 8.338957751963138e-05, - "loss": 0.0309, + "epoch": 0.86, + "learning_rate": 0.00017074423798059854, + "loss": 0.047, "step": 133510 }, { - "epoch": 1.44, - "learning_rate": 8.337335323512232e-05, - "loss": 0.0327, + "epoch": 0.86, + "learning_rate": 0.00017073455662624162, + "loss": 0.0408, "step": 133520 }, { - "epoch": 1.44, - "learning_rate": 8.335712895061327e-05, - "loss": 0.0373, + "epoch": 0.86, + "learning_rate": 0.0001707248752718847, + "loss": 0.043, "step": 133530 }, { - "epoch": 1.44, - "learning_rate": 8.334090466610422e-05, - "loss": 0.029, + "epoch": 0.86, + "learning_rate": 0.00017071519391752778, + "loss": 0.0476, "step": 133540 }, { - "epoch": 1.44, - "learning_rate": 8.332468038159517e-05, - "loss": 0.0324, + "epoch": 0.86, + "learning_rate": 0.0001707055125631708, + "loss": 0.0363, "step": 133550 }, { - "epoch": 1.44, - "learning_rate": 8.33084560970861e-05, - "loss": 0.0311, + "epoch": 0.86, + "learning_rate": 0.0001706958312088139, + "loss": 0.0408, "step": 133560 }, { - "epoch": 1.44, - "learning_rate": 8.329223181257706e-05, - "loss": 0.0282, + "epoch": 0.86, + "learning_rate": 0.00017068614985445697, + "loss": 0.0416, "step": 133570 }, { - "epoch": 1.44, - "learning_rate": 8.3276007528068e-05, - "loss": 0.0374, + "epoch": 0.86, + "learning_rate": 0.00017067646850010002, + "loss": 0.0413, "step": 133580 }, { - "epoch": 1.44, - "learning_rate": 8.325978324355896e-05, - "loss": 0.0331, + "epoch": 0.86, + "learning_rate": 0.0001706667871457431, + "loss": 0.0367, "step": 133590 }, { - "epoch": 1.45, - "learning_rate": 8.32435589590499e-05, - "loss": 0.0327, + "epoch": 0.86, + "learning_rate": 0.00017065710579138618, + "loss": 0.0411, "step": 133600 }, { - "epoch": 1.45, - "learning_rate": 8.322733467454084e-05, - "loss": 0.03, + "epoch": 0.86, + "learning_rate": 0.00017064742443702923, + "loss": 0.0382, "step": 133610 }, { - "epoch": 1.45, - "learning_rate": 8.321111039003179e-05, - "loss": 0.031, + "epoch": 0.86, + "learning_rate": 0.00017063774308267228, + "loss": 0.0362, "step": 133620 }, { - "epoch": 1.45, - "learning_rate": 8.319488610552274e-05, - "loss": 0.0322, + "epoch": 0.86, + "learning_rate": 0.00017062806172831536, + "loss": 0.0383, "step": 133630 }, { - "epoch": 1.45, - "learning_rate": 8.317866182101369e-05, - "loss": 0.0327, + "epoch": 0.86, + "learning_rate": 0.00017061838037395842, + "loss": 0.0432, "step": 133640 }, { - "epoch": 1.45, - "learning_rate": 8.316243753650463e-05, - "loss": 0.029, + "epoch": 0.86, + "learning_rate": 0.0001706086990196015, + "loss": 0.0375, "step": 133650 }, { - "epoch": 1.45, - "learning_rate": 8.314621325199558e-05, - "loss": 0.0319, + "epoch": 0.86, + "learning_rate": 0.00017059901766524458, + "loss": 0.0391, "step": 133660 }, { - "epoch": 1.45, - "learning_rate": 8.312998896748653e-05, - "loss": 0.0298, + "epoch": 0.86, + "learning_rate": 0.00017058933631088766, + "loss": 0.0377, "step": 133670 }, { - "epoch": 1.45, - "learning_rate": 8.311376468297748e-05, - "loss": 0.0309, + "epoch": 0.86, + "learning_rate": 0.0001705796549565307, + "loss": 0.0357, "step": 133680 }, { - "epoch": 1.45, - "learning_rate": 8.309754039846843e-05, - "loss": 0.0277, + "epoch": 0.86, + "learning_rate": 0.00017056997360217376, + "loss": 0.0409, "step": 133690 }, { - "epoch": 1.45, - "learning_rate": 8.308131611395936e-05, - "loss": 0.0305, + "epoch": 0.86, + "learning_rate": 0.00017056029224781684, + "loss": 0.0393, "step": 133700 }, { - "epoch": 1.45, - "learning_rate": 8.306509182945031e-05, - "loss": 0.0316, + "epoch": 0.86, + "learning_rate": 0.0001705506108934599, + "loss": 0.0381, "step": 133710 }, { - "epoch": 1.45, - "learning_rate": 8.304886754494126e-05, - "loss": 0.0333, + "epoch": 0.86, + "learning_rate": 0.00017054092953910297, + "loss": 0.0379, "step": 133720 }, { - "epoch": 1.45, - "learning_rate": 8.303264326043221e-05, - "loss": 0.0262, + "epoch": 0.86, + "learning_rate": 0.00017053124818474605, + "loss": 0.0422, "step": 133730 }, { - "epoch": 1.45, - "learning_rate": 8.301641897592315e-05, - "loss": 0.0305, + "epoch": 0.86, + "learning_rate": 0.00017052156683038913, + "loss": 0.0411, "step": 133740 }, { - "epoch": 1.45, - "learning_rate": 8.30001946914141e-05, - "loss": 0.025, + "epoch": 0.86, + "learning_rate": 0.00017051188547603219, + "loss": 0.0365, "step": 133750 }, { - "epoch": 1.45, - "learning_rate": 8.298397040690505e-05, - "loss": 0.0331, + "epoch": 0.86, + "learning_rate": 0.00017050220412167524, + "loss": 0.0412, "step": 133760 }, { - "epoch": 1.45, - "learning_rate": 8.2967746122396e-05, - "loss": 0.0312, + "epoch": 0.86, + "learning_rate": 0.00017049252276731832, + "loss": 0.0414, "step": 133770 }, { - "epoch": 1.45, - "learning_rate": 8.295152183788695e-05, - "loss": 0.0293, + "epoch": 0.86, + "learning_rate": 0.00017048284141296137, + "loss": 0.0434, "step": 133780 }, { - "epoch": 1.45, - "learning_rate": 8.293529755337788e-05, - "loss": 0.0313, + "epoch": 0.86, + "learning_rate": 0.00017047316005860445, + "loss": 0.0455, "step": 133790 }, { - "epoch": 1.45, - "learning_rate": 8.291907326886883e-05, - "loss": 0.0308, + "epoch": 0.86, + "learning_rate": 0.00017046347870424753, + "loss": 0.034, "step": 133800 }, { - "epoch": 1.45, - "learning_rate": 8.290284898435978e-05, - "loss": 0.0324, + "epoch": 0.86, + "learning_rate": 0.0001704537973498906, + "loss": 0.0409, "step": 133810 }, { - "epoch": 1.45, - "learning_rate": 8.288662469985073e-05, - "loss": 0.0323, + "epoch": 0.86, + "learning_rate": 0.00017044411599553366, + "loss": 0.0428, "step": 133820 }, { - "epoch": 1.45, - "learning_rate": 8.287040041534167e-05, - "loss": 0.0298, + "epoch": 0.86, + "learning_rate": 0.00017043443464117672, + "loss": 0.0428, "step": 133830 }, { - "epoch": 1.45, - "learning_rate": 8.285417613083262e-05, - "loss": 0.0257, + "epoch": 0.86, + "learning_rate": 0.00017042475328681977, + "loss": 0.0463, "step": 133840 }, { - "epoch": 1.45, - "learning_rate": 8.283795184632357e-05, - "loss": 0.0304, + "epoch": 0.86, + "learning_rate": 0.00017041507193246285, + "loss": 0.0384, "step": 133850 }, { - "epoch": 1.45, - "learning_rate": 8.282172756181452e-05, - "loss": 0.0356, + "epoch": 0.86, + "learning_rate": 0.00017040539057810593, + "loss": 0.042, "step": 133860 }, { - "epoch": 1.45, - "learning_rate": 8.280550327730547e-05, - "loss": 0.0357, + "epoch": 0.86, + "learning_rate": 0.000170395709223749, + "loss": 0.0408, "step": 133870 }, { - "epoch": 1.45, - "learning_rate": 8.27892789927964e-05, - "loss": 0.0306, + "epoch": 0.86, + "learning_rate": 0.00017038602786939206, + "loss": 0.0368, "step": 133880 }, { - "epoch": 1.45, - "learning_rate": 8.277305470828735e-05, - "loss": 0.0282, + "epoch": 0.86, + "learning_rate": 0.00017037634651503514, + "loss": 0.0407, "step": 133890 }, { - "epoch": 1.45, - "learning_rate": 8.27568304237783e-05, - "loss": 0.031, + "epoch": 0.86, + "learning_rate": 0.0001703666651606782, + "loss": 0.0359, "step": 133900 }, { - "epoch": 1.45, - "learning_rate": 8.274060613926925e-05, - "loss": 0.0311, + "epoch": 0.86, + "learning_rate": 0.00017035698380632125, + "loss": 0.0419, "step": 133910 }, { - "epoch": 1.45, - "learning_rate": 8.272438185476019e-05, - "loss": 0.0276, + "epoch": 0.86, + "learning_rate": 0.00017034730245196433, + "loss": 0.0419, "step": 133920 }, { - "epoch": 1.45, - "learning_rate": 8.270815757025114e-05, - "loss": 0.0266, + "epoch": 0.86, + "learning_rate": 0.0001703376210976074, + "loss": 0.0448, "step": 133930 }, { - "epoch": 1.45, - "learning_rate": 8.269193328574209e-05, - "loss": 0.0252, + "epoch": 0.86, + "learning_rate": 0.00017032793974325049, + "loss": 0.0417, "step": 133940 }, { - "epoch": 1.45, - "learning_rate": 8.267570900123304e-05, - "loss": 0.0288, + "epoch": 0.86, + "learning_rate": 0.00017031825838889354, + "loss": 0.044, "step": 133950 }, { - "epoch": 1.45, - "learning_rate": 8.265948471672399e-05, - "loss": 0.0302, + "epoch": 0.86, + "learning_rate": 0.00017030857703453662, + "loss": 0.0404, "step": 133960 }, { - "epoch": 1.45, - "learning_rate": 8.264326043221493e-05, - "loss": 0.0244, + "epoch": 0.86, + "learning_rate": 0.00017029889568017967, + "loss": 0.0329, "step": 133970 }, { - "epoch": 1.45, - "learning_rate": 8.262703614770588e-05, - "loss": 0.0351, + "epoch": 0.86, + "learning_rate": 0.00017028921432582272, + "loss": 0.0381, "step": 133980 }, { - "epoch": 1.45, - "learning_rate": 8.261081186319682e-05, - "loss": 0.0266, + "epoch": 0.86, + "learning_rate": 0.0001702795329714658, + "loss": 0.0415, "step": 133990 }, { - "epoch": 1.45, - "learning_rate": 8.259458757868777e-05, - "loss": 0.0363, + "epoch": 0.86, + "learning_rate": 0.00017026985161710888, + "loss": 0.0466, "step": 134000 }, { - "epoch": 1.45, - "eval_cer": 0.9211251702916028, - "eval_loss": 0.02382628433406353, - "eval_runtime": 118.8065, - "eval_samples_per_second": 16.834, - "eval_steps_per_second": 4.209, + "epoch": 0.86, + "eval_cer": 0.9199240763755507, + "eval_loss": 0.026646053418517113, + "eval_runtime": 120.1342, + "eval_samples_per_second": 16.648, + "eval_steps_per_second": 4.162, "step": 134000 }, { - "epoch": 1.45, - "learning_rate": 8.257836329417872e-05, - "loss": 0.0298, + "epoch": 0.86, + "learning_rate": 0.00017026017026275196, + "loss": 0.0371, "step": 134010 }, { - "epoch": 1.45, - "learning_rate": 8.256213900966966e-05, - "loss": 0.0338, + "epoch": 0.86, + "learning_rate": 0.00017025048890839502, + "loss": 0.039, "step": 134020 }, { - "epoch": 1.45, - "learning_rate": 8.254591472516061e-05, - "loss": 0.0295, + "epoch": 0.87, + "learning_rate": 0.0001702408075540381, + "loss": 0.0381, "step": 134030 }, { - "epoch": 1.45, - "learning_rate": 8.252969044065156e-05, - "loss": 0.0295, + "epoch": 0.87, + "learning_rate": 0.00017023112619968112, + "loss": 0.0404, "step": 134040 }, { - "epoch": 1.45, - "learning_rate": 8.251346615614251e-05, - "loss": 0.0303, + "epoch": 0.87, + "learning_rate": 0.0001702214448453242, + "loss": 0.0522, "step": 134050 }, { - "epoch": 1.45, - "learning_rate": 8.249724187163345e-05, - "loss": 0.0321, + "epoch": 0.87, + "learning_rate": 0.00017021176349096728, + "loss": 0.0418, "step": 134060 }, { - "epoch": 1.45, - "learning_rate": 8.24810175871244e-05, - "loss": 0.0256, + "epoch": 0.87, + "learning_rate": 0.00017020208213661036, + "loss": 0.0389, "step": 134070 }, { - "epoch": 1.45, - "learning_rate": 8.246479330261535e-05, - "loss": 0.0256, + "epoch": 0.87, + "learning_rate": 0.0001701924007822534, + "loss": 0.0409, "step": 134080 }, { - "epoch": 1.45, - "learning_rate": 8.24485690181063e-05, - "loss": 0.028, + "epoch": 0.87, + "learning_rate": 0.0001701827194278965, + "loss": 0.0446, "step": 134090 }, { - "epoch": 1.45, - "learning_rate": 8.243234473359725e-05, - "loss": 0.0271, + "epoch": 0.87, + "learning_rate": 0.00017017303807353957, + "loss": 0.045, "step": 134100 }, { - "epoch": 1.45, - "learning_rate": 8.241612044908818e-05, - "loss": 0.0283, + "epoch": 0.87, + "learning_rate": 0.0001701633567191826, + "loss": 0.0425, "step": 134110 }, { - "epoch": 1.45, - "learning_rate": 8.239989616457913e-05, - "loss": 0.0287, + "epoch": 0.87, + "learning_rate": 0.00017015367536482568, + "loss": 0.0339, "step": 134120 }, { - "epoch": 1.45, - "learning_rate": 8.238367188007008e-05, - "loss": 0.0284, + "epoch": 0.87, + "learning_rate": 0.00017014399401046876, + "loss": 0.0416, "step": 134130 }, { - "epoch": 1.45, - "learning_rate": 8.236744759556103e-05, - "loss": 0.0238, + "epoch": 0.87, + "learning_rate": 0.00017013431265611184, + "loss": 0.0425, "step": 134140 }, { - "epoch": 1.45, - "learning_rate": 8.235122331105197e-05, - "loss": 0.0307, + "epoch": 0.87, + "learning_rate": 0.0001701246313017549, + "loss": 0.0425, "step": 134150 }, { - "epoch": 1.45, - "learning_rate": 8.233499902654292e-05, - "loss": 0.0365, + "epoch": 0.87, + "learning_rate": 0.00017011494994739797, + "loss": 0.0432, "step": 134160 }, { - "epoch": 1.45, - "learning_rate": 8.231877474203387e-05, - "loss": 0.0281, + "epoch": 0.87, + "learning_rate": 0.00017010526859304105, + "loss": 0.0396, "step": 134170 }, { - "epoch": 1.45, - "learning_rate": 8.230255045752482e-05, - "loss": 0.0353, + "epoch": 0.87, + "learning_rate": 0.00017009558723868408, + "loss": 0.039, "step": 134180 }, { - "epoch": 1.45, - "learning_rate": 8.228632617301577e-05, - "loss": 0.0298, + "epoch": 0.87, + "learning_rate": 0.00017008590588432716, + "loss": 0.0431, "step": 134190 }, { - "epoch": 1.45, - "learning_rate": 8.22701018885067e-05, - "loss": 0.0399, + "epoch": 0.87, + "learning_rate": 0.00017007622452997023, + "loss": 0.0357, "step": 134200 }, { - "epoch": 1.45, - "learning_rate": 8.225387760399765e-05, - "loss": 0.0313, + "epoch": 0.87, + "learning_rate": 0.00017006654317561331, + "loss": 0.0366, "step": 134210 }, { - "epoch": 1.45, - "learning_rate": 8.22376533194886e-05, - "loss": 0.0361, + "epoch": 0.87, + "learning_rate": 0.00017005686182125637, + "loss": 0.038, "step": 134220 }, { - "epoch": 1.45, - "learning_rate": 8.222142903497955e-05, - "loss": 0.036, + "epoch": 0.87, + "learning_rate": 0.00017004718046689945, + "loss": 0.0457, "step": 134230 }, { - "epoch": 1.45, - "learning_rate": 8.220520475047049e-05, - "loss": 0.032, + "epoch": 0.87, + "learning_rate": 0.00017003749911254253, + "loss": 0.0403, "step": 134240 }, { - "epoch": 1.45, - "learning_rate": 8.218898046596144e-05, - "loss": 0.0279, + "epoch": 0.87, + "learning_rate": 0.00017002781775818555, + "loss": 0.0379, "step": 134250 }, { - "epoch": 1.45, - "learning_rate": 8.217275618145239e-05, - "loss": 0.0277, + "epoch": 0.87, + "learning_rate": 0.00017001813640382863, + "loss": 0.0442, "step": 134260 }, { - "epoch": 1.45, - "learning_rate": 8.215653189694334e-05, - "loss": 0.0299, + "epoch": 0.87, + "learning_rate": 0.0001700084550494717, + "loss": 0.0371, "step": 134270 }, { - "epoch": 1.45, - "learning_rate": 8.214030761243429e-05, - "loss": 0.0273, + "epoch": 0.87, + "learning_rate": 0.00016999877369511476, + "loss": 0.0424, "step": 134280 }, { - "epoch": 1.45, - "learning_rate": 8.212408332792522e-05, - "loss": 0.0272, + "epoch": 0.87, + "learning_rate": 0.00016998909234075784, + "loss": 0.0412, "step": 134290 }, { - "epoch": 1.45, - "learning_rate": 8.210785904341617e-05, - "loss": 0.0274, + "epoch": 0.87, + "learning_rate": 0.00016997941098640092, + "loss": 0.0436, "step": 134300 }, { - "epoch": 1.45, - "learning_rate": 8.209163475890712e-05, - "loss": 0.0358, + "epoch": 0.87, + "learning_rate": 0.00016996972963204395, + "loss": 0.0408, "step": 134310 }, { - "epoch": 1.45, - "learning_rate": 8.207541047439807e-05, - "loss": 0.0272, + "epoch": 0.87, + "learning_rate": 0.00016996004827768703, + "loss": 0.0509, "step": 134320 }, { - "epoch": 1.45, - "learning_rate": 8.205918618988901e-05, - "loss": 0.0343, + "epoch": 0.87, + "learning_rate": 0.0001699503669233301, + "loss": 0.0418, "step": 134330 }, { - "epoch": 1.45, - "learning_rate": 8.204296190537996e-05, - "loss": 0.0314, + "epoch": 0.87, + "learning_rate": 0.0001699406855689732, + "loss": 0.038, "step": 134340 }, { - "epoch": 1.45, - "learning_rate": 8.202673762087091e-05, - "loss": 0.0323, + "epoch": 0.87, + "learning_rate": 0.00016993100421461624, + "loss": 0.0437, "step": 134350 }, { - "epoch": 1.45, - "learning_rate": 8.201051333636186e-05, - "loss": 0.0354, + "epoch": 0.87, + "learning_rate": 0.00016992132286025932, + "loss": 0.0393, "step": 134360 }, { - "epoch": 1.45, - "learning_rate": 8.199428905185281e-05, - "loss": 0.0292, + "epoch": 0.87, + "learning_rate": 0.0001699116415059024, + "loss": 0.0333, "step": 134370 }, { - "epoch": 1.45, - "learning_rate": 8.197806476734374e-05, - "loss": 0.0368, + "epoch": 0.87, + "learning_rate": 0.00016990196015154543, + "loss": 0.0374, "step": 134380 }, { - "epoch": 1.45, - "learning_rate": 8.19618404828347e-05, - "loss": 0.031, + "epoch": 0.87, + "learning_rate": 0.0001698922787971885, + "loss": 0.046, "step": 134390 }, { - "epoch": 1.45, - "learning_rate": 8.194561619832564e-05, - "loss": 0.0305, + "epoch": 0.87, + "learning_rate": 0.0001698825974428316, + "loss": 0.0392, "step": 134400 }, { - "epoch": 1.45, - "learning_rate": 8.192939191381659e-05, - "loss": 0.0298, + "epoch": 0.87, + "learning_rate": 0.00016987291608847467, + "loss": 0.0361, "step": 134410 }, { - "epoch": 1.45, - "learning_rate": 8.191316762930753e-05, - "loss": 0.033, + "epoch": 0.87, + "learning_rate": 0.00016986323473411772, + "loss": 0.0423, "step": 134420 }, { - "epoch": 1.45, - "learning_rate": 8.189694334479848e-05, - "loss": 0.0325, + "epoch": 0.87, + "learning_rate": 0.0001698535533797608, + "loss": 0.0464, "step": 134430 }, { - "epoch": 1.45, - "learning_rate": 8.188071906028943e-05, - "loss": 0.0351, + "epoch": 0.87, + "learning_rate": 0.00016984387202540388, + "loss": 0.0369, "step": 134440 }, { - "epoch": 1.45, - "learning_rate": 8.186449477578038e-05, - "loss": 0.0273, + "epoch": 0.87, + "learning_rate": 0.0001698341906710469, + "loss": 0.0428, "step": 134450 }, { - "epoch": 1.45, - "learning_rate": 8.184827049127133e-05, - "loss": 0.036, + "epoch": 0.87, + "learning_rate": 0.00016982450931668998, + "loss": 0.0373, "step": 134460 }, { - "epoch": 1.45, - "learning_rate": 8.183204620676226e-05, - "loss": 0.0324, + "epoch": 0.87, + "learning_rate": 0.00016981482796233306, + "loss": 0.038, "step": 134470 }, { - "epoch": 1.45, - "learning_rate": 8.181582192225321e-05, - "loss": 0.0384, + "epoch": 0.87, + "learning_rate": 0.00016980514660797612, + "loss": 0.0328, "step": 134480 }, { - "epoch": 1.45, - "learning_rate": 8.179959763774416e-05, - "loss": 0.0296, + "epoch": 0.87, + "learning_rate": 0.0001697954652536192, + "loss": 0.047, "step": 134490 }, { - "epoch": 1.45, - "learning_rate": 8.178337335323511e-05, - "loss": 0.0264, + "epoch": 0.87, + "learning_rate": 0.00016978578389926228, + "loss": 0.0428, "step": 134500 }, { - "epoch": 1.45, - "learning_rate": 8.176714906872605e-05, - "loss": 0.0371, + "epoch": 0.87, + "learning_rate": 0.00016977610254490536, + "loss": 0.0401, "step": 134510 }, { - "epoch": 1.45, - "learning_rate": 8.1750924784217e-05, - "loss": 0.0291, + "epoch": 0.87, + "learning_rate": 0.00016976642119054838, + "loss": 0.0473, "step": 134520 }, { - "epoch": 1.46, - "learning_rate": 8.173470049970795e-05, - "loss": 0.0278, + "epoch": 0.87, + "learning_rate": 0.00016975673983619146, + "loss": 0.044, "step": 134530 }, { - "epoch": 1.46, - "learning_rate": 8.17184762151989e-05, - "loss": 0.0349, + "epoch": 0.87, + "learning_rate": 0.00016974705848183454, + "loss": 0.0341, "step": 134540 }, { - "epoch": 1.46, - "learning_rate": 8.170225193068985e-05, - "loss": 0.0318, + "epoch": 0.87, + "learning_rate": 0.0001697373771274776, + "loss": 0.0358, "step": 134550 }, { - "epoch": 1.46, - "learning_rate": 8.168602764618079e-05, - "loss": 0.0298, + "epoch": 0.87, + "learning_rate": 0.00016972769577312067, + "loss": 0.0365, "step": 134560 }, { - "epoch": 1.46, - "learning_rate": 8.166980336167174e-05, - "loss": 0.0304, + "epoch": 0.87, + "learning_rate": 0.00016971801441876375, + "loss": 0.0399, "step": 134570 }, { - "epoch": 1.46, - "learning_rate": 8.165357907716269e-05, - "loss": 0.0325, + "epoch": 0.87, + "learning_rate": 0.00016970833306440683, + "loss": 0.0428, "step": 134580 }, { - "epoch": 1.46, - "learning_rate": 8.163735479265363e-05, - "loss": 0.0368, + "epoch": 0.87, + "learning_rate": 0.00016969865171004986, + "loss": 0.0414, "step": 134590 }, { - "epoch": 1.46, - "learning_rate": 8.162113050814457e-05, - "loss": 0.034, + "epoch": 0.87, + "learning_rate": 0.00016968897035569294, + "loss": 0.0375, "step": 134600 }, { - "epoch": 1.46, - "learning_rate": 8.160490622363552e-05, - "loss": 0.0315, + "epoch": 0.87, + "learning_rate": 0.00016967928900133602, + "loss": 0.0377, "step": 134610 }, { - "epoch": 1.46, - "learning_rate": 8.158868193912647e-05, - "loss": 0.0257, + "epoch": 0.87, + "learning_rate": 0.00016966960764697907, + "loss": 0.0373, "step": 134620 }, { - "epoch": 1.46, - "learning_rate": 8.157245765461742e-05, - "loss": 0.0272, + "epoch": 0.87, + "learning_rate": 0.00016965992629262215, + "loss": 0.0388, "step": 134630 }, { - "epoch": 1.46, - "learning_rate": 8.155623337010837e-05, - "loss": 0.0301, + "epoch": 0.87, + "learning_rate": 0.00016965024493826523, + "loss": 0.0411, "step": 134640 }, { - "epoch": 1.46, - "learning_rate": 8.15400090855993e-05, - "loss": 0.034, + "epoch": 0.87, + "learning_rate": 0.00016964056358390828, + "loss": 0.0461, "step": 134650 }, { - "epoch": 1.46, - "learning_rate": 8.152378480109026e-05, - "loss": 0.0318, + "epoch": 0.87, + "learning_rate": 0.00016963088222955134, + "loss": 0.0369, "step": 134660 }, { - "epoch": 1.46, - "learning_rate": 8.15075605165812e-05, - "loss": 0.0282, + "epoch": 0.87, + "learning_rate": 0.00016962120087519442, + "loss": 0.0424, "step": 134670 }, { - "epoch": 1.46, - "learning_rate": 8.149133623207216e-05, - "loss": 0.0303, + "epoch": 0.87, + "learning_rate": 0.00016961151952083747, + "loss": 0.0382, "step": 134680 }, { - "epoch": 1.46, - "learning_rate": 8.147511194756309e-05, - "loss": 0.0313, + "epoch": 0.87, + "learning_rate": 0.00016960183816648055, + "loss": 0.0345, "step": 134690 }, { - "epoch": 1.46, - "learning_rate": 8.145888766305404e-05, - "loss": 0.0256, + "epoch": 0.87, + "learning_rate": 0.00016959215681212363, + "loss": 0.0433, "step": 134700 }, { - "epoch": 1.46, - "learning_rate": 8.144266337854499e-05, - "loss": 0.0336, + "epoch": 0.87, + "learning_rate": 0.0001695824754577667, + "loss": 0.0421, "step": 134710 }, { - "epoch": 1.46, - "learning_rate": 8.142643909403594e-05, - "loss": 0.0274, + "epoch": 0.87, + "learning_rate": 0.00016957279410340976, + "loss": 0.0404, "step": 134720 }, { - "epoch": 1.46, - "learning_rate": 8.141021480952689e-05, - "loss": 0.0328, + "epoch": 0.87, + "learning_rate": 0.0001695631127490528, + "loss": 0.0358, "step": 134730 }, { - "epoch": 1.46, - "learning_rate": 8.139399052501783e-05, - "loss": 0.0305, + "epoch": 0.87, + "learning_rate": 0.0001695534313946959, + "loss": 0.0367, "step": 134740 }, { - "epoch": 1.46, - "learning_rate": 8.137776624050878e-05, - "loss": 0.0342, + "epoch": 0.87, + "learning_rate": 0.00016954375004033895, + "loss": 0.0408, "step": 134750 }, { - "epoch": 1.46, - "learning_rate": 8.136154195599973e-05, - "loss": 0.0406, + "epoch": 0.87, + "learning_rate": 0.00016953406868598203, + "loss": 0.0453, "step": 134760 }, { - "epoch": 1.46, - "learning_rate": 8.134531767149068e-05, - "loss": 0.0314, + "epoch": 0.87, + "learning_rate": 0.0001695243873316251, + "loss": 0.0402, "step": 134770 }, { - "epoch": 1.46, - "learning_rate": 8.132909338698163e-05, - "loss": 0.0342, + "epoch": 0.87, + "learning_rate": 0.00016951470597726819, + "loss": 0.0435, "step": 134780 }, { - "epoch": 1.46, - "learning_rate": 8.131286910247256e-05, - "loss": 0.0315, + "epoch": 0.87, + "learning_rate": 0.00016950502462291124, + "loss": 0.0356, "step": 134790 }, { - "epoch": 1.46, - "learning_rate": 8.129664481796351e-05, - "loss": 0.0332, + "epoch": 0.87, + "learning_rate": 0.0001694953432685543, + "loss": 0.0415, "step": 134800 }, { - "epoch": 1.46, - "learning_rate": 8.128042053345446e-05, - "loss": 0.0337, + "epoch": 0.87, + "learning_rate": 0.00016948566191419737, + "loss": 0.0404, "step": 134810 }, { - "epoch": 1.46, - "learning_rate": 8.126419624894541e-05, - "loss": 0.0318, + "epoch": 0.87, + "learning_rate": 0.00016947598055984042, + "loss": 0.0393, "step": 134820 }, { - "epoch": 1.46, - "learning_rate": 8.124797196443635e-05, - "loss": 0.0379, + "epoch": 0.87, + "learning_rate": 0.0001694662992054835, + "loss": 0.0359, "step": 134830 }, { - "epoch": 1.46, - "learning_rate": 8.12317476799273e-05, - "loss": 0.0272, + "epoch": 0.87, + "learning_rate": 0.00016945661785112658, + "loss": 0.0406, "step": 134840 }, { - "epoch": 1.46, - "learning_rate": 8.121552339541825e-05, - "loss": 0.0296, + "epoch": 0.87, + "learning_rate": 0.00016944693649676964, + "loss": 0.0467, "step": 134850 }, { - "epoch": 1.46, - "learning_rate": 8.11992991109092e-05, - "loss": 0.0338, + "epoch": 0.87, + "learning_rate": 0.00016943725514241272, + "loss": 0.0435, "step": 134860 }, { - "epoch": 1.46, - "learning_rate": 8.118307482640015e-05, - "loss": 0.0359, + "epoch": 0.87, + "learning_rate": 0.00016942757378805577, + "loss": 0.0401, "step": 134870 }, { - "epoch": 1.46, - "learning_rate": 8.116685054189108e-05, - "loss": 0.0242, + "epoch": 0.87, + "learning_rate": 0.00016941789243369882, + "loss": 0.0374, "step": 134880 }, { - "epoch": 1.46, - "learning_rate": 8.115062625738203e-05, - "loss": 0.0344, + "epoch": 0.87, + "learning_rate": 0.0001694082110793419, + "loss": 0.0395, "step": 134890 }, { - "epoch": 1.46, - "learning_rate": 8.113440197287298e-05, - "loss": 0.0269, + "epoch": 0.87, + "learning_rate": 0.00016939852972498498, + "loss": 0.0451, "step": 134900 }, { - "epoch": 1.46, - "learning_rate": 8.111817768836393e-05, - "loss": 0.0294, + "epoch": 0.87, + "learning_rate": 0.00016938884837062806, + "loss": 0.0427, "step": 134910 }, { - "epoch": 1.46, - "learning_rate": 8.110195340385487e-05, - "loss": 0.0302, + "epoch": 0.87, + "learning_rate": 0.0001693791670162711, + "loss": 0.0402, "step": 134920 }, { - "epoch": 1.46, - "learning_rate": 8.108572911934583e-05, - "loss": 0.0296, + "epoch": 0.87, + "learning_rate": 0.0001693694856619142, + "loss": 0.0424, "step": 134930 }, { - "epoch": 1.46, - "learning_rate": 8.106950483483678e-05, - "loss": 0.0258, + "epoch": 0.87, + "learning_rate": 0.00016935980430755724, + "loss": 0.0395, "step": 134940 }, { - "epoch": 1.46, - "learning_rate": 8.105328055032773e-05, - "loss": 0.031, + "epoch": 0.87, + "learning_rate": 0.0001693501229532003, + "loss": 0.0439, "step": 134950 }, { - "epoch": 1.46, - "learning_rate": 8.103705626581868e-05, + "epoch": 0.87, + "learning_rate": 0.00016934044159884338, "loss": 0.0378, "step": 134960 }, { - "epoch": 1.46, - "learning_rate": 8.102083198130963e-05, - "loss": 0.0274, + "epoch": 0.87, + "learning_rate": 0.00016933076024448646, + "loss": 0.0408, "step": 134970 }, { - "epoch": 1.46, - "learning_rate": 8.100460769680057e-05, - "loss": 0.0326, + "epoch": 0.87, + "learning_rate": 0.00016932107889012954, + "loss": 0.0354, "step": 134980 }, { - "epoch": 1.46, - "learning_rate": 8.098838341229152e-05, - "loss": 0.0312, + "epoch": 0.87, + "learning_rate": 0.0001693113975357726, + "loss": 0.0418, "step": 134990 }, { - "epoch": 1.46, - "learning_rate": 8.097215912778247e-05, - "loss": 0.0264, + "epoch": 0.87, + "learning_rate": 0.00016930171618141567, + "loss": 0.04, "step": 135000 }, { - "epoch": 1.46, - "eval_cer": 0.9210960153090163, - "eval_loss": 0.023969639092683792, - "eval_runtime": 118.9677, - "eval_samples_per_second": 16.811, - "eval_steps_per_second": 4.203, + "epoch": 0.87, + "eval_cer": 0.919934922607615, + "eval_loss": 0.02674305997788906, + "eval_runtime": 119.9587, + "eval_samples_per_second": 16.672, + "eval_steps_per_second": 4.168, "step": 135000 }, { - "epoch": 1.46, - "learning_rate": 8.095593484327342e-05, - "loss": 0.0288, + "epoch": 0.87, + "learning_rate": 0.00016929203482705872, + "loss": 0.0434, "step": 135010 }, { - "epoch": 1.46, - "learning_rate": 8.093971055876435e-05, - "loss": 0.0303, + "epoch": 0.87, + "learning_rate": 0.00016928235347270177, + "loss": 0.0429, "step": 135020 }, { - "epoch": 1.46, - "learning_rate": 8.09234862742553e-05, - "loss": 0.0291, + "epoch": 0.87, + "learning_rate": 0.00016927267211834485, + "loss": 0.0424, "step": 135030 }, { - "epoch": 1.46, - "learning_rate": 8.090726198974625e-05, - "loss": 0.0326, + "epoch": 0.87, + "learning_rate": 0.00016926299076398793, + "loss": 0.0404, "step": 135040 }, { - "epoch": 1.46, - "learning_rate": 8.08910377052372e-05, - "loss": 0.0268, + "epoch": 0.87, + "learning_rate": 0.000169253309409631, + "loss": 0.0408, "step": 135050 }, { - "epoch": 1.46, - "learning_rate": 8.087481342072815e-05, - "loss": 0.0306, + "epoch": 0.87, + "learning_rate": 0.00016924362805527407, + "loss": 0.0387, "step": 135060 }, { - "epoch": 1.46, - "learning_rate": 8.085858913621909e-05, - "loss": 0.0301, + "epoch": 0.87, + "learning_rate": 0.00016923394670091715, + "loss": 0.0466, "step": 135070 }, { - "epoch": 1.46, - "learning_rate": 8.084236485171004e-05, - "loss": 0.0279, + "epoch": 0.87, + "learning_rate": 0.00016922426534656017, + "loss": 0.037, "step": 135080 }, { - "epoch": 1.46, - "learning_rate": 8.082614056720099e-05, - "loss": 0.0245, + "epoch": 0.87, + "learning_rate": 0.00016921458399220325, + "loss": 0.0455, "step": 135090 }, { - "epoch": 1.46, - "learning_rate": 8.080991628269194e-05, - "loss": 0.0304, + "epoch": 0.87, + "learning_rate": 0.00016920490263784633, + "loss": 0.0435, "step": 135100 }, { - "epoch": 1.46, - "learning_rate": 8.079369199818287e-05, - "loss": 0.03, + "epoch": 0.87, + "learning_rate": 0.0001691952212834894, + "loss": 0.0403, "step": 135110 }, { - "epoch": 1.46, - "learning_rate": 8.077746771367382e-05, - "loss": 0.0278, + "epoch": 0.87, + "learning_rate": 0.00016918553992913246, + "loss": 0.0375, "step": 135120 }, { - "epoch": 1.46, - "learning_rate": 8.076124342916477e-05, - "loss": 0.0257, + "epoch": 0.87, + "learning_rate": 0.00016917585857477554, + "loss": 0.0445, "step": 135130 }, { - "epoch": 1.46, - "learning_rate": 8.074501914465572e-05, - "loss": 0.0259, + "epoch": 0.87, + "learning_rate": 0.00016916617722041862, + "loss": 0.0394, "step": 135140 }, { - "epoch": 1.46, - "learning_rate": 8.072879486014667e-05, - "loss": 0.0324, + "epoch": 0.87, + "learning_rate": 0.00016915649586606165, + "loss": 0.0423, "step": 135150 }, { - "epoch": 1.46, - "learning_rate": 8.071257057563761e-05, - "loss": 0.0334, + "epoch": 0.87, + "learning_rate": 0.00016914681451170473, + "loss": 0.0373, "step": 135160 }, { - "epoch": 1.46, - "learning_rate": 8.069634629112856e-05, - "loss": 0.0314, + "epoch": 0.87, + "learning_rate": 0.0001691371331573478, + "loss": 0.0416, "step": 135170 }, { - "epoch": 1.46, - "learning_rate": 8.068012200661951e-05, - "loss": 0.0316, + "epoch": 0.87, + "learning_rate": 0.0001691274518029909, + "loss": 0.0405, "step": 135180 }, { - "epoch": 1.46, - "learning_rate": 8.066389772211046e-05, - "loss": 0.0279, + "epoch": 0.87, + "learning_rate": 0.00016911777044863394, + "loss": 0.0412, "step": 135190 }, { - "epoch": 1.46, - "learning_rate": 8.06476734376014e-05, - "loss": 0.0319, + "epoch": 0.87, + "learning_rate": 0.00016910808909427702, + "loss": 0.0438, "step": 135200 }, { - "epoch": 1.46, - "learning_rate": 8.063144915309234e-05, - "loss": 0.0281, + "epoch": 0.87, + "learning_rate": 0.0001690984077399201, + "loss": 0.0394, "step": 135210 }, { - "epoch": 1.46, - "learning_rate": 8.06152248685833e-05, - "loss": 0.0244, + "epoch": 0.87, + "learning_rate": 0.00016908872638556313, + "loss": 0.0426, "step": 135220 }, { - "epoch": 1.46, - "learning_rate": 8.059900058407424e-05, - "loss": 0.032, + "epoch": 0.87, + "learning_rate": 0.0001690790450312062, + "loss": 0.0414, "step": 135230 }, { - "epoch": 1.46, - "learning_rate": 8.05827762995652e-05, - "loss": 0.0289, + "epoch": 0.87, + "learning_rate": 0.00016906936367684929, + "loss": 0.0448, "step": 135240 }, { - "epoch": 1.46, - "learning_rate": 8.056655201505613e-05, - "loss": 0.0285, + "epoch": 0.87, + "learning_rate": 0.00016905968232249234, + "loss": 0.0435, "step": 135250 }, { - "epoch": 1.46, - "learning_rate": 8.055032773054708e-05, - "loss": 0.0355, + "epoch": 0.87, + "learning_rate": 0.00016905000096813542, + "loss": 0.0448, "step": 135260 }, { - "epoch": 1.46, - "learning_rate": 8.053410344603803e-05, - "loss": 0.0295, + "epoch": 0.87, + "learning_rate": 0.0001690403196137785, + "loss": 0.0443, "step": 135270 }, { - "epoch": 1.46, - "learning_rate": 8.051787916152898e-05, - "loss": 0.0358, + "epoch": 0.87, + "learning_rate": 0.00016903063825942158, + "loss": 0.0423, "step": 135280 }, { - "epoch": 1.46, - "learning_rate": 8.050165487701992e-05, - "loss": 0.0377, + "epoch": 0.87, + "learning_rate": 0.0001690209569050646, + "loss": 0.0403, "step": 135290 }, { - "epoch": 1.46, - "learning_rate": 8.048543059251087e-05, - "loss": 0.0295, + "epoch": 0.87, + "learning_rate": 0.00016901127555070768, + "loss": 0.0384, "step": 135300 }, { - "epoch": 1.46, - "learning_rate": 8.046920630800182e-05, - "loss": 0.0253, + "epoch": 0.87, + "learning_rate": 0.00016900159419635076, + "loss": 0.0372, "step": 135310 }, { - "epoch": 1.46, - "learning_rate": 8.045298202349276e-05, - "loss": 0.0293, + "epoch": 0.87, + "learning_rate": 0.00016899191284199382, + "loss": 0.0363, "step": 135320 }, { - "epoch": 1.46, - "learning_rate": 8.043675773898371e-05, - "loss": 0.031, + "epoch": 0.87, + "learning_rate": 0.0001689822314876369, + "loss": 0.0454, "step": 135330 }, { - "epoch": 1.46, - "learning_rate": 8.042053345447465e-05, - "loss": 0.0295, + "epoch": 0.87, + "learning_rate": 0.00016897255013327998, + "loss": 0.0395, "step": 135340 }, { - "epoch": 1.46, - "learning_rate": 8.04043091699656e-05, - "loss": 0.0356, + "epoch": 0.87, + "learning_rate": 0.00016896286877892306, + "loss": 0.0387, "step": 135350 }, { - "epoch": 1.46, - "learning_rate": 8.038808488545655e-05, - "loss": 0.0274, + "epoch": 0.87, + "learning_rate": 0.00016895318742456608, + "loss": 0.0383, "step": 135360 }, { - "epoch": 1.46, - "learning_rate": 8.03718606009475e-05, - "loss": 0.0282, + "epoch": 0.87, + "learning_rate": 0.00016894350607020916, + "loss": 0.0397, "step": 135370 }, { - "epoch": 1.46, - "learning_rate": 8.035563631643844e-05, - "loss": 0.0317, + "epoch": 0.87, + "learning_rate": 0.00016893382471585224, + "loss": 0.0421, "step": 135380 }, { - "epoch": 1.46, - "learning_rate": 8.033941203192939e-05, - "loss": 0.0261, + "epoch": 0.87, + "learning_rate": 0.0001689241433614953, + "loss": 0.0384, "step": 135390 }, { - "epoch": 1.46, - "learning_rate": 8.032318774742034e-05, - "loss": 0.0311, + "epoch": 0.87, + "learning_rate": 0.00016891446200713837, + "loss": 0.0462, "step": 135400 }, { - "epoch": 1.46, - "learning_rate": 8.030696346291129e-05, - "loss": 0.0285, + "epoch": 0.87, + "learning_rate": 0.00016890478065278145, + "loss": 0.0388, "step": 135410 }, { - "epoch": 1.46, - "learning_rate": 8.029073917840224e-05, - "loss": 0.0298, + "epoch": 0.87, + "learning_rate": 0.0001688950992984245, + "loss": 0.0444, "step": 135420 }, { - "epoch": 1.46, - "learning_rate": 8.027451489389317e-05, - "loss": 0.0294, + "epoch": 0.87, + "learning_rate": 0.00016888541794406756, + "loss": 0.0394, "step": 135430 }, { - "epoch": 1.46, - "learning_rate": 8.025829060938412e-05, - "loss": 0.0275, + "epoch": 0.87, + "learning_rate": 0.00016887573658971064, + "loss": 0.0386, "step": 135440 }, { - "epoch": 1.47, - "learning_rate": 8.024206632487507e-05, - "loss": 0.025, + "epoch": 0.87, + "learning_rate": 0.0001688660552353537, + "loss": 0.0482, "step": 135450 }, { - "epoch": 1.47, - "learning_rate": 8.022584204036602e-05, - "loss": 0.0264, + "epoch": 0.87, + "learning_rate": 0.00016885637388099677, + "loss": 0.0459, "step": 135460 }, { - "epoch": 1.47, - "learning_rate": 8.020961775585697e-05, - "loss": 0.0351, + "epoch": 0.87, + "learning_rate": 0.00016884669252663985, + "loss": 0.0397, "step": 135470 }, { - "epoch": 1.47, - "learning_rate": 8.019339347134791e-05, - "loss": 0.0275, + "epoch": 0.87, + "learning_rate": 0.00016883701117228293, + "loss": 0.0385, "step": 135480 }, { - "epoch": 1.47, - "learning_rate": 8.017716918683886e-05, - "loss": 0.0343, + "epoch": 0.87, + "learning_rate": 0.00016882732981792598, + "loss": 0.0449, "step": 135490 }, { - "epoch": 1.47, - "learning_rate": 8.01609449023298e-05, - "loss": 0.0283, + "epoch": 0.87, + "learning_rate": 0.00016881764846356904, + "loss": 0.0396, "step": 135500 }, { - "epoch": 1.47, - "learning_rate": 8.014472061782076e-05, - "loss": 0.0348, + "epoch": 0.87, + "learning_rate": 0.00016880796710921212, + "loss": 0.046, "step": 135510 }, { - "epoch": 1.47, - "learning_rate": 8.012849633331169e-05, - "loss": 0.0332, + "epoch": 0.87, + "learning_rate": 0.00016879828575485517, + "loss": 0.0439, "step": 135520 }, { - "epoch": 1.47, - "learning_rate": 8.011227204880264e-05, - "loss": 0.0298, + "epoch": 0.87, + "learning_rate": 0.00016878860440049825, + "loss": 0.0361, "step": 135530 }, { - "epoch": 1.47, - "learning_rate": 8.009604776429359e-05, - "loss": 0.0305, + "epoch": 0.87, + "learning_rate": 0.00016877892304614133, + "loss": 0.0482, "step": 135540 }, { - "epoch": 1.47, - "learning_rate": 8.007982347978454e-05, - "loss": 0.0281, + "epoch": 0.87, + "learning_rate": 0.0001687692416917844, + "loss": 0.0468, "step": 135550 }, { - "epoch": 1.47, - "learning_rate": 8.006359919527549e-05, - "loss": 0.0265, + "epoch": 0.87, + "learning_rate": 0.00016875956033742746, + "loss": 0.0435, "step": 135560 }, { - "epoch": 1.47, - "learning_rate": 8.004737491076643e-05, - "loss": 0.0297, + "epoch": 0.87, + "learning_rate": 0.0001687498789830705, + "loss": 0.0401, "step": 135570 }, { - "epoch": 1.47, - "learning_rate": 8.003115062625738e-05, - "loss": 0.0315, + "epoch": 0.88, + "learning_rate": 0.0001687401976287136, + "loss": 0.0443, "step": 135580 }, { - "epoch": 1.47, - "learning_rate": 8.001492634174833e-05, - "loss": 0.0292, + "epoch": 0.88, + "learning_rate": 0.00016873051627435665, + "loss": 0.0393, "step": 135590 }, { - "epoch": 1.47, - "learning_rate": 7.999870205723928e-05, - "loss": 0.0346, + "epoch": 0.88, + "learning_rate": 0.00016872083491999973, + "loss": 0.0389, "step": 135600 }, { - "epoch": 1.47, - "learning_rate": 7.998247777273021e-05, - "loss": 0.0347, + "epoch": 0.88, + "learning_rate": 0.0001687111535656428, + "loss": 0.0399, "step": 135610 }, { - "epoch": 1.47, - "learning_rate": 7.996625348822116e-05, - "loss": 0.0311, + "epoch": 0.88, + "learning_rate": 0.00016870147221128586, + "loss": 0.0436, "step": 135620 }, { - "epoch": 1.47, - "learning_rate": 7.995002920371211e-05, - "loss": 0.0325, + "epoch": 0.88, + "learning_rate": 0.00016869179085692894, + "loss": 0.04, "step": 135630 }, { - "epoch": 1.47, - "learning_rate": 7.993380491920306e-05, - "loss": 0.0326, + "epoch": 0.88, + "learning_rate": 0.000168682109502572, + "loss": 0.0352, "step": 135640 }, { - "epoch": 1.47, - "learning_rate": 7.991758063469401e-05, - "loss": 0.0288, + "epoch": 0.88, + "learning_rate": 0.00016867242814821504, + "loss": 0.0458, "step": 135650 }, { - "epoch": 1.47, - "learning_rate": 7.990135635018495e-05, - "loss": 0.0272, + "epoch": 0.88, + "learning_rate": 0.00016866274679385812, + "loss": 0.0359, "step": 135660 }, { - "epoch": 1.47, - "learning_rate": 7.98851320656759e-05, - "loss": 0.0268, + "epoch": 0.88, + "learning_rate": 0.0001686530654395012, + "loss": 0.039, "step": 135670 }, { - "epoch": 1.47, - "learning_rate": 7.986890778116685e-05, - "loss": 0.0334, + "epoch": 0.88, + "learning_rate": 0.00016864338408514428, + "loss": 0.0426, "step": 135680 }, { - "epoch": 1.47, - "learning_rate": 7.98526834966578e-05, - "loss": 0.0316, + "epoch": 0.88, + "learning_rate": 0.00016863370273078733, + "loss": 0.0511, "step": 135690 }, { - "epoch": 1.47, - "learning_rate": 7.983645921214873e-05, - "loss": 0.0307, + "epoch": 0.88, + "learning_rate": 0.00016862402137643041, + "loss": 0.0388, "step": 135700 }, { - "epoch": 1.47, - "learning_rate": 7.982023492763968e-05, - "loss": 0.0294, + "epoch": 0.88, + "learning_rate": 0.00016861434002207347, + "loss": 0.0405, "step": 135710 }, { - "epoch": 1.47, - "learning_rate": 7.980401064313063e-05, - "loss": 0.0258, + "epoch": 0.88, + "learning_rate": 0.00016860465866771652, + "loss": 0.0406, "step": 135720 }, { - "epoch": 1.47, - "learning_rate": 7.978778635862158e-05, - "loss": 0.0312, + "epoch": 0.88, + "learning_rate": 0.0001685949773133596, + "loss": 0.038, "step": 135730 }, { - "epoch": 1.47, - "learning_rate": 7.977156207411253e-05, - "loss": 0.0341, + "epoch": 0.88, + "learning_rate": 0.00016858529595900268, + "loss": 0.0448, "step": 135740 }, { - "epoch": 1.47, - "learning_rate": 7.975533778960347e-05, - "loss": 0.0337, + "epoch": 0.88, + "learning_rate": 0.00016857561460464576, + "loss": 0.0395, "step": 135750 }, { - "epoch": 1.47, - "learning_rate": 7.973911350509442e-05, - "loss": 0.0306, + "epoch": 0.88, + "learning_rate": 0.0001685659332502888, + "loss": 0.0424, "step": 135760 }, { - "epoch": 1.47, - "learning_rate": 7.972288922058537e-05, - "loss": 0.0333, + "epoch": 0.88, + "learning_rate": 0.0001685562518959319, + "loss": 0.0407, "step": 135770 }, { - "epoch": 1.47, - "learning_rate": 7.970666493607632e-05, - "loss": 0.031, + "epoch": 0.88, + "learning_rate": 0.00016854657054157494, + "loss": 0.0392, "step": 135780 }, { - "epoch": 1.47, - "learning_rate": 7.969044065156725e-05, - "loss": 0.0251, + "epoch": 0.88, + "learning_rate": 0.000168536889187218, + "loss": 0.0398, "step": 135790 }, { - "epoch": 1.47, - "learning_rate": 7.96742163670582e-05, - "loss": 0.0248, + "epoch": 0.88, + "learning_rate": 0.00016852720783286108, + "loss": 0.0382, "step": 135800 }, { - "epoch": 1.47, - "learning_rate": 7.965799208254915e-05, - "loss": 0.0257, + "epoch": 0.88, + "learning_rate": 0.00016851752647850416, + "loss": 0.039, "step": 135810 }, { - "epoch": 1.47, - "learning_rate": 7.96417677980401e-05, - "loss": 0.0263, + "epoch": 0.88, + "learning_rate": 0.0001685078451241472, + "loss": 0.0412, "step": 135820 }, { - "epoch": 1.47, - "learning_rate": 7.962554351353105e-05, - "loss": 0.0297, + "epoch": 0.88, + "learning_rate": 0.0001684981637697903, + "loss": 0.0371, "step": 135830 }, { - "epoch": 1.47, - "learning_rate": 7.960931922902199e-05, - "loss": 0.0265, + "epoch": 0.88, + "learning_rate": 0.00016848848241543337, + "loss": 0.0331, "step": 135840 }, { - "epoch": 1.47, - "learning_rate": 7.959309494451294e-05, - "loss": 0.0307, + "epoch": 0.88, + "learning_rate": 0.0001684788010610764, + "loss": 0.0376, "step": 135850 }, { - "epoch": 1.47, - "learning_rate": 7.957687066000389e-05, - "loss": 0.0337, + "epoch": 0.88, + "learning_rate": 0.00016846911970671947, + "loss": 0.0447, "step": 135860 }, { - "epoch": 1.47, - "learning_rate": 7.956064637549484e-05, - "loss": 0.0253, + "epoch": 0.88, + "learning_rate": 0.00016845943835236255, + "loss": 0.0497, "step": 135870 }, { - "epoch": 1.47, - "learning_rate": 7.954442209098578e-05, - "loss": 0.0313, + "epoch": 0.88, + "learning_rate": 0.00016844975699800563, + "loss": 0.0442, "step": 135880 }, { - "epoch": 1.47, - "learning_rate": 7.952819780647673e-05, - "loss": 0.0277, + "epoch": 0.88, + "learning_rate": 0.0001684400756436487, + "loss": 0.0432, "step": 135890 }, { - "epoch": 1.47, - "learning_rate": 7.951197352196768e-05, - "loss": 0.026, + "epoch": 0.88, + "learning_rate": 0.00016843039428929177, + "loss": 0.04, "step": 135900 }, { - "epoch": 1.47, - "learning_rate": 7.949574923745863e-05, - "loss": 0.0305, + "epoch": 0.88, + "learning_rate": 0.00016842071293493485, + "loss": 0.0409, "step": 135910 }, { - "epoch": 1.47, - "learning_rate": 7.947952495294957e-05, - "loss": 0.0314, + "epoch": 0.88, + "learning_rate": 0.00016841103158057787, + "loss": 0.0418, "step": 135920 }, { - "epoch": 1.47, - "learning_rate": 7.946330066844051e-05, - "loss": 0.0285, + "epoch": 0.88, + "learning_rate": 0.00016840135022622095, + "loss": 0.0456, "step": 135930 }, { - "epoch": 1.47, - "learning_rate": 7.944707638393146e-05, - "loss": 0.027, + "epoch": 0.88, + "learning_rate": 0.00016839166887186403, + "loss": 0.0404, "step": 135940 }, { - "epoch": 1.47, - "learning_rate": 7.943085209942241e-05, - "loss": 0.0271, + "epoch": 0.88, + "learning_rate": 0.0001683819875175071, + "loss": 0.0373, "step": 135950 }, { - "epoch": 1.47, - "learning_rate": 7.941462781491336e-05, - "loss": 0.0299, + "epoch": 0.88, + "learning_rate": 0.00016837230616315016, + "loss": 0.0403, "step": 135960 }, { - "epoch": 1.47, - "learning_rate": 7.93984035304043e-05, - "loss": 0.0342, + "epoch": 0.88, + "learning_rate": 0.00016836262480879324, + "loss": 0.0405, "step": 135970 }, { - "epoch": 1.47, - "learning_rate": 7.938217924589525e-05, - "loss": 0.0261, + "epoch": 0.88, + "learning_rate": 0.00016835294345443632, + "loss": 0.0383, "step": 135980 }, { - "epoch": 1.47, - "learning_rate": 7.93659549613862e-05, - "loss": 0.0244, + "epoch": 0.88, + "learning_rate": 0.00016834326210007935, + "loss": 0.044, "step": 135990 }, { - "epoch": 1.47, - "learning_rate": 7.934973067687715e-05, - "loss": 0.0304, + "epoch": 0.88, + "learning_rate": 0.00016833358074572243, + "loss": 0.038, "step": 136000 }, { - "epoch": 1.47, - "eval_cer": 0.9210933648560539, - "eval_loss": 0.02423330768942833, - "eval_runtime": 118.7126, - "eval_samples_per_second": 16.847, - "eval_steps_per_second": 4.212, + "epoch": 0.88, + "eval_cer": 0.9199123262908147, + "eval_loss": 0.027130674570798874, + "eval_runtime": 119.9831, + "eval_samples_per_second": 16.669, + "eval_steps_per_second": 4.167, "step": 136000 }, { - "epoch": 1.47, - "learning_rate": 7.93335063923681e-05, - "loss": 0.0255, + "epoch": 0.88, + "learning_rate": 0.0001683238993913655, + "loss": 0.0399, "step": 136010 }, { - "epoch": 1.47, - "learning_rate": 7.931728210785903e-05, - "loss": 0.0374, + "epoch": 0.88, + "learning_rate": 0.00016831421803700856, + "loss": 0.0379, "step": 136020 }, { - "epoch": 1.47, - "learning_rate": 7.930105782334998e-05, - "loss": 0.0334, + "epoch": 0.88, + "learning_rate": 0.00016830453668265164, + "loss": 0.0385, "step": 136030 }, { - "epoch": 1.47, - "learning_rate": 7.928483353884093e-05, - "loss": 0.0249, + "epoch": 0.88, + "learning_rate": 0.00016829485532829472, + "loss": 0.0377, "step": 136040 }, { - "epoch": 1.47, - "learning_rate": 7.926860925433188e-05, - "loss": 0.0339, + "epoch": 0.88, + "learning_rate": 0.0001682851739739378, + "loss": 0.0445, "step": 136050 }, { - "epoch": 1.47, - "learning_rate": 7.925238496982282e-05, - "loss": 0.0269, + "epoch": 0.88, + "learning_rate": 0.00016827549261958083, + "loss": 0.0462, "step": 136060 }, { - "epoch": 1.47, - "learning_rate": 7.923616068531377e-05, - "loss": 0.0331, + "epoch": 0.88, + "learning_rate": 0.0001682658112652239, + "loss": 0.0374, "step": 136070 }, { - "epoch": 1.47, - "learning_rate": 7.921993640080472e-05, - "loss": 0.0269, + "epoch": 0.88, + "learning_rate": 0.00016825612991086699, + "loss": 0.0408, "step": 136080 }, { - "epoch": 1.47, - "learning_rate": 7.920371211629567e-05, - "loss": 0.0288, + "epoch": 0.88, + "learning_rate": 0.00016824644855651004, + "loss": 0.0418, "step": 136090 }, { - "epoch": 1.47, - "learning_rate": 7.918748783178662e-05, - "loss": 0.0281, + "epoch": 0.88, + "learning_rate": 0.00016823676720215312, + "loss": 0.0412, "step": 136100 }, { - "epoch": 1.47, - "learning_rate": 7.917126354727755e-05, - "loss": 0.0307, + "epoch": 0.88, + "learning_rate": 0.0001682270858477962, + "loss": 0.043, "step": 136110 }, { - "epoch": 1.47, - "learning_rate": 7.91550392627685e-05, - "loss": 0.0288, + "epoch": 0.88, + "learning_rate": 0.00016821740449343928, + "loss": 0.0484, "step": 136120 }, { - "epoch": 1.47, - "learning_rate": 7.913881497825945e-05, - "loss": 0.0299, + "epoch": 0.88, + "learning_rate": 0.0001682077231390823, + "loss": 0.0367, "step": 136130 }, { - "epoch": 1.47, - "learning_rate": 7.91225906937504e-05, - "loss": 0.0321, + "epoch": 0.88, + "learning_rate": 0.00016819804178472538, + "loss": 0.043, "step": 136140 }, { - "epoch": 1.47, - "learning_rate": 7.910636640924135e-05, - "loss": 0.0312, + "epoch": 0.88, + "learning_rate": 0.00016818836043036846, + "loss": 0.0397, "step": 136150 }, { - "epoch": 1.47, - "learning_rate": 7.909014212473229e-05, - "loss": 0.0251, + "epoch": 0.88, + "learning_rate": 0.00016817867907601152, + "loss": 0.0389, "step": 136160 }, { - "epoch": 1.47, - "learning_rate": 7.907391784022324e-05, - "loss": 0.0285, + "epoch": 0.88, + "learning_rate": 0.0001681689977216546, + "loss": 0.0409, "step": 136170 }, { - "epoch": 1.47, - "learning_rate": 7.905769355571419e-05, - "loss": 0.0255, + "epoch": 0.88, + "learning_rate": 0.00016815931636729768, + "loss": 0.0402, "step": 136180 }, { - "epoch": 1.47, - "learning_rate": 7.904146927120514e-05, - "loss": 0.0256, + "epoch": 0.88, + "learning_rate": 0.00016814963501294076, + "loss": 0.044, "step": 136190 }, { - "epoch": 1.47, - "learning_rate": 7.902524498669607e-05, - "loss": 0.0279, + "epoch": 0.88, + "learning_rate": 0.00016813995365858378, + "loss": 0.0404, "step": 136200 }, { - "epoch": 1.47, - "learning_rate": 7.900902070218702e-05, - "loss": 0.0265, + "epoch": 0.88, + "learning_rate": 0.00016813027230422686, + "loss": 0.0429, "step": 136210 }, { - "epoch": 1.47, - "learning_rate": 7.899279641767797e-05, - "loss": 0.0289, + "epoch": 0.88, + "learning_rate": 0.0001681205909498699, + "loss": 0.0429, "step": 136220 }, { - "epoch": 1.47, - "learning_rate": 7.897657213316892e-05, - "loss": 0.0291, + "epoch": 0.88, + "learning_rate": 0.000168110909595513, + "loss": 0.0448, "step": 136230 }, { - "epoch": 1.47, - "learning_rate": 7.896034784865987e-05, - "loss": 0.0279, + "epoch": 0.88, + "learning_rate": 0.00016810122824115607, + "loss": 0.0433, "step": 136240 }, { - "epoch": 1.47, - "learning_rate": 7.894412356415081e-05, - "loss": 0.0319, + "epoch": 0.88, + "learning_rate": 0.00016809154688679915, + "loss": 0.0375, "step": 136250 }, { - "epoch": 1.47, - "learning_rate": 7.892789927964176e-05, - "loss": 0.0232, + "epoch": 0.88, + "learning_rate": 0.0001680818655324422, + "loss": 0.0381, "step": 136260 }, { - "epoch": 1.47, - "learning_rate": 7.891167499513271e-05, - "loss": 0.0345, + "epoch": 0.88, + "learning_rate": 0.00016807218417808526, + "loss": 0.0346, "step": 136270 }, { - "epoch": 1.47, - "learning_rate": 7.889545071062366e-05, - "loss": 0.0308, + "epoch": 0.88, + "learning_rate": 0.00016806250282372834, + "loss": 0.0438, "step": 136280 }, { - "epoch": 1.47, - "learning_rate": 7.88792264261146e-05, - "loss": 0.0312, + "epoch": 0.88, + "learning_rate": 0.0001680528214693714, + "loss": 0.039, "step": 136290 }, { - "epoch": 1.47, - "learning_rate": 7.886300214160554e-05, - "loss": 0.0276, + "epoch": 0.88, + "learning_rate": 0.00016804314011501447, + "loss": 0.0401, "step": 136300 }, { - "epoch": 1.47, - "learning_rate": 7.88467778570965e-05, - "loss": 0.0315, + "epoch": 0.88, + "learning_rate": 0.00016803345876065755, + "loss": 0.0415, "step": 136310 }, { - "epoch": 1.47, - "learning_rate": 7.883055357258744e-05, - "loss": 0.0264, + "epoch": 0.88, + "learning_rate": 0.00016802377740630063, + "loss": 0.0429, "step": 136320 }, { - "epoch": 1.47, - "learning_rate": 7.88143292880784e-05, - "loss": 0.03, + "epoch": 0.88, + "learning_rate": 0.00016801409605194368, + "loss": 0.0389, "step": 136330 }, { - "epoch": 1.47, - "learning_rate": 7.879810500356933e-05, - "loss": 0.0316, + "epoch": 0.88, + "learning_rate": 0.00016800441469758674, + "loss": 0.0394, "step": 136340 }, { - "epoch": 1.47, - "learning_rate": 7.878188071906028e-05, - "loss": 0.0261, + "epoch": 0.88, + "learning_rate": 0.00016799473334322982, + "loss": 0.0397, "step": 136350 }, { - "epoch": 1.47, - "learning_rate": 7.876565643455123e-05, - "loss": 0.0328, + "epoch": 0.88, + "learning_rate": 0.00016798505198887287, + "loss": 0.0424, "step": 136360 }, { - "epoch": 1.47, - "learning_rate": 7.874943215004218e-05, - "loss": 0.0323, + "epoch": 0.88, + "learning_rate": 0.00016797537063451595, + "loss": 0.0353, "step": 136370 }, { - "epoch": 1.48, - "learning_rate": 7.873320786553312e-05, - "loss": 0.0313, + "epoch": 0.88, + "learning_rate": 0.00016796568928015903, + "loss": 0.0415, "step": 136380 }, { - "epoch": 1.48, - "learning_rate": 7.871698358102407e-05, - "loss": 0.0287, + "epoch": 0.88, + "learning_rate": 0.0001679560079258021, + "loss": 0.0382, "step": 136390 }, { - "epoch": 1.48, - "learning_rate": 7.870075929651501e-05, - "loss": 0.0394, + "epoch": 0.88, + "learning_rate": 0.00016794632657144516, + "loss": 0.0379, "step": 136400 }, { - "epoch": 1.48, - "learning_rate": 7.868453501200596e-05, - "loss": 0.0313, + "epoch": 0.88, + "learning_rate": 0.0001679366452170882, + "loss": 0.0424, "step": 136410 }, { - "epoch": 1.48, - "learning_rate": 7.866831072749691e-05, - "loss": 0.028, + "epoch": 0.88, + "learning_rate": 0.00016792696386273127, + "loss": 0.0384, "step": 136420 }, { - "epoch": 1.48, - "learning_rate": 7.865208644298785e-05, - "loss": 0.0374, + "epoch": 0.88, + "learning_rate": 0.00016791728250837434, + "loss": 0.0411, "step": 136430 }, { - "epoch": 1.48, - "learning_rate": 7.86358621584788e-05, - "loss": 0.03, + "epoch": 0.88, + "learning_rate": 0.00016790760115401742, + "loss": 0.0404, "step": 136440 }, { - "epoch": 1.48, - "learning_rate": 7.861963787396975e-05, - "loss": 0.0264, + "epoch": 0.88, + "learning_rate": 0.0001678979197996605, + "loss": 0.0388, "step": 136450 }, { - "epoch": 1.48, - "learning_rate": 7.86034135894607e-05, - "loss": 0.0298, + "epoch": 0.88, + "learning_rate": 0.00016788823844530356, + "loss": 0.0438, "step": 136460 }, { - "epoch": 1.48, - "learning_rate": 7.858718930495164e-05, - "loss": 0.0275, + "epoch": 0.88, + "learning_rate": 0.00016787855709094664, + "loss": 0.0406, "step": 136470 }, { - "epoch": 1.48, - "learning_rate": 7.857096502044259e-05, - "loss": 0.0376, + "epoch": 0.88, + "learning_rate": 0.0001678688757365897, + "loss": 0.0392, "step": 136480 }, { - "epoch": 1.48, - "learning_rate": 7.855474073593354e-05, - "loss": 0.0267, + "epoch": 0.88, + "learning_rate": 0.00016785919438223274, + "loss": 0.0435, "step": 136490 }, { - "epoch": 1.48, - "learning_rate": 7.853851645142449e-05, - "loss": 0.0289, + "epoch": 0.88, + "learning_rate": 0.00016784951302787582, + "loss": 0.0392, "step": 136500 }, { - "epoch": 1.48, - "learning_rate": 7.852229216691544e-05, - "loss": 0.0273, + "epoch": 0.88, + "learning_rate": 0.0001678398316735189, + "loss": 0.0373, "step": 136510 }, { - "epoch": 1.48, - "learning_rate": 7.850606788240637e-05, - "loss": 0.0305, + "epoch": 0.88, + "learning_rate": 0.00016783015031916198, + "loss": 0.0363, "step": 136520 }, { - "epoch": 1.48, - "learning_rate": 7.848984359789732e-05, - "loss": 0.0341, + "epoch": 0.88, + "learning_rate": 0.00016782046896480503, + "loss": 0.037, "step": 136530 }, { - "epoch": 1.48, - "learning_rate": 7.847361931338827e-05, - "loss": 0.022, + "epoch": 0.88, + "learning_rate": 0.00016781078761044811, + "loss": 0.0377, "step": 136540 }, { - "epoch": 1.48, - "learning_rate": 7.845739502887922e-05, - "loss": 0.0312, + "epoch": 0.88, + "learning_rate": 0.00016780110625609117, + "loss": 0.0524, "step": 136550 }, { - "epoch": 1.48, - "learning_rate": 7.844117074437016e-05, - "loss": 0.0279, + "epoch": 0.88, + "learning_rate": 0.00016779142490173422, + "loss": 0.0329, "step": 136560 }, { - "epoch": 1.48, - "learning_rate": 7.84249464598611e-05, - "loss": 0.0264, + "epoch": 0.88, + "learning_rate": 0.0001677817435473773, + "loss": 0.0415, "step": 136570 }, { - "epoch": 1.48, - "learning_rate": 7.840872217535206e-05, - "loss": 0.0266, + "epoch": 0.88, + "learning_rate": 0.00016777206219302038, + "loss": 0.0436, "step": 136580 }, { - "epoch": 1.48, - "learning_rate": 7.8392497890843e-05, - "loss": 0.0281, + "epoch": 0.88, + "learning_rate": 0.00016776238083866346, + "loss": 0.0403, "step": 136590 }, { - "epoch": 1.48, - "learning_rate": 7.837627360633396e-05, - "loss": 0.0288, + "epoch": 0.88, + "learning_rate": 0.0001677526994843065, + "loss": 0.0435, "step": 136600 }, { - "epoch": 1.48, - "learning_rate": 7.836004932182489e-05, - "loss": 0.0372, + "epoch": 0.88, + "learning_rate": 0.0001677430181299496, + "loss": 0.0451, "step": 136610 }, { - "epoch": 1.48, - "learning_rate": 7.834382503731584e-05, - "loss": 0.0385, + "epoch": 0.88, + "learning_rate": 0.00016773333677559262, + "loss": 0.0425, "step": 136620 }, { - "epoch": 1.48, - "learning_rate": 7.832760075280679e-05, - "loss": 0.0282, + "epoch": 0.88, + "learning_rate": 0.0001677236554212357, + "loss": 0.0485, "step": 136630 }, { - "epoch": 1.48, - "learning_rate": 7.831137646829774e-05, - "loss": 0.0287, + "epoch": 0.88, + "learning_rate": 0.00016771397406687878, + "loss": 0.0437, "step": 136640 }, { - "epoch": 1.48, - "learning_rate": 7.829515218378868e-05, - "loss": 0.0298, + "epoch": 0.88, + "learning_rate": 0.00016770429271252186, + "loss": 0.0404, "step": 136650 }, { - "epoch": 1.48, - "learning_rate": 7.827892789927963e-05, - "loss": 0.031, + "epoch": 0.88, + "learning_rate": 0.0001676946113581649, + "loss": 0.0405, "step": 136660 }, { - "epoch": 1.48, - "learning_rate": 7.826270361477058e-05, - "loss": 0.028, + "epoch": 0.88, + "learning_rate": 0.000167684930003808, + "loss": 0.0383, "step": 136670 }, { - "epoch": 1.48, - "learning_rate": 7.824647933026153e-05, - "loss": 0.0312, + "epoch": 0.88, + "learning_rate": 0.00016767524864945107, + "loss": 0.0454, "step": 136680 }, { - "epoch": 1.48, - "learning_rate": 7.823025504575248e-05, - "loss": 0.03, + "epoch": 0.88, + "learning_rate": 0.0001676655672950941, + "loss": 0.0427, "step": 136690 }, { - "epoch": 1.48, - "learning_rate": 7.821403076124341e-05, - "loss": 0.0308, + "epoch": 0.88, + "learning_rate": 0.00016765588594073717, + "loss": 0.036, "step": 136700 }, { - "epoch": 1.48, - "learning_rate": 7.819780647673436e-05, - "loss": 0.0324, + "epoch": 0.88, + "learning_rate": 0.00016764620458638025, + "loss": 0.04, "step": 136710 }, { - "epoch": 1.48, - "learning_rate": 7.818158219222531e-05, - "loss": 0.0342, + "epoch": 0.88, + "learning_rate": 0.00016763652323202333, + "loss": 0.0407, "step": 136720 }, { - "epoch": 1.48, - "learning_rate": 7.816535790771626e-05, - "loss": 0.0308, + "epoch": 0.88, + "learning_rate": 0.00016762684187766639, + "loss": 0.0351, "step": 136730 }, { - "epoch": 1.48, - "learning_rate": 7.81491336232072e-05, - "loss": 0.0295, + "epoch": 0.88, + "learning_rate": 0.00016761716052330947, + "loss": 0.0424, "step": 136740 }, { - "epoch": 1.48, - "learning_rate": 7.813290933869815e-05, - "loss": 0.0361, + "epoch": 0.88, + "learning_rate": 0.00016760747916895255, + "loss": 0.0412, "step": 136750 }, { - "epoch": 1.48, - "learning_rate": 7.81166850541891e-05, - "loss": 0.0271, + "epoch": 0.88, + "learning_rate": 0.00016759779781459557, + "loss": 0.0379, "step": 136760 }, { - "epoch": 1.48, - "learning_rate": 7.810046076968005e-05, - "loss": 0.0294, + "epoch": 0.88, + "learning_rate": 0.00016758811646023865, + "loss": 0.0352, "step": 136770 }, { - "epoch": 1.48, - "learning_rate": 7.8084236485171e-05, - "loss": 0.0269, + "epoch": 0.88, + "learning_rate": 0.00016757843510588173, + "loss": 0.0389, "step": 136780 }, { - "epoch": 1.48, - "learning_rate": 7.806801220066193e-05, - "loss": 0.0272, + "epoch": 0.88, + "learning_rate": 0.0001675687537515248, + "loss": 0.0429, "step": 136790 }, { - "epoch": 1.48, - "learning_rate": 7.805178791615288e-05, - "loss": 0.0348, + "epoch": 0.88, + "learning_rate": 0.00016755907239716786, + "loss": 0.0388, "step": 136800 }, { - "epoch": 1.48, - "learning_rate": 7.803556363164383e-05, - "loss": 0.035, + "epoch": 0.88, + "learning_rate": 0.00016754939104281094, + "loss": 0.0428, "step": 136810 }, { - "epoch": 1.48, - "learning_rate": 7.801933934713478e-05, - "loss": 0.0272, + "epoch": 0.88, + "learning_rate": 0.00016753970968845402, + "loss": 0.0347, "step": 136820 }, { - "epoch": 1.48, - "learning_rate": 7.800311506262572e-05, - "loss": 0.0278, + "epoch": 0.88, + "learning_rate": 0.00016753002833409705, + "loss": 0.0418, "step": 136830 }, { - "epoch": 1.48, - "learning_rate": 7.798689077811667e-05, - "loss": 0.0273, + "epoch": 0.88, + "learning_rate": 0.00016752034697974013, + "loss": 0.0407, "step": 136840 }, { - "epoch": 1.48, - "learning_rate": 7.797066649360762e-05, - "loss": 0.0264, + "epoch": 0.88, + "learning_rate": 0.0001675106656253832, + "loss": 0.0488, "step": 136850 }, { - "epoch": 1.48, - "learning_rate": 7.795444220909857e-05, - "loss": 0.0292, + "epoch": 0.88, + "learning_rate": 0.00016750098427102626, + "loss": 0.0409, "step": 136860 }, { - "epoch": 1.48, - "learning_rate": 7.793821792458952e-05, - "loss": 0.0394, + "epoch": 0.88, + "learning_rate": 0.00016749130291666934, + "loss": 0.0492, "step": 136870 }, { - "epoch": 1.48, - "learning_rate": 7.792199364008045e-05, - "loss": 0.0318, + "epoch": 0.88, + "learning_rate": 0.00016748162156231242, + "loss": 0.0358, "step": 136880 }, { - "epoch": 1.48, - "learning_rate": 7.79057693555714e-05, - "loss": 0.0257, + "epoch": 0.88, + "learning_rate": 0.0001674719402079555, + "loss": 0.0415, "step": 136890 }, { - "epoch": 1.48, - "learning_rate": 7.788954507106235e-05, - "loss": 0.0274, + "epoch": 0.88, + "learning_rate": 0.00016746225885359853, + "loss": 0.045, "step": 136900 }, { - "epoch": 1.48, - "learning_rate": 7.78733207865533e-05, - "loss": 0.0318, + "epoch": 0.88, + "learning_rate": 0.0001674525774992416, + "loss": 0.0388, "step": 136910 }, { - "epoch": 1.48, - "learning_rate": 7.785709650204425e-05, - "loss": 0.0358, + "epoch": 0.88, + "learning_rate": 0.00016744289614488469, + "loss": 0.0451, "step": 136920 }, { - "epoch": 1.48, - "learning_rate": 7.784087221753519e-05, - "loss": 0.027, + "epoch": 0.88, + "learning_rate": 0.00016743321479052774, + "loss": 0.0385, "step": 136930 }, { - "epoch": 1.48, - "learning_rate": 7.782464793302614e-05, - "loss": 0.0307, + "epoch": 0.88, + "learning_rate": 0.00016742353343617082, + "loss": 0.0412, "step": 136940 }, { - "epoch": 1.48, - "learning_rate": 7.780842364851709e-05, - "loss": 0.0289, + "epoch": 0.88, + "learning_rate": 0.0001674138520818139, + "loss": 0.0449, "step": 136950 }, { - "epoch": 1.48, - "learning_rate": 7.779219936400804e-05, - "loss": 0.0265, + "epoch": 0.88, + "learning_rate": 0.00016740417072745698, + "loss": 0.036, "step": 136960 }, { - "epoch": 1.48, - "learning_rate": 7.777597507949898e-05, - "loss": 0.0332, + "epoch": 0.88, + "learning_rate": 0.0001673944893731, + "loss": 0.042, "step": 136970 }, { - "epoch": 1.48, - "learning_rate": 7.775975079498993e-05, - "loss": 0.0305, + "epoch": 0.88, + "learning_rate": 0.00016738480801874308, + "loss": 0.0446, "step": 136980 }, { - "epoch": 1.48, - "learning_rate": 7.774352651048088e-05, - "loss": 0.0301, + "epoch": 0.88, + "learning_rate": 0.00016737512666438616, + "loss": 0.0458, "step": 136990 }, { - "epoch": 1.48, - "learning_rate": 7.772730222597182e-05, - "loss": 0.0325, + "epoch": 0.88, + "learning_rate": 0.00016736544531002922, + "loss": 0.0382, "step": 137000 }, { - "epoch": 1.48, - "eval_cer": 0.9211613931487558, - "eval_loss": 0.02359270490705967, - "eval_runtime": 119.0419, - "eval_samples_per_second": 16.801, - "eval_steps_per_second": 4.2, + "epoch": 0.88, + "eval_cer": 0.9199159417015027, + "eval_loss": 0.0271102674305439, + "eval_runtime": 119.9795, + "eval_samples_per_second": 16.67, + "eval_steps_per_second": 4.167, "step": 137000 }, { - "epoch": 1.48, - "learning_rate": 7.771107794146277e-05, - "loss": 0.028, + "epoch": 0.88, + "learning_rate": 0.0001673557639556723, + "loss": 0.0446, "step": 137010 }, { - "epoch": 1.48, - "learning_rate": 7.769485365695371e-05, - "loss": 0.0296, + "epoch": 0.88, + "learning_rate": 0.00016734608260131538, + "loss": 0.0432, "step": 137020 }, { - "epoch": 1.48, - "learning_rate": 7.767862937244466e-05, - "loss": 0.0324, + "epoch": 0.88, + "learning_rate": 0.00016733640124695843, + "loss": 0.0405, "step": 137030 }, { - "epoch": 1.48, - "learning_rate": 7.766240508793561e-05, - "loss": 0.0277, + "epoch": 0.88, + "learning_rate": 0.00016732671989260148, + "loss": 0.0381, "step": 137040 }, { - "epoch": 1.48, - "learning_rate": 7.764618080342656e-05, - "loss": 0.0323, + "epoch": 0.88, + "learning_rate": 0.00016731703853824456, + "loss": 0.0382, "step": 137050 }, { - "epoch": 1.48, - "learning_rate": 7.76299565189175e-05, - "loss": 0.0304, + "epoch": 0.88, + "learning_rate": 0.0001673073571838876, + "loss": 0.0377, "step": 137060 }, { - "epoch": 1.48, - "learning_rate": 7.761373223440845e-05, - "loss": 0.0274, + "epoch": 0.88, + "learning_rate": 0.0001672976758295307, + "loss": 0.0429, "step": 137070 }, { - "epoch": 1.48, - "learning_rate": 7.75975079498994e-05, - "loss": 0.0306, + "epoch": 0.88, + "learning_rate": 0.00016728799447517377, + "loss": 0.0386, "step": 137080 }, { - "epoch": 1.48, - "learning_rate": 7.758128366539035e-05, - "loss": 0.0232, + "epoch": 0.88, + "learning_rate": 0.00016727831312081685, + "loss": 0.0366, "step": 137090 }, { - "epoch": 1.48, - "learning_rate": 7.75650593808813e-05, - "loss": 0.0274, + "epoch": 0.88, + "learning_rate": 0.0001672686317664599, + "loss": 0.0383, "step": 137100 }, { - "epoch": 1.48, - "learning_rate": 7.754883509637223e-05, - "loss": 0.0372, + "epoch": 0.88, + "learning_rate": 0.00016725895041210296, + "loss": 0.0412, "step": 137110 }, { - "epoch": 1.48, - "learning_rate": 7.753261081186318e-05, - "loss": 0.0327, + "epoch": 0.89, + "learning_rate": 0.00016724926905774604, + "loss": 0.0381, "step": 137120 }, { - "epoch": 1.48, - "learning_rate": 7.751638652735413e-05, - "loss": 0.0262, + "epoch": 0.89, + "learning_rate": 0.0001672395877033891, + "loss": 0.0364, "step": 137130 }, { - "epoch": 1.48, - "learning_rate": 7.750016224284508e-05, - "loss": 0.0294, + "epoch": 0.89, + "learning_rate": 0.00016722990634903217, + "loss": 0.0416, "step": 137140 }, { - "epoch": 1.48, - "learning_rate": 7.748393795833602e-05, - "loss": 0.0329, + "epoch": 0.89, + "learning_rate": 0.00016722022499467525, + "loss": 0.0404, "step": 137150 }, { - "epoch": 1.48, - "learning_rate": 7.746771367382697e-05, - "loss": 0.0342, + "epoch": 0.89, + "learning_rate": 0.00016721054364031833, + "loss": 0.0445, "step": 137160 }, { - "epoch": 1.48, - "learning_rate": 7.745148938931792e-05, - "loss": 0.0266, + "epoch": 0.89, + "learning_rate": 0.00016720086228596138, + "loss": 0.0388, "step": 137170 }, { - "epoch": 1.48, - "learning_rate": 7.743526510480887e-05, - "loss": 0.0268, + "epoch": 0.89, + "learning_rate": 0.00016719118093160443, + "loss": 0.0425, "step": 137180 }, { - "epoch": 1.48, - "learning_rate": 7.741904082029982e-05, - "loss": 0.0308, + "epoch": 0.89, + "learning_rate": 0.00016718149957724751, + "loss": 0.0415, "step": 137190 }, { - "epoch": 1.48, - "learning_rate": 7.740281653579075e-05, - "loss": 0.0267, + "epoch": 0.89, + "learning_rate": 0.00016717181822289057, + "loss": 0.0363, "step": 137200 }, { - "epoch": 1.48, - "learning_rate": 7.73865922512817e-05, - "loss": 0.0276, + "epoch": 0.89, + "learning_rate": 0.00016716213686853365, + "loss": 0.0437, "step": 137210 }, { - "epoch": 1.48, - "learning_rate": 7.737036796677265e-05, - "loss": 0.0282, + "epoch": 0.89, + "learning_rate": 0.00016715245551417673, + "loss": 0.0371, "step": 137220 }, { - "epoch": 1.48, - "learning_rate": 7.73541436822636e-05, - "loss": 0.0268, + "epoch": 0.89, + "learning_rate": 0.00016714277415981978, + "loss": 0.039, "step": 137230 }, { - "epoch": 1.48, - "learning_rate": 7.733791939775454e-05, - "loss": 0.0265, + "epoch": 0.89, + "learning_rate": 0.00016713309280546286, + "loss": 0.0382, "step": 137240 }, { - "epoch": 1.48, - "learning_rate": 7.732169511324549e-05, - "loss": 0.0265, + "epoch": 0.89, + "learning_rate": 0.0001671234114511059, + "loss": 0.0392, "step": 137250 }, { - "epoch": 1.48, - "learning_rate": 7.730547082873644e-05, - "loss": 0.0301, + "epoch": 0.89, + "learning_rate": 0.00016711373009674896, + "loss": 0.0437, "step": 137260 }, { - "epoch": 1.48, - "learning_rate": 7.728924654422739e-05, - "loss": 0.0276, + "epoch": 0.89, + "learning_rate": 0.00016710404874239204, + "loss": 0.0413, "step": 137270 }, { - "epoch": 1.48, - "learning_rate": 7.727302225971835e-05, - "loss": 0.0331, + "epoch": 0.89, + "learning_rate": 0.00016709436738803512, + "loss": 0.039, "step": 137280 }, { - "epoch": 1.48, - "learning_rate": 7.72567979752093e-05, - "loss": 0.0306, + "epoch": 0.89, + "learning_rate": 0.0001670846860336782, + "loss": 0.0386, "step": 137290 }, { - "epoch": 1.49, - "learning_rate": 7.724057369070024e-05, - "loss": 0.0277, + "epoch": 0.89, + "learning_rate": 0.00016707500467932126, + "loss": 0.0472, "step": 137300 }, { - "epoch": 1.49, - "learning_rate": 7.722434940619119e-05, - "loss": 0.0295, + "epoch": 0.89, + "learning_rate": 0.00016706532332496434, + "loss": 0.0437, "step": 137310 }, { - "epoch": 1.49, - "learning_rate": 7.720812512168214e-05, - "loss": 0.0298, + "epoch": 0.89, + "learning_rate": 0.0001670556419706074, + "loss": 0.0389, "step": 137320 }, { - "epoch": 1.49, - "learning_rate": 7.719190083717309e-05, - "loss": 0.0287, + "epoch": 0.89, + "learning_rate": 0.00016704596061625044, + "loss": 0.0415, "step": 137330 }, { - "epoch": 1.49, - "learning_rate": 7.717567655266402e-05, - "loss": 0.0287, + "epoch": 0.89, + "learning_rate": 0.00016703627926189352, + "loss": 0.043, "step": 137340 }, { - "epoch": 1.49, - "learning_rate": 7.715945226815497e-05, - "loss": 0.0299, + "epoch": 0.89, + "learning_rate": 0.0001670265979075366, + "loss": 0.0405, "step": 137350 }, { - "epoch": 1.49, - "learning_rate": 7.714322798364592e-05, - "loss": 0.0321, + "epoch": 0.89, + "learning_rate": 0.00016701691655317968, + "loss": 0.0385, "step": 137360 }, { - "epoch": 1.49, - "learning_rate": 7.712700369913687e-05, - "loss": 0.0275, + "epoch": 0.89, + "learning_rate": 0.00016700723519882273, + "loss": 0.0466, "step": 137370 }, { - "epoch": 1.49, - "learning_rate": 7.711077941462782e-05, - "loss": 0.0284, + "epoch": 0.89, + "learning_rate": 0.00016699755384446581, + "loss": 0.0359, "step": 137380 }, { - "epoch": 1.49, - "learning_rate": 7.709455513011876e-05, - "loss": 0.0291, + "epoch": 0.89, + "learning_rate": 0.00016698787249010887, + "loss": 0.0421, "step": 137390 }, { - "epoch": 1.49, - "learning_rate": 7.707833084560971e-05, - "loss": 0.0242, + "epoch": 0.89, + "learning_rate": 0.00016697819113575192, + "loss": 0.0451, "step": 137400 }, { - "epoch": 1.49, - "learning_rate": 7.706210656110066e-05, - "loss": 0.0327, + "epoch": 0.89, + "learning_rate": 0.000166968509781395, + "loss": 0.0391, "step": 137410 }, { - "epoch": 1.49, - "learning_rate": 7.704588227659161e-05, - "loss": 0.0339, + "epoch": 0.89, + "learning_rate": 0.00016695882842703808, + "loss": 0.0415, "step": 137420 }, { - "epoch": 1.49, - "learning_rate": 7.702965799208254e-05, - "loss": 0.0293, + "epoch": 0.89, + "learning_rate": 0.00016694914707268113, + "loss": 0.0432, "step": 137430 }, { - "epoch": 1.49, - "learning_rate": 7.701343370757349e-05, - "loss": 0.0286, + "epoch": 0.89, + "learning_rate": 0.0001669394657183242, + "loss": 0.038, "step": 137440 }, { - "epoch": 1.49, - "learning_rate": 7.699720942306444e-05, - "loss": 0.0281, + "epoch": 0.89, + "learning_rate": 0.0001669297843639673, + "loss": 0.0393, "step": 137450 }, { - "epoch": 1.49, - "learning_rate": 7.698098513855539e-05, - "loss": 0.0296, + "epoch": 0.89, + "learning_rate": 0.00016692010300961032, + "loss": 0.0416, "step": 137460 }, { - "epoch": 1.49, - "learning_rate": 7.696476085404634e-05, - "loss": 0.0307, + "epoch": 0.89, + "learning_rate": 0.0001669104216552534, + "loss": 0.0454, "step": 137470 }, { - "epoch": 1.49, - "learning_rate": 7.694853656953728e-05, - "loss": 0.0298, + "epoch": 0.89, + "learning_rate": 0.00016690074030089648, + "loss": 0.0421, "step": 137480 }, { - "epoch": 1.49, - "learning_rate": 7.693231228502823e-05, - "loss": 0.0295, + "epoch": 0.89, + "learning_rate": 0.00016689105894653956, + "loss": 0.0342, "step": 137490 }, { - "epoch": 1.49, - "learning_rate": 7.691608800051918e-05, - "loss": 0.029, + "epoch": 0.89, + "learning_rate": 0.0001668813775921826, + "loss": 0.0387, "step": 137500 }, { - "epoch": 1.49, - "learning_rate": 7.689986371601013e-05, - "loss": 0.0329, + "epoch": 0.89, + "learning_rate": 0.0001668716962378257, + "loss": 0.0391, "step": 137510 }, { - "epoch": 1.49, - "learning_rate": 7.688363943150106e-05, - "loss": 0.0315, + "epoch": 0.89, + "learning_rate": 0.00016686201488346877, + "loss": 0.0366, "step": 137520 }, { - "epoch": 1.49, - "learning_rate": 7.686741514699201e-05, - "loss": 0.0276, + "epoch": 0.89, + "learning_rate": 0.0001668523335291118, + "loss": 0.0351, "step": 137530 }, { - "epoch": 1.49, - "learning_rate": 7.685119086248296e-05, - "loss": 0.0299, + "epoch": 0.89, + "learning_rate": 0.00016684265217475487, + "loss": 0.0409, "step": 137540 }, { - "epoch": 1.49, - "learning_rate": 7.683496657797391e-05, - "loss": 0.029, + "epoch": 0.89, + "learning_rate": 0.00016683297082039795, + "loss": 0.0387, "step": 137550 }, { - "epoch": 1.49, - "learning_rate": 7.681874229346486e-05, - "loss": 0.0275, + "epoch": 0.89, + "learning_rate": 0.00016682328946604103, + "loss": 0.0415, "step": 137560 }, { - "epoch": 1.49, - "learning_rate": 7.68025180089558e-05, - "loss": 0.0347, + "epoch": 0.89, + "learning_rate": 0.00016681360811168409, + "loss": 0.0354, "step": 137570 }, { - "epoch": 1.49, - "learning_rate": 7.678629372444675e-05, - "loss": 0.0322, + "epoch": 0.89, + "learning_rate": 0.00016680392675732717, + "loss": 0.0381, "step": 137580 }, { - "epoch": 1.49, - "learning_rate": 7.67700694399377e-05, - "loss": 0.0254, + "epoch": 0.89, + "learning_rate": 0.00016679424540297025, + "loss": 0.0429, "step": 137590 }, { - "epoch": 1.49, - "learning_rate": 7.675384515542865e-05, - "loss": 0.0308, + "epoch": 0.89, + "learning_rate": 0.00016678456404861327, + "loss": 0.037, "step": 137600 }, { - "epoch": 1.49, - "learning_rate": 7.67376208709196e-05, - "loss": 0.0375, + "epoch": 0.89, + "learning_rate": 0.00016677488269425635, + "loss": 0.0387, "step": 137610 }, { - "epoch": 1.49, - "learning_rate": 7.672139658641053e-05, - "loss": 0.0311, + "epoch": 0.89, + "learning_rate": 0.00016676520133989943, + "loss": 0.0383, "step": 137620 }, { - "epoch": 1.49, - "learning_rate": 7.670517230190148e-05, - "loss": 0.0325, + "epoch": 0.89, + "learning_rate": 0.00016675551998554248, + "loss": 0.0394, "step": 137630 }, { - "epoch": 1.49, - "learning_rate": 7.668894801739243e-05, - "loss": 0.0265, + "epoch": 0.89, + "learning_rate": 0.00016674583863118556, + "loss": 0.0399, "step": 137640 }, { - "epoch": 1.49, - "learning_rate": 7.667272373288338e-05, - "loss": 0.0329, + "epoch": 0.89, + "learning_rate": 0.00016673615727682864, + "loss": 0.043, "step": 137650 }, { - "epoch": 1.49, - "learning_rate": 7.665649944837432e-05, - "loss": 0.0297, + "epoch": 0.89, + "learning_rate": 0.00016672647592247172, + "loss": 0.035, "step": 137660 }, { - "epoch": 1.49, - "learning_rate": 7.664027516386527e-05, - "loss": 0.0325, + "epoch": 0.89, + "learning_rate": 0.00016671679456811475, + "loss": 0.0404, "step": 137670 }, { - "epoch": 1.49, - "learning_rate": 7.662405087935622e-05, - "loss": 0.0293, + "epoch": 0.89, + "learning_rate": 0.00016670711321375783, + "loss": 0.0455, "step": 137680 }, { - "epoch": 1.49, - "learning_rate": 7.660782659484717e-05, - "loss": 0.0252, + "epoch": 0.89, + "learning_rate": 0.0001666974318594009, + "loss": 0.036, "step": 137690 }, { - "epoch": 1.49, - "learning_rate": 7.659160231033812e-05, - "loss": 0.0269, + "epoch": 0.89, + "learning_rate": 0.00016668775050504396, + "loss": 0.0459, "step": 137700 }, { - "epoch": 1.49, - "learning_rate": 7.657537802582906e-05, - "loss": 0.0242, + "epoch": 0.89, + "learning_rate": 0.00016667806915068704, + "loss": 0.0404, "step": 137710 }, { - "epoch": 1.49, - "learning_rate": 7.655915374132e-05, - "loss": 0.0303, + "epoch": 0.89, + "learning_rate": 0.00016666838779633012, + "loss": 0.0348, "step": 137720 }, { - "epoch": 1.49, - "learning_rate": 7.654292945681095e-05, - "loss": 0.0259, + "epoch": 0.89, + "learning_rate": 0.0001666587064419732, + "loss": 0.0387, "step": 137730 }, { - "epoch": 1.49, - "learning_rate": 7.65267051723019e-05, - "loss": 0.0246, + "epoch": 0.89, + "learning_rate": 0.00016664902508761623, + "loss": 0.0346, "step": 137740 }, { - "epoch": 1.49, - "learning_rate": 7.651048088779284e-05, - "loss": 0.0288, + "epoch": 0.89, + "learning_rate": 0.0001666393437332593, + "loss": 0.0396, "step": 137750 }, { - "epoch": 1.49, - "learning_rate": 7.649425660328379e-05, - "loss": 0.0315, + "epoch": 0.89, + "learning_rate": 0.00016662966237890239, + "loss": 0.0461, "step": 137760 }, { - "epoch": 1.49, - "learning_rate": 7.647803231877474e-05, - "loss": 0.034, + "epoch": 0.89, + "learning_rate": 0.00016661998102454544, + "loss": 0.0379, "step": 137770 }, { - "epoch": 1.49, - "learning_rate": 7.646180803426569e-05, - "loss": 0.0293, + "epoch": 0.89, + "learning_rate": 0.00016661029967018852, + "loss": 0.0368, "step": 137780 }, { - "epoch": 1.49, - "learning_rate": 7.644558374975664e-05, - "loss": 0.0289, + "epoch": 0.89, + "learning_rate": 0.0001666006183158316, + "loss": 0.0383, "step": 137790 }, { - "epoch": 1.49, - "learning_rate": 7.642935946524758e-05, - "loss": 0.0331, + "epoch": 0.89, + "learning_rate": 0.00016659093696147465, + "loss": 0.0353, "step": 137800 }, { - "epoch": 1.49, - "learning_rate": 7.641313518073853e-05, - "loss": 0.0295, + "epoch": 0.89, + "learning_rate": 0.0001665812556071177, + "loss": 0.0411, "step": 137810 }, { - "epoch": 1.49, - "learning_rate": 7.639691089622948e-05, - "loss": 0.0287, + "epoch": 0.89, + "learning_rate": 0.00016657157425276078, + "loss": 0.0394, "step": 137820 }, { - "epoch": 1.49, - "learning_rate": 7.638068661172043e-05, - "loss": 0.035, + "epoch": 0.89, + "learning_rate": 0.00016656189289840384, + "loss": 0.0347, "step": 137830 }, { - "epoch": 1.49, - "learning_rate": 7.636446232721136e-05, - "loss": 0.0285, + "epoch": 0.89, + "learning_rate": 0.00016655221154404692, + "loss": 0.039, "step": 137840 }, { - "epoch": 1.49, - "learning_rate": 7.634823804270231e-05, - "loss": 0.0327, + "epoch": 0.89, + "learning_rate": 0.00016654253018969, + "loss": 0.0401, "step": 137850 }, { - "epoch": 1.49, - "learning_rate": 7.633201375819326e-05, - "loss": 0.0334, + "epoch": 0.89, + "learning_rate": 0.00016653284883533307, + "loss": 0.0426, "step": 137860 }, { - "epoch": 1.49, - "learning_rate": 7.631578947368421e-05, - "loss": 0.0284, + "epoch": 0.89, + "learning_rate": 0.00016652316748097613, + "loss": 0.0383, "step": 137870 }, { - "epoch": 1.49, - "learning_rate": 7.629956518917516e-05, - "loss": 0.0241, + "epoch": 0.89, + "learning_rate": 0.00016651348612661918, + "loss": 0.0395, "step": 137880 }, { - "epoch": 1.49, - "learning_rate": 7.62833409046661e-05, - "loss": 0.0243, + "epoch": 0.89, + "learning_rate": 0.00016650380477226226, + "loss": 0.0435, "step": 137890 }, { - "epoch": 1.49, - "learning_rate": 7.626711662015705e-05, - "loss": 0.0308, + "epoch": 0.89, + "learning_rate": 0.0001664941234179053, + "loss": 0.0399, "step": 137900 }, { - "epoch": 1.49, - "learning_rate": 7.6250892335648e-05, - "loss": 0.0316, + "epoch": 0.89, + "learning_rate": 0.0001664844420635484, + "loss": 0.0382, "step": 137910 }, { - "epoch": 1.49, - "learning_rate": 7.623466805113895e-05, - "loss": 0.0306, + "epoch": 0.89, + "learning_rate": 0.00016647476070919147, + "loss": 0.0431, "step": 137920 }, { - "epoch": 1.49, - "learning_rate": 7.621844376662988e-05, - "loss": 0.0303, + "epoch": 0.89, + "learning_rate": 0.00016646507935483455, + "loss": 0.0431, "step": 137930 }, { - "epoch": 1.49, - "learning_rate": 7.620221948212083e-05, - "loss": 0.0281, + "epoch": 0.89, + "learning_rate": 0.0001664553980004776, + "loss": 0.0458, "step": 137940 }, { - "epoch": 1.49, - "learning_rate": 7.618599519761178e-05, - "loss": 0.0326, + "epoch": 0.89, + "learning_rate": 0.00016644571664612066, + "loss": 0.0355, "step": 137950 }, { - "epoch": 1.49, - "learning_rate": 7.616977091310273e-05, - "loss": 0.0306, + "epoch": 0.89, + "learning_rate": 0.00016643603529176374, + "loss": 0.0413, "step": 137960 }, { - "epoch": 1.49, - "learning_rate": 7.615354662859368e-05, - "loss": 0.0278, + "epoch": 0.89, + "learning_rate": 0.0001664263539374068, + "loss": 0.0501, "step": 137970 }, { - "epoch": 1.49, - "learning_rate": 7.613732234408462e-05, - "loss": 0.0238, + "epoch": 0.89, + "learning_rate": 0.00016641667258304987, + "loss": 0.0418, "step": 137980 }, { - "epoch": 1.49, - "learning_rate": 7.612109805957557e-05, - "loss": 0.0262, + "epoch": 0.89, + "learning_rate": 0.00016640699122869295, + "loss": 0.038, "step": 137990 }, { - "epoch": 1.49, - "learning_rate": 7.610487377506652e-05, - "loss": 0.033, + "epoch": 0.89, + "learning_rate": 0.00016639730987433603, + "loss": 0.0422, "step": 138000 }, { - "epoch": 1.49, - "eval_cer": 0.9211269372602444, - "eval_loss": 0.02387210540473461, - "eval_runtime": 118.905, - "eval_samples_per_second": 16.82, - "eval_steps_per_second": 4.205, + "epoch": 0.89, + "eval_cer": 0.9199258840808948, + "eval_loss": 0.026540521532297134, + "eval_runtime": 119.7003, + "eval_samples_per_second": 16.708, + "eval_steps_per_second": 4.177, "step": 138000 }, { - "epoch": 1.49, - "learning_rate": 7.608864949055747e-05, - "loss": 0.0231, + "epoch": 0.89, + "learning_rate": 0.00016638762851997908, + "loss": 0.0394, "step": 138010 }, { - "epoch": 1.49, - "learning_rate": 7.60724252060484e-05, - "loss": 0.0335, + "epoch": 0.89, + "learning_rate": 0.00016637794716562213, + "loss": 0.0431, "step": 138020 }, { - "epoch": 1.49, - "learning_rate": 7.605620092153935e-05, - "loss": 0.0286, + "epoch": 0.89, + "learning_rate": 0.0001663682658112652, + "loss": 0.0419, "step": 138030 }, { - "epoch": 1.49, - "learning_rate": 7.60399766370303e-05, - "loss": 0.0291, + "epoch": 0.89, + "learning_rate": 0.00016635858445690827, + "loss": 0.0418, "step": 138040 }, { - "epoch": 1.49, - "learning_rate": 7.602375235252125e-05, - "loss": 0.0311, + "epoch": 0.89, + "learning_rate": 0.00016634890310255135, + "loss": 0.0443, "step": 138050 }, { - "epoch": 1.49, - "learning_rate": 7.60075280680122e-05, - "loss": 0.0311, + "epoch": 0.89, + "learning_rate": 0.00016633922174819443, + "loss": 0.0432, "step": 138060 }, { - "epoch": 1.49, - "learning_rate": 7.599130378350314e-05, - "loss": 0.0296, + "epoch": 0.89, + "learning_rate": 0.00016632954039383748, + "loss": 0.0379, "step": 138070 }, { - "epoch": 1.49, - "learning_rate": 7.597507949899409e-05, - "loss": 0.0258, + "epoch": 0.89, + "learning_rate": 0.00016631985903948056, + "loss": 0.0426, "step": 138080 }, { - "epoch": 1.49, - "learning_rate": 7.595885521448504e-05, - "loss": 0.0263, + "epoch": 0.89, + "learning_rate": 0.0001663101776851236, + "loss": 0.0437, "step": 138090 }, { - "epoch": 1.49, - "learning_rate": 7.594263092997599e-05, - "loss": 0.0307, + "epoch": 0.89, + "learning_rate": 0.00016630049633076666, + "loss": 0.0422, "step": 138100 }, { - "epoch": 1.49, - "learning_rate": 7.592640664546692e-05, - "loss": 0.0253, + "epoch": 0.89, + "learning_rate": 0.00016629081497640974, + "loss": 0.0465, "step": 138110 }, { - "epoch": 1.49, - "learning_rate": 7.591018236095787e-05, - "loss": 0.0295, + "epoch": 0.89, + "learning_rate": 0.00016628113362205282, + "loss": 0.0387, "step": 138120 }, { - "epoch": 1.49, - "learning_rate": 7.589395807644882e-05, - "loss": 0.0287, + "epoch": 0.89, + "learning_rate": 0.0001662714522676959, + "loss": 0.0374, "step": 138130 }, { - "epoch": 1.49, - "learning_rate": 7.587773379193977e-05, - "loss": 0.0327, + "epoch": 0.89, + "learning_rate": 0.00016626177091333896, + "loss": 0.0405, "step": 138140 }, { - "epoch": 1.49, - "learning_rate": 7.586150950743072e-05, - "loss": 0.0333, + "epoch": 0.89, + "learning_rate": 0.00016625208955898204, + "loss": 0.0429, "step": 138150 }, { - "epoch": 1.49, - "learning_rate": 7.584528522292166e-05, - "loss": 0.0294, + "epoch": 0.89, + "learning_rate": 0.0001662424082046251, + "loss": 0.0401, "step": 138160 }, { - "epoch": 1.49, - "learning_rate": 7.582906093841261e-05, - "loss": 0.0264, + "epoch": 0.89, + "learning_rate": 0.00016623272685026814, + "loss": 0.04, "step": 138170 }, { - "epoch": 1.49, - "learning_rate": 7.581283665390356e-05, - "loss": 0.032, + "epoch": 0.89, + "learning_rate": 0.00016622304549591122, + "loss": 0.042, "step": 138180 }, { - "epoch": 1.49, - "learning_rate": 7.579661236939451e-05, - "loss": 0.0314, + "epoch": 0.89, + "learning_rate": 0.0001662133641415543, + "loss": 0.0473, "step": 138190 }, { - "epoch": 1.49, - "learning_rate": 7.578038808488544e-05, - "loss": 0.0281, + "epoch": 0.89, + "learning_rate": 0.00016620368278719738, + "loss": 0.0393, "step": 138200 }, { - "epoch": 1.49, - "learning_rate": 7.57641638003764e-05, - "loss": 0.0336, + "epoch": 0.89, + "learning_rate": 0.00016619400143284043, + "loss": 0.0462, "step": 138210 }, { - "epoch": 1.49, - "learning_rate": 7.574793951586734e-05, - "loss": 0.0263, + "epoch": 0.89, + "learning_rate": 0.0001661843200784835, + "loss": 0.0405, "step": 138220 }, { - "epoch": 1.5, - "learning_rate": 7.57317152313583e-05, - "loss": 0.0216, + "epoch": 0.89, + "learning_rate": 0.00016617463872412654, + "loss": 0.0426, "step": 138230 }, { - "epoch": 1.5, - "learning_rate": 7.571549094684924e-05, - "loss": 0.0256, + "epoch": 0.89, + "learning_rate": 0.00016616495736976962, + "loss": 0.0348, "step": 138240 }, { - "epoch": 1.5, - "learning_rate": 7.569926666234018e-05, - "loss": 0.0261, + "epoch": 0.89, + "learning_rate": 0.0001661552760154127, + "loss": 0.0437, "step": 138250 }, { - "epoch": 1.5, - "learning_rate": 7.568304237783113e-05, - "loss": 0.0347, + "epoch": 0.89, + "learning_rate": 0.00016614559466105578, + "loss": 0.044, "step": 138260 }, { - "epoch": 1.5, - "learning_rate": 7.566681809332208e-05, - "loss": 0.0294, + "epoch": 0.89, + "learning_rate": 0.00016613591330669883, + "loss": 0.0377, "step": 138270 }, { - "epoch": 1.5, - "learning_rate": 7.565059380881303e-05, - "loss": 0.0309, + "epoch": 0.89, + "learning_rate": 0.0001661262319523419, + "loss": 0.0375, "step": 138280 }, { - "epoch": 1.5, - "learning_rate": 7.563436952430398e-05, - "loss": 0.0339, + "epoch": 0.89, + "learning_rate": 0.000166116550597985, + "loss": 0.0355, "step": 138290 }, { - "epoch": 1.5, - "learning_rate": 7.561814523979492e-05, - "loss": 0.0287, + "epoch": 0.89, + "learning_rate": 0.00016610686924362802, + "loss": 0.05, "step": 138300 }, { - "epoch": 1.5, - "learning_rate": 7.560192095528587e-05, - "loss": 0.0359, + "epoch": 0.89, + "learning_rate": 0.0001660971878892711, + "loss": 0.0409, "step": 138310 }, { - "epoch": 1.5, - "learning_rate": 7.558569667077682e-05, - "loss": 0.0267, + "epoch": 0.89, + "learning_rate": 0.00016608750653491418, + "loss": 0.0388, "step": 138320 }, { - "epoch": 1.5, - "learning_rate": 7.556947238626776e-05, - "loss": 0.0314, + "epoch": 0.89, + "learning_rate": 0.00016607782518055726, + "loss": 0.0354, "step": 138330 }, { - "epoch": 1.5, - "learning_rate": 7.55532481017587e-05, - "loss": 0.0295, + "epoch": 0.89, + "learning_rate": 0.0001660681438262003, + "loss": 0.0403, "step": 138340 }, { - "epoch": 1.5, - "learning_rate": 7.553702381724965e-05, - "loss": 0.0312, + "epoch": 0.89, + "learning_rate": 0.0001660584624718434, + "loss": 0.0403, "step": 138350 }, { - "epoch": 1.5, - "learning_rate": 7.55207995327406e-05, - "loss": 0.0287, + "epoch": 0.89, + "learning_rate": 0.00016604878111748647, + "loss": 0.0448, "step": 138360 }, { - "epoch": 1.5, - "learning_rate": 7.550457524823155e-05, - "loss": 0.0257, + "epoch": 0.89, + "learning_rate": 0.0001660390997631295, + "loss": 0.0425, "step": 138370 }, { - "epoch": 1.5, - "learning_rate": 7.54883509637225e-05, - "loss": 0.0273, + "epoch": 0.89, + "learning_rate": 0.00016602941840877257, + "loss": 0.0419, "step": 138380 }, { - "epoch": 1.5, - "learning_rate": 7.547212667921344e-05, - "loss": 0.0306, + "epoch": 0.89, + "learning_rate": 0.00016601973705441565, + "loss": 0.0388, "step": 138390 }, { - "epoch": 1.5, - "learning_rate": 7.545590239470439e-05, - "loss": 0.0283, + "epoch": 0.89, + "learning_rate": 0.00016601005570005873, + "loss": 0.0378, "step": 138400 }, { - "epoch": 1.5, - "learning_rate": 7.543967811019534e-05, - "loss": 0.0298, + "epoch": 0.89, + "learning_rate": 0.00016600037434570179, + "loss": 0.0437, "step": 138410 }, { - "epoch": 1.5, - "learning_rate": 7.542345382568629e-05, - "loss": 0.0338, + "epoch": 0.89, + "learning_rate": 0.00016599069299134487, + "loss": 0.0417, "step": 138420 }, { - "epoch": 1.5, - "learning_rate": 7.540722954117722e-05, - "loss": 0.0237, + "epoch": 0.89, + "learning_rate": 0.00016598101163698795, + "loss": 0.038, "step": 138430 }, { - "epoch": 1.5, - "learning_rate": 7.539100525666817e-05, - "loss": 0.028, + "epoch": 0.89, + "learning_rate": 0.00016597133028263097, + "loss": 0.035, "step": 138440 }, { - "epoch": 1.5, - "learning_rate": 7.537478097215912e-05, - "loss": 0.0327, + "epoch": 0.89, + "learning_rate": 0.00016596164892827405, + "loss": 0.0518, "step": 138450 }, { - "epoch": 1.5, - "learning_rate": 7.535855668765007e-05, - "loss": 0.035, + "epoch": 0.89, + "learning_rate": 0.00016595196757391713, + "loss": 0.0446, "step": 138460 }, { - "epoch": 1.5, - "learning_rate": 7.534233240314102e-05, - "loss": 0.0328, + "epoch": 0.89, + "learning_rate": 0.00016594228621956018, + "loss": 0.0471, "step": 138470 }, { - "epoch": 1.5, - "learning_rate": 7.532610811863196e-05, - "loss": 0.0302, + "epoch": 0.89, + "learning_rate": 0.00016593260486520326, + "loss": 0.0398, "step": 138480 }, { - "epoch": 1.5, - "learning_rate": 7.530988383412291e-05, - "loss": 0.0334, + "epoch": 0.89, + "learning_rate": 0.00016592292351084634, + "loss": 0.0455, "step": 138490 }, { - "epoch": 1.5, - "learning_rate": 7.529365954961386e-05, - "loss": 0.0295, + "epoch": 0.89, + "learning_rate": 0.00016591324215648942, + "loss": 0.0391, "step": 138500 }, { - "epoch": 1.5, - "learning_rate": 7.52774352651048e-05, - "loss": 0.029, + "epoch": 0.89, + "learning_rate": 0.00016590356080213245, + "loss": 0.0357, "step": 138510 }, { - "epoch": 1.5, - "learning_rate": 7.526121098059574e-05, - "loss": 0.0348, + "epoch": 0.89, + "learning_rate": 0.00016589387944777553, + "loss": 0.0417, "step": 138520 }, { - "epoch": 1.5, - "learning_rate": 7.524498669608669e-05, - "loss": 0.0293, + "epoch": 0.89, + "learning_rate": 0.0001658841980934186, + "loss": 0.036, "step": 138530 }, { - "epoch": 1.5, - "learning_rate": 7.522876241157764e-05, - "loss": 0.0285, + "epoch": 0.89, + "learning_rate": 0.00016587451673906166, + "loss": 0.0357, "step": 138540 }, { - "epoch": 1.5, - "learning_rate": 7.521253812706859e-05, - "loss": 0.0353, + "epoch": 0.89, + "learning_rate": 0.00016586483538470474, + "loss": 0.0478, "step": 138550 }, { - "epoch": 1.5, - "learning_rate": 7.519631384255954e-05, - "loss": 0.0273, + "epoch": 0.89, + "learning_rate": 0.00016585515403034782, + "loss": 0.0355, "step": 138560 }, { - "epoch": 1.5, - "learning_rate": 7.518008955805048e-05, - "loss": 0.0272, + "epoch": 0.89, + "learning_rate": 0.0001658454726759909, + "loss": 0.0449, "step": 138570 }, { - "epoch": 1.5, - "learning_rate": 7.516386527354143e-05, - "loss": 0.0278, + "epoch": 0.89, + "learning_rate": 0.00016583579132163393, + "loss": 0.0395, "step": 138580 }, { - "epoch": 1.5, - "learning_rate": 7.514764098903238e-05, - "loss": 0.0303, + "epoch": 0.89, + "learning_rate": 0.000165826109967277, + "loss": 0.0418, "step": 138590 }, { - "epoch": 1.5, - "learning_rate": 7.513141670452333e-05, - "loss": 0.0281, + "epoch": 0.89, + "learning_rate": 0.00016581642861292008, + "loss": 0.0424, "step": 138600 }, { - "epoch": 1.5, - "learning_rate": 7.511519242001426e-05, - "loss": 0.0249, + "epoch": 0.89, + "learning_rate": 0.00016580674725856314, + "loss": 0.0367, "step": 138610 }, { - "epoch": 1.5, - "learning_rate": 7.509896813550521e-05, - "loss": 0.0329, + "epoch": 0.89, + "learning_rate": 0.00016579706590420622, + "loss": 0.039, "step": 138620 }, { - "epoch": 1.5, - "learning_rate": 7.508274385099616e-05, - "loss": 0.0292, + "epoch": 0.89, + "learning_rate": 0.0001657873845498493, + "loss": 0.0468, "step": 138630 }, { - "epoch": 1.5, - "learning_rate": 7.506651956648711e-05, - "loss": 0.0334, + "epoch": 0.89, + "learning_rate": 0.00016577770319549235, + "loss": 0.0457, "step": 138640 }, { - "epoch": 1.5, - "learning_rate": 7.505029528197806e-05, - "loss": 0.0284, + "epoch": 0.89, + "learning_rate": 0.0001657680218411354, + "loss": 0.0355, "step": 138650 }, { - "epoch": 1.5, - "learning_rate": 7.5034070997469e-05, - "loss": 0.0277, + "epoch": 0.89, + "learning_rate": 0.00016575834048677848, + "loss": 0.04, "step": 138660 }, { - "epoch": 1.5, - "learning_rate": 7.501784671295995e-05, - "loss": 0.0348, + "epoch": 0.9, + "learning_rate": 0.00016574865913242153, + "loss": 0.0446, "step": 138670 }, { - "epoch": 1.5, - "learning_rate": 7.50016224284509e-05, - "loss": 0.0292, + "epoch": 0.9, + "learning_rate": 0.00016573897777806461, + "loss": 0.0436, "step": 138680 }, { - "epoch": 1.5, - "learning_rate": 7.498539814394185e-05, - "loss": 0.0325, + "epoch": 0.9, + "learning_rate": 0.0001657292964237077, + "loss": 0.0391, "step": 138690 }, { - "epoch": 1.5, - "learning_rate": 7.496917385943278e-05, - "loss": 0.0334, + "epoch": 0.9, + "learning_rate": 0.00016571961506935077, + "loss": 0.0417, "step": 138700 }, { - "epoch": 1.5, - "learning_rate": 7.495294957492373e-05, - "loss": 0.0276, + "epoch": 0.9, + "learning_rate": 0.00016570993371499383, + "loss": 0.0373, "step": 138710 }, { - "epoch": 1.5, - "learning_rate": 7.493672529041468e-05, - "loss": 0.031, + "epoch": 0.9, + "learning_rate": 0.00016570025236063688, + "loss": 0.0413, "step": 138720 }, { - "epoch": 1.5, - "learning_rate": 7.492050100590563e-05, - "loss": 0.0304, + "epoch": 0.9, + "learning_rate": 0.00016569057100627996, + "loss": 0.0427, "step": 138730 }, { - "epoch": 1.5, - "learning_rate": 7.490427672139658e-05, - "loss": 0.0309, + "epoch": 0.9, + "learning_rate": 0.000165680889651923, + "loss": 0.0366, "step": 138740 }, { - "epoch": 1.5, - "learning_rate": 7.488805243688752e-05, - "loss": 0.0315, + "epoch": 0.9, + "learning_rate": 0.0001656712082975661, + "loss": 0.0426, "step": 138750 }, { - "epoch": 1.5, - "learning_rate": 7.487182815237847e-05, - "loss": 0.0254, + "epoch": 0.9, + "learning_rate": 0.00016566152694320917, + "loss": 0.0421, "step": 138760 }, { - "epoch": 1.5, - "learning_rate": 7.485560386786942e-05, - "loss": 0.0282, + "epoch": 0.9, + "learning_rate": 0.00016565184558885225, + "loss": 0.0366, "step": 138770 }, { - "epoch": 1.5, - "learning_rate": 7.483937958336037e-05, + "epoch": 0.9, + "learning_rate": 0.0001656421642344953, "loss": 0.0351, "step": 138780 }, { - "epoch": 1.5, - "learning_rate": 7.48231552988513e-05, - "loss": 0.0296, + "epoch": 0.9, + "learning_rate": 0.00016563248288013836, + "loss": 0.0438, "step": 138790 }, { - "epoch": 1.5, - "learning_rate": 7.480693101434226e-05, - "loss": 0.0287, + "epoch": 0.9, + "learning_rate": 0.00016562280152578144, + "loss": 0.0406, "step": 138800 }, { - "epoch": 1.5, - "learning_rate": 7.47907067298332e-05, - "loss": 0.0285, + "epoch": 0.9, + "learning_rate": 0.0001656131201714245, + "loss": 0.0408, "step": 138810 }, { - "epoch": 1.5, - "learning_rate": 7.477448244532415e-05, - "loss": 0.0325, + "epoch": 0.9, + "learning_rate": 0.00016560343881706757, + "loss": 0.0423, "step": 138820 }, { - "epoch": 1.5, - "learning_rate": 7.47582581608151e-05, - "loss": 0.0295, + "epoch": 0.9, + "learning_rate": 0.00016559375746271065, + "loss": 0.0376, "step": 138830 }, { - "epoch": 1.5, - "learning_rate": 7.474203387630604e-05, - "loss": 0.0323, + "epoch": 0.9, + "learning_rate": 0.0001655840761083537, + "loss": 0.0486, "step": 138840 }, { - "epoch": 1.5, - "learning_rate": 7.472580959179699e-05, - "loss": 0.0231, + "epoch": 0.9, + "learning_rate": 0.00016557439475399678, + "loss": 0.0391, "step": 138850 }, { - "epoch": 1.5, - "learning_rate": 7.470958530728794e-05, - "loss": 0.0298, + "epoch": 0.9, + "learning_rate": 0.00016556471339963983, + "loss": 0.0406, "step": 138860 }, { - "epoch": 1.5, - "learning_rate": 7.469336102277889e-05, - "loss": 0.0313, + "epoch": 0.9, + "learning_rate": 0.0001655550320452829, + "loss": 0.0512, "step": 138870 }, { - "epoch": 1.5, - "learning_rate": 7.467713673826983e-05, - "loss": 0.0289, + "epoch": 0.9, + "learning_rate": 0.00016554535069092597, + "loss": 0.0444, "step": 138880 }, { - "epoch": 1.5, - "learning_rate": 7.466091245376078e-05, - "loss": 0.0306, + "epoch": 0.9, + "learning_rate": 0.00016553566933656905, + "loss": 0.0407, "step": 138890 }, { - "epoch": 1.5, - "learning_rate": 7.464468816925173e-05, - "loss": 0.029, + "epoch": 0.9, + "learning_rate": 0.00016552598798221213, + "loss": 0.0394, "step": 138900 }, { - "epoch": 1.5, - "learning_rate": 7.462846388474268e-05, - "loss": 0.0283, + "epoch": 0.9, + "learning_rate": 0.00016551630662785518, + "loss": 0.038, "step": 138910 }, { - "epoch": 1.5, - "learning_rate": 7.461223960023363e-05, - "loss": 0.03, + "epoch": 0.9, + "learning_rate": 0.00016550662527349826, + "loss": 0.0522, "step": 138920 }, { - "epoch": 1.5, - "learning_rate": 7.459601531572456e-05, - "loss": 0.0324, + "epoch": 0.9, + "learning_rate": 0.0001654969439191413, + "loss": 0.0376, "step": 138930 }, { - "epoch": 1.5, - "learning_rate": 7.457979103121551e-05, - "loss": 0.0301, + "epoch": 0.9, + "learning_rate": 0.00016548726256478436, + "loss": 0.0389, "step": 138940 }, { - "epoch": 1.5, - "learning_rate": 7.456356674670646e-05, - "loss": 0.0268, + "epoch": 0.9, + "learning_rate": 0.00016547758121042744, + "loss": 0.0415, "step": 138950 }, { - "epoch": 1.5, - "learning_rate": 7.454734246219741e-05, - "loss": 0.0364, + "epoch": 0.9, + "learning_rate": 0.00016546789985607052, + "loss": 0.0414, "step": 138960 }, { - "epoch": 1.5, - "learning_rate": 7.453111817768835e-05, - "loss": 0.0331, + "epoch": 0.9, + "learning_rate": 0.0001654582185017136, + "loss": 0.0423, "step": 138970 }, { - "epoch": 1.5, - "learning_rate": 7.45148938931793e-05, - "loss": 0.0246, + "epoch": 0.9, + "learning_rate": 0.00016544853714735666, + "loss": 0.0422, "step": 138980 }, { - "epoch": 1.5, - "learning_rate": 7.449866960867025e-05, - "loss": 0.0232, + "epoch": 0.9, + "learning_rate": 0.00016543885579299974, + "loss": 0.0373, "step": 138990 }, { - "epoch": 1.5, - "learning_rate": 7.44824453241612e-05, - "loss": 0.03, + "epoch": 0.9, + "learning_rate": 0.0001654291744386428, + "loss": 0.0464, "step": 139000 }, { - "epoch": 1.5, - "eval_cer": 0.9210686272950714, - "eval_loss": 0.023618407547473907, - "eval_runtime": 119.0121, - "eval_samples_per_second": 16.805, - "eval_steps_per_second": 4.201, + "epoch": 0.9, + "eval_cer": 0.9199593266297593, + "eval_loss": 0.026463398709893227, + "eval_runtime": 120.0017, + "eval_samples_per_second": 16.666, + "eval_steps_per_second": 4.167, "step": 139000 }, { - "epoch": 1.5, - "learning_rate": 7.446622103965215e-05, - "loss": 0.0246, + "epoch": 0.9, + "learning_rate": 0.00016541949308428584, + "loss": 0.0513, "step": 139010 }, { - "epoch": 1.5, - "learning_rate": 7.444999675514308e-05, - "loss": 0.0301, + "epoch": 0.9, + "learning_rate": 0.00016540981172992892, + "loss": 0.0376, "step": 139020 }, { - "epoch": 1.5, - "learning_rate": 7.443377247063403e-05, - "loss": 0.0289, + "epoch": 0.9, + "learning_rate": 0.000165400130375572, + "loss": 0.0459, "step": 139030 }, { - "epoch": 1.5, - "learning_rate": 7.4417548186125e-05, - "loss": 0.0295, + "epoch": 0.9, + "learning_rate": 0.00016539044902121505, + "loss": 0.0433, "step": 139040 }, { - "epoch": 1.5, - "learning_rate": 7.440132390161593e-05, - "loss": 0.0305, + "epoch": 0.9, + "learning_rate": 0.00016538076766685813, + "loss": 0.0399, "step": 139050 }, { - "epoch": 1.5, - "learning_rate": 7.438509961710688e-05, - "loss": 0.0276, + "epoch": 0.9, + "learning_rate": 0.0001653710863125012, + "loss": 0.0367, "step": 139060 }, { - "epoch": 1.5, - "learning_rate": 7.436887533259783e-05, - "loss": 0.0266, + "epoch": 0.9, + "learning_rate": 0.00016536140495814424, + "loss": 0.0391, "step": 139070 }, { - "epoch": 1.5, - "learning_rate": 7.435265104808878e-05, - "loss": 0.0322, + "epoch": 0.9, + "learning_rate": 0.00016535172360378732, + "loss": 0.0349, "step": 139080 }, { - "epoch": 1.5, - "learning_rate": 7.433642676357972e-05, - "loss": 0.031, + "epoch": 0.9, + "learning_rate": 0.0001653420422494304, + "loss": 0.0395, "step": 139090 }, { - "epoch": 1.5, - "learning_rate": 7.432020247907067e-05, - "loss": 0.0324, + "epoch": 0.9, + "learning_rate": 0.00016533236089507348, + "loss": 0.0373, "step": 139100 }, { - "epoch": 1.5, - "learning_rate": 7.430397819456162e-05, - "loss": 0.0271, + "epoch": 0.9, + "learning_rate": 0.00016532267954071653, + "loss": 0.0402, "step": 139110 }, { - "epoch": 1.5, - "learning_rate": 7.428775391005257e-05, - "loss": 0.0286, + "epoch": 0.9, + "learning_rate": 0.0001653129981863596, + "loss": 0.0334, "step": 139120 }, { - "epoch": 1.5, - "learning_rate": 7.427152962554352e-05, - "loss": 0.031, + "epoch": 0.9, + "learning_rate": 0.0001653033168320027, + "loss": 0.0364, "step": 139130 }, { - "epoch": 1.5, - "learning_rate": 7.425530534103445e-05, - "loss": 0.029, + "epoch": 0.9, + "learning_rate": 0.00016529363547764572, + "loss": 0.0368, "step": 139140 }, { - "epoch": 1.51, - "learning_rate": 7.42390810565254e-05, - "loss": 0.028, + "epoch": 0.9, + "learning_rate": 0.0001652839541232888, + "loss": 0.038, "step": 139150 }, { - "epoch": 1.51, - "learning_rate": 7.422285677201635e-05, - "loss": 0.0236, + "epoch": 0.9, + "learning_rate": 0.00016527427276893188, + "loss": 0.0306, "step": 139160 }, { - "epoch": 1.51, - "learning_rate": 7.42066324875073e-05, - "loss": 0.0302, + "epoch": 0.9, + "learning_rate": 0.00016526459141457496, + "loss": 0.0424, "step": 139170 }, { - "epoch": 1.51, - "learning_rate": 7.419040820299824e-05, - "loss": 0.0249, + "epoch": 0.9, + "learning_rate": 0.000165254910060218, + "loss": 0.0373, "step": 139180 }, { - "epoch": 1.51, - "learning_rate": 7.417418391848919e-05, - "loss": 0.0264, + "epoch": 0.9, + "learning_rate": 0.0001652452287058611, + "loss": 0.0351, "step": 139190 }, { - "epoch": 1.51, - "learning_rate": 7.415795963398014e-05, - "loss": 0.0288, + "epoch": 0.9, + "learning_rate": 0.00016523554735150417, + "loss": 0.0427, "step": 139200 }, { - "epoch": 1.51, - "learning_rate": 7.414173534947109e-05, - "loss": 0.0277, + "epoch": 0.9, + "learning_rate": 0.0001652258659971472, + "loss": 0.0519, "step": 139210 }, { - "epoch": 1.51, - "learning_rate": 7.412551106496204e-05, - "loss": 0.0374, + "epoch": 0.9, + "learning_rate": 0.00016521618464279027, + "loss": 0.0424, "step": 139220 }, { - "epoch": 1.51, - "learning_rate": 7.410928678045297e-05, - "loss": 0.0249, + "epoch": 0.9, + "learning_rate": 0.00016520650328843335, + "loss": 0.0409, "step": 139230 }, { - "epoch": 1.51, - "learning_rate": 7.409306249594392e-05, - "loss": 0.0262, + "epoch": 0.9, + "learning_rate": 0.0001651968219340764, + "loss": 0.0391, "step": 139240 }, { - "epoch": 1.51, - "learning_rate": 7.407683821143487e-05, - "loss": 0.0309, + "epoch": 0.9, + "learning_rate": 0.00016518714057971949, + "loss": 0.0387, "step": 139250 }, { - "epoch": 1.51, - "learning_rate": 7.406061392692582e-05, - "loss": 0.0294, + "epoch": 0.9, + "learning_rate": 0.00016517745922536256, + "loss": 0.0444, "step": 139260 }, { - "epoch": 1.51, - "learning_rate": 7.404438964241676e-05, - "loss": 0.0326, + "epoch": 0.9, + "learning_rate": 0.00016516777787100564, + "loss": 0.0406, "step": 139270 }, { - "epoch": 1.51, - "learning_rate": 7.402816535790771e-05, - "loss": 0.0311, + "epoch": 0.9, + "learning_rate": 0.00016515809651664867, + "loss": 0.0344, "step": 139280 }, { - "epoch": 1.51, - "learning_rate": 7.401194107339866e-05, - "loss": 0.0332, + "epoch": 0.9, + "learning_rate": 0.00016514841516229175, + "loss": 0.0364, "step": 139290 }, { - "epoch": 1.51, - "learning_rate": 7.399571678888961e-05, - "loss": 0.0274, + "epoch": 0.9, + "learning_rate": 0.00016513873380793483, + "loss": 0.0383, "step": 139300 }, { - "epoch": 1.51, - "learning_rate": 7.397949250438056e-05, - "loss": 0.0347, + "epoch": 0.9, + "learning_rate": 0.00016512905245357788, + "loss": 0.0383, "step": 139310 }, { - "epoch": 1.51, - "learning_rate": 7.39632682198715e-05, - "loss": 0.0271, + "epoch": 0.9, + "learning_rate": 0.00016511937109922096, + "loss": 0.0351, "step": 139320 }, { - "epoch": 1.51, - "learning_rate": 7.394704393536244e-05, - "loss": 0.027, + "epoch": 0.9, + "learning_rate": 0.00016510968974486404, + "loss": 0.0406, "step": 139330 }, { - "epoch": 1.51, - "learning_rate": 7.39308196508534e-05, - "loss": 0.0271, + "epoch": 0.9, + "learning_rate": 0.00016510000839050712, + "loss": 0.0403, "step": 139340 }, { - "epoch": 1.51, - "learning_rate": 7.391459536634434e-05, - "loss": 0.0276, + "epoch": 0.9, + "learning_rate": 0.00016509032703615015, + "loss": 0.0403, "step": 139350 }, { - "epoch": 1.51, - "learning_rate": 7.389837108183529e-05, - "loss": 0.026, + "epoch": 0.9, + "learning_rate": 0.00016508064568179323, + "loss": 0.0374, "step": 139360 }, { - "epoch": 1.51, - "learning_rate": 7.388214679732623e-05, - "loss": 0.0263, + "epoch": 0.9, + "learning_rate": 0.0001650709643274363, + "loss": 0.0383, "step": 139370 }, { - "epoch": 1.51, - "learning_rate": 7.386592251281718e-05, - "loss": 0.0311, + "epoch": 0.9, + "learning_rate": 0.00016506128297307936, + "loss": 0.0354, "step": 139380 }, { - "epoch": 1.51, - "learning_rate": 7.384969822830813e-05, - "loss": 0.0272, + "epoch": 0.9, + "learning_rate": 0.00016505160161872244, + "loss": 0.041, "step": 139390 }, { - "epoch": 1.51, - "learning_rate": 7.383347394379908e-05, - "loss": 0.0263, + "epoch": 0.9, + "learning_rate": 0.00016504192026436552, + "loss": 0.0387, "step": 139400 }, { - "epoch": 1.51, - "learning_rate": 7.381724965929001e-05, - "loss": 0.0291, + "epoch": 0.9, + "learning_rate": 0.00016503223891000857, + "loss": 0.0319, "step": 139410 }, { - "epoch": 1.51, - "learning_rate": 7.380102537478096e-05, - "loss": 0.0235, + "epoch": 0.9, + "learning_rate": 0.00016502255755565162, + "loss": 0.0434, "step": 139420 }, { - "epoch": 1.51, - "learning_rate": 7.378480109027191e-05, - "loss": 0.04, + "epoch": 0.9, + "learning_rate": 0.0001650128762012947, + "loss": 0.0382, "step": 139430 }, { - "epoch": 1.51, - "learning_rate": 7.376857680576286e-05, - "loss": 0.0301, + "epoch": 0.9, + "learning_rate": 0.00016500319484693776, + "loss": 0.0405, "step": 139440 }, { - "epoch": 1.51, - "learning_rate": 7.375235252125381e-05, - "loss": 0.0341, + "epoch": 0.9, + "learning_rate": 0.00016499351349258084, + "loss": 0.0354, "step": 139450 }, { - "epoch": 1.51, - "learning_rate": 7.373612823674475e-05, - "loss": 0.0318, + "epoch": 0.9, + "learning_rate": 0.00016498383213822392, + "loss": 0.0454, "step": 139460 }, { - "epoch": 1.51, - "learning_rate": 7.37199039522357e-05, - "loss": 0.0333, + "epoch": 0.9, + "learning_rate": 0.000164974150783867, + "loss": 0.0429, "step": 139470 }, { - "epoch": 1.51, - "learning_rate": 7.370367966772665e-05, - "loss": 0.0316, + "epoch": 0.9, + "learning_rate": 0.00016496446942951005, + "loss": 0.0434, "step": 139480 }, { - "epoch": 1.51, - "learning_rate": 7.36874553832176e-05, - "loss": 0.0376, + "epoch": 0.9, + "learning_rate": 0.0001649547880751531, + "loss": 0.0389, "step": 139490 }, { - "epoch": 1.51, - "learning_rate": 7.367123109870854e-05, - "loss": 0.0254, + "epoch": 0.9, + "learning_rate": 0.00016494510672079618, + "loss": 0.0436, "step": 139500 }, { - "epoch": 1.51, - "learning_rate": 7.365500681419949e-05, - "loss": 0.0393, + "epoch": 0.9, + "learning_rate": 0.00016493542536643923, + "loss": 0.0375, "step": 139510 }, { - "epoch": 1.51, - "learning_rate": 7.363878252969044e-05, - "loss": 0.0259, + "epoch": 0.9, + "learning_rate": 0.00016492574401208231, + "loss": 0.0385, "step": 139520 }, { - "epoch": 1.51, - "learning_rate": 7.362255824518139e-05, - "loss": 0.0332, + "epoch": 0.9, + "learning_rate": 0.0001649160626577254, + "loss": 0.0492, "step": 139530 }, { - "epoch": 1.51, - "learning_rate": 7.360633396067233e-05, - "loss": 0.0219, + "epoch": 0.9, + "learning_rate": 0.00016490638130336847, + "loss": 0.0357, "step": 139540 }, { - "epoch": 1.51, - "learning_rate": 7.359010967616327e-05, - "loss": 0.0289, + "epoch": 0.9, + "learning_rate": 0.00016489669994901153, + "loss": 0.0365, "step": 139550 }, { - "epoch": 1.51, - "learning_rate": 7.357388539165422e-05, - "loss": 0.0291, + "epoch": 0.9, + "learning_rate": 0.00016488701859465458, + "loss": 0.0448, "step": 139560 }, { - "epoch": 1.51, - "learning_rate": 7.355766110714517e-05, - "loss": 0.0296, + "epoch": 0.9, + "learning_rate": 0.00016487733724029766, + "loss": 0.0379, "step": 139570 }, { - "epoch": 1.51, - "learning_rate": 7.354143682263612e-05, - "loss": 0.0329, + "epoch": 0.9, + "learning_rate": 0.0001648676558859407, + "loss": 0.036, "step": 139580 }, { - "epoch": 1.51, - "learning_rate": 7.352521253812706e-05, - "loss": 0.03, + "epoch": 0.9, + "learning_rate": 0.0001648579745315838, + "loss": 0.0388, "step": 139590 }, { - "epoch": 1.51, - "learning_rate": 7.3508988253618e-05, - "loss": 0.0269, + "epoch": 0.9, + "learning_rate": 0.00016484829317722687, + "loss": 0.0486, "step": 139600 }, { - "epoch": 1.51, - "learning_rate": 7.349276396910896e-05, - "loss": 0.0326, + "epoch": 0.9, + "learning_rate": 0.00016483861182286992, + "loss": 0.0347, "step": 139610 }, { - "epoch": 1.51, - "learning_rate": 7.34765396845999e-05, - "loss": 0.0317, + "epoch": 0.9, + "learning_rate": 0.000164828930468513, + "loss": 0.0335, "step": 139620 }, { - "epoch": 1.51, - "learning_rate": 7.346031540009086e-05, - "loss": 0.0265, + "epoch": 0.9, + "learning_rate": 0.00016481924911415606, + "loss": 0.041, "step": 139630 }, { - "epoch": 1.51, - "learning_rate": 7.344409111558179e-05, - "loss": 0.0291, + "epoch": 0.9, + "learning_rate": 0.0001648095677597991, + "loss": 0.0334, "step": 139640 }, { - "epoch": 1.51, - "learning_rate": 7.342786683107274e-05, - "loss": 0.0293, + "epoch": 0.9, + "learning_rate": 0.0001647998864054422, + "loss": 0.0494, "step": 139650 }, { - "epoch": 1.51, - "learning_rate": 7.341164254656369e-05, - "loss": 0.0292, + "epoch": 0.9, + "learning_rate": 0.00016479020505108527, + "loss": 0.0455, "step": 139660 }, { - "epoch": 1.51, - "learning_rate": 7.339541826205464e-05, - "loss": 0.028, + "epoch": 0.9, + "learning_rate": 0.00016478052369672835, + "loss": 0.034, "step": 139670 }, { - "epoch": 1.51, - "learning_rate": 7.337919397754558e-05, - "loss": 0.0294, + "epoch": 0.9, + "learning_rate": 0.0001647708423423714, + "loss": 0.0378, "step": 139680 }, { - "epoch": 1.51, - "learning_rate": 7.336296969303653e-05, - "loss": 0.0301, + "epoch": 0.9, + "learning_rate": 0.00016476116098801448, + "loss": 0.0422, "step": 139690 }, { - "epoch": 1.51, - "learning_rate": 7.334674540852748e-05, - "loss": 0.0286, + "epoch": 0.9, + "learning_rate": 0.00016475147963365753, + "loss": 0.0385, "step": 139700 }, { - "epoch": 1.51, - "learning_rate": 7.333052112401843e-05, - "loss": 0.0286, + "epoch": 0.9, + "learning_rate": 0.00016474179827930059, + "loss": 0.0412, "step": 139710 }, { - "epoch": 1.51, - "learning_rate": 7.331429683950938e-05, - "loss": 0.0363, + "epoch": 0.9, + "learning_rate": 0.00016473211692494367, + "loss": 0.0365, "step": 139720 }, { - "epoch": 1.51, - "learning_rate": 7.329807255500031e-05, - "loss": 0.0276, + "epoch": 0.9, + "learning_rate": 0.00016472243557058675, + "loss": 0.034, "step": 139730 }, { - "epoch": 1.51, - "learning_rate": 7.328184827049126e-05, - "loss": 0.0341, + "epoch": 0.9, + "learning_rate": 0.00016471275421622983, + "loss": 0.0368, "step": 139740 }, { - "epoch": 1.51, - "learning_rate": 7.326562398598221e-05, - "loss": 0.0307, + "epoch": 0.9, + "learning_rate": 0.00016470307286187288, + "loss": 0.0343, "step": 139750 }, { - "epoch": 1.51, - "learning_rate": 7.324939970147316e-05, - "loss": 0.0342, + "epoch": 0.9, + "learning_rate": 0.00016469339150751596, + "loss": 0.0388, "step": 139760 }, { - "epoch": 1.51, - "learning_rate": 7.32331754169641e-05, - "loss": 0.0256, + "epoch": 0.9, + "learning_rate": 0.000164683710153159, + "loss": 0.0499, "step": 139770 }, { - "epoch": 1.51, - "learning_rate": 7.321695113245505e-05, - "loss": 0.025, + "epoch": 0.9, + "learning_rate": 0.00016467402879880206, + "loss": 0.0396, "step": 139780 }, { - "epoch": 1.51, - "learning_rate": 7.3200726847946e-05, - "loss": 0.0319, + "epoch": 0.9, + "learning_rate": 0.00016466434744444514, + "loss": 0.0423, "step": 139790 }, { - "epoch": 1.51, - "learning_rate": 7.318450256343695e-05, - "loss": 0.0298, + "epoch": 0.9, + "learning_rate": 0.00016465466609008822, + "loss": 0.0412, "step": 139800 }, { - "epoch": 1.51, - "learning_rate": 7.31682782789279e-05, - "loss": 0.0303, + "epoch": 0.9, + "learning_rate": 0.00016464498473573128, + "loss": 0.0418, "step": 139810 }, { - "epoch": 1.51, - "learning_rate": 7.315205399441883e-05, - "loss": 0.0305, + "epoch": 0.9, + "learning_rate": 0.00016463530338137436, + "loss": 0.04, "step": 139820 }, { - "epoch": 1.51, - "learning_rate": 7.313582970990978e-05, - "loss": 0.0281, + "epoch": 0.9, + "learning_rate": 0.00016462562202701744, + "loss": 0.0367, "step": 139830 }, { - "epoch": 1.51, - "learning_rate": 7.311960542540073e-05, - "loss": 0.0254, + "epoch": 0.9, + "learning_rate": 0.00016461594067266046, + "loss": 0.042, "step": 139840 }, { - "epoch": 1.51, - "learning_rate": 7.310338114089168e-05, - "loss": 0.0565, + "epoch": 0.9, + "learning_rate": 0.00016460625931830354, + "loss": 0.0402, "step": 139850 }, { - "epoch": 1.51, - "learning_rate": 7.308715685638262e-05, - "loss": 0.0253, + "epoch": 0.9, + "learning_rate": 0.00016459657796394662, + "loss": 0.0433, "step": 139860 }, { - "epoch": 1.51, - "learning_rate": 7.307093257187357e-05, - "loss": 0.0356, + "epoch": 0.9, + "learning_rate": 0.0001645868966095897, + "loss": 0.0346, "step": 139870 }, { - "epoch": 1.51, - "learning_rate": 7.305470828736452e-05, - "loss": 0.0316, + "epoch": 0.9, + "learning_rate": 0.00016457721525523275, + "loss": 0.0394, "step": 139880 }, { - "epoch": 1.51, - "learning_rate": 7.303848400285547e-05, - "loss": 0.029, + "epoch": 0.9, + "learning_rate": 0.00016456753390087583, + "loss": 0.0377, "step": 139890 }, { - "epoch": 1.51, - "learning_rate": 7.302225971834642e-05, - "loss": 0.0325, + "epoch": 0.9, + "learning_rate": 0.0001645578525465189, + "loss": 0.0339, "step": 139900 }, { - "epoch": 1.51, - "learning_rate": 7.300603543383735e-05, - "loss": 0.0352, + "epoch": 0.9, + "learning_rate": 0.00016454817119216194, + "loss": 0.0372, "step": 139910 }, { - "epoch": 1.51, - "learning_rate": 7.29898111493283e-05, - "loss": 0.0267, + "epoch": 0.9, + "learning_rate": 0.00016453848983780502, + "loss": 0.0351, "step": 139920 }, { - "epoch": 1.51, - "learning_rate": 7.297358686481925e-05, - "loss": 0.0419, + "epoch": 0.9, + "learning_rate": 0.0001645288084834481, + "loss": 0.0408, "step": 139930 }, { - "epoch": 1.51, - "learning_rate": 7.29573625803102e-05, - "loss": 0.0242, + "epoch": 0.9, + "learning_rate": 0.00016451912712909118, + "loss": 0.041, "step": 139940 }, { - "epoch": 1.51, - "learning_rate": 7.294113829580114e-05, - "loss": 0.0322, + "epoch": 0.9, + "learning_rate": 0.00016450944577473423, + "loss": 0.0504, "step": 139950 }, { - "epoch": 1.51, - "learning_rate": 7.292491401129209e-05, - "loss": 0.0257, + "epoch": 0.9, + "learning_rate": 0.0001644997644203773, + "loss": 0.0447, "step": 139960 }, { - "epoch": 1.51, - "learning_rate": 7.290868972678304e-05, - "loss": 0.0339, + "epoch": 0.9, + "learning_rate": 0.0001644900830660204, + "loss": 0.0451, "step": 139970 }, { - "epoch": 1.51, - "learning_rate": 7.289246544227399e-05, - "loss": 0.0253, + "epoch": 0.9, + "learning_rate": 0.00016448040171166342, + "loss": 0.0405, "step": 139980 }, { - "epoch": 1.51, - "learning_rate": 7.287624115776494e-05, - "loss": 0.0299, + "epoch": 0.9, + "learning_rate": 0.0001644707203573065, + "loss": 0.0367, "step": 139990 }, { - "epoch": 1.51, - "learning_rate": 7.286001687325588e-05, - "loss": 0.0256, + "epoch": 0.9, + "learning_rate": 0.00016446103900294958, + "loss": 0.0372, "step": 140000 }, { - "epoch": 1.51, - "eval_cer": 0.9211419564936981, - "eval_loss": 0.023512214422225952, - "eval_runtime": 118.9538, - "eval_samples_per_second": 16.813, - "eval_steps_per_second": 4.203, + "epoch": 0.9, + "eval_cer": 0.9199656535984635, + "eval_loss": 0.027039654552936554, + "eval_runtime": 119.7354, + "eval_samples_per_second": 16.703, + "eval_steps_per_second": 4.176, "step": 140000 }, { - "epoch": 1.51, - "learning_rate": 7.284379258874682e-05, - "loss": 0.0287, + "epoch": 0.9, + "learning_rate": 0.00016445135764859263, + "loss": 0.0391, "step": 140010 }, { - "epoch": 1.51, - "learning_rate": 7.282756830423777e-05, - "loss": 0.0254, + "epoch": 0.9, + "learning_rate": 0.0001644416762942357, + "loss": 0.0405, "step": 140020 }, { - "epoch": 1.51, - "learning_rate": 7.281134401972872e-05, - "loss": 0.0311, + "epoch": 0.9, + "learning_rate": 0.0001644319949398788, + "loss": 0.0441, "step": 140030 }, { - "epoch": 1.51, - "learning_rate": 7.279511973521966e-05, - "loss": 0.0289, + "epoch": 0.9, + "learning_rate": 0.00016442231358552187, + "loss": 0.0399, "step": 140040 }, { - "epoch": 1.51, - "learning_rate": 7.277889545071061e-05, - "loss": 0.0266, + "epoch": 0.9, + "learning_rate": 0.0001644126322311649, + "loss": 0.0372, "step": 140050 }, { - "epoch": 1.51, - "learning_rate": 7.276267116620156e-05, - "loss": 0.028, + "epoch": 0.9, + "learning_rate": 0.00016440295087680797, + "loss": 0.0386, "step": 140060 }, { - "epoch": 1.52, - "learning_rate": 7.274644688169251e-05, - "loss": 0.0315, + "epoch": 0.9, + "learning_rate": 0.00016439326952245105, + "loss": 0.0398, "step": 140070 }, { - "epoch": 1.52, - "learning_rate": 7.273022259718346e-05, - "loss": 0.0274, + "epoch": 0.9, + "learning_rate": 0.0001643835881680941, + "loss": 0.0358, "step": 140080 }, { - "epoch": 1.52, - "learning_rate": 7.27139983126744e-05, - "loss": 0.0294, + "epoch": 0.9, + "learning_rate": 0.00016437390681373718, + "loss": 0.0388, "step": 140090 }, { - "epoch": 1.52, - "learning_rate": 7.269777402816535e-05, - "loss": 0.0302, + "epoch": 0.9, + "learning_rate": 0.00016436422545938026, + "loss": 0.0381, "step": 140100 }, { - "epoch": 1.52, - "learning_rate": 7.26815497436563e-05, - "loss": 0.0315, + "epoch": 0.9, + "learning_rate": 0.00016435454410502334, + "loss": 0.0417, "step": 140110 }, { - "epoch": 1.52, - "learning_rate": 7.266532545914725e-05, - "loss": 0.0294, + "epoch": 0.9, + "learning_rate": 0.00016434486275066637, + "loss": 0.0428, "step": 140120 }, { - "epoch": 1.52, - "learning_rate": 7.26491011746382e-05, - "loss": 0.0302, + "epoch": 0.9, + "learning_rate": 0.00016433518139630945, + "loss": 0.0348, "step": 140130 }, { - "epoch": 1.52, - "learning_rate": 7.263287689012913e-05, - "loss": 0.0261, + "epoch": 0.9, + "learning_rate": 0.00016432550004195253, + "loss": 0.0335, "step": 140140 }, { - "epoch": 1.52, - "learning_rate": 7.261665260562008e-05, - "loss": 0.0326, + "epoch": 0.9, + "learning_rate": 0.00016431581868759558, + "loss": 0.0435, "step": 140150 }, { - "epoch": 1.52, - "learning_rate": 7.260042832111103e-05, - "loss": 0.0307, + "epoch": 0.9, + "learning_rate": 0.00016430613733323866, + "loss": 0.0394, "step": 140160 }, { - "epoch": 1.52, - "learning_rate": 7.258420403660198e-05, - "loss": 0.034, + "epoch": 0.9, + "learning_rate": 0.00016429645597888174, + "loss": 0.0455, "step": 140170 }, { - "epoch": 1.52, - "learning_rate": 7.256797975209292e-05, - "loss": 0.026, + "epoch": 0.9, + "learning_rate": 0.00016428677462452482, + "loss": 0.0372, "step": 140180 }, { - "epoch": 1.52, - "learning_rate": 7.255175546758387e-05, - "loss": 0.032, + "epoch": 0.9, + "learning_rate": 0.00016427709327016785, + "loss": 0.0365, "step": 140190 }, { - "epoch": 1.52, - "learning_rate": 7.253553118307482e-05, - "loss": 0.0275, + "epoch": 0.9, + "learning_rate": 0.00016426741191581093, + "loss": 0.039, "step": 140200 }, { - "epoch": 1.52, - "learning_rate": 7.251930689856577e-05, - "loss": 0.0324, + "epoch": 0.9, + "learning_rate": 0.00016425773056145398, + "loss": 0.041, "step": 140210 }, { - "epoch": 1.52, - "learning_rate": 7.250308261405672e-05, - "loss": 0.0292, + "epoch": 0.91, + "learning_rate": 0.00016424804920709706, + "loss": 0.0348, "step": 140220 }, { - "epoch": 1.52, - "learning_rate": 7.248685832954767e-05, - "loss": 0.0295, + "epoch": 0.91, + "learning_rate": 0.00016423836785274014, + "loss": 0.0384, "step": 140230 }, { - "epoch": 1.52, - "learning_rate": 7.247063404503862e-05, - "loss": 0.0266, + "epoch": 0.91, + "learning_rate": 0.00016422868649838322, + "loss": 0.0394, "step": 140240 }, { - "epoch": 1.52, - "learning_rate": 7.245440976052955e-05, - "loss": 0.0294, + "epoch": 0.91, + "learning_rate": 0.00016421900514402627, + "loss": 0.0394, "step": 140250 }, { - "epoch": 1.52, - "learning_rate": 7.24381854760205e-05, - "loss": 0.0292, + "epoch": 0.91, + "learning_rate": 0.00016420932378966932, + "loss": 0.042, "step": 140260 }, { - "epoch": 1.52, - "learning_rate": 7.242196119151145e-05, - "loss": 0.0315, + "epoch": 0.91, + "learning_rate": 0.0001641996424353124, + "loss": 0.0399, "step": 140270 }, { - "epoch": 1.52, - "learning_rate": 7.24057369070024e-05, - "loss": 0.0296, + "epoch": 0.91, + "learning_rate": 0.00016418996108095546, + "loss": 0.0433, "step": 140280 }, { - "epoch": 1.52, - "learning_rate": 7.238951262249335e-05, - "loss": 0.028, + "epoch": 0.91, + "learning_rate": 0.00016418027972659854, + "loss": 0.0421, "step": 140290 }, { - "epoch": 1.52, - "learning_rate": 7.237328833798429e-05, - "loss": 0.0314, + "epoch": 0.91, + "learning_rate": 0.00016417059837224162, + "loss": 0.0371, "step": 140300 }, { - "epoch": 1.52, - "learning_rate": 7.235706405347524e-05, - "loss": 0.0289, + "epoch": 0.91, + "learning_rate": 0.0001641609170178847, + "loss": 0.0382, "step": 140310 }, { - "epoch": 1.52, - "learning_rate": 7.234083976896619e-05, - "loss": 0.0291, + "epoch": 0.91, + "learning_rate": 0.00016415123566352775, + "loss": 0.0345, "step": 140320 }, { - "epoch": 1.52, - "learning_rate": 7.232461548445714e-05, - "loss": 0.0298, + "epoch": 0.91, + "learning_rate": 0.0001641415543091708, + "loss": 0.0381, "step": 140330 }, { - "epoch": 1.52, - "learning_rate": 7.230839119994807e-05, - "loss": 0.0256, + "epoch": 0.91, + "learning_rate": 0.00016413187295481388, + "loss": 0.0347, "step": 140340 }, { - "epoch": 1.52, - "learning_rate": 7.229216691543902e-05, - "loss": 0.0248, + "epoch": 0.91, + "learning_rate": 0.00016412219160045693, + "loss": 0.0356, "step": 140350 }, { - "epoch": 1.52, - "learning_rate": 7.227594263092997e-05, - "loss": 0.0275, + "epoch": 0.91, + "learning_rate": 0.00016411251024610001, + "loss": 0.0433, "step": 140360 }, { - "epoch": 1.52, - "learning_rate": 7.225971834642092e-05, - "loss": 0.03, + "epoch": 0.91, + "learning_rate": 0.0001641028288917431, + "loss": 0.0404, "step": 140370 }, { - "epoch": 1.52, - "learning_rate": 7.224349406191187e-05, - "loss": 0.028, + "epoch": 0.91, + "learning_rate": 0.00016409314753738617, + "loss": 0.0403, "step": 140380 }, { - "epoch": 1.52, - "learning_rate": 7.222726977740281e-05, - "loss": 0.0364, + "epoch": 0.91, + "learning_rate": 0.00016408346618302923, + "loss": 0.0419, "step": 140390 }, { - "epoch": 1.52, - "learning_rate": 7.221104549289376e-05, - "loss": 0.0259, + "epoch": 0.91, + "learning_rate": 0.00016407378482867228, + "loss": 0.0398, "step": 140400 }, { - "epoch": 1.52, - "learning_rate": 7.219482120838471e-05, - "loss": 0.0262, + "epoch": 0.91, + "learning_rate": 0.00016406410347431533, + "loss": 0.0423, "step": 140410 }, { - "epoch": 1.52, - "learning_rate": 7.217859692387566e-05, - "loss": 0.0275, + "epoch": 0.91, + "learning_rate": 0.0001640544221199584, + "loss": 0.0393, "step": 140420 }, { - "epoch": 1.52, - "learning_rate": 7.216237263936661e-05, - "loss": 0.0272, + "epoch": 0.91, + "learning_rate": 0.0001640447407656015, + "loss": 0.0383, "step": 140430 }, { - "epoch": 1.52, - "learning_rate": 7.214614835485754e-05, - "loss": 0.0325, + "epoch": 0.91, + "learning_rate": 0.00016403505941124457, + "loss": 0.0364, "step": 140440 }, { - "epoch": 1.52, - "learning_rate": 7.212992407034849e-05, - "loss": 0.033, + "epoch": 0.91, + "learning_rate": 0.00016402537805688762, + "loss": 0.0392, "step": 140450 }, { - "epoch": 1.52, - "learning_rate": 7.211369978583944e-05, - "loss": 0.0302, + "epoch": 0.91, + "learning_rate": 0.0001640156967025307, + "loss": 0.0403, "step": 140460 }, { - "epoch": 1.52, - "learning_rate": 7.209747550133039e-05, - "loss": 0.0357, + "epoch": 0.91, + "learning_rate": 0.00016400601534817376, + "loss": 0.0404, "step": 140470 }, { - "epoch": 1.52, - "learning_rate": 7.208125121682133e-05, - "loss": 0.0304, + "epoch": 0.91, + "learning_rate": 0.0001639963339938168, + "loss": 0.038, "step": 140480 }, { - "epoch": 1.52, - "learning_rate": 7.206502693231228e-05, - "loss": 0.0312, + "epoch": 0.91, + "learning_rate": 0.0001639866526394599, + "loss": 0.0427, "step": 140490 }, { - "epoch": 1.52, - "learning_rate": 7.204880264780323e-05, - "loss": 0.0302, + "epoch": 0.91, + "learning_rate": 0.00016397697128510297, + "loss": 0.0407, "step": 140500 }, { - "epoch": 1.52, - "learning_rate": 7.203257836329418e-05, - "loss": 0.0307, + "epoch": 0.91, + "learning_rate": 0.00016396728993074605, + "loss": 0.0416, "step": 140510 }, { - "epoch": 1.52, - "learning_rate": 7.201635407878513e-05, - "loss": 0.0313, + "epoch": 0.91, + "learning_rate": 0.0001639576085763891, + "loss": 0.0385, "step": 140520 }, { - "epoch": 1.52, - "learning_rate": 7.200012979427606e-05, - "loss": 0.0272, + "epoch": 0.91, + "learning_rate": 0.00016394792722203218, + "loss": 0.0392, "step": 140530 }, { - "epoch": 1.52, - "learning_rate": 7.198390550976701e-05, - "loss": 0.0321, + "epoch": 0.91, + "learning_rate": 0.00016393824586767523, + "loss": 0.0389, "step": 140540 }, { - "epoch": 1.52, - "learning_rate": 7.196768122525796e-05, - "loss": 0.0367, + "epoch": 0.91, + "learning_rate": 0.00016392856451331829, + "loss": 0.0402, "step": 140550 }, { - "epoch": 1.52, - "learning_rate": 7.195145694074891e-05, - "loss": 0.0271, + "epoch": 0.91, + "learning_rate": 0.00016391888315896137, + "loss": 0.0401, "step": 140560 }, { - "epoch": 1.52, - "learning_rate": 7.193523265623985e-05, - "loss": 0.0297, + "epoch": 0.91, + "learning_rate": 0.00016390920180460445, + "loss": 0.0355, "step": 140570 }, { - "epoch": 1.52, - "learning_rate": 7.19190083717308e-05, - "loss": 0.0288, + "epoch": 0.91, + "learning_rate": 0.00016389952045024753, + "loss": 0.0398, "step": 140580 }, { - "epoch": 1.52, - "learning_rate": 7.190278408722175e-05, - "loss": 0.0325, + "epoch": 0.91, + "learning_rate": 0.00016388983909589058, + "loss": 0.0339, "step": 140590 }, { - "epoch": 1.52, - "learning_rate": 7.18865598027127e-05, - "loss": 0.0293, + "epoch": 0.91, + "learning_rate": 0.00016388015774153366, + "loss": 0.0413, "step": 140600 }, { - "epoch": 1.52, - "learning_rate": 7.187033551820365e-05, - "loss": 0.0282, + "epoch": 0.91, + "learning_rate": 0.00016387047638717668, + "loss": 0.0455, "step": 140610 }, { - "epoch": 1.52, - "learning_rate": 7.185411123369458e-05, - "loss": 0.029, + "epoch": 0.91, + "learning_rate": 0.00016386079503281976, + "loss": 0.0361, "step": 140620 }, { - "epoch": 1.52, - "learning_rate": 7.183788694918553e-05, - "loss": 0.028, - "step": 140630 + "epoch": 0.91, + "learning_rate": 0.00016385111367846284, + "loss": 0.046, + "step": 140630 }, { - "epoch": 1.52, - "learning_rate": 7.182166266467648e-05, - "loss": 0.028, + "epoch": 0.91, + "learning_rate": 0.00016384143232410592, + "loss": 0.0408, "step": 140640 }, { - "epoch": 1.52, - "learning_rate": 7.180543838016743e-05, - "loss": 0.0356, + "epoch": 0.91, + "learning_rate": 0.00016383175096974898, + "loss": 0.0424, "step": 140650 }, { - "epoch": 1.52, - "learning_rate": 7.178921409565837e-05, - "loss": 0.0286, + "epoch": 0.91, + "learning_rate": 0.00016382206961539206, + "loss": 0.0339, "step": 140660 }, { - "epoch": 1.52, - "learning_rate": 7.177298981114932e-05, - "loss": 0.0291, + "epoch": 0.91, + "learning_rate": 0.00016381238826103514, + "loss": 0.0346, "step": 140670 }, { - "epoch": 1.52, - "learning_rate": 7.175676552664027e-05, - "loss": 0.0322, + "epoch": 0.91, + "learning_rate": 0.00016380270690667816, + "loss": 0.0387, "step": 140680 }, { - "epoch": 1.52, - "learning_rate": 7.174054124213122e-05, - "loss": 0.0296, + "epoch": 0.91, + "learning_rate": 0.00016379302555232124, + "loss": 0.0429, "step": 140690 }, { - "epoch": 1.52, - "learning_rate": 7.172431695762217e-05, - "loss": 0.0292, + "epoch": 0.91, + "learning_rate": 0.00016378334419796432, + "loss": 0.0408, "step": 140700 }, { - "epoch": 1.52, - "learning_rate": 7.17080926731131e-05, - "loss": 0.0297, + "epoch": 0.91, + "learning_rate": 0.0001637736628436074, + "loss": 0.0425, "step": 140710 }, { - "epoch": 1.52, - "learning_rate": 7.169186838860406e-05, - "loss": 0.0301, + "epoch": 0.91, + "learning_rate": 0.00016376398148925045, + "loss": 0.0438, "step": 140720 }, { - "epoch": 1.52, - "learning_rate": 7.1675644104095e-05, - "loss": 0.0314, + "epoch": 0.91, + "learning_rate": 0.00016375430013489353, + "loss": 0.0411, "step": 140730 }, { - "epoch": 1.52, - "learning_rate": 7.165941981958595e-05, - "loss": 0.0319, + "epoch": 0.91, + "learning_rate": 0.0001637446187805366, + "loss": 0.038, "step": 140740 }, { - "epoch": 1.52, - "learning_rate": 7.164319553507689e-05, - "loss": 0.0283, + "epoch": 0.91, + "learning_rate": 0.00016373493742617964, + "loss": 0.044, "step": 140750 }, { - "epoch": 1.52, - "learning_rate": 7.162697125056784e-05, - "loss": 0.0301, + "epoch": 0.91, + "learning_rate": 0.00016372525607182272, + "loss": 0.0361, "step": 140760 }, { - "epoch": 1.52, - "learning_rate": 7.161074696605879e-05, - "loss": 0.0237, + "epoch": 0.91, + "learning_rate": 0.0001637155747174658, + "loss": 0.0422, "step": 140770 }, { - "epoch": 1.52, - "learning_rate": 7.159452268154974e-05, - "loss": 0.0315, + "epoch": 0.91, + "learning_rate": 0.00016370589336310888, + "loss": 0.039, "step": 140780 }, { - "epoch": 1.52, - "learning_rate": 7.157829839704069e-05, - "loss": 0.0311, + "epoch": 0.91, + "learning_rate": 0.00016369621200875193, + "loss": 0.0425, "step": 140790 }, { - "epoch": 1.52, - "learning_rate": 7.156207411253163e-05, - "loss": 0.0268, + "epoch": 0.91, + "learning_rate": 0.000163686530654395, + "loss": 0.0383, "step": 140800 }, { - "epoch": 1.52, - "learning_rate": 7.154584982802258e-05, - "loss": 0.0288, + "epoch": 0.91, + "learning_rate": 0.0001636768493000381, + "loss": 0.0391, "step": 140810 }, { - "epoch": 1.52, - "learning_rate": 7.152962554351353e-05, - "loss": 0.0292, + "epoch": 0.91, + "learning_rate": 0.00016366716794568112, + "loss": 0.0358, "step": 140820 }, { - "epoch": 1.52, - "learning_rate": 7.151340125900448e-05, - "loss": 0.034, + "epoch": 0.91, + "learning_rate": 0.0001636574865913242, + "loss": 0.0391, "step": 140830 }, { - "epoch": 1.52, - "learning_rate": 7.149717697449541e-05, - "loss": 0.0295, + "epoch": 0.91, + "learning_rate": 0.00016364780523696727, + "loss": 0.0474, "step": 140840 }, { - "epoch": 1.52, - "learning_rate": 7.148095268998636e-05, - "loss": 0.0293, + "epoch": 0.91, + "learning_rate": 0.00016363812388261033, + "loss": 0.0406, "step": 140850 }, { - "epoch": 1.52, - "learning_rate": 7.146472840547731e-05, - "loss": 0.0296, + "epoch": 0.91, + "learning_rate": 0.0001636284425282534, + "loss": 0.0379, "step": 140860 }, { - "epoch": 1.52, - "learning_rate": 7.144850412096826e-05, - "loss": 0.0299, + "epoch": 0.91, + "learning_rate": 0.0001636187611738965, + "loss": 0.0398, "step": 140870 }, { - "epoch": 1.52, - "learning_rate": 7.143227983645921e-05, - "loss": 0.0294, + "epoch": 0.91, + "learning_rate": 0.00016360907981953957, + "loss": 0.0345, "step": 140880 }, { - "epoch": 1.52, - "learning_rate": 7.141605555195015e-05, - "loss": 0.0264, + "epoch": 0.91, + "learning_rate": 0.0001635993984651826, + "loss": 0.0348, "step": 140890 }, { - "epoch": 1.52, - "learning_rate": 7.13998312674411e-05, - "loss": 0.0293, + "epoch": 0.91, + "learning_rate": 0.00016358971711082567, + "loss": 0.0368, "step": 140900 }, { - "epoch": 1.52, - "learning_rate": 7.138360698293205e-05, - "loss": 0.0288, + "epoch": 0.91, + "learning_rate": 0.00016358003575646875, + "loss": 0.0464, "step": 140910 }, { - "epoch": 1.52, - "learning_rate": 7.1367382698423e-05, - "loss": 0.026, + "epoch": 0.91, + "learning_rate": 0.0001635703544021118, + "loss": 0.0372, "step": 140920 }, { - "epoch": 1.52, - "learning_rate": 7.135115841391393e-05, - "loss": 0.0294, + "epoch": 0.91, + "learning_rate": 0.00016356067304775488, + "loss": 0.0369, "step": 140930 }, { - "epoch": 1.52, - "learning_rate": 7.133493412940488e-05, - "loss": 0.0302, + "epoch": 0.91, + "learning_rate": 0.00016355099169339796, + "loss": 0.0455, "step": 140940 }, { - "epoch": 1.52, - "learning_rate": 7.131870984489583e-05, - "loss": 0.0323, + "epoch": 0.91, + "learning_rate": 0.00016354131033904104, + "loss": 0.0395, "step": 140950 }, { - "epoch": 1.52, - "learning_rate": 7.130248556038678e-05, - "loss": 0.0309, + "epoch": 0.91, + "learning_rate": 0.00016353162898468407, + "loss": 0.0417, "step": 140960 }, { - "epoch": 1.52, - "learning_rate": 7.128626127587773e-05, - "loss": 0.0264, + "epoch": 0.91, + "learning_rate": 0.00016352194763032715, + "loss": 0.0537, "step": 140970 }, { - "epoch": 1.52, - "learning_rate": 7.127003699136867e-05, - "loss": 0.0291, + "epoch": 0.91, + "learning_rate": 0.00016351226627597023, + "loss": 0.039, "step": 140980 }, { - "epoch": 1.52, - "learning_rate": 7.125381270685962e-05, - "loss": 0.0296, + "epoch": 0.91, + "learning_rate": 0.00016350258492161328, + "loss": 0.0389, "step": 140990 }, { - "epoch": 1.53, - "learning_rate": 7.123758842235057e-05, - "loss": 0.0312, + "epoch": 0.91, + "learning_rate": 0.00016349290356725636, + "loss": 0.0381, "step": 141000 }, { - "epoch": 1.53, - "eval_cer": 0.9211083840895076, - "eval_loss": 0.02374228648841381, - "eval_runtime": 118.8254, - "eval_samples_per_second": 16.831, - "eval_steps_per_second": 4.208, + "epoch": 0.91, + "eval_cer": 0.9199078070274546, + "eval_loss": 0.026563717052340508, + "eval_runtime": 120.0005, + "eval_samples_per_second": 16.667, + "eval_steps_per_second": 4.167, "step": 141000 }, { - "epoch": 1.53, - "learning_rate": 7.122136413784152e-05, - "loss": 0.0212, + "epoch": 0.91, + "learning_rate": 0.00016348322221289944, + "loss": 0.0438, "step": 141010 }, { - "epoch": 1.53, - "learning_rate": 7.120513985333245e-05, - "loss": 0.0304, + "epoch": 0.91, + "learning_rate": 0.0001634735408585425, + "loss": 0.038, "step": 141020 }, { - "epoch": 1.53, - "learning_rate": 7.11889155688234e-05, - "loss": 0.0315, + "epoch": 0.91, + "learning_rate": 0.00016346385950418555, + "loss": 0.0431, "step": 141030 }, { - "epoch": 1.53, - "learning_rate": 7.117269128431435e-05, - "loss": 0.0323, + "epoch": 0.91, + "learning_rate": 0.00016345417814982863, + "loss": 0.0427, "step": 141040 }, { - "epoch": 1.53, - "learning_rate": 7.11564669998053e-05, - "loss": 0.0239, + "epoch": 0.91, + "learning_rate": 0.00016344449679547168, + "loss": 0.0396, "step": 141050 }, { - "epoch": 1.53, - "learning_rate": 7.114024271529625e-05, - "loss": 0.0271, + "epoch": 0.91, + "learning_rate": 0.00016343481544111476, + "loss": 0.0437, "step": 141060 }, { - "epoch": 1.53, - "learning_rate": 7.112401843078719e-05, - "loss": 0.0321, + "epoch": 0.91, + "learning_rate": 0.00016342513408675784, + "loss": 0.0415, "step": 141070 }, { - "epoch": 1.53, - "learning_rate": 7.110779414627814e-05, - "loss": 0.028, + "epoch": 0.91, + "learning_rate": 0.00016341545273240092, + "loss": 0.0381, "step": 141080 }, { - "epoch": 1.53, - "learning_rate": 7.109156986176909e-05, - "loss": 0.0355, + "epoch": 0.91, + "learning_rate": 0.00016340577137804397, + "loss": 0.0416, "step": 141090 }, { - "epoch": 1.53, - "learning_rate": 7.107534557726004e-05, - "loss": 0.03, + "epoch": 0.91, + "learning_rate": 0.00016339609002368702, + "loss": 0.0392, "step": 141100 }, { - "epoch": 1.53, - "learning_rate": 7.105912129275097e-05, - "loss": 0.0316, + "epoch": 0.91, + "learning_rate": 0.0001633864086693301, + "loss": 0.045, "step": 141110 }, { - "epoch": 1.53, - "learning_rate": 7.104289700824192e-05, - "loss": 0.0284, + "epoch": 0.91, + "learning_rate": 0.00016337672731497316, + "loss": 0.0398, "step": 141120 }, { - "epoch": 1.53, - "learning_rate": 7.102667272373287e-05, - "loss": 0.0234, + "epoch": 0.91, + "learning_rate": 0.00016336704596061624, + "loss": 0.037, "step": 141130 }, { - "epoch": 1.53, - "learning_rate": 7.101044843922382e-05, - "loss": 0.0269, + "epoch": 0.91, + "learning_rate": 0.00016335736460625932, + "loss": 0.0347, "step": 141140 }, { - "epoch": 1.53, - "learning_rate": 7.099422415471477e-05, - "loss": 0.0332, + "epoch": 0.91, + "learning_rate": 0.0001633476832519024, + "loss": 0.0374, "step": 141150 }, { - "epoch": 1.53, - "learning_rate": 7.097799987020571e-05, - "loss": 0.0303, + "epoch": 0.91, + "learning_rate": 0.00016333800189754545, + "loss": 0.0415, "step": 141160 }, { - "epoch": 1.53, - "learning_rate": 7.096177558569666e-05, - "loss": 0.0238, + "epoch": 0.91, + "learning_rate": 0.0001633283205431885, + "loss": 0.0399, "step": 141170 }, { - "epoch": 1.53, - "learning_rate": 7.094555130118761e-05, - "loss": 0.0359, + "epoch": 0.91, + "learning_rate": 0.00016331863918883158, + "loss": 0.0461, "step": 141180 }, { - "epoch": 1.53, - "learning_rate": 7.092932701667856e-05, - "loss": 0.0259, + "epoch": 0.91, + "learning_rate": 0.00016330895783447463, + "loss": 0.0406, "step": 141190 }, { - "epoch": 1.53, - "learning_rate": 7.091310273216951e-05, - "loss": 0.0303, + "epoch": 0.91, + "learning_rate": 0.0001632992764801177, + "loss": 0.0341, "step": 141200 }, { - "epoch": 1.53, - "learning_rate": 7.089687844766045e-05, - "loss": 0.0316, + "epoch": 0.91, + "learning_rate": 0.0001632895951257608, + "loss": 0.0394, "step": 141210 }, { - "epoch": 1.53, - "learning_rate": 7.08806541631514e-05, - "loss": 0.032, + "epoch": 0.91, + "learning_rate": 0.00016327991377140385, + "loss": 0.0418, "step": 141220 }, { - "epoch": 1.53, - "learning_rate": 7.086442987864234e-05, - "loss": 0.0254, + "epoch": 0.91, + "learning_rate": 0.0001632702324170469, + "loss": 0.0387, "step": 141230 }, { - "epoch": 1.53, - "learning_rate": 7.08482055941333e-05, - "loss": 0.0309, + "epoch": 0.91, + "learning_rate": 0.00016326055106268998, + "loss": 0.0372, "step": 141240 }, { - "epoch": 1.53, - "learning_rate": 7.083198130962423e-05, - "loss": 0.0303, + "epoch": 0.91, + "learning_rate": 0.00016325086970833303, + "loss": 0.0377, "step": 141250 }, { - "epoch": 1.53, - "learning_rate": 7.081575702511518e-05, - "loss": 0.024, + "epoch": 0.91, + "learning_rate": 0.0001632411883539761, + "loss": 0.0427, "step": 141260 }, { - "epoch": 1.53, - "learning_rate": 7.079953274060613e-05, - "loss": 0.0273, + "epoch": 0.91, + "learning_rate": 0.0001632315069996192, + "loss": 0.0427, "step": 141270 }, { - "epoch": 1.53, - "learning_rate": 7.078330845609708e-05, + "epoch": 0.91, + "learning_rate": 0.00016322182564526227, "loss": 0.0416, "step": 141280 }, { - "epoch": 1.53, - "learning_rate": 7.076708417158803e-05, - "loss": 0.025, + "epoch": 0.91, + "learning_rate": 0.00016321214429090532, + "loss": 0.0356, "step": 141290 }, { - "epoch": 1.53, - "learning_rate": 7.075085988707897e-05, - "loss": 0.0271, + "epoch": 0.91, + "learning_rate": 0.00016320246293654838, + "loss": 0.0369, "step": 141300 }, { - "epoch": 1.53, - "learning_rate": 7.073463560256992e-05, - "loss": 0.0326, + "epoch": 0.91, + "learning_rate": 0.00016319278158219146, + "loss": 0.0396, "step": 141310 }, { - "epoch": 1.53, - "learning_rate": 7.071841131806087e-05, - "loss": 0.029, + "epoch": 0.91, + "learning_rate": 0.0001631831002278345, + "loss": 0.0404, "step": 141320 }, { - "epoch": 1.53, - "learning_rate": 7.070218703355182e-05, - "loss": 0.0234, + "epoch": 0.91, + "learning_rate": 0.0001631734188734776, + "loss": 0.0374, "step": 141330 }, { - "epoch": 1.53, - "learning_rate": 7.068596274904275e-05, - "loss": 0.0258, + "epoch": 0.91, + "learning_rate": 0.00016316373751912067, + "loss": 0.0425, "step": 141340 }, { - "epoch": 1.53, - "learning_rate": 7.06697384645337e-05, - "loss": 0.027, + "epoch": 0.91, + "learning_rate": 0.00016315405616476375, + "loss": 0.034, "step": 141350 }, { - "epoch": 1.53, - "learning_rate": 7.065351418002465e-05, - "loss": 0.0291, + "epoch": 0.91, + "learning_rate": 0.0001631443748104068, + "loss": 0.0394, "step": 141360 }, { - "epoch": 1.53, - "learning_rate": 7.06372898955156e-05, - "loss": 0.0246, + "epoch": 0.91, + "learning_rate": 0.00016313469345604985, + "loss": 0.0387, "step": 141370 }, { - "epoch": 1.53, - "learning_rate": 7.062106561100655e-05, - "loss": 0.0303, + "epoch": 0.91, + "learning_rate": 0.00016312501210169293, + "loss": 0.0419, "step": 141380 }, { - "epoch": 1.53, - "learning_rate": 7.06048413264975e-05, - "loss": 0.0295, + "epoch": 0.91, + "learning_rate": 0.00016311533074733599, + "loss": 0.0367, "step": 141390 }, { - "epoch": 1.53, - "learning_rate": 7.058861704198845e-05, - "loss": 0.0268, + "epoch": 0.91, + "learning_rate": 0.00016310564939297907, + "loss": 0.0332, "step": 141400 }, { - "epoch": 1.53, - "learning_rate": 7.057239275747939e-05, - "loss": 0.0376, + "epoch": 0.91, + "learning_rate": 0.00016309596803862215, + "loss": 0.0353, "step": 141410 }, { - "epoch": 1.53, - "learning_rate": 7.055616847297034e-05, - "loss": 0.0275, + "epoch": 0.91, + "learning_rate": 0.0001630862866842652, + "loss": 0.0333, "step": 141420 }, { - "epoch": 1.53, - "learning_rate": 7.053994418846129e-05, - "loss": 0.0294, + "epoch": 0.91, + "learning_rate": 0.00016307660532990828, + "loss": 0.0349, "step": 141430 }, { - "epoch": 1.53, - "learning_rate": 7.052371990395224e-05, - "loss": 0.0237, + "epoch": 0.91, + "learning_rate": 0.00016306692397555133, + "loss": 0.0367, "step": 141440 }, { - "epoch": 1.53, - "learning_rate": 7.050749561944319e-05, - "loss": 0.0314, + "epoch": 0.91, + "learning_rate": 0.00016305724262119438, + "loss": 0.0377, "step": 141450 }, { - "epoch": 1.53, - "learning_rate": 7.049127133493412e-05, - "loss": 0.0322, + "epoch": 0.91, + "learning_rate": 0.00016304756126683746, + "loss": 0.0355, "step": 141460 }, { - "epoch": 1.53, - "learning_rate": 7.047504705042507e-05, - "loss": 0.0288, + "epoch": 0.91, + "learning_rate": 0.00016303787991248054, + "loss": 0.0399, "step": 141470 }, { - "epoch": 1.53, - "learning_rate": 7.045882276591602e-05, - "loss": 0.0301, + "epoch": 0.91, + "learning_rate": 0.00016302819855812362, + "loss": 0.0387, "step": 141480 }, { - "epoch": 1.53, - "learning_rate": 7.044259848140697e-05, - "loss": 0.0315, + "epoch": 0.91, + "learning_rate": 0.00016301851720376668, + "loss": 0.038, "step": 141490 }, { - "epoch": 1.53, - "learning_rate": 7.042637419689792e-05, - "loss": 0.0281, + "epoch": 0.91, + "learning_rate": 0.00016300883584940975, + "loss": 0.0348, "step": 141500 }, { - "epoch": 1.53, - "learning_rate": 7.041014991238886e-05, - "loss": 0.0309, + "epoch": 0.91, + "learning_rate": 0.0001629991544950528, + "loss": 0.0396, "step": 141510 }, { - "epoch": 1.53, - "learning_rate": 7.03939256278798e-05, - "loss": 0.0329, + "epoch": 0.91, + "learning_rate": 0.00016298947314069586, + "loss": 0.0415, "step": 141520 }, { - "epoch": 1.53, - "learning_rate": 7.037770134337076e-05, - "loss": 0.0271, + "epoch": 0.91, + "learning_rate": 0.00016297979178633894, + "loss": 0.0394, "step": 141530 }, { - "epoch": 1.53, - "learning_rate": 7.03614770588617e-05, - "loss": 0.0264, + "epoch": 0.91, + "learning_rate": 0.00016297011043198202, + "loss": 0.0399, "step": 141540 }, { - "epoch": 1.53, - "learning_rate": 7.034525277435264e-05, - "loss": 0.0312, + "epoch": 0.91, + "learning_rate": 0.0001629604290776251, + "loss": 0.0307, "step": 141550 }, { - "epoch": 1.53, - "learning_rate": 7.032902848984359e-05, - "loss": 0.0344, + "epoch": 0.91, + "learning_rate": 0.00016295074772326815, + "loss": 0.0358, "step": 141560 }, { - "epoch": 1.53, - "learning_rate": 7.031280420533454e-05, - "loss": 0.027, + "epoch": 0.91, + "learning_rate": 0.00016294106636891123, + "loss": 0.038, "step": 141570 }, { - "epoch": 1.53, - "learning_rate": 7.029657992082549e-05, - "loss": 0.0289, + "epoch": 0.91, + "learning_rate": 0.00016293138501455428, + "loss": 0.0418, "step": 141580 }, { - "epoch": 1.53, - "learning_rate": 7.028035563631644e-05, - "loss": 0.0265, + "epoch": 0.91, + "learning_rate": 0.00016292170366019734, + "loss": 0.0385, "step": 141590 }, { - "epoch": 1.53, - "learning_rate": 7.026413135180738e-05, - "loss": 0.0333, + "epoch": 0.91, + "learning_rate": 0.00016291202230584042, + "loss": 0.0441, "step": 141600 }, { - "epoch": 1.53, - "learning_rate": 7.024790706729833e-05, - "loss": 0.0264, + "epoch": 0.91, + "learning_rate": 0.0001629023409514835, + "loss": 0.0434, "step": 141610 }, { - "epoch": 1.53, - "learning_rate": 7.023168278278928e-05, - "loss": 0.036, + "epoch": 0.91, + "learning_rate": 0.00016289265959712655, + "loss": 0.0445, "step": 141620 }, { - "epoch": 1.53, - "learning_rate": 7.021545849828023e-05, - "loss": 0.0305, + "epoch": 0.91, + "learning_rate": 0.00016288297824276963, + "loss": 0.0381, "step": 141630 }, { - "epoch": 1.53, - "learning_rate": 7.019923421377116e-05, - "loss": 0.0349, + "epoch": 0.91, + "learning_rate": 0.0001628732968884127, + "loss": 0.0397, "step": 141640 }, { - "epoch": 1.53, - "learning_rate": 7.018300992926211e-05, - "loss": 0.0342, + "epoch": 0.91, + "learning_rate": 0.00016286361553405573, + "loss": 0.0336, "step": 141650 }, { - "epoch": 1.53, - "learning_rate": 7.016678564475306e-05, - "loss": 0.0299, + "epoch": 0.91, + "learning_rate": 0.00016285393417969881, + "loss": 0.0452, "step": 141660 }, { - "epoch": 1.53, - "learning_rate": 7.015056136024401e-05, - "loss": 0.0335, + "epoch": 0.91, + "learning_rate": 0.0001628442528253419, + "loss": 0.0362, "step": 141670 }, { - "epoch": 1.53, - "learning_rate": 7.013433707573496e-05, - "loss": 0.026, + "epoch": 0.91, + "learning_rate": 0.00016283457147098497, + "loss": 0.0425, "step": 141680 }, { - "epoch": 1.53, - "learning_rate": 7.01181127912259e-05, - "loss": 0.0288, + "epoch": 0.91, + "learning_rate": 0.00016282489011662803, + "loss": 0.0343, "step": 141690 }, { - "epoch": 1.53, - "learning_rate": 7.010188850671685e-05, - "loss": 0.0282, + "epoch": 0.91, + "learning_rate": 0.0001628152087622711, + "loss": 0.0384, "step": 141700 }, { - "epoch": 1.53, - "learning_rate": 7.00856642222078e-05, - "loss": 0.0307, + "epoch": 0.91, + "learning_rate": 0.0001628055274079142, + "loss": 0.0467, "step": 141710 }, { - "epoch": 1.53, - "learning_rate": 7.006943993769875e-05, - "loss": 0.029, + "epoch": 0.91, + "learning_rate": 0.0001627958460535572, + "loss": 0.0356, "step": 141720 }, { - "epoch": 1.53, - "learning_rate": 7.005321565318968e-05, - "loss": 0.0312, + "epoch": 0.91, + "learning_rate": 0.0001627861646992003, + "loss": 0.0431, "step": 141730 }, { - "epoch": 1.53, - "learning_rate": 7.003699136868063e-05, - "loss": 0.0212, + "epoch": 0.91, + "learning_rate": 0.00016277648334484337, + "loss": 0.0349, "step": 141740 }, { - "epoch": 1.53, - "learning_rate": 7.002076708417158e-05, - "loss": 0.0264, + "epoch": 0.91, + "learning_rate": 0.00016276680199048645, + "loss": 0.0369, "step": 141750 }, { - "epoch": 1.53, - "learning_rate": 7.000454279966253e-05, - "loss": 0.0228, + "epoch": 0.91, + "learning_rate": 0.0001627571206361295, + "loss": 0.0384, "step": 141760 }, { - "epoch": 1.53, - "learning_rate": 6.998831851515348e-05, - "loss": 0.0249, + "epoch": 0.92, + "learning_rate": 0.00016274743928177258, + "loss": 0.0401, "step": 141770 }, { - "epoch": 1.53, - "learning_rate": 6.997209423064442e-05, - "loss": 0.0289, + "epoch": 0.92, + "learning_rate": 0.00016273775792741566, + "loss": 0.0354, "step": 141780 }, { - "epoch": 1.53, - "learning_rate": 6.995586994613537e-05, - "loss": 0.0249, + "epoch": 0.92, + "learning_rate": 0.0001627280765730587, + "loss": 0.0329, "step": 141790 }, { - "epoch": 1.53, - "learning_rate": 6.993964566162632e-05, - "loss": 0.0284, + "epoch": 0.92, + "learning_rate": 0.00016271839521870177, + "loss": 0.0382, "step": 141800 }, { - "epoch": 1.53, - "learning_rate": 6.992342137711727e-05, - "loss": 0.0286, + "epoch": 0.92, + "learning_rate": 0.00016270871386434485, + "loss": 0.0361, "step": 141810 }, { - "epoch": 1.53, - "learning_rate": 6.99071970926082e-05, - "loss": 0.0261, + "epoch": 0.92, + "learning_rate": 0.0001626990325099879, + "loss": 0.0496, "step": 141820 }, { - "epoch": 1.53, - "learning_rate": 6.989097280809915e-05, - "loss": 0.0311, + "epoch": 0.92, + "learning_rate": 0.00016268935115563098, + "loss": 0.0359, "step": 141830 }, { - "epoch": 1.53, - "learning_rate": 6.98747485235901e-05, - "loss": 0.033, + "epoch": 0.92, + "learning_rate": 0.00016267966980127406, + "loss": 0.0396, "step": 141840 }, { - "epoch": 1.53, - "learning_rate": 6.985852423908105e-05, - "loss": 0.0216, + "epoch": 0.92, + "learning_rate": 0.00016266998844691714, + "loss": 0.0405, "step": 141850 }, { - "epoch": 1.53, - "learning_rate": 6.9842299954572e-05, - "loss": 0.0269, + "epoch": 0.92, + "learning_rate": 0.00016266030709256017, + "loss": 0.0394, "step": 141860 }, { - "epoch": 1.53, - "learning_rate": 6.982607567006294e-05, - "loss": 0.0264, + "epoch": 0.92, + "learning_rate": 0.00016265062573820325, + "loss": 0.0364, "step": 141870 }, { - "epoch": 1.53, - "learning_rate": 6.980985138555389e-05, - "loss": 0.0298, + "epoch": 0.92, + "learning_rate": 0.00016264094438384633, + "loss": 0.0407, "step": 141880 }, { - "epoch": 1.53, - "learning_rate": 6.979362710104484e-05, - "loss": 0.0292, + "epoch": 0.92, + "learning_rate": 0.00016263126302948938, + "loss": 0.0397, "step": 141890 }, { - "epoch": 1.53, - "learning_rate": 6.977740281653579e-05, - "loss": 0.0284, + "epoch": 0.92, + "learning_rate": 0.00016262158167513246, + "loss": 0.0388, "step": 141900 }, { - "epoch": 1.53, - "learning_rate": 6.976117853202673e-05, - "loss": 0.0263, + "epoch": 0.92, + "learning_rate": 0.00016261190032077554, + "loss": 0.0343, "step": 141910 }, { - "epoch": 1.54, - "learning_rate": 6.974495424751768e-05, - "loss": 0.0334, + "epoch": 0.92, + "learning_rate": 0.00016260221896641862, + "loss": 0.0391, "step": 141920 }, { - "epoch": 1.54, - "learning_rate": 6.972872996300863e-05, - "loss": 0.0301, + "epoch": 0.92, + "learning_rate": 0.00016259253761206164, + "loss": 0.0351, "step": 141930 }, { - "epoch": 1.54, - "learning_rate": 6.971250567849958e-05, - "loss": 0.0327, + "epoch": 0.92, + "learning_rate": 0.00016258285625770472, + "loss": 0.0348, "step": 141940 }, { - "epoch": 1.54, - "learning_rate": 6.969628139399052e-05, - "loss": 0.0318, + "epoch": 0.92, + "learning_rate": 0.0001625731749033478, + "loss": 0.0346, "step": 141950 }, { - "epoch": 1.54, - "learning_rate": 6.968005710948146e-05, - "loss": 0.0301, + "epoch": 0.92, + "learning_rate": 0.00016256349354899086, + "loss": 0.0347, "step": 141960 }, { - "epoch": 1.54, - "learning_rate": 6.966383282497241e-05, - "loss": 0.027, + "epoch": 0.92, + "learning_rate": 0.00016255381219463394, + "loss": 0.0423, "step": 141970 }, { - "epoch": 1.54, - "learning_rate": 6.964760854046336e-05, - "loss": 0.0271, + "epoch": 0.92, + "learning_rate": 0.00016254413084027702, + "loss": 0.0419, "step": 141980 }, { - "epoch": 1.54, - "learning_rate": 6.963138425595431e-05, - "loss": 0.0309, + "epoch": 0.92, + "learning_rate": 0.00016253444948592007, + "loss": 0.0436, "step": 141990 }, { - "epoch": 1.54, - "learning_rate": 6.961515997144525e-05, - "loss": 0.0302, + "epoch": 0.92, + "learning_rate": 0.00016252476813156312, + "loss": 0.0359, "step": 142000 }, { - "epoch": 1.54, - "eval_cer": 0.9211039666679035, - "eval_loss": 0.023659221827983856, - "eval_runtime": 118.9512, - "eval_samples_per_second": 16.814, - "eval_steps_per_second": 4.203, + "epoch": 0.92, + "eval_cer": 0.9198490566037736, + "eval_loss": 0.02665277197957039, + "eval_runtime": 119.7024, + "eval_samples_per_second": 16.708, + "eval_steps_per_second": 4.177, "step": 142000 }, { - "epoch": 1.54, - "learning_rate": 6.95989356869362e-05, - "loss": 0.027, + "epoch": 0.92, + "learning_rate": 0.0001625150867772062, + "loss": 0.0376, "step": 142010 }, { - "epoch": 1.54, - "learning_rate": 6.958271140242715e-05, - "loss": 0.0347, + "epoch": 0.92, + "learning_rate": 0.00016250540542284925, + "loss": 0.0415, "step": 142020 }, { - "epoch": 1.54, - "learning_rate": 6.95664871179181e-05, - "loss": 0.0289, + "epoch": 0.92, + "learning_rate": 0.00016249572406849233, + "loss": 0.0412, "step": 142030 }, { - "epoch": 1.54, - "learning_rate": 6.955026283340905e-05, - "loss": 0.0309, + "epoch": 0.92, + "learning_rate": 0.0001624860427141354, + "loss": 0.0476, "step": 142040 }, { - "epoch": 1.54, - "learning_rate": 6.953403854889998e-05, - "loss": 0.028, + "epoch": 0.92, + "learning_rate": 0.0001624763613597785, + "loss": 0.0404, "step": 142050 }, { - "epoch": 1.54, - "learning_rate": 6.951781426439093e-05, - "loss": 0.0295, + "epoch": 0.92, + "learning_rate": 0.00016246668000542155, + "loss": 0.0462, "step": 142060 }, { - "epoch": 1.54, - "learning_rate": 6.950158997988188e-05, - "loss": 0.0288, + "epoch": 0.92, + "learning_rate": 0.0001624569986510646, + "loss": 0.0399, "step": 142070 }, { - "epoch": 1.54, - "learning_rate": 6.948536569537283e-05, - "loss": 0.0315, + "epoch": 0.92, + "learning_rate": 0.00016244731729670768, + "loss": 0.0426, "step": 142080 }, { - "epoch": 1.54, - "learning_rate": 6.946914141086377e-05, - "loss": 0.0276, + "epoch": 0.92, + "learning_rate": 0.00016243763594235073, + "loss": 0.0353, "step": 142090 }, { - "epoch": 1.54, - "learning_rate": 6.945291712635472e-05, - "loss": 0.0297, + "epoch": 0.92, + "learning_rate": 0.0001624279545879938, + "loss": 0.0417, "step": 142100 }, { - "epoch": 1.54, - "learning_rate": 6.943669284184567e-05, - "loss": 0.0292, + "epoch": 0.92, + "learning_rate": 0.0001624182732336369, + "loss": 0.0419, "step": 142110 }, { - "epoch": 1.54, - "learning_rate": 6.942046855733662e-05, - "loss": 0.0283, + "epoch": 0.92, + "learning_rate": 0.00016240859187927997, + "loss": 0.0377, "step": 142120 }, { - "epoch": 1.54, - "learning_rate": 6.940424427282757e-05, - "loss": 0.0336, + "epoch": 0.92, + "learning_rate": 0.00016239891052492302, + "loss": 0.037, "step": 142130 }, { - "epoch": 1.54, - "learning_rate": 6.93880199883185e-05, - "loss": 0.0284, + "epoch": 0.92, + "learning_rate": 0.00016238922917056608, + "loss": 0.041, "step": 142140 }, { - "epoch": 1.54, - "learning_rate": 6.937179570380945e-05, - "loss": 0.0257, + "epoch": 0.92, + "learning_rate": 0.00016237954781620916, + "loss": 0.0401, "step": 142150 }, { - "epoch": 1.54, - "learning_rate": 6.93555714193004e-05, - "loss": 0.0316, + "epoch": 0.92, + "learning_rate": 0.0001623698664618522, + "loss": 0.0425, "step": 142160 }, { - "epoch": 1.54, - "learning_rate": 6.933934713479135e-05, - "loss": 0.0258, + "epoch": 0.92, + "learning_rate": 0.0001623601851074953, + "loss": 0.0383, "step": 142170 }, { - "epoch": 1.54, - "learning_rate": 6.932312285028229e-05, - "loss": 0.0238, + "epoch": 0.92, + "learning_rate": 0.00016235050375313837, + "loss": 0.0438, "step": 142180 }, { - "epoch": 1.54, - "learning_rate": 6.930689856577324e-05, - "loss": 0.032, + "epoch": 0.92, + "learning_rate": 0.00016234082239878142, + "loss": 0.038, "step": 142190 }, { - "epoch": 1.54, - "learning_rate": 6.929067428126419e-05, - "loss": 0.0267, + "epoch": 0.92, + "learning_rate": 0.0001623311410444245, + "loss": 0.0413, "step": 142200 }, { - "epoch": 1.54, - "learning_rate": 6.927444999675514e-05, - "loss": 0.0322, + "epoch": 0.92, + "learning_rate": 0.00016232145969006755, + "loss": 0.0314, "step": 142210 }, { - "epoch": 1.54, - "learning_rate": 6.925822571224609e-05, - "loss": 0.0286, + "epoch": 0.92, + "learning_rate": 0.0001623117783357106, + "loss": 0.0441, "step": 142220 }, { - "epoch": 1.54, - "learning_rate": 6.924200142773702e-05, - "loss": 0.0276, + "epoch": 0.92, + "learning_rate": 0.00016230209698135369, + "loss": 0.0409, "step": 142230 }, { - "epoch": 1.54, - "learning_rate": 6.922577714322797e-05, - "loss": 0.0247, + "epoch": 0.92, + "learning_rate": 0.00016229241562699677, + "loss": 0.0369, "step": 142240 }, { - "epoch": 1.54, - "learning_rate": 6.920955285871892e-05, - "loss": 0.0321, + "epoch": 0.92, + "learning_rate": 0.00016228273427263984, + "loss": 0.0365, "step": 142250 }, { - "epoch": 1.54, - "learning_rate": 6.919332857420987e-05, - "loss": 0.0273, + "epoch": 0.92, + "learning_rate": 0.0001622730529182829, + "loss": 0.0419, "step": 142260 }, { - "epoch": 1.54, - "learning_rate": 6.917710428970082e-05, - "loss": 0.0309, + "epoch": 0.92, + "learning_rate": 0.00016226337156392598, + "loss": 0.0382, "step": 142270 }, { - "epoch": 1.54, - "learning_rate": 6.916088000519176e-05, - "loss": 0.0347, + "epoch": 0.92, + "learning_rate": 0.00016225369020956903, + "loss": 0.0383, "step": 142280 }, { - "epoch": 1.54, - "learning_rate": 6.914465572068271e-05, - "loss": 0.0257, + "epoch": 0.92, + "learning_rate": 0.00016224400885521208, + "loss": 0.042, "step": 142290 }, { - "epoch": 1.54, - "learning_rate": 6.912843143617366e-05, - "loss": 0.031, + "epoch": 0.92, + "learning_rate": 0.00016223432750085516, + "loss": 0.0407, "step": 142300 }, { - "epoch": 1.54, - "learning_rate": 6.911220715166461e-05, - "loss": 0.0283, + "epoch": 0.92, + "learning_rate": 0.00016222464614649824, + "loss": 0.0428, "step": 142310 }, { - "epoch": 1.54, - "learning_rate": 6.909598286715554e-05, - "loss": 0.0238, + "epoch": 0.92, + "learning_rate": 0.00016221496479214132, + "loss": 0.0449, "step": 142320 }, { - "epoch": 1.54, - "learning_rate": 6.90797585826465e-05, - "loss": 0.0342, + "epoch": 0.92, + "learning_rate": 0.00016220528343778437, + "loss": 0.0442, "step": 142330 }, { - "epoch": 1.54, - "learning_rate": 6.906353429813744e-05, - "loss": 0.0295, + "epoch": 0.92, + "learning_rate": 0.00016219560208342745, + "loss": 0.0321, "step": 142340 }, { - "epoch": 1.54, - "learning_rate": 6.90473100136284e-05, - "loss": 0.0318, + "epoch": 0.92, + "learning_rate": 0.0001621859207290705, + "loss": 0.0393, "step": 142350 }, { - "epoch": 1.54, - "learning_rate": 6.903108572911934e-05, - "loss": 0.0257, + "epoch": 0.92, + "learning_rate": 0.00016217623937471356, + "loss": 0.0392, "step": 142360 }, { - "epoch": 1.54, - "learning_rate": 6.901486144461028e-05, - "loss": 0.0315, + "epoch": 0.92, + "learning_rate": 0.00016216655802035664, + "loss": 0.0379, "step": 142370 }, { - "epoch": 1.54, - "learning_rate": 6.899863716010123e-05, - "loss": 0.0273, + "epoch": 0.92, + "learning_rate": 0.00016215687666599972, + "loss": 0.04, "step": 142380 }, { - "epoch": 1.54, - "learning_rate": 6.898241287559218e-05, - "loss": 0.0296, + "epoch": 0.92, + "learning_rate": 0.0001621471953116428, + "loss": 0.0429, "step": 142390 }, { - "epoch": 1.54, - "learning_rate": 6.896618859108313e-05, - "loss": 0.0277, + "epoch": 0.92, + "learning_rate": 0.00016213751395728585, + "loss": 0.0362, "step": 142400 }, { - "epoch": 1.54, - "learning_rate": 6.894996430657407e-05, - "loss": 0.0311, + "epoch": 0.92, + "learning_rate": 0.00016212783260292893, + "loss": 0.0364, "step": 142410 }, { - "epoch": 1.54, - "learning_rate": 6.893374002206501e-05, - "loss": 0.0225, + "epoch": 0.92, + "learning_rate": 0.00016211815124857196, + "loss": 0.0349, "step": 142420 }, { - "epoch": 1.54, - "learning_rate": 6.891751573755596e-05, - "loss": 0.0308, + "epoch": 0.92, + "learning_rate": 0.00016210846989421504, + "loss": 0.0455, "step": 142430 }, { - "epoch": 1.54, - "learning_rate": 6.890129145304691e-05, - "loss": 0.0326, + "epoch": 0.92, + "learning_rate": 0.00016209878853985812, + "loss": 0.0393, "step": 142440 }, { - "epoch": 1.54, - "learning_rate": 6.888506716853786e-05, - "loss": 0.0265, + "epoch": 0.92, + "learning_rate": 0.0001620891071855012, + "loss": 0.0398, "step": 142450 }, { - "epoch": 1.54, - "learning_rate": 6.88688428840288e-05, - "loss": 0.0306, + "epoch": 0.92, + "learning_rate": 0.00016207942583114425, + "loss": 0.0397, "step": 142460 }, { - "epoch": 1.54, - "learning_rate": 6.885261859951975e-05, - "loss": 0.0286, + "epoch": 0.92, + "learning_rate": 0.00016206974447678733, + "loss": 0.0444, "step": 142470 }, { - "epoch": 1.54, - "learning_rate": 6.88363943150107e-05, - "loss": 0.0313, + "epoch": 0.92, + "learning_rate": 0.0001620600631224304, + "loss": 0.036, "step": 142480 }, { - "epoch": 1.54, - "learning_rate": 6.882017003050165e-05, - "loss": 0.0265, + "epoch": 0.92, + "learning_rate": 0.00016205038176807343, + "loss": 0.0432, "step": 142490 }, { - "epoch": 1.54, - "learning_rate": 6.880394574599259e-05, - "loss": 0.0277, + "epoch": 0.92, + "learning_rate": 0.00016204070041371651, + "loss": 0.0408, "step": 142500 }, { - "epoch": 1.54, - "learning_rate": 6.878772146148354e-05, - "loss": 0.0247, + "epoch": 0.92, + "learning_rate": 0.0001620310190593596, + "loss": 0.0394, "step": 142510 }, { - "epoch": 1.54, - "learning_rate": 6.877149717697449e-05, - "loss": 0.0303, + "epoch": 0.92, + "learning_rate": 0.00016202133770500267, + "loss": 0.0405, "step": 142520 }, { - "epoch": 1.54, - "learning_rate": 6.875527289246544e-05, - "loss": 0.0262, + "epoch": 0.92, + "learning_rate": 0.00016201165635064573, + "loss": 0.0427, "step": 142530 }, { - "epoch": 1.54, - "learning_rate": 6.873904860795639e-05, - "loss": 0.03, + "epoch": 0.92, + "learning_rate": 0.0001620019749962888, + "loss": 0.0431, "step": 142540 }, { - "epoch": 1.54, - "learning_rate": 6.872282432344732e-05, - "loss": 0.0284, + "epoch": 0.92, + "learning_rate": 0.00016199229364193189, + "loss": 0.046, "step": 142550 }, { - "epoch": 1.54, - "learning_rate": 6.870660003893828e-05, - "loss": 0.0324, + "epoch": 0.92, + "learning_rate": 0.0001619826122875749, + "loss": 0.0399, "step": 142560 }, { - "epoch": 1.54, - "learning_rate": 6.869037575442923e-05, - "loss": 0.0325, + "epoch": 0.92, + "learning_rate": 0.000161972930933218, + "loss": 0.0423, "step": 142570 }, { - "epoch": 1.54, - "learning_rate": 6.867415146992017e-05, - "loss": 0.0294, + "epoch": 0.92, + "learning_rate": 0.00016196324957886107, + "loss": 0.0438, "step": 142580 }, { - "epoch": 1.54, - "learning_rate": 6.865792718541112e-05, - "loss": 0.0282, + "epoch": 0.92, + "learning_rate": 0.00016195356822450415, + "loss": 0.0382, "step": 142590 }, { - "epoch": 1.54, - "learning_rate": 6.864170290090207e-05, - "loss": 0.0287, + "epoch": 0.92, + "learning_rate": 0.0001619438868701472, + "loss": 0.0414, "step": 142600 }, { - "epoch": 1.54, - "learning_rate": 6.862547861639302e-05, - "loss": 0.0262, + "epoch": 0.92, + "learning_rate": 0.00016193420551579028, + "loss": 0.0441, "step": 142610 }, { - "epoch": 1.54, - "learning_rate": 6.860925433188396e-05, - "loss": 0.0398, + "epoch": 0.92, + "learning_rate": 0.00016192452416143336, + "loss": 0.0392, "step": 142620 }, { - "epoch": 1.54, - "learning_rate": 6.85930300473749e-05, - "loss": 0.0388, + "epoch": 0.92, + "learning_rate": 0.0001619148428070764, + "loss": 0.0503, "step": 142630 }, { - "epoch": 1.54, - "learning_rate": 6.857680576286586e-05, - "loss": 0.0295, + "epoch": 0.92, + "learning_rate": 0.00016190516145271947, + "loss": 0.0441, "step": 142640 }, { - "epoch": 1.54, - "learning_rate": 6.85605814783568e-05, - "loss": 0.0273, + "epoch": 0.92, + "learning_rate": 0.00016189548009836255, + "loss": 0.0426, "step": 142650 }, { - "epoch": 1.54, - "learning_rate": 6.854435719384776e-05, - "loss": 0.0253, + "epoch": 0.92, + "learning_rate": 0.0001618857987440056, + "loss": 0.0556, "step": 142660 }, { - "epoch": 1.54, - "learning_rate": 6.852813290933869e-05, - "loss": 0.0345, + "epoch": 0.92, + "learning_rate": 0.00016187611738964868, + "loss": 0.043, "step": 142670 }, { - "epoch": 1.54, - "learning_rate": 6.851190862482964e-05, - "loss": 0.0322, + "epoch": 0.92, + "learning_rate": 0.00016186643603529176, + "loss": 0.0408, "step": 142680 }, { - "epoch": 1.54, - "learning_rate": 6.849568434032059e-05, - "loss": 0.0282, + "epoch": 0.92, + "learning_rate": 0.00016185675468093484, + "loss": 0.0395, "step": 142690 }, { - "epoch": 1.54, - "learning_rate": 6.847946005581154e-05, - "loss": 0.029, + "epoch": 0.92, + "learning_rate": 0.00016184707332657787, + "loss": 0.0377, "step": 142700 }, { - "epoch": 1.54, - "learning_rate": 6.846323577130248e-05, - "loss": 0.0261, + "epoch": 0.92, + "learning_rate": 0.00016183739197222095, + "loss": 0.0443, "step": 142710 }, { - "epoch": 1.54, - "learning_rate": 6.844701148679343e-05, - "loss": 0.0319, + "epoch": 0.92, + "learning_rate": 0.00016182771061786403, + "loss": 0.0464, "step": 142720 }, { - "epoch": 1.54, - "learning_rate": 6.843078720228438e-05, - "loss": 0.0277, + "epoch": 0.92, + "learning_rate": 0.00016181802926350708, + "loss": 0.0402, "step": 142730 }, { - "epoch": 1.54, - "learning_rate": 6.841456291777533e-05, - "loss": 0.0323, + "epoch": 0.92, + "learning_rate": 0.00016180834790915016, + "loss": 0.0448, "step": 142740 }, { - "epoch": 1.54, - "learning_rate": 6.839833863326628e-05, - "loss": 0.0315, + "epoch": 0.92, + "learning_rate": 0.00016179866655479324, + "loss": 0.0362, "step": 142750 }, { - "epoch": 1.54, - "learning_rate": 6.838211434875721e-05, - "loss": 0.0284, + "epoch": 0.92, + "learning_rate": 0.00016178898520043632, + "loss": 0.0369, "step": 142760 }, { - "epoch": 1.54, - "learning_rate": 6.836589006424816e-05, - "loss": 0.0342, + "epoch": 0.92, + "learning_rate": 0.00016177930384607934, + "loss": 0.0371, "step": 142770 }, { - "epoch": 1.54, - "learning_rate": 6.834966577973911e-05, - "loss": 0.0299, + "epoch": 0.92, + "learning_rate": 0.00016176962249172242, + "loss": 0.0391, "step": 142780 }, { - "epoch": 1.54, - "learning_rate": 6.833344149523006e-05, - "loss": 0.0302, + "epoch": 0.92, + "learning_rate": 0.0001617599411373655, + "loss": 0.0348, "step": 142790 }, { - "epoch": 1.54, - "learning_rate": 6.8317217210721e-05, - "loss": 0.0279, + "epoch": 0.92, + "learning_rate": 0.00016175025978300856, + "loss": 0.0362, "step": 142800 }, { - "epoch": 1.54, - "learning_rate": 6.830099292621195e-05, - "loss": 0.031, + "epoch": 0.92, + "learning_rate": 0.00016174057842865164, + "loss": 0.0419, "step": 142810 }, { - "epoch": 1.54, - "learning_rate": 6.82847686417029e-05, - "loss": 0.0353, + "epoch": 0.92, + "learning_rate": 0.00016173089707429472, + "loss": 0.0346, "step": 142820 }, { - "epoch": 1.54, - "learning_rate": 6.826854435719385e-05, - "loss": 0.0295, + "epoch": 0.92, + "learning_rate": 0.00016172121571993777, + "loss": 0.0406, "step": 142830 }, { - "epoch": 1.54, - "learning_rate": 6.82523200726848e-05, - "loss": 0.0308, + "epoch": 0.92, + "learning_rate": 0.00016171153436558082, + "loss": 0.041, "step": 142840 }, { - "epoch": 1.55, - "learning_rate": 6.823609578817573e-05, - "loss": 0.0295, + "epoch": 0.92, + "learning_rate": 0.0001617018530112239, + "loss": 0.036, "step": 142850 }, { - "epoch": 1.55, - "learning_rate": 6.821987150366668e-05, - "loss": 0.0276, + "epoch": 0.92, + "learning_rate": 0.00016169217165686695, + "loss": 0.0447, "step": 142860 }, { - "epoch": 1.55, - "learning_rate": 6.820364721915763e-05, - "loss": 0.0241, + "epoch": 0.92, + "learning_rate": 0.00016168249030251003, + "loss": 0.0337, "step": 142870 }, { - "epoch": 1.55, - "learning_rate": 6.818742293464858e-05, - "loss": 0.0272, + "epoch": 0.92, + "learning_rate": 0.0001616728089481531, + "loss": 0.0296, "step": 142880 }, { - "epoch": 1.55, - "learning_rate": 6.817119865013952e-05, - "loss": 0.0276, + "epoch": 0.92, + "learning_rate": 0.0001616631275937962, + "loss": 0.0374, "step": 142890 }, { - "epoch": 1.55, - "learning_rate": 6.815497436563047e-05, - "loss": 0.0288, + "epoch": 0.92, + "learning_rate": 0.00016165344623943925, + "loss": 0.0399, "step": 142900 }, { - "epoch": 1.55, - "learning_rate": 6.813875008112142e-05, - "loss": 0.034, + "epoch": 0.92, + "learning_rate": 0.0001616437648850823, + "loss": 0.0385, "step": 142910 }, { - "epoch": 1.55, - "learning_rate": 6.812252579661237e-05, - "loss": 0.0303, + "epoch": 0.92, + "learning_rate": 0.00016163408353072538, + "loss": 0.0396, "step": 142920 }, { - "epoch": 1.55, - "learning_rate": 6.810630151210332e-05, - "loss": 0.0248, + "epoch": 0.92, + "learning_rate": 0.00016162440217636843, + "loss": 0.0379, "step": 142930 }, { - "epoch": 1.55, - "learning_rate": 6.809007722759425e-05, - "loss": 0.0297, + "epoch": 0.92, + "learning_rate": 0.0001616147208220115, + "loss": 0.0378, "step": 142940 }, { - "epoch": 1.55, - "learning_rate": 6.80738529430852e-05, - "loss": 0.0282, + "epoch": 0.92, + "learning_rate": 0.0001616050394676546, + "loss": 0.035, "step": 142950 }, { - "epoch": 1.55, - "learning_rate": 6.805762865857615e-05, - "loss": 0.0268, + "epoch": 0.92, + "learning_rate": 0.00016159535811329767, + "loss": 0.0365, "step": 142960 }, { - "epoch": 1.55, - "learning_rate": 6.80414043740671e-05, - "loss": 0.0254, + "epoch": 0.92, + "learning_rate": 0.00016158567675894072, + "loss": 0.0483, "step": 142970 }, { - "epoch": 1.55, - "learning_rate": 6.802518008955804e-05, - "loss": 0.0276, + "epoch": 0.92, + "learning_rate": 0.00016157599540458378, + "loss": 0.0472, "step": 142980 }, { - "epoch": 1.55, - "learning_rate": 6.800895580504899e-05, - "loss": 0.0277, + "epoch": 0.92, + "learning_rate": 0.00016156631405022685, + "loss": 0.0386, "step": 142990 }, { - "epoch": 1.55, - "learning_rate": 6.799273152053994e-05, - "loss": 0.0227, + "epoch": 0.92, + "learning_rate": 0.0001615566326958699, + "loss": 0.0368, "step": 143000 }, { - "epoch": 1.55, - "eval_cer": 0.9211843637410967, - "eval_loss": 0.023230884224176407, - "eval_runtime": 119.0392, - "eval_samples_per_second": 16.801, - "eval_steps_per_second": 4.2, + "epoch": 0.92, + "eval_cer": 0.9198716529205739, + "eval_loss": 0.027006572112441063, + "eval_runtime": 120.0134, + "eval_samples_per_second": 16.665, + "eval_steps_per_second": 4.166, "step": 143000 }, { - "epoch": 1.55, - "learning_rate": 6.797650723603089e-05, - "loss": 0.0245, + "epoch": 0.92, + "learning_rate": 0.000161546951341513, + "loss": 0.0397, "step": 143010 }, { - "epoch": 1.55, - "learning_rate": 6.796028295152184e-05, - "loss": 0.0273, + "epoch": 0.92, + "learning_rate": 0.00016153726998715607, + "loss": 0.0348, "step": 143020 }, { - "epoch": 1.55, - "learning_rate": 6.794405866701277e-05, - "loss": 0.0268, + "epoch": 0.92, + "learning_rate": 0.00016152758863279912, + "loss": 0.0433, "step": 143030 }, { - "epoch": 1.55, - "learning_rate": 6.792783438250372e-05, - "loss": 0.0275, + "epoch": 0.92, + "learning_rate": 0.0001615179072784422, + "loss": 0.0365, "step": 143040 }, { - "epoch": 1.55, - "learning_rate": 6.791161009799467e-05, - "loss": 0.03, + "epoch": 0.92, + "learning_rate": 0.00016150822592408525, + "loss": 0.0396, "step": 143050 }, { - "epoch": 1.55, - "learning_rate": 6.789538581348562e-05, - "loss": 0.0273, + "epoch": 0.92, + "learning_rate": 0.0001614985445697283, + "loss": 0.0414, "step": 143060 }, { - "epoch": 1.55, - "learning_rate": 6.787916152897656e-05, - "loss": 0.03, + "epoch": 0.92, + "learning_rate": 0.00016148886321537138, + "loss": 0.0454, "step": 143070 }, { - "epoch": 1.55, - "learning_rate": 6.786293724446751e-05, - "loss": 0.0276, + "epoch": 0.92, + "learning_rate": 0.00016147918186101446, + "loss": 0.0419, "step": 143080 }, { - "epoch": 1.55, - "learning_rate": 6.784671295995846e-05, - "loss": 0.029, + "epoch": 0.92, + "learning_rate": 0.00016146950050665754, + "loss": 0.0407, "step": 143090 }, { - "epoch": 1.55, - "learning_rate": 6.783048867544941e-05, - "loss": 0.028, + "epoch": 0.92, + "learning_rate": 0.0001614598191523006, + "loss": 0.0374, "step": 143100 }, { - "epoch": 1.55, - "learning_rate": 6.781426439094036e-05, - "loss": 0.0276, + "epoch": 0.92, + "learning_rate": 0.00016145013779794368, + "loss": 0.0508, "step": 143110 }, { - "epoch": 1.55, - "learning_rate": 6.77980401064313e-05, - "loss": 0.0288, + "epoch": 0.92, + "learning_rate": 0.00016144045644358673, + "loss": 0.0552, "step": 143120 }, { - "epoch": 1.55, - "learning_rate": 6.778181582192225e-05, - "loss": 0.025, + "epoch": 0.92, + "learning_rate": 0.00016143077508922978, + "loss": 0.04, "step": 143130 }, { - "epoch": 1.55, - "learning_rate": 6.77655915374132e-05, - "loss": 0.0251, + "epoch": 0.92, + "learning_rate": 0.00016142109373487286, + "loss": 0.0369, "step": 143140 }, { - "epoch": 1.55, - "learning_rate": 6.774936725290414e-05, - "loss": 0.0287, + "epoch": 0.92, + "learning_rate": 0.00016141141238051594, + "loss": 0.0418, "step": 143150 }, { - "epoch": 1.55, - "learning_rate": 6.773314296839508e-05, - "loss": 0.0299, + "epoch": 0.92, + "learning_rate": 0.00016140173102615902, + "loss": 0.0399, "step": 143160 }, { - "epoch": 1.55, - "learning_rate": 6.771691868388603e-05, - "loss": 0.0258, + "epoch": 0.92, + "learning_rate": 0.00016139204967180207, + "loss": 0.0367, "step": 143170 }, { - "epoch": 1.55, - "learning_rate": 6.770069439937698e-05, - "loss": 0.0388, + "epoch": 0.92, + "learning_rate": 0.00016138236831744515, + "loss": 0.0384, "step": 143180 }, { - "epoch": 1.55, - "learning_rate": 6.768447011486793e-05, - "loss": 0.0278, + "epoch": 0.92, + "learning_rate": 0.0001613726869630882, + "loss": 0.0348, "step": 143190 }, { - "epoch": 1.55, - "learning_rate": 6.766824583035888e-05, - "loss": 0.0258, + "epoch": 0.92, + "learning_rate": 0.00016136300560873126, + "loss": 0.0413, "step": 143200 }, { - "epoch": 1.55, - "learning_rate": 6.765202154584982e-05, - "loss": 0.03, + "epoch": 0.92, + "learning_rate": 0.00016135332425437434, + "loss": 0.0456, "step": 143210 }, { - "epoch": 1.55, - "learning_rate": 6.763579726134077e-05, - "loss": 0.0274, + "epoch": 0.92, + "learning_rate": 0.00016134364290001742, + "loss": 0.0381, "step": 143220 }, { - "epoch": 1.55, - "learning_rate": 6.761957297683172e-05, - "loss": 0.0276, + "epoch": 0.92, + "learning_rate": 0.00016133396154566047, + "loss": 0.0351, "step": 143230 }, { - "epoch": 1.55, - "learning_rate": 6.760334869232267e-05, - "loss": 0.0255, + "epoch": 0.92, + "learning_rate": 0.00016132428019130355, + "loss": 0.0382, "step": 143240 }, { - "epoch": 1.55, - "learning_rate": 6.75871244078136e-05, - "loss": 0.0269, + "epoch": 0.92, + "learning_rate": 0.00016131459883694663, + "loss": 0.0405, "step": 143250 }, { - "epoch": 1.55, - "learning_rate": 6.757090012330455e-05, - "loss": 0.0265, + "epoch": 0.92, + "learning_rate": 0.00016130491748258966, + "loss": 0.0371, "step": 143260 }, { - "epoch": 1.55, - "learning_rate": 6.75546758387955e-05, - "loss": 0.0327, + "epoch": 0.92, + "learning_rate": 0.00016129523612823274, + "loss": 0.0342, "step": 143270 }, { - "epoch": 1.55, - "learning_rate": 6.753845155428645e-05, - "loss": 0.0245, + "epoch": 0.92, + "learning_rate": 0.00016128555477387582, + "loss": 0.042, "step": 143280 }, { - "epoch": 1.55, - "learning_rate": 6.75222272697774e-05, - "loss": 0.0268, + "epoch": 0.92, + "learning_rate": 0.0001612758734195189, + "loss": 0.0431, "step": 143290 }, { - "epoch": 1.55, - "learning_rate": 6.750600298526834e-05, - "loss": 0.0291, + "epoch": 0.92, + "learning_rate": 0.00016126619206516195, + "loss": 0.0401, "step": 143300 }, { - "epoch": 1.55, - "learning_rate": 6.748977870075929e-05, - "loss": 0.0291, + "epoch": 0.92, + "learning_rate": 0.00016125651071080503, + "loss": 0.0442, "step": 143310 }, { - "epoch": 1.55, - "learning_rate": 6.747355441625024e-05, - "loss": 0.0294, + "epoch": 0.93, + "learning_rate": 0.0001612468293564481, + "loss": 0.0428, "step": 143320 }, { - "epoch": 1.55, - "learning_rate": 6.745733013174119e-05, - "loss": 0.0292, + "epoch": 0.93, + "learning_rate": 0.00016123714800209113, + "loss": 0.0359, "step": 143330 }, { - "epoch": 1.55, - "learning_rate": 6.744110584723214e-05, - "loss": 0.025, + "epoch": 0.93, + "learning_rate": 0.00016122746664773421, + "loss": 0.0344, "step": 143340 }, { - "epoch": 1.55, - "learning_rate": 6.742488156272307e-05, - "loss": 0.0298, + "epoch": 0.93, + "learning_rate": 0.0001612177852933773, + "loss": 0.0512, "step": 143350 }, { - "epoch": 1.55, - "learning_rate": 6.740865727821402e-05, - "loss": 0.0241, + "epoch": 0.93, + "learning_rate": 0.00016120810393902037, + "loss": 0.0353, "step": 143360 }, { - "epoch": 1.55, - "learning_rate": 6.739243299370497e-05, - "loss": 0.0286, + "epoch": 0.93, + "learning_rate": 0.00016119842258466343, + "loss": 0.0436, "step": 143370 }, { - "epoch": 1.55, - "learning_rate": 6.737620870919592e-05, - "loss": 0.0257, + "epoch": 0.93, + "learning_rate": 0.0001611887412303065, + "loss": 0.0404, "step": 143380 }, { - "epoch": 1.55, - "learning_rate": 6.735998442468686e-05, - "loss": 0.0268, + "epoch": 0.93, + "learning_rate": 0.00016117905987594959, + "loss": 0.0407, "step": 143390 }, { - "epoch": 1.55, - "learning_rate": 6.734376014017781e-05, - "loss": 0.0311, + "epoch": 0.93, + "learning_rate": 0.0001611693785215926, + "loss": 0.0398, "step": 143400 }, { - "epoch": 1.55, - "learning_rate": 6.732753585566876e-05, - "loss": 0.0298, + "epoch": 0.93, + "learning_rate": 0.0001611596971672357, + "loss": 0.0436, "step": 143410 }, { - "epoch": 1.55, - "learning_rate": 6.731131157115971e-05, - "loss": 0.0294, + "epoch": 0.93, + "learning_rate": 0.00016115001581287877, + "loss": 0.037, "step": 143420 }, { - "epoch": 1.55, - "learning_rate": 6.729508728665066e-05, - "loss": 0.0282, + "epoch": 0.93, + "learning_rate": 0.00016114033445852182, + "loss": 0.0399, "step": 143430 }, { - "epoch": 1.55, - "learning_rate": 6.72788630021416e-05, - "loss": 0.0282, + "epoch": 0.93, + "learning_rate": 0.0001611306531041649, + "loss": 0.0351, "step": 143440 }, { - "epoch": 1.55, - "learning_rate": 6.726263871763254e-05, - "loss": 0.0268, + "epoch": 0.93, + "learning_rate": 0.00016112097174980798, + "loss": 0.0434, "step": 143450 }, { - "epoch": 1.55, - "learning_rate": 6.724641443312349e-05, - "loss": 0.0227, + "epoch": 0.93, + "learning_rate": 0.00016111129039545106, + "loss": 0.037, "step": 143460 }, { - "epoch": 1.55, - "learning_rate": 6.723019014861444e-05, - "loss": 0.025, + "epoch": 0.93, + "learning_rate": 0.0001611016090410941, + "loss": 0.0389, "step": 143470 }, { - "epoch": 1.55, - "learning_rate": 6.721396586410538e-05, - "loss": 0.0263, + "epoch": 0.93, + "learning_rate": 0.00016109192768673717, + "loss": 0.0377, "step": 143480 }, { - "epoch": 1.55, - "learning_rate": 6.719774157959633e-05, - "loss": 0.0251, + "epoch": 0.93, + "learning_rate": 0.00016108224633238025, + "loss": 0.0402, "step": 143490 }, { - "epoch": 1.55, - "learning_rate": 6.718151729508728e-05, - "loss": 0.0395, + "epoch": 0.93, + "learning_rate": 0.0001610725649780233, + "loss": 0.0384, "step": 143500 }, { - "epoch": 1.55, - "learning_rate": 6.716529301057823e-05, - "loss": 0.0247, + "epoch": 0.93, + "learning_rate": 0.00016106288362366638, + "loss": 0.0392, "step": 143510 }, { - "epoch": 1.55, - "learning_rate": 6.714906872606918e-05, - "loss": 0.0306, + "epoch": 0.93, + "learning_rate": 0.00016105320226930946, + "loss": 0.0375, "step": 143520 }, { - "epoch": 1.55, - "learning_rate": 6.713284444156011e-05, - "loss": 0.0259, + "epoch": 0.93, + "learning_rate": 0.00016104352091495254, + "loss": 0.0389, "step": 143530 }, { - "epoch": 1.55, - "learning_rate": 6.711662015705106e-05, - "loss": 0.0256, + "epoch": 0.93, + "learning_rate": 0.00016103383956059557, + "loss": 0.043, "step": 143540 }, { - "epoch": 1.55, - "learning_rate": 6.710039587254201e-05, - "loss": 0.0317, + "epoch": 0.93, + "learning_rate": 0.00016102415820623865, + "loss": 0.0403, "step": 143550 }, { - "epoch": 1.55, - "learning_rate": 6.708417158803296e-05, - "loss": 0.0271, + "epoch": 0.93, + "learning_rate": 0.00016101447685188173, + "loss": 0.0367, "step": 143560 }, { - "epoch": 1.55, - "learning_rate": 6.70679473035239e-05, - "loss": 0.0263, + "epoch": 0.93, + "learning_rate": 0.00016100479549752478, + "loss": 0.0363, "step": 143570 }, { - "epoch": 1.55, - "learning_rate": 6.705172301901485e-05, - "loss": 0.0283, + "epoch": 0.93, + "learning_rate": 0.00016099511414316786, + "loss": 0.0425, "step": 143580 }, { - "epoch": 1.55, - "learning_rate": 6.70354987345058e-05, - "loss": 0.0279, + "epoch": 0.93, + "learning_rate": 0.00016098543278881094, + "loss": 0.0399, "step": 143590 }, { - "epoch": 1.55, - "learning_rate": 6.701927444999675e-05, - "loss": 0.0293, + "epoch": 0.93, + "learning_rate": 0.000160975751434454, + "loss": 0.0478, "step": 143600 }, { - "epoch": 1.55, - "learning_rate": 6.70030501654877e-05, - "loss": 0.0326, + "epoch": 0.93, + "learning_rate": 0.00016096607008009704, + "loss": 0.0388, "step": 143610 }, { - "epoch": 1.55, - "learning_rate": 6.698682588097864e-05, - "loss": 0.0234, + "epoch": 0.93, + "learning_rate": 0.00016095638872574012, + "loss": 0.0382, "step": 143620 }, { - "epoch": 1.55, - "learning_rate": 6.697060159646958e-05, - "loss": 0.0239, + "epoch": 0.93, + "learning_rate": 0.00016094670737138318, + "loss": 0.042, "step": 143630 }, { - "epoch": 1.55, - "learning_rate": 6.695437731196053e-05, - "loss": 0.0294, + "epoch": 0.93, + "learning_rate": 0.00016093702601702626, + "loss": 0.0418, "step": 143640 }, { - "epoch": 1.55, - "learning_rate": 6.693815302745148e-05, - "loss": 0.0255, + "epoch": 0.93, + "learning_rate": 0.00016092734466266934, + "loss": 0.0413, "step": 143650 }, { - "epoch": 1.55, - "learning_rate": 6.692192874294242e-05, - "loss": 0.0267, + "epoch": 0.93, + "learning_rate": 0.00016091766330831241, + "loss": 0.0444, "step": 143660 }, { - "epoch": 1.55, - "learning_rate": 6.690570445843337e-05, - "loss": 0.0322, + "epoch": 0.93, + "learning_rate": 0.00016090798195395547, + "loss": 0.039, "step": 143670 }, { - "epoch": 1.55, - "learning_rate": 6.688948017392432e-05, - "loss": 0.0309, + "epoch": 0.93, + "learning_rate": 0.00016089830059959852, + "loss": 0.0518, "step": 143680 }, { - "epoch": 1.55, - "learning_rate": 6.687325588941527e-05, - "loss": 0.0237, + "epoch": 0.93, + "learning_rate": 0.0001608886192452416, + "loss": 0.0332, "step": 143690 }, { - "epoch": 1.55, - "learning_rate": 6.685703160490622e-05, - "loss": 0.0276, + "epoch": 0.93, + "learning_rate": 0.00016087893789088465, + "loss": 0.0358, "step": 143700 }, { - "epoch": 1.55, - "learning_rate": 6.684080732039716e-05, - "loss": 0.0314, + "epoch": 0.93, + "learning_rate": 0.00016086925653652773, + "loss": 0.0397, "step": 143710 }, { - "epoch": 1.55, - "learning_rate": 6.68245830358881e-05, - "loss": 0.0304, + "epoch": 0.93, + "learning_rate": 0.0001608595751821708, + "loss": 0.0398, "step": 143720 }, { - "epoch": 1.55, - "learning_rate": 6.680835875137907e-05, - "loss": 0.0296, + "epoch": 0.93, + "learning_rate": 0.0001608498938278139, + "loss": 0.0357, "step": 143730 }, { - "epoch": 1.55, - "learning_rate": 6.679213446687e-05, - "loss": 0.0307, + "epoch": 0.93, + "learning_rate": 0.00016084021247345694, + "loss": 0.0418, "step": 143740 }, { - "epoch": 1.55, - "learning_rate": 6.677591018236095e-05, - "loss": 0.0281, + "epoch": 0.93, + "learning_rate": 0.0001608305311191, + "loss": 0.0383, "step": 143750 }, { - "epoch": 1.55, - "learning_rate": 6.67596858978519e-05, - "loss": 0.0262, + "epoch": 0.93, + "learning_rate": 0.00016082084976474308, + "loss": 0.0452, "step": 143760 }, { - "epoch": 1.56, - "learning_rate": 6.674346161334285e-05, - "loss": 0.0316, + "epoch": 0.93, + "learning_rate": 0.00016081116841038613, + "loss": 0.0369, "step": 143770 }, { - "epoch": 1.56, - "learning_rate": 6.672723732883379e-05, - "loss": 0.0289, + "epoch": 0.93, + "learning_rate": 0.0001608014870560292, + "loss": 0.037, "step": 143780 }, { - "epoch": 1.56, - "learning_rate": 6.671101304432474e-05, - "loss": 0.0256, + "epoch": 0.93, + "learning_rate": 0.0001607918057016723, + "loss": 0.0373, "step": 143790 }, { - "epoch": 1.56, - "learning_rate": 6.669478875981569e-05, - "loss": 0.0353, + "epoch": 0.93, + "learning_rate": 0.00016078212434731534, + "loss": 0.0418, "step": 143800 }, { - "epoch": 1.56, - "learning_rate": 6.667856447530664e-05, - "loss": 0.0283, + "epoch": 0.93, + "learning_rate": 0.00016077244299295842, + "loss": 0.0365, "step": 143810 }, { - "epoch": 1.56, - "learning_rate": 6.666234019079759e-05, - "loss": 0.0289, + "epoch": 0.93, + "learning_rate": 0.00016076276163860147, + "loss": 0.035, "step": 143820 }, { - "epoch": 1.56, - "learning_rate": 6.664611590628853e-05, - "loss": 0.0305, + "epoch": 0.93, + "learning_rate": 0.00016075308028424453, + "loss": 0.0432, "step": 143830 }, { - "epoch": 1.56, - "learning_rate": 6.662989162177948e-05, - "loss": 0.0326, + "epoch": 0.93, + "learning_rate": 0.0001607433989298876, + "loss": 0.0406, "step": 143840 }, { - "epoch": 1.56, - "learning_rate": 6.661366733727043e-05, - "loss": 0.0353, + "epoch": 0.93, + "learning_rate": 0.0001607337175755307, + "loss": 0.0457, "step": 143850 }, { - "epoch": 1.56, - "learning_rate": 6.659744305276138e-05, - "loss": 0.0263, + "epoch": 0.93, + "learning_rate": 0.00016072403622117377, + "loss": 0.0332, "step": 143860 }, { - "epoch": 1.56, - "learning_rate": 6.658121876825231e-05, - "loss": 0.0297, + "epoch": 0.93, + "learning_rate": 0.00016071435486681682, + "loss": 0.0391, "step": 143870 }, { - "epoch": 1.56, - "learning_rate": 6.656499448374326e-05, - "loss": 0.0332, + "epoch": 0.93, + "learning_rate": 0.0001607046735124599, + "loss": 0.0382, "step": 143880 }, { - "epoch": 1.56, - "learning_rate": 6.654877019923421e-05, - "loss": 0.0243, + "epoch": 0.93, + "learning_rate": 0.00016069499215810295, + "loss": 0.0327, "step": 143890 }, { - "epoch": 1.56, - "learning_rate": 6.653254591472516e-05, - "loss": 0.0292, + "epoch": 0.93, + "learning_rate": 0.000160685310803746, + "loss": 0.0404, "step": 143900 }, { - "epoch": 1.56, - "learning_rate": 6.651632163021611e-05, - "loss": 0.025, + "epoch": 0.93, + "learning_rate": 0.00016067562944938908, + "loss": 0.0359, "step": 143910 }, { - "epoch": 1.56, - "learning_rate": 6.650009734570705e-05, - "loss": 0.0299, + "epoch": 0.93, + "learning_rate": 0.00016066594809503216, + "loss": 0.0426, "step": 143920 }, { - "epoch": 1.56, - "learning_rate": 6.6483873061198e-05, - "loss": 0.0297, + "epoch": 0.93, + "learning_rate": 0.00016065626674067524, + "loss": 0.0376, "step": 143930 }, { - "epoch": 1.56, - "learning_rate": 6.646764877668895e-05, - "loss": 0.0269, + "epoch": 0.93, + "learning_rate": 0.0001606465853863183, + "loss": 0.0376, "step": 143940 }, { - "epoch": 1.56, - "learning_rate": 6.64514244921799e-05, - "loss": 0.0297, + "epoch": 0.93, + "learning_rate": 0.00016063690403196138, + "loss": 0.0394, "step": 143950 }, { - "epoch": 1.56, - "learning_rate": 6.643520020767083e-05, - "loss": 0.03, + "epoch": 0.93, + "learning_rate": 0.00016062722267760443, + "loss": 0.0343, "step": 143960 }, { - "epoch": 1.56, - "learning_rate": 6.641897592316178e-05, - "loss": 0.0305, + "epoch": 0.93, + "learning_rate": 0.00016061754132324748, + "loss": 0.0381, "step": 143970 }, { - "epoch": 1.56, - "learning_rate": 6.640275163865273e-05, - "loss": 0.0319, + "epoch": 0.93, + "learning_rate": 0.00016060785996889056, + "loss": 0.0397, "step": 143980 }, { - "epoch": 1.56, - "learning_rate": 6.638652735414368e-05, - "loss": 0.0258, + "epoch": 0.93, + "learning_rate": 0.00016059817861453364, + "loss": 0.0359, "step": 143990 }, { - "epoch": 1.56, - "learning_rate": 6.637030306963463e-05, - "loss": 0.0261, + "epoch": 0.93, + "learning_rate": 0.0001605884972601767, + "loss": 0.0365, "step": 144000 }, { - "epoch": 1.56, - "eval_cer": 0.9210889474344499, - "eval_loss": 0.02324651926755905, - "eval_runtime": 119.1065, - "eval_samples_per_second": 16.792, - "eval_steps_per_second": 4.198, + "epoch": 0.93, + "eval_cer": 0.9198861145633261, + "eval_loss": 0.02664892189204693, + "eval_runtime": 119.7778, + "eval_samples_per_second": 16.698, + "eval_steps_per_second": 4.174, "step": 144000 }, { - "epoch": 1.56, - "learning_rate": 6.635407878512557e-05, - "loss": 0.0232, + "epoch": 0.93, + "learning_rate": 0.00016057881590581977, + "loss": 0.0456, "step": 144010 }, { - "epoch": 1.56, - "learning_rate": 6.633785450061652e-05, - "loss": 0.0308, + "epoch": 0.93, + "learning_rate": 0.00016056913455146285, + "loss": 0.0338, "step": 144020 }, { - "epoch": 1.56, - "learning_rate": 6.632163021610747e-05, - "loss": 0.0279, + "epoch": 0.93, + "learning_rate": 0.00016055945319710588, + "loss": 0.0327, "step": 144030 }, { - "epoch": 1.56, - "learning_rate": 6.630540593159842e-05, - "loss": 0.0292, + "epoch": 0.93, + "learning_rate": 0.00016054977184274896, + "loss": 0.0383, "step": 144040 }, { - "epoch": 1.56, - "learning_rate": 6.628918164708935e-05, - "loss": 0.0296, + "epoch": 0.93, + "learning_rate": 0.00016054009048839204, + "loss": 0.0402, "step": 144050 }, { - "epoch": 1.56, - "learning_rate": 6.62729573625803e-05, - "loss": 0.0305, + "epoch": 0.93, + "learning_rate": 0.00016053040913403512, + "loss": 0.0422, "step": 144060 }, { - "epoch": 1.56, - "learning_rate": 6.625673307807125e-05, - "loss": 0.029, + "epoch": 0.93, + "learning_rate": 0.00016052072777967817, + "loss": 0.036, "step": 144070 }, { - "epoch": 1.56, - "learning_rate": 6.62405087935622e-05, - "loss": 0.0272, + "epoch": 0.93, + "learning_rate": 0.00016051104642532125, + "loss": 0.0485, "step": 144080 }, { - "epoch": 1.56, - "learning_rate": 6.622428450905315e-05, - "loss": 0.0267, + "epoch": 0.93, + "learning_rate": 0.00016050136507096433, + "loss": 0.0416, "step": 144090 }, { - "epoch": 1.56, - "learning_rate": 6.620806022454409e-05, - "loss": 0.0283, + "epoch": 0.93, + "learning_rate": 0.00016049168371660736, + "loss": 0.0364, "step": 144100 }, { - "epoch": 1.56, - "learning_rate": 6.619183594003504e-05, - "loss": 0.0238, + "epoch": 0.93, + "learning_rate": 0.00016048200236225044, + "loss": 0.0387, "step": 144110 }, { - "epoch": 1.56, - "learning_rate": 6.617561165552599e-05, - "loss": 0.0326, + "epoch": 0.93, + "learning_rate": 0.00016047232100789352, + "loss": 0.0454, "step": 144120 }, { - "epoch": 1.56, - "learning_rate": 6.615938737101694e-05, - "loss": 0.0337, + "epoch": 0.93, + "learning_rate": 0.0001604626396535366, + "loss": 0.0461, "step": 144130 }, { - "epoch": 1.56, - "learning_rate": 6.614316308650787e-05, - "loss": 0.0306, + "epoch": 0.93, + "learning_rate": 0.00016045295829917965, + "loss": 0.0389, "step": 144140 }, { - "epoch": 1.56, - "learning_rate": 6.612693880199882e-05, - "loss": 0.0261, + "epoch": 0.93, + "learning_rate": 0.00016044327694482273, + "loss": 0.0452, "step": 144150 }, { - "epoch": 1.56, - "learning_rate": 6.611071451748977e-05, - "loss": 0.0309, + "epoch": 0.93, + "learning_rate": 0.0001604335955904658, + "loss": 0.0482, "step": 144160 }, { - "epoch": 1.56, - "learning_rate": 6.609449023298072e-05, - "loss": 0.0265, + "epoch": 0.93, + "learning_rate": 0.00016042391423610883, + "loss": 0.0384, "step": 144170 }, { - "epoch": 1.56, - "learning_rate": 6.607826594847167e-05, - "loss": 0.0319, + "epoch": 0.93, + "learning_rate": 0.00016041423288175191, + "loss": 0.0374, "step": 144180 }, { - "epoch": 1.56, - "learning_rate": 6.606204166396261e-05, - "loss": 0.0274, + "epoch": 0.93, + "learning_rate": 0.000160404551527395, + "loss": 0.0389, "step": 144190 }, { - "epoch": 1.56, - "learning_rate": 6.604581737945356e-05, - "loss": 0.0327, + "epoch": 0.93, + "learning_rate": 0.00016039487017303805, + "loss": 0.0372, "step": 144200 }, { - "epoch": 1.56, - "learning_rate": 6.602959309494451e-05, - "loss": 0.031, + "epoch": 0.93, + "learning_rate": 0.00016038518881868113, + "loss": 0.0467, "step": 144210 }, { - "epoch": 1.56, - "learning_rate": 6.601336881043546e-05, - "loss": 0.0274, + "epoch": 0.93, + "learning_rate": 0.0001603755074643242, + "loss": 0.0448, "step": 144220 }, { - "epoch": 1.56, - "learning_rate": 6.59971445259264e-05, - "loss": 0.0258, + "epoch": 0.93, + "learning_rate": 0.00016036582610996729, + "loss": 0.0406, "step": 144230 }, { - "epoch": 1.56, - "learning_rate": 6.598092024141734e-05, - "loss": 0.025, + "epoch": 0.93, + "learning_rate": 0.0001603561447556103, + "loss": 0.0429, "step": 144240 }, { - "epoch": 1.56, - "learning_rate": 6.59646959569083e-05, - "loss": 0.0301, + "epoch": 0.93, + "learning_rate": 0.0001603464634012534, + "loss": 0.0404, "step": 144250 }, { - "epoch": 1.56, - "learning_rate": 6.594847167239924e-05, - "loss": 0.0323, + "epoch": 0.93, + "learning_rate": 0.00016033678204689647, + "loss": 0.0413, "step": 144260 }, { - "epoch": 1.56, - "learning_rate": 6.59322473878902e-05, - "loss": 0.0268, + "epoch": 0.93, + "learning_rate": 0.00016032710069253952, + "loss": 0.0374, "step": 144270 }, { - "epoch": 1.56, - "learning_rate": 6.591602310338113e-05, - "loss": 0.026, + "epoch": 0.93, + "learning_rate": 0.0001603174193381826, + "loss": 0.0447, "step": 144280 }, { - "epoch": 1.56, - "learning_rate": 6.589979881887208e-05, - "loss": 0.0255, + "epoch": 0.93, + "learning_rate": 0.00016030773798382568, + "loss": 0.0401, "step": 144290 }, { - "epoch": 1.56, - "learning_rate": 6.588357453436303e-05, - "loss": 0.0285, + "epoch": 0.93, + "learning_rate": 0.00016029805662946876, + "loss": 0.0418, "step": 144300 }, { - "epoch": 1.56, - "learning_rate": 6.586735024985398e-05, - "loss": 0.0213, + "epoch": 0.93, + "learning_rate": 0.0001602883752751118, + "loss": 0.0365, "step": 144310 }, { - "epoch": 1.56, - "learning_rate": 6.585112596534492e-05, - "loss": 0.0269, + "epoch": 0.93, + "learning_rate": 0.00016027869392075487, + "loss": 0.0383, "step": 144320 }, { - "epoch": 1.56, - "learning_rate": 6.583490168083587e-05, - "loss": 0.0327, + "epoch": 0.93, + "learning_rate": 0.00016026901256639795, + "loss": 0.0408, "step": 144330 }, { - "epoch": 1.56, - "learning_rate": 6.581867739632682e-05, - "loss": 0.0275, + "epoch": 0.93, + "learning_rate": 0.000160259331212041, + "loss": 0.0386, "step": 144340 }, { - "epoch": 1.56, - "learning_rate": 6.580245311181777e-05, - "loss": 0.0376, + "epoch": 0.93, + "learning_rate": 0.00016024964985768408, + "loss": 0.0379, "step": 144350 }, { - "epoch": 1.56, - "learning_rate": 6.578622882730871e-05, - "loss": 0.0282, + "epoch": 0.93, + "learning_rate": 0.00016023996850332716, + "loss": 0.0382, "step": 144360 }, { - "epoch": 1.56, - "learning_rate": 6.577000454279965e-05, - "loss": 0.0275, + "epoch": 0.93, + "learning_rate": 0.00016023028714897024, + "loss": 0.0415, "step": 144370 }, { - "epoch": 1.56, - "learning_rate": 6.57537802582906e-05, - "loss": 0.026, + "epoch": 0.93, + "learning_rate": 0.00016022060579461327, + "loss": 0.05, "step": 144380 }, { - "epoch": 1.56, - "learning_rate": 6.573755597378155e-05, - "loss": 0.0252, + "epoch": 0.93, + "learning_rate": 0.00016021092444025635, + "loss": 0.0368, "step": 144390 }, { - "epoch": 1.56, - "learning_rate": 6.57213316892725e-05, - "loss": 0.0352, + "epoch": 0.93, + "learning_rate": 0.0001602012430858994, + "loss": 0.0354, "step": 144400 }, { - "epoch": 1.56, - "learning_rate": 6.570510740476345e-05, - "loss": 0.0301, + "epoch": 0.93, + "learning_rate": 0.00016019156173154248, + "loss": 0.0369, "step": 144410 }, { - "epoch": 1.56, - "learning_rate": 6.568888312025439e-05, - "loss": 0.0269, + "epoch": 0.93, + "learning_rate": 0.00016018188037718556, + "loss": 0.0413, "step": 144420 }, { - "epoch": 1.56, - "learning_rate": 6.567265883574534e-05, - "loss": 0.0236, + "epoch": 0.93, + "learning_rate": 0.00016017219902282864, + "loss": 0.0375, "step": 144430 }, { - "epoch": 1.56, - "learning_rate": 6.565643455123629e-05, - "loss": 0.0384, + "epoch": 0.93, + "learning_rate": 0.0001601625176684717, + "loss": 0.0405, "step": 144440 }, { - "epoch": 1.56, - "learning_rate": 6.564021026672724e-05, - "loss": 0.0261, + "epoch": 0.93, + "learning_rate": 0.00016015283631411474, + "loss": 0.0321, "step": 144450 }, { - "epoch": 1.56, - "learning_rate": 6.562398598221817e-05, - "loss": 0.0368, + "epoch": 0.93, + "learning_rate": 0.00016014315495975782, + "loss": 0.0429, "step": 144460 }, { - "epoch": 1.56, - "learning_rate": 6.560776169770912e-05, - "loss": 0.0287, + "epoch": 0.93, + "learning_rate": 0.00016013347360540088, + "loss": 0.0383, "step": 144470 }, { - "epoch": 1.56, - "learning_rate": 6.559153741320007e-05, - "loss": 0.0322, + "epoch": 0.93, + "learning_rate": 0.00016012379225104395, + "loss": 0.0328, "step": 144480 }, { - "epoch": 1.56, - "learning_rate": 6.557531312869102e-05, - "loss": 0.0315, + "epoch": 0.93, + "learning_rate": 0.00016011411089668703, + "loss": 0.0393, "step": 144490 }, { - "epoch": 1.56, - "learning_rate": 6.555908884418197e-05, - "loss": 0.0259, + "epoch": 0.93, + "learning_rate": 0.00016010442954233011, + "loss": 0.0366, "step": 144500 }, { - "epoch": 1.56, - "learning_rate": 6.554286455967291e-05, - "loss": 0.0267, + "epoch": 0.93, + "learning_rate": 0.00016009474818797317, + "loss": 0.0413, "step": 144510 }, { - "epoch": 1.56, - "learning_rate": 6.552664027516386e-05, - "loss": 0.0277, + "epoch": 0.93, + "learning_rate": 0.00016008506683361622, + "loss": 0.038, "step": 144520 }, { - "epoch": 1.56, - "learning_rate": 6.55104159906548e-05, - "loss": 0.0267, + "epoch": 0.93, + "learning_rate": 0.0001600753854792593, + "loss": 0.0349, "step": 144530 }, { - "epoch": 1.56, - "learning_rate": 6.549419170614576e-05, - "loss": 0.0296, + "epoch": 0.93, + "learning_rate": 0.00016006570412490235, + "loss": 0.0393, "step": 144540 }, { - "epoch": 1.56, - "learning_rate": 6.547796742163669e-05, - "loss": 0.0294, + "epoch": 0.93, + "learning_rate": 0.00016005602277054543, + "loss": 0.0369, "step": 144550 }, { - "epoch": 1.56, - "learning_rate": 6.546174313712764e-05, - "loss": 0.0292, + "epoch": 0.93, + "learning_rate": 0.0001600463414161885, + "loss": 0.0377, "step": 144560 }, { - "epoch": 1.56, - "learning_rate": 6.544551885261859e-05, - "loss": 0.0304, + "epoch": 0.93, + "learning_rate": 0.0001600366600618316, + "loss": 0.0384, "step": 144570 }, { - "epoch": 1.56, - "learning_rate": 6.542929456810954e-05, - "loss": 0.0254, + "epoch": 0.93, + "learning_rate": 0.00016002697870747464, + "loss": 0.0426, "step": 144580 }, { - "epoch": 1.56, - "learning_rate": 6.541307028360049e-05, - "loss": 0.0308, + "epoch": 0.93, + "learning_rate": 0.0001600172973531177, + "loss": 0.0352, "step": 144590 }, { - "epoch": 1.56, - "learning_rate": 6.539684599909143e-05, - "loss": 0.0304, + "epoch": 0.93, + "learning_rate": 0.00016000761599876075, + "loss": 0.0377, "step": 144600 }, { - "epoch": 1.56, - "learning_rate": 6.538062171458238e-05, - "loss": 0.0294, + "epoch": 0.93, + "learning_rate": 0.00015999793464440383, + "loss": 0.0369, "step": 144610 }, { - "epoch": 1.56, - "learning_rate": 6.536439743007333e-05, - "loss": 0.0304, + "epoch": 0.93, + "learning_rate": 0.0001599882532900469, + "loss": 0.0399, "step": 144620 }, { - "epoch": 1.56, - "learning_rate": 6.534817314556428e-05, - "loss": 0.0375, + "epoch": 0.93, + "learning_rate": 0.00015997857193569, + "loss": 0.0386, "step": 144630 }, { - "epoch": 1.56, - "learning_rate": 6.533194886105521e-05, - "loss": 0.0299, + "epoch": 0.93, + "learning_rate": 0.00015996889058133304, + "loss": 0.0369, "step": 144640 }, { - "epoch": 1.56, - "learning_rate": 6.531572457654616e-05, - "loss": 0.0389, + "epoch": 0.93, + "learning_rate": 0.00015995920922697612, + "loss": 0.0404, "step": 144650 }, { - "epoch": 1.56, - "learning_rate": 6.529950029203711e-05, - "loss": 0.0295, + "epoch": 0.93, + "learning_rate": 0.00015994952787261917, + "loss": 0.038, "step": 144660 }, { - "epoch": 1.56, - "learning_rate": 6.528327600752806e-05, - "loss": 0.0279, + "epoch": 0.93, + "learning_rate": 0.00015993984651826223, + "loss": 0.0346, "step": 144670 }, { - "epoch": 1.56, - "learning_rate": 6.526705172301901e-05, - "loss": 0.0278, + "epoch": 0.93, + "learning_rate": 0.0001599301651639053, + "loss": 0.0327, "step": 144680 }, { - "epoch": 1.56, - "learning_rate": 6.525082743850995e-05, - "loss": 0.0267, + "epoch": 0.93, + "learning_rate": 0.0001599204838095484, + "loss": 0.0373, "step": 144690 }, { - "epoch": 1.57, - "learning_rate": 6.52346031540009e-05, - "loss": 0.025, + "epoch": 0.93, + "learning_rate": 0.00015991080245519147, + "loss": 0.0465, "step": 144700 }, { - "epoch": 1.57, - "learning_rate": 6.521837886949185e-05, - "loss": 0.0248, + "epoch": 0.93, + "learning_rate": 0.00015990112110083452, + "loss": 0.0408, "step": 144710 }, { - "epoch": 1.57, - "learning_rate": 6.52021545849828e-05, - "loss": 0.0329, + "epoch": 0.93, + "learning_rate": 0.0001598914397464776, + "loss": 0.0397, "step": 144720 }, { - "epoch": 1.57, - "learning_rate": 6.518593030047373e-05, - "loss": 0.0317, + "epoch": 0.93, + "learning_rate": 0.00015988175839212065, + "loss": 0.0466, "step": 144730 }, { - "epoch": 1.57, - "learning_rate": 6.516970601596468e-05, - "loss": 0.0226, + "epoch": 0.93, + "learning_rate": 0.0001598720770377637, + "loss": 0.043, "step": 144740 }, { - "epoch": 1.57, - "learning_rate": 6.515348173145563e-05, - "loss": 0.0281, + "epoch": 0.93, + "learning_rate": 0.00015986239568340678, + "loss": 0.0415, "step": 144750 }, { - "epoch": 1.57, - "learning_rate": 6.513725744694658e-05, - "loss": 0.0304, + "epoch": 0.93, + "learning_rate": 0.00015985271432904986, + "loss": 0.0388, "step": 144760 }, { - "epoch": 1.57, - "learning_rate": 6.512103316243753e-05, - "loss": 0.03, + "epoch": 0.93, + "learning_rate": 0.00015984303297469294, + "loss": 0.0413, "step": 144770 }, { - "epoch": 1.57, - "learning_rate": 6.510480887792847e-05, - "loss": 0.0261, + "epoch": 0.93, + "learning_rate": 0.000159833351620336, + "loss": 0.0421, "step": 144780 }, { - "epoch": 1.57, - "learning_rate": 6.508858459341942e-05, - "loss": 0.0282, + "epoch": 0.93, + "learning_rate": 0.00015982367026597908, + "loss": 0.0424, "step": 144790 }, { - "epoch": 1.57, - "learning_rate": 6.507236030891037e-05, - "loss": 0.026, + "epoch": 0.93, + "learning_rate": 0.0001598139889116221, + "loss": 0.0413, "step": 144800 }, { - "epoch": 1.57, - "learning_rate": 6.505613602440132e-05, - "loss": 0.0276, + "epoch": 0.93, + "learning_rate": 0.00015980430755726518, + "loss": 0.0379, "step": 144810 }, { - "epoch": 1.57, - "learning_rate": 6.503991173989226e-05, - "loss": 0.0316, + "epoch": 0.93, + "learning_rate": 0.00015979462620290826, + "loss": 0.0367, "step": 144820 }, { - "epoch": 1.57, - "learning_rate": 6.50236874553832e-05, - "loss": 0.0264, + "epoch": 0.93, + "learning_rate": 0.00015978494484855134, + "loss": 0.0352, "step": 144830 }, { - "epoch": 1.57, - "learning_rate": 6.500746317087415e-05, - "loss": 0.0356, + "epoch": 0.93, + "learning_rate": 0.0001597752634941944, + "loss": 0.0395, "step": 144840 }, { - "epoch": 1.57, - "learning_rate": 6.49912388863651e-05, - "loss": 0.0334, + "epoch": 0.93, + "learning_rate": 0.00015976558213983747, + "loss": 0.0342, "step": 144850 }, { - "epoch": 1.57, - "learning_rate": 6.497501460185605e-05, - "loss": 0.0266, + "epoch": 0.93, + "learning_rate": 0.00015975590078548055, + "loss": 0.0347, "step": 144860 }, { - "epoch": 1.57, - "learning_rate": 6.495879031734699e-05, - "loss": 0.0268, + "epoch": 0.94, + "learning_rate": 0.00015974621943112358, + "loss": 0.0358, "step": 144870 }, { - "epoch": 1.57, - "learning_rate": 6.494256603283794e-05, - "loss": 0.028, + "epoch": 0.94, + "learning_rate": 0.00015973653807676666, + "loss": 0.0407, "step": 144880 }, { - "epoch": 1.57, - "learning_rate": 6.492634174832889e-05, - "loss": 0.0311, + "epoch": 0.94, + "learning_rate": 0.00015972685672240974, + "loss": 0.0399, "step": 144890 }, { - "epoch": 1.57, - "learning_rate": 6.491011746381984e-05, - "loss": 0.0262, + "epoch": 0.94, + "learning_rate": 0.00015971717536805282, + "loss": 0.0343, "step": 144900 }, { - "epoch": 1.57, - "learning_rate": 6.489389317931079e-05, - "loss": 0.0269, + "epoch": 0.94, + "learning_rate": 0.00015970749401369587, + "loss": 0.042, "step": 144910 }, { - "epoch": 1.57, - "learning_rate": 6.487766889480174e-05, - "loss": 0.0289, + "epoch": 0.94, + "learning_rate": 0.00015969781265933895, + "loss": 0.0352, "step": 144920 }, { - "epoch": 1.57, - "learning_rate": 6.486144461029269e-05, - "loss": 0.0275, + "epoch": 0.94, + "learning_rate": 0.00015968813130498203, + "loss": 0.0401, "step": 144930 }, { - "epoch": 1.57, - "learning_rate": 6.484522032578363e-05, - "loss": 0.0256, + "epoch": 0.94, + "learning_rate": 0.00015967844995062506, + "loss": 0.0418, "step": 144940 }, { - "epoch": 1.57, - "learning_rate": 6.482899604127458e-05, - "loss": 0.0274, + "epoch": 0.94, + "learning_rate": 0.00015966876859626814, + "loss": 0.0414, "step": 144950 }, { - "epoch": 1.57, - "learning_rate": 6.481277175676552e-05, - "loss": 0.028, + "epoch": 0.94, + "learning_rate": 0.00015965908724191122, + "loss": 0.0352, "step": 144960 }, { - "epoch": 1.57, - "learning_rate": 6.479654747225647e-05, - "loss": 0.0283, + "epoch": 0.94, + "learning_rate": 0.0001596494058875543, + "loss": 0.0465, "step": 144970 }, { - "epoch": 1.57, - "learning_rate": 6.478032318774742e-05, - "loss": 0.0247, + "epoch": 0.94, + "learning_rate": 0.00015963972453319735, + "loss": 0.0421, "step": 144980 }, { - "epoch": 1.57, - "learning_rate": 6.476409890323836e-05, - "loss": 0.0256, + "epoch": 0.94, + "learning_rate": 0.00015963004317884043, + "loss": 0.0422, "step": 144990 }, { - "epoch": 1.57, - "learning_rate": 6.474787461872931e-05, - "loss": 0.0269, + "epoch": 0.94, + "learning_rate": 0.0001596203618244835, + "loss": 0.0413, "step": 145000 }, { - "epoch": 1.57, - "eval_cer": 0.9211260537759236, - "eval_loss": 0.022748522460460663, - "eval_runtime": 119.0779, - "eval_samples_per_second": 16.796, - "eval_steps_per_second": 4.199, + "epoch": 0.94, + "eval_cer": 0.9198535758671337, + "eval_loss": 0.02679886296391487, + "eval_runtime": 119.8861, + "eval_samples_per_second": 16.682, + "eval_steps_per_second": 4.171, "step": 145000 }, { - "epoch": 1.57, - "learning_rate": 6.473165033422026e-05, - "loss": 0.0267, + "epoch": 0.94, + "learning_rate": 0.00015961068047012653, + "loss": 0.0407, "step": 145010 }, { - "epoch": 1.57, - "learning_rate": 6.471542604971121e-05, - "loss": 0.0239, + "epoch": 0.94, + "learning_rate": 0.0001596009991157696, + "loss": 0.0393, "step": 145020 }, { - "epoch": 1.57, - "learning_rate": 6.469920176520215e-05, - "loss": 0.0307, + "epoch": 0.94, + "learning_rate": 0.0001595913177614127, + "loss": 0.0387, "step": 145030 }, { - "epoch": 1.57, - "learning_rate": 6.46829774806931e-05, - "loss": 0.0309, + "epoch": 0.94, + "learning_rate": 0.00015958163640705575, + "loss": 0.0418, "step": 145040 }, { - "epoch": 1.57, - "learning_rate": 6.466675319618405e-05, - "loss": 0.0268, + "epoch": 0.94, + "learning_rate": 0.00015957195505269883, + "loss": 0.041, "step": 145050 }, { - "epoch": 1.57, - "learning_rate": 6.4650528911675e-05, - "loss": 0.0278, + "epoch": 0.94, + "learning_rate": 0.0001595622736983419, + "loss": 0.0368, "step": 145060 }, { - "epoch": 1.57, - "learning_rate": 6.463430462716595e-05, - "loss": 0.0321, + "epoch": 0.94, + "learning_rate": 0.00015955259234398499, + "loss": 0.0405, "step": 145070 }, { - "epoch": 1.57, - "learning_rate": 6.461808034265688e-05, - "loss": 0.0292, + "epoch": 0.94, + "learning_rate": 0.000159542910989628, + "loss": 0.0362, "step": 145080 }, { - "epoch": 1.57, - "learning_rate": 6.460185605814783e-05, - "loss": 0.0294, + "epoch": 0.94, + "learning_rate": 0.0001595332296352711, + "loss": 0.0396, "step": 145090 }, { - "epoch": 1.57, - "learning_rate": 6.458563177363878e-05, - "loss": 0.0286, + "epoch": 0.94, + "learning_rate": 0.00015952354828091417, + "loss": 0.0383, "step": 145100 }, { - "epoch": 1.57, - "learning_rate": 6.456940748912973e-05, - "loss": 0.0316, + "epoch": 0.94, + "learning_rate": 0.00015951386692655722, + "loss": 0.0351, "step": 145110 }, { - "epoch": 1.57, - "learning_rate": 6.455318320462067e-05, - "loss": 0.0329, + "epoch": 0.94, + "learning_rate": 0.0001595041855722003, + "loss": 0.0343, "step": 145120 }, { - "epoch": 1.57, - "learning_rate": 6.453695892011162e-05, - "loss": 0.0334, + "epoch": 0.94, + "learning_rate": 0.00015949450421784338, + "loss": 0.0421, "step": 145130 }, { - "epoch": 1.57, - "learning_rate": 6.452073463560257e-05, - "loss": 0.0278, + "epoch": 0.94, + "learning_rate": 0.00015948482286348646, + "loss": 0.043, "step": 145140 }, { - "epoch": 1.57, - "learning_rate": 6.450451035109352e-05, - "loss": 0.0259, + "epoch": 0.94, + "learning_rate": 0.0001594751415091295, + "loss": 0.033, "step": 145150 }, { - "epoch": 1.57, - "learning_rate": 6.448828606658447e-05, - "loss": 0.0283, + "epoch": 0.94, + "learning_rate": 0.00015946546015477257, + "loss": 0.038, "step": 145160 }, { - "epoch": 1.57, - "learning_rate": 6.44720617820754e-05, - "loss": 0.0314, + "epoch": 0.94, + "learning_rate": 0.00015945577880041565, + "loss": 0.0382, "step": 145170 }, { - "epoch": 1.57, - "learning_rate": 6.445583749756635e-05, - "loss": 0.0285, + "epoch": 0.94, + "learning_rate": 0.0001594460974460587, + "loss": 0.0414, "step": 145180 }, { - "epoch": 1.57, - "learning_rate": 6.44396132130573e-05, - "loss": 0.0348, + "epoch": 0.94, + "learning_rate": 0.00015943641609170178, + "loss": 0.0449, "step": 145190 }, { - "epoch": 1.57, - "learning_rate": 6.442338892854825e-05, - "loss": 0.025, + "epoch": 0.94, + "learning_rate": 0.00015942673473734486, + "loss": 0.0379, "step": 145200 }, { - "epoch": 1.57, - "learning_rate": 6.440716464403919e-05, - "loss": 0.0283, + "epoch": 0.94, + "learning_rate": 0.0001594170533829879, + "loss": 0.0391, "step": 145210 }, { - "epoch": 1.57, - "learning_rate": 6.439094035953014e-05, - "loss": 0.0276, + "epoch": 0.94, + "learning_rate": 0.00015940737202863097, + "loss": 0.0336, "step": 145220 }, { - "epoch": 1.57, - "learning_rate": 6.437471607502109e-05, - "loss": 0.0366, + "epoch": 0.94, + "learning_rate": 0.00015939769067427404, + "loss": 0.0317, "step": 145230 }, { - "epoch": 1.57, - "learning_rate": 6.435849179051204e-05, - "loss": 0.0275, + "epoch": 0.94, + "learning_rate": 0.0001593880093199171, + "loss": 0.0349, "step": 145240 }, { - "epoch": 1.57, - "learning_rate": 6.434226750600299e-05, - "loss": 0.024, + "epoch": 0.94, + "learning_rate": 0.00015937832796556018, + "loss": 0.0364, "step": 145250 }, { - "epoch": 1.57, - "learning_rate": 6.432604322149392e-05, - "loss": 0.0272, + "epoch": 0.94, + "learning_rate": 0.00015936864661120326, + "loss": 0.0384, "step": 145260 }, { - "epoch": 1.57, - "learning_rate": 6.430981893698487e-05, - "loss": 0.0282, + "epoch": 0.94, + "learning_rate": 0.00015935896525684634, + "loss": 0.0359, "step": 145270 }, { - "epoch": 1.57, - "learning_rate": 6.429359465247582e-05, - "loss": 0.0276, + "epoch": 0.94, + "learning_rate": 0.0001593492839024894, + "loss": 0.0425, "step": 145280 }, { - "epoch": 1.57, - "learning_rate": 6.427737036796677e-05, - "loss": 0.0356, + "epoch": 0.94, + "learning_rate": 0.00015933960254813244, + "loss": 0.0476, "step": 145290 }, { - "epoch": 1.57, - "learning_rate": 6.426114608345771e-05, - "loss": 0.032, + "epoch": 0.94, + "learning_rate": 0.00015932992119377552, + "loss": 0.0374, "step": 145300 }, { - "epoch": 1.57, - "learning_rate": 6.424492179894866e-05, - "loss": 0.0289, + "epoch": 0.94, + "learning_rate": 0.00015932023983941857, + "loss": 0.0411, "step": 145310 }, { - "epoch": 1.57, - "learning_rate": 6.422869751443961e-05, - "loss": 0.0332, + "epoch": 0.94, + "learning_rate": 0.00015931055848506165, + "loss": 0.0386, "step": 145320 }, { - "epoch": 1.57, - "learning_rate": 6.421247322993056e-05, - "loss": 0.0265, + "epoch": 0.94, + "learning_rate": 0.00015930087713070473, + "loss": 0.0375, "step": 145330 }, { - "epoch": 1.57, - "learning_rate": 6.419624894542151e-05, - "loss": 0.0275, + "epoch": 0.94, + "learning_rate": 0.00015929119577634781, + "loss": 0.0384, "step": 145340 }, { - "epoch": 1.57, - "learning_rate": 6.418002466091244e-05, - "loss": 0.029, + "epoch": 0.94, + "learning_rate": 0.00015928151442199087, + "loss": 0.041, "step": 145350 }, { - "epoch": 1.57, - "learning_rate": 6.41638003764034e-05, - "loss": 0.0301, + "epoch": 0.94, + "learning_rate": 0.00015927183306763392, + "loss": 0.0447, "step": 145360 }, { - "epoch": 1.57, - "learning_rate": 6.414757609189434e-05, - "loss": 0.0283, + "epoch": 0.94, + "learning_rate": 0.000159262151713277, + "loss": 0.0409, "step": 145370 }, { - "epoch": 1.57, - "learning_rate": 6.41313518073853e-05, - "loss": 0.0347, + "epoch": 0.94, + "learning_rate": 0.00015925247035892005, + "loss": 0.0366, "step": 145380 }, { - "epoch": 1.57, - "learning_rate": 6.411512752287623e-05, - "loss": 0.0261, + "epoch": 0.94, + "learning_rate": 0.00015924278900456313, + "loss": 0.0384, "step": 145390 }, { - "epoch": 1.57, - "learning_rate": 6.409890323836718e-05, - "loss": 0.0269, + "epoch": 0.94, + "learning_rate": 0.0001592331076502062, + "loss": 0.0381, "step": 145400 }, { - "epoch": 1.57, - "learning_rate": 6.408267895385813e-05, - "loss": 0.0284, + "epoch": 0.94, + "learning_rate": 0.00015922342629584926, + "loss": 0.0377, "step": 145410 }, { - "epoch": 1.57, - "learning_rate": 6.406645466934908e-05, - "loss": 0.0326, + "epoch": 0.94, + "learning_rate": 0.00015921374494149234, + "loss": 0.0352, "step": 145420 }, { - "epoch": 1.57, - "learning_rate": 6.405023038484003e-05, - "loss": 0.0312, + "epoch": 0.94, + "learning_rate": 0.0001592040635871354, + "loss": 0.0367, "step": 145430 }, { - "epoch": 1.57, - "learning_rate": 6.403400610033096e-05, - "loss": 0.0259, + "epoch": 0.94, + "learning_rate": 0.00015919438223277845, + "loss": 0.0393, "step": 145440 }, { - "epoch": 1.57, - "learning_rate": 6.401778181582191e-05, - "loss": 0.0263, + "epoch": 0.94, + "learning_rate": 0.00015918470087842153, + "loss": 0.0354, "step": 145450 }, { - "epoch": 1.57, - "learning_rate": 6.400155753131286e-05, - "loss": 0.024, + "epoch": 0.94, + "learning_rate": 0.0001591750195240646, + "loss": 0.0369, "step": 145460 }, { - "epoch": 1.57, - "learning_rate": 6.398533324680381e-05, - "loss": 0.0305, + "epoch": 0.94, + "learning_rate": 0.0001591653381697077, + "loss": 0.0401, "step": 145470 }, { - "epoch": 1.57, - "learning_rate": 6.396910896229476e-05, - "loss": 0.0239, + "epoch": 0.94, + "learning_rate": 0.00015915565681535074, + "loss": 0.0376, "step": 145480 }, { - "epoch": 1.57, - "learning_rate": 6.39528846777857e-05, - "loss": 0.0305, + "epoch": 0.94, + "learning_rate": 0.00015914597546099382, + "loss": 0.0355, "step": 145490 }, { - "epoch": 1.57, - "learning_rate": 6.393666039327665e-05, - "loss": 0.0265, + "epoch": 0.94, + "learning_rate": 0.00015913629410663687, + "loss": 0.0373, "step": 145500 }, { - "epoch": 1.57, - "learning_rate": 6.39204361087676e-05, - "loss": 0.0276, + "epoch": 0.94, + "learning_rate": 0.00015912661275227993, + "loss": 0.0349, "step": 145510 }, { - "epoch": 1.57, - "learning_rate": 6.390421182425855e-05, - "loss": 0.026, + "epoch": 0.94, + "learning_rate": 0.000159116931397923, + "loss": 0.0382, "step": 145520 }, { - "epoch": 1.57, - "learning_rate": 6.388798753974949e-05, - "loss": 0.0289, + "epoch": 0.94, + "learning_rate": 0.00015910725004356609, + "loss": 0.0364, "step": 145530 }, { - "epoch": 1.57, - "learning_rate": 6.387176325524044e-05, - "loss": 0.0235, + "epoch": 0.94, + "learning_rate": 0.00015909756868920917, + "loss": 0.0359, "step": 145540 }, { - "epoch": 1.57, - "learning_rate": 6.385553897073139e-05, - "loss": 0.0221, + "epoch": 0.94, + "learning_rate": 0.00015908788733485222, + "loss": 0.0415, "step": 145550 }, { - "epoch": 1.57, - "learning_rate": 6.383931468622233e-05, - "loss": 0.0326, + "epoch": 0.94, + "learning_rate": 0.0001590782059804953, + "loss": 0.0415, "step": 145560 }, { - "epoch": 1.57, - "learning_rate": 6.382309040171328e-05, - "loss": 0.0273, + "epoch": 0.94, + "learning_rate": 0.00015906852462613835, + "loss": 0.0291, "step": 145570 }, { - "epoch": 1.57, - "learning_rate": 6.380686611720422e-05, - "loss": 0.0294, + "epoch": 0.94, + "learning_rate": 0.0001590588432717814, + "loss": 0.0379, "step": 145580 }, { - "epoch": 1.57, - "learning_rate": 6.379064183269517e-05, - "loss": 0.0294, + "epoch": 0.94, + "learning_rate": 0.00015904916191742448, + "loss": 0.0338, "step": 145590 }, { - "epoch": 1.57, - "learning_rate": 6.377441754818612e-05, - "loss": 0.0321, + "epoch": 0.94, + "learning_rate": 0.00015903948056306756, + "loss": 0.0324, "step": 145600 }, { - "epoch": 1.57, - "learning_rate": 6.375819326367707e-05, - "loss": 0.0251, + "epoch": 0.94, + "learning_rate": 0.00015902979920871062, + "loss": 0.0384, "step": 145610 }, { - "epoch": 1.58, - "learning_rate": 6.3741968979168e-05, - "loss": 0.0284, + "epoch": 0.94, + "learning_rate": 0.0001590201178543537, + "loss": 0.0398, "step": 145620 }, { - "epoch": 1.58, - "learning_rate": 6.372574469465896e-05, - "loss": 0.0268, + "epoch": 0.94, + "learning_rate": 0.00015901043649999678, + "loss": 0.0419, "step": 145630 }, { - "epoch": 1.58, - "learning_rate": 6.37095204101499e-05, - "loss": 0.0277, + "epoch": 0.94, + "learning_rate": 0.0001590007551456398, + "loss": 0.0406, "step": 145640 }, { - "epoch": 1.58, - "learning_rate": 6.369329612564086e-05, - "loss": 0.0293, + "epoch": 0.94, + "learning_rate": 0.00015899107379128288, + "loss": 0.041, "step": 145650 }, { - "epoch": 1.58, - "learning_rate": 6.36770718411318e-05, - "loss": 0.0288, + "epoch": 0.94, + "learning_rate": 0.00015898139243692596, + "loss": 0.0367, "step": 145660 }, { - "epoch": 1.58, - "learning_rate": 6.366084755662274e-05, - "loss": 0.0278, + "epoch": 0.94, + "learning_rate": 0.00015897171108256904, + "loss": 0.0377, "step": 145670 }, { - "epoch": 1.58, - "learning_rate": 6.364462327211369e-05, - "loss": 0.0265, + "epoch": 0.94, + "learning_rate": 0.0001589620297282121, + "loss": 0.0447, "step": 145680 }, { - "epoch": 1.58, - "learning_rate": 6.362839898760464e-05, - "loss": 0.0287, + "epoch": 0.94, + "learning_rate": 0.00015895234837385517, + "loss": 0.0413, "step": 145690 }, { - "epoch": 1.58, - "learning_rate": 6.361217470309559e-05, - "loss": 0.0288, + "epoch": 0.94, + "learning_rate": 0.00015894266701949825, + "loss": 0.0413, "step": 145700 }, { - "epoch": 1.58, - "learning_rate": 6.359595041858653e-05, - "loss": 0.0246, + "epoch": 0.94, + "learning_rate": 0.00015893298566514128, + "loss": 0.0453, "step": 145710 }, { - "epoch": 1.58, - "learning_rate": 6.357972613407748e-05, - "loss": 0.0263, + "epoch": 0.94, + "learning_rate": 0.00015892330431078436, + "loss": 0.0473, "step": 145720 }, { - "epoch": 1.58, - "learning_rate": 6.356350184956843e-05, - "loss": 0.0242, + "epoch": 0.94, + "learning_rate": 0.00015891362295642744, + "loss": 0.0369, "step": 145730 }, { - "epoch": 1.58, - "learning_rate": 6.354727756505938e-05, - "loss": 0.0306, + "epoch": 0.94, + "learning_rate": 0.00015890394160207052, + "loss": 0.0355, "step": 145740 }, { - "epoch": 1.58, - "learning_rate": 6.353105328055033e-05, - "loss": 0.0292, + "epoch": 0.94, + "learning_rate": 0.00015889426024771357, + "loss": 0.0379, "step": 145750 }, { - "epoch": 1.58, - "learning_rate": 6.351482899604126e-05, - "loss": 0.024, + "epoch": 0.94, + "learning_rate": 0.00015888457889335665, + "loss": 0.0473, "step": 145760 }, { - "epoch": 1.58, - "learning_rate": 6.349860471153221e-05, - "loss": 0.0313, + "epoch": 0.94, + "learning_rate": 0.00015887489753899973, + "loss": 0.0393, "step": 145770 }, { - "epoch": 1.58, - "learning_rate": 6.348238042702316e-05, - "loss": 0.0282, + "epoch": 0.94, + "learning_rate": 0.00015886521618464276, + "loss": 0.0392, "step": 145780 }, { - "epoch": 1.58, - "learning_rate": 6.346615614251411e-05, - "loss": 0.0288, + "epoch": 0.94, + "learning_rate": 0.00015885553483028584, + "loss": 0.0349, "step": 145790 }, { - "epoch": 1.58, - "learning_rate": 6.344993185800505e-05, - "loss": 0.03, + "epoch": 0.94, + "learning_rate": 0.00015884585347592892, + "loss": 0.0354, "step": 145800 }, { - "epoch": 1.58, - "learning_rate": 6.3433707573496e-05, - "loss": 0.0262, + "epoch": 0.94, + "learning_rate": 0.00015883617212157197, + "loss": 0.0375, "step": 145810 }, { - "epoch": 1.58, - "learning_rate": 6.341748328898695e-05, - "loss": 0.0261, + "epoch": 0.94, + "learning_rate": 0.00015882649076721505, + "loss": 0.043, "step": 145820 }, { - "epoch": 1.58, - "learning_rate": 6.34012590044779e-05, - "loss": 0.0259, + "epoch": 0.94, + "learning_rate": 0.00015881680941285813, + "loss": 0.0466, "step": 145830 }, { - "epoch": 1.58, - "learning_rate": 6.338503471996885e-05, - "loss": 0.0251, + "epoch": 0.94, + "learning_rate": 0.0001588071280585012, + "loss": 0.0368, "step": 145840 }, { - "epoch": 1.58, - "learning_rate": 6.336881043545978e-05, - "loss": 0.0291, + "epoch": 0.94, + "learning_rate": 0.00015879744670414423, + "loss": 0.04, "step": 145850 }, { - "epoch": 1.58, - "learning_rate": 6.335258615095073e-05, - "loss": 0.0271, + "epoch": 0.94, + "learning_rate": 0.0001587877653497873, + "loss": 0.0357, "step": 145860 }, { - "epoch": 1.58, - "learning_rate": 6.333636186644168e-05, - "loss": 0.0294, + "epoch": 0.94, + "learning_rate": 0.0001587780839954304, + "loss": 0.0341, "step": 145870 }, { - "epoch": 1.58, - "learning_rate": 6.332013758193263e-05, - "loss": 0.0346, + "epoch": 0.94, + "learning_rate": 0.00015876840264107345, + "loss": 0.036, "step": 145880 }, { - "epoch": 1.58, - "learning_rate": 6.330391329742357e-05, - "loss": 0.0304, + "epoch": 0.94, + "learning_rate": 0.00015875872128671653, + "loss": 0.0398, "step": 145890 }, { - "epoch": 1.58, - "learning_rate": 6.328768901291452e-05, - "loss": 0.0315, + "epoch": 0.94, + "learning_rate": 0.0001587490399323596, + "loss": 0.0409, "step": 145900 }, { - "epoch": 1.58, - "learning_rate": 6.327146472840547e-05, - "loss": 0.0295, + "epoch": 0.94, + "learning_rate": 0.00015873935857800268, + "loss": 0.0395, "step": 145910 }, { - "epoch": 1.58, - "learning_rate": 6.325524044389642e-05, - "loss": 0.0257, + "epoch": 0.94, + "learning_rate": 0.0001587296772236457, + "loss": 0.0399, "step": 145920 }, { - "epoch": 1.58, - "learning_rate": 6.323901615938737e-05, - "loss": 0.0263, + "epoch": 0.94, + "learning_rate": 0.0001587199958692888, + "loss": 0.0368, "step": 145930 }, { - "epoch": 1.58, - "learning_rate": 6.32227918748783e-05, - "loss": 0.0318, + "epoch": 0.94, + "learning_rate": 0.00015871031451493187, + "loss": 0.0389, "step": 145940 }, { - "epoch": 1.58, - "learning_rate": 6.320656759036925e-05, - "loss": 0.0294, + "epoch": 0.94, + "learning_rate": 0.00015870063316057492, + "loss": 0.0423, "step": 145950 }, { - "epoch": 1.58, - "learning_rate": 6.31903433058602e-05, - "loss": 0.0249, + "epoch": 0.94, + "learning_rate": 0.000158690951806218, + "loss": 0.0374, "step": 145960 }, { - "epoch": 1.58, - "learning_rate": 6.317411902135115e-05, - "loss": 0.0263, + "epoch": 0.94, + "learning_rate": 0.00015868127045186108, + "loss": 0.04, "step": 145970 }, { - "epoch": 1.58, - "learning_rate": 6.315789473684209e-05, - "loss": 0.0267, + "epoch": 0.94, + "learning_rate": 0.00015867158909750413, + "loss": 0.0471, "step": 145980 }, { - "epoch": 1.58, - "learning_rate": 6.314167045233304e-05, - "loss": 0.0313, + "epoch": 0.94, + "learning_rate": 0.0001586619077431472, + "loss": 0.0362, "step": 145990 }, { - "epoch": 1.58, - "learning_rate": 6.312544616782399e-05, - "loss": 0.0312, + "epoch": 0.94, + "learning_rate": 0.00015865222638879027, + "loss": 0.0383, "step": 146000 }, { - "epoch": 1.58, - "eval_cer": 0.9210915978874122, - "eval_loss": 0.022776592522859573, - "eval_runtime": 119.1144, - "eval_samples_per_second": 16.791, - "eval_steps_per_second": 4.198, + "epoch": 0.94, + "eval_cer": 0.9198969607953904, + "eval_loss": 0.02613520435988903, + "eval_runtime": 119.9802, + "eval_samples_per_second": 16.669, + "eval_steps_per_second": 4.167, "step": 146000 }, { - "epoch": 1.58, - "learning_rate": 6.310922188331494e-05, - "loss": 0.0313, + "epoch": 0.94, + "learning_rate": 0.00015864254503443332, + "loss": 0.041, "step": 146010 }, { - "epoch": 1.58, - "learning_rate": 6.309299759880589e-05, - "loss": 0.03, + "epoch": 0.94, + "learning_rate": 0.0001586328636800764, + "loss": 0.0376, "step": 146020 }, { - "epoch": 1.58, - "learning_rate": 6.307677331429683e-05, - "loss": 0.028, + "epoch": 0.94, + "learning_rate": 0.00015862318232571948, + "loss": 0.0348, "step": 146030 }, { - "epoch": 1.58, - "learning_rate": 6.306054902978777e-05, - "loss": 0.0232, + "epoch": 0.94, + "learning_rate": 0.00015861350097136256, + "loss": 0.0335, "step": 146040 }, { - "epoch": 1.58, - "learning_rate": 6.304432474527872e-05, - "loss": 0.0306, + "epoch": 0.94, + "learning_rate": 0.0001586038196170056, + "loss": 0.0393, "step": 146050 }, { - "epoch": 1.58, - "learning_rate": 6.302810046076967e-05, - "loss": 0.0241, + "epoch": 0.94, + "learning_rate": 0.00015859413826264866, + "loss": 0.0391, "step": 146060 }, { - "epoch": 1.58, - "learning_rate": 6.301187617626061e-05, - "loss": 0.0288, + "epoch": 0.94, + "learning_rate": 0.00015858445690829174, + "loss": 0.0396, "step": 146070 }, { - "epoch": 1.58, - "learning_rate": 6.299565189175157e-05, - "loss": 0.0299, + "epoch": 0.94, + "learning_rate": 0.0001585747755539348, + "loss": 0.0368, "step": 146080 }, { - "epoch": 1.58, - "learning_rate": 6.297942760724252e-05, - "loss": 0.0321, + "epoch": 0.94, + "learning_rate": 0.00015856509419957788, + "loss": 0.0364, "step": 146090 }, { - "epoch": 1.58, - "learning_rate": 6.296320332273346e-05, - "loss": 0.0241, + "epoch": 0.94, + "learning_rate": 0.00015855541284522096, + "loss": 0.044, "step": 146100 }, { - "epoch": 1.58, - "learning_rate": 6.294697903822441e-05, - "loss": 0.0263, + "epoch": 0.94, + "learning_rate": 0.00015854573149086404, + "loss": 0.0406, "step": 146110 }, { - "epoch": 1.58, - "learning_rate": 6.293075475371536e-05, - "loss": 0.0258, + "epoch": 0.94, + "learning_rate": 0.0001585360501365071, + "loss": 0.0359, "step": 146120 }, { - "epoch": 1.58, - "learning_rate": 6.291453046920631e-05, - "loss": 0.0307, + "epoch": 0.94, + "learning_rate": 0.00015852636878215014, + "loss": 0.0351, "step": 146130 }, { - "epoch": 1.58, - "learning_rate": 6.289830618469726e-05, - "loss": 0.0231, + "epoch": 0.94, + "learning_rate": 0.00015851668742779322, + "loss": 0.0391, "step": 146140 }, { - "epoch": 1.58, - "learning_rate": 6.28820819001882e-05, - "loss": 0.0296, + "epoch": 0.94, + "learning_rate": 0.00015850700607343627, + "loss": 0.0406, "step": 146150 }, { - "epoch": 1.58, - "learning_rate": 6.286585761567914e-05, - "loss": 0.03, + "epoch": 0.94, + "learning_rate": 0.00015849732471907935, + "loss": 0.0369, "step": 146160 }, { - "epoch": 1.58, - "learning_rate": 6.28496333311701e-05, - "loss": 0.026, + "epoch": 0.94, + "learning_rate": 0.00015848764336472243, + "loss": 0.0386, "step": 146170 }, { - "epoch": 1.58, - "learning_rate": 6.283340904666104e-05, - "loss": 0.0335, + "epoch": 0.94, + "learning_rate": 0.0001584779620103655, + "loss": 0.0453, "step": 146180 }, { - "epoch": 1.58, - "learning_rate": 6.281718476215198e-05, - "loss": 0.0272, + "epoch": 0.94, + "learning_rate": 0.00015846828065600857, + "loss": 0.0349, "step": 146190 }, { - "epoch": 1.58, - "learning_rate": 6.280096047764293e-05, - "loss": 0.027, + "epoch": 0.94, + "learning_rate": 0.00015845859930165162, + "loss": 0.0346, "step": 146200 }, { - "epoch": 1.58, - "learning_rate": 6.278473619313388e-05, - "loss": 0.0309, + "epoch": 0.94, + "learning_rate": 0.00015844891794729467, + "loss": 0.0395, "step": 146210 }, { - "epoch": 1.58, - "learning_rate": 6.276851190862483e-05, - "loss": 0.0354, + "epoch": 0.94, + "learning_rate": 0.00015843923659293775, + "loss": 0.0397, "step": 146220 }, { - "epoch": 1.58, - "learning_rate": 6.275228762411578e-05, - "loss": 0.0317, + "epoch": 0.94, + "learning_rate": 0.00015842955523858083, + "loss": 0.0361, "step": 146230 }, { - "epoch": 1.58, - "learning_rate": 6.273606333960672e-05, - "loss": 0.0302, + "epoch": 0.94, + "learning_rate": 0.0001584198738842239, + "loss": 0.0286, "step": 146240 }, { - "epoch": 1.58, - "learning_rate": 6.271983905509767e-05, - "loss": 0.0288, + "epoch": 0.94, + "learning_rate": 0.00015841019252986696, + "loss": 0.0442, "step": 146250 }, { - "epoch": 1.58, - "learning_rate": 6.270361477058862e-05, - "loss": 0.0306, + "epoch": 0.94, + "learning_rate": 0.00015840051117551004, + "loss": 0.0383, "step": 146260 }, { - "epoch": 1.58, - "learning_rate": 6.268739048607957e-05, - "loss": 0.0305, + "epoch": 0.94, + "learning_rate": 0.0001583908298211531, + "loss": 0.0431, "step": 146270 }, { - "epoch": 1.58, - "learning_rate": 6.26711662015705e-05, - "loss": 0.0271, + "epoch": 0.94, + "learning_rate": 0.00015838114846679615, + "loss": 0.0406, "step": 146280 }, { - "epoch": 1.58, - "learning_rate": 6.265494191706145e-05, - "loss": 0.0354, + "epoch": 0.94, + "learning_rate": 0.00015837146711243923, + "loss": 0.0365, "step": 146290 }, { - "epoch": 1.58, - "learning_rate": 6.26387176325524e-05, - "loss": 0.0272, + "epoch": 0.94, + "learning_rate": 0.0001583617857580823, + "loss": 0.0392, "step": 146300 }, { - "epoch": 1.58, - "learning_rate": 6.262249334804335e-05, - "loss": 0.0227, + "epoch": 0.94, + "learning_rate": 0.0001583521044037254, + "loss": 0.0317, "step": 146310 }, { - "epoch": 1.58, - "learning_rate": 6.26062690635343e-05, - "loss": 0.0281, + "epoch": 0.94, + "learning_rate": 0.00015834242304936844, + "loss": 0.0324, "step": 146320 }, { - "epoch": 1.58, - "learning_rate": 6.259004477902524e-05, - "loss": 0.0261, + "epoch": 0.94, + "learning_rate": 0.00015833274169501152, + "loss": 0.0369, "step": 146330 }, { - "epoch": 1.58, - "learning_rate": 6.257382049451619e-05, - "loss": 0.027, + "epoch": 0.94, + "learning_rate": 0.00015832306034065457, + "loss": 0.0403, "step": 146340 }, { - "epoch": 1.58, - "learning_rate": 6.255759621000714e-05, - "loss": 0.0264, + "epoch": 0.94, + "learning_rate": 0.00015831337898629763, + "loss": 0.0366, "step": 146350 }, { - "epoch": 1.58, - "learning_rate": 6.254137192549809e-05, - "loss": 0.031, + "epoch": 0.94, + "learning_rate": 0.0001583036976319407, + "loss": 0.0383, "step": 146360 }, { - "epoch": 1.58, - "learning_rate": 6.252514764098902e-05, - "loss": 0.032, + "epoch": 0.94, + "learning_rate": 0.00015829401627758379, + "loss": 0.0375, "step": 146370 }, { - "epoch": 1.58, - "learning_rate": 6.250892335647997e-05, - "loss": 0.0303, + "epoch": 0.94, + "learning_rate": 0.00015828433492322684, + "loss": 0.0404, "step": 146380 }, { - "epoch": 1.58, - "learning_rate": 6.249269907197092e-05, - "loss": 0.0328, + "epoch": 0.94, + "learning_rate": 0.00015827465356886992, + "loss": 0.0429, "step": 146390 }, { - "epoch": 1.58, - "learning_rate": 6.247647478746187e-05, - "loss": 0.0286, + "epoch": 0.94, + "learning_rate": 0.000158264972214513, + "loss": 0.0402, "step": 146400 }, { - "epoch": 1.58, - "learning_rate": 6.246025050295282e-05, - "loss": 0.0295, + "epoch": 0.94, + "learning_rate": 0.00015825529086015602, + "loss": 0.042, "step": 146410 }, { - "epoch": 1.58, - "learning_rate": 6.244402621844376e-05, - "loss": 0.0288, + "epoch": 0.95, + "learning_rate": 0.0001582456095057991, + "loss": 0.0362, "step": 146420 }, { - "epoch": 1.58, - "learning_rate": 6.242780193393471e-05, - "loss": 0.0262, + "epoch": 0.95, + "learning_rate": 0.00015823592815144218, + "loss": 0.0387, "step": 146430 }, { - "epoch": 1.58, - "learning_rate": 6.241157764942566e-05, - "loss": 0.025, + "epoch": 0.95, + "learning_rate": 0.00015822624679708526, + "loss": 0.0411, "step": 146440 }, { - "epoch": 1.58, - "learning_rate": 6.239535336491661e-05, - "loss": 0.026, + "epoch": 0.95, + "learning_rate": 0.00015821656544272832, + "loss": 0.037, "step": 146450 }, { - "epoch": 1.58, - "learning_rate": 6.237912908040754e-05, - "loss": 0.0324, + "epoch": 0.95, + "learning_rate": 0.0001582068840883714, + "loss": 0.0368, "step": 146460 }, { - "epoch": 1.58, - "learning_rate": 6.236290479589849e-05, - "loss": 0.0299, + "epoch": 0.95, + "learning_rate": 0.00015819720273401448, + "loss": 0.0441, "step": 146470 }, { - "epoch": 1.58, - "learning_rate": 6.234668051138944e-05, - "loss": 0.0319, + "epoch": 0.95, + "learning_rate": 0.0001581875213796575, + "loss": 0.0442, "step": 146480 }, { - "epoch": 1.58, - "learning_rate": 6.233045622688039e-05, - "loss": 0.0305, + "epoch": 0.95, + "learning_rate": 0.00015817784002530058, + "loss": 0.0322, "step": 146490 }, { - "epoch": 1.58, - "learning_rate": 6.231423194237134e-05, - "loss": 0.0254, + "epoch": 0.95, + "learning_rate": 0.00015816815867094366, + "loss": 0.043, "step": 146500 }, { - "epoch": 1.58, - "learning_rate": 6.229800765786228e-05, - "loss": 0.0314, + "epoch": 0.95, + "learning_rate": 0.00015815847731658674, + "loss": 0.0403, "step": 146510 }, { - "epoch": 1.58, - "learning_rate": 6.228178337335323e-05, - "loss": 0.0304, + "epoch": 0.95, + "learning_rate": 0.0001581487959622298, + "loss": 0.0372, "step": 146520 }, { - "epoch": 1.58, - "learning_rate": 6.226555908884418e-05, - "loss": 0.0297, + "epoch": 0.95, + "learning_rate": 0.00015813911460787287, + "loss": 0.0388, "step": 146530 }, { - "epoch": 1.58, - "learning_rate": 6.224933480433513e-05, - "loss": 0.0267, + "epoch": 0.95, + "learning_rate": 0.00015812943325351595, + "loss": 0.0347, "step": 146540 }, { - "epoch": 1.59, - "learning_rate": 6.223311051982608e-05, - "loss": 0.0248, + "epoch": 0.95, + "learning_rate": 0.00015811975189915898, + "loss": 0.0416, "step": 146550 }, { - "epoch": 1.59, - "learning_rate": 6.221688623531701e-05, - "loss": 0.0229, + "epoch": 0.95, + "learning_rate": 0.00015811007054480206, + "loss": 0.0401, "step": 146560 }, { - "epoch": 1.59, - "learning_rate": 6.220066195080796e-05, - "loss": 0.0237, + "epoch": 0.95, + "learning_rate": 0.00015810038919044514, + "loss": 0.0455, "step": 146570 }, { - "epoch": 1.59, - "learning_rate": 6.218443766629891e-05, - "loss": 0.0309, + "epoch": 0.95, + "learning_rate": 0.00015809070783608822, + "loss": 0.039, "step": 146580 }, { - "epoch": 1.59, - "learning_rate": 6.216821338178986e-05, - "loss": 0.0298, + "epoch": 0.95, + "learning_rate": 0.00015808102648173127, + "loss": 0.0338, "step": 146590 }, { - "epoch": 1.59, - "learning_rate": 6.21519890972808e-05, - "loss": 0.0215, + "epoch": 0.95, + "learning_rate": 0.00015807134512737435, + "loss": 0.0471, "step": 146600 }, { - "epoch": 1.59, - "learning_rate": 6.213576481277175e-05, - "loss": 0.0299, + "epoch": 0.95, + "learning_rate": 0.00015806166377301743, + "loss": 0.0389, "step": 146610 }, { - "epoch": 1.59, - "learning_rate": 6.21195405282627e-05, - "loss": 0.0232, + "epoch": 0.95, + "learning_rate": 0.00015805198241866046, + "loss": 0.0392, "step": 146620 }, { - "epoch": 1.59, - "learning_rate": 6.210331624375365e-05, - "loss": 0.0265, + "epoch": 0.95, + "learning_rate": 0.00015804230106430354, + "loss": 0.0443, "step": 146630 }, { - "epoch": 1.59, - "learning_rate": 6.20870919592446e-05, - "loss": 0.0273, + "epoch": 0.95, + "learning_rate": 0.00015803261970994661, + "loss": 0.0392, "step": 146640 }, { - "epoch": 1.59, - "learning_rate": 6.207086767473553e-05, - "loss": 0.0292, + "epoch": 0.95, + "learning_rate": 0.00015802293835558967, + "loss": 0.0382, "step": 146650 }, { - "epoch": 1.59, - "learning_rate": 6.205464339022648e-05, - "loss": 0.032, + "epoch": 0.95, + "learning_rate": 0.00015801325700123275, + "loss": 0.0401, "step": 146660 }, { - "epoch": 1.59, - "learning_rate": 6.203841910571743e-05, - "loss": 0.0268, + "epoch": 0.95, + "learning_rate": 0.00015800357564687583, + "loss": 0.0349, "step": 146670 }, { - "epoch": 1.59, - "learning_rate": 6.202219482120838e-05, - "loss": 0.0286, + "epoch": 0.95, + "learning_rate": 0.0001579938942925189, + "loss": 0.0388, "step": 146680 }, { - "epoch": 1.59, - "learning_rate": 6.200597053669932e-05, - "loss": 0.0304, + "epoch": 0.95, + "learning_rate": 0.00015798421293816193, + "loss": 0.0414, "step": 146690 }, { - "epoch": 1.59, - "learning_rate": 6.198974625219027e-05, - "loss": 0.0306, + "epoch": 0.95, + "learning_rate": 0.000157974531583805, + "loss": 0.0492, "step": 146700 }, { - "epoch": 1.59, - "learning_rate": 6.197352196768122e-05, - "loss": 0.0328, + "epoch": 0.95, + "learning_rate": 0.0001579648502294481, + "loss": 0.0387, "step": 146710 }, { - "epoch": 1.59, - "learning_rate": 6.195729768317217e-05, - "loss": 0.0295, + "epoch": 0.95, + "learning_rate": 0.00015795516887509114, + "loss": 0.0467, "step": 146720 }, { - "epoch": 1.59, - "learning_rate": 6.194107339866312e-05, - "loss": 0.0256, + "epoch": 0.95, + "learning_rate": 0.00015794548752073422, + "loss": 0.0401, "step": 146730 }, { - "epoch": 1.59, - "learning_rate": 6.192484911415406e-05, - "loss": 0.042, + "epoch": 0.95, + "learning_rate": 0.0001579358061663773, + "loss": 0.0355, "step": 146740 }, { - "epoch": 1.59, - "learning_rate": 6.1908624829645e-05, - "loss": 0.0264, + "epoch": 0.95, + "learning_rate": 0.00015792612481202038, + "loss": 0.0366, "step": 146750 }, { - "epoch": 1.59, - "learning_rate": 6.189240054513596e-05, - "loss": 0.0333, + "epoch": 0.95, + "learning_rate": 0.0001579164434576634, + "loss": 0.0392, "step": 146760 }, { - "epoch": 1.59, - "learning_rate": 6.18761762606269e-05, - "loss": 0.0301, + "epoch": 0.95, + "learning_rate": 0.0001579067621033065, + "loss": 0.0408, "step": 146770 }, { - "epoch": 1.59, - "learning_rate": 6.185995197611784e-05, - "loss": 0.0325, + "epoch": 0.95, + "learning_rate": 0.00015789708074894957, + "loss": 0.0366, "step": 146780 }, { - "epoch": 1.59, - "learning_rate": 6.184372769160879e-05, - "loss": 0.0286, + "epoch": 0.95, + "learning_rate": 0.00015788739939459262, + "loss": 0.0358, "step": 146790 }, { - "epoch": 1.59, - "learning_rate": 6.182750340709974e-05, - "loss": 0.022, + "epoch": 0.95, + "learning_rate": 0.0001578777180402357, + "loss": 0.0363, "step": 146800 }, { - "epoch": 1.59, - "learning_rate": 6.181127912259069e-05, - "loss": 0.0304, + "epoch": 0.95, + "learning_rate": 0.00015786803668587878, + "loss": 0.0333, "step": 146810 }, { - "epoch": 1.59, - "learning_rate": 6.179505483808164e-05, - "loss": 0.0334, + "epoch": 0.95, + "learning_rate": 0.00015785835533152183, + "loss": 0.0363, "step": 146820 }, { - "epoch": 1.59, - "learning_rate": 6.177883055357258e-05, - "loss": 0.032, + "epoch": 0.95, + "learning_rate": 0.0001578486739771649, + "loss": 0.0398, "step": 146830 }, { - "epoch": 1.59, - "learning_rate": 6.176260626906353e-05, - "loss": 0.0287, + "epoch": 0.95, + "learning_rate": 0.00015783899262280797, + "loss": 0.038, "step": 146840 }, { - "epoch": 1.59, - "learning_rate": 6.174638198455448e-05, - "loss": 0.0248, + "epoch": 0.95, + "learning_rate": 0.00015782931126845102, + "loss": 0.0333, "step": 146850 }, { - "epoch": 1.59, - "learning_rate": 6.173015770004543e-05, - "loss": 0.0217, + "epoch": 0.95, + "learning_rate": 0.0001578196299140941, + "loss": 0.0333, "step": 146860 }, { - "epoch": 1.59, - "learning_rate": 6.171393341553636e-05, - "loss": 0.0291, + "epoch": 0.95, + "learning_rate": 0.00015780994855973718, + "loss": 0.0365, "step": 146870 }, { - "epoch": 1.59, - "learning_rate": 6.169770913102731e-05, - "loss": 0.0251, + "epoch": 0.95, + "learning_rate": 0.00015780026720538026, + "loss": 0.0361, "step": 146880 }, { - "epoch": 1.59, - "learning_rate": 6.168148484651826e-05, - "loss": 0.0252, + "epoch": 0.95, + "learning_rate": 0.0001577905858510233, + "loss": 0.0383, "step": 146890 }, { - "epoch": 1.59, - "learning_rate": 6.166526056200921e-05, - "loss": 0.0296, + "epoch": 0.95, + "learning_rate": 0.00015778090449666636, + "loss": 0.0372, "step": 146900 }, { - "epoch": 1.59, - "learning_rate": 6.164903627750016e-05, - "loss": 0.0351, + "epoch": 0.95, + "learning_rate": 0.00015777122314230944, + "loss": 0.0324, "step": 146910 }, { - "epoch": 1.59, - "learning_rate": 6.16328119929911e-05, - "loss": 0.0262, + "epoch": 0.95, + "learning_rate": 0.0001577615417879525, + "loss": 0.0429, "step": 146920 }, { - "epoch": 1.59, - "learning_rate": 6.161658770848205e-05, - "loss": 0.0255, + "epoch": 0.95, + "learning_rate": 0.00015775186043359558, + "loss": 0.0356, "step": 146930 }, { - "epoch": 1.59, - "learning_rate": 6.1600363423973e-05, - "loss": 0.025, + "epoch": 0.95, + "learning_rate": 0.00015774217907923866, + "loss": 0.0363, "step": 146940 }, { - "epoch": 1.59, - "learning_rate": 6.158413913946395e-05, - "loss": 0.0307, + "epoch": 0.95, + "learning_rate": 0.00015773249772488174, + "loss": 0.0379, "step": 146950 }, { - "epoch": 1.59, - "learning_rate": 6.156791485495488e-05, - "loss": 0.0279, + "epoch": 0.95, + "learning_rate": 0.0001577228163705248, + "loss": 0.0389, "step": 146960 }, { - "epoch": 1.59, - "learning_rate": 6.155169057044583e-05, - "loss": 0.025, + "epoch": 0.95, + "learning_rate": 0.00015771313501616784, + "loss": 0.0429, "step": 146970 }, { - "epoch": 1.59, - "learning_rate": 6.153546628593678e-05, - "loss": 0.0283, + "epoch": 0.95, + "learning_rate": 0.00015770345366181092, + "loss": 0.0318, "step": 146980 }, { - "epoch": 1.59, - "learning_rate": 6.151924200142773e-05, - "loss": 0.0302, + "epoch": 0.95, + "learning_rate": 0.00015769377230745397, + "loss": 0.0457, "step": 146990 }, { - "epoch": 1.59, - "learning_rate": 6.150301771691868e-05, - "loss": 0.0298, + "epoch": 0.95, + "learning_rate": 0.00015768409095309705, + "loss": 0.0396, "step": 147000 }, { - "epoch": 1.59, - "eval_cer": 0.9210739282009962, - "eval_loss": 0.023059368133544922, - "eval_runtime": 118.9803, - "eval_samples_per_second": 16.81, - "eval_steps_per_second": 4.202, + "epoch": 0.95, + "eval_cer": 0.9198553835724776, + "eval_loss": 0.025865597650408745, + "eval_runtime": 120.0422, + "eval_samples_per_second": 16.661, + "eval_steps_per_second": 4.165, "step": 147000 }, { - "epoch": 1.59, - "learning_rate": 6.148679343240962e-05, - "loss": 0.0293, + "epoch": 0.95, + "learning_rate": 0.00015767440959874013, + "loss": 0.039, "step": 147010 }, { - "epoch": 1.59, - "learning_rate": 6.147056914790057e-05, - "loss": 0.0294, + "epoch": 0.95, + "learning_rate": 0.00015766472824438319, + "loss": 0.0467, "step": 147020 }, { - "epoch": 1.59, - "learning_rate": 6.145434486339152e-05, - "loss": 0.0258, + "epoch": 0.95, + "learning_rate": 0.00015765504689002627, + "loss": 0.0376, "step": 147030 }, { - "epoch": 1.59, - "learning_rate": 6.143812057888247e-05, - "loss": 0.0286, + "epoch": 0.95, + "learning_rate": 0.00015764536553566932, + "loss": 0.0404, "step": 147040 }, { - "epoch": 1.59, - "learning_rate": 6.14218962943734e-05, - "loss": 0.0286, + "epoch": 0.95, + "learning_rate": 0.00015763568418131237, + "loss": 0.0419, "step": 147050 }, { - "epoch": 1.59, - "learning_rate": 6.140567200986435e-05, - "loss": 0.0285, + "epoch": 0.95, + "learning_rate": 0.00015762600282695545, + "loss": 0.0366, "step": 147060 }, { - "epoch": 1.59, - "learning_rate": 6.13894477253553e-05, - "loss": 0.0278, + "epoch": 0.95, + "learning_rate": 0.00015761632147259853, + "loss": 0.037, "step": 147070 }, { - "epoch": 1.59, - "learning_rate": 6.137322344084625e-05, - "loss": 0.0316, + "epoch": 0.95, + "learning_rate": 0.0001576066401182416, + "loss": 0.0452, "step": 147080 }, { - "epoch": 1.59, - "learning_rate": 6.13569991563372e-05, - "loss": 0.0325, + "epoch": 0.95, + "learning_rate": 0.00015759695876388466, + "loss": 0.0361, "step": 147090 }, { - "epoch": 1.59, - "learning_rate": 6.134077487182814e-05, - "loss": 0.0284, + "epoch": 0.95, + "learning_rate": 0.00015758727740952774, + "loss": 0.0392, "step": 147100 }, { - "epoch": 1.59, - "learning_rate": 6.132455058731909e-05, - "loss": 0.0308, + "epoch": 0.95, + "learning_rate": 0.0001575775960551708, + "loss": 0.0371, "step": 147110 }, { - "epoch": 1.59, - "learning_rate": 6.130832630281004e-05, - "loss": 0.0307, + "epoch": 0.95, + "learning_rate": 0.00015756791470081385, + "loss": 0.0378, "step": 147120 }, { - "epoch": 1.59, - "learning_rate": 6.129210201830099e-05, - "loss": 0.0343, + "epoch": 0.95, + "learning_rate": 0.00015755823334645693, + "loss": 0.0407, "step": 147130 }, { - "epoch": 1.59, - "learning_rate": 6.127587773379192e-05, - "loss": 0.0289, + "epoch": 0.95, + "learning_rate": 0.0001575485519921, + "loss": 0.04, "step": 147140 }, { - "epoch": 1.59, - "learning_rate": 6.125965344928287e-05, - "loss": 0.0284, + "epoch": 0.95, + "learning_rate": 0.0001575388706377431, + "loss": 0.0348, "step": 147150 }, { - "epoch": 1.59, - "learning_rate": 6.124342916477382e-05, - "loss": 0.0285, + "epoch": 0.95, + "learning_rate": 0.00015752918928338614, + "loss": 0.0355, "step": 147160 }, { - "epoch": 1.59, - "learning_rate": 6.122720488026477e-05, - "loss": 0.0271, + "epoch": 0.95, + "learning_rate": 0.00015751950792902922, + "loss": 0.0426, "step": 147170 }, { - "epoch": 1.59, - "learning_rate": 6.121098059575572e-05, - "loss": 0.03, + "epoch": 0.95, + "learning_rate": 0.00015750982657467227, + "loss": 0.0363, "step": 147180 }, { - "epoch": 1.59, - "learning_rate": 6.119475631124666e-05, - "loss": 0.0307, + "epoch": 0.95, + "learning_rate": 0.00015750014522031533, + "loss": 0.0321, "step": 147190 }, { - "epoch": 1.59, - "learning_rate": 6.117853202673761e-05, - "loss": 0.0274, + "epoch": 0.95, + "learning_rate": 0.0001574904638659584, + "loss": 0.0404, "step": 147200 }, { - "epoch": 1.59, - "learning_rate": 6.116230774222856e-05, - "loss": 0.0256, + "epoch": 0.95, + "learning_rate": 0.00015748078251160149, + "loss": 0.0329, "step": 147210 }, { - "epoch": 1.59, - "learning_rate": 6.114608345771951e-05, - "loss": 0.0256, + "epoch": 0.95, + "learning_rate": 0.00015747110115724454, + "loss": 0.0416, "step": 147220 }, { - "epoch": 1.59, - "learning_rate": 6.112985917321046e-05, - "loss": 0.0308, + "epoch": 0.95, + "learning_rate": 0.00015746141980288762, + "loss": 0.0439, "step": 147230 }, { - "epoch": 1.59, - "learning_rate": 6.11136348887014e-05, - "loss": 0.0264, + "epoch": 0.95, + "learning_rate": 0.0001574517384485307, + "loss": 0.0414, "step": 147240 }, { - "epoch": 1.59, - "learning_rate": 6.109741060419236e-05, - "loss": 0.0292, + "epoch": 0.95, + "learning_rate": 0.00015744205709417372, + "loss": 0.0377, "step": 147250 }, { - "epoch": 1.59, - "learning_rate": 6.10811863196833e-05, - "loss": 0.0316, + "epoch": 0.95, + "learning_rate": 0.0001574323757398168, + "loss": 0.0352, "step": 147260 }, { - "epoch": 1.59, - "learning_rate": 6.106496203517424e-05, - "loss": 0.0251, + "epoch": 0.95, + "learning_rate": 0.00015742269438545988, + "loss": 0.0427, "step": 147270 }, { - "epoch": 1.59, - "learning_rate": 6.10487377506652e-05, - "loss": 0.0306, + "epoch": 0.95, + "learning_rate": 0.00015741301303110296, + "loss": 0.0401, "step": 147280 }, { - "epoch": 1.59, - "learning_rate": 6.1032513466156144e-05, - "loss": 0.029, + "epoch": 0.95, + "learning_rate": 0.00015740333167674602, + "loss": 0.0338, "step": 147290 }, { - "epoch": 1.59, - "learning_rate": 6.101628918164709e-05, - "loss": 0.0266, + "epoch": 0.95, + "learning_rate": 0.0001573936503223891, + "loss": 0.0407, "step": 147300 }, { - "epoch": 1.59, - "learning_rate": 6.1000064897138037e-05, - "loss": 0.0275, + "epoch": 0.95, + "learning_rate": 0.00015738396896803217, + "loss": 0.0347, "step": 147310 }, { - "epoch": 1.59, - "learning_rate": 6.098384061262898e-05, - "loss": 0.0239, + "epoch": 0.95, + "learning_rate": 0.0001573742876136752, + "loss": 0.0364, "step": 147320 }, { - "epoch": 1.59, - "learning_rate": 6.096761632811993e-05, - "loss": 0.0319, + "epoch": 0.95, + "learning_rate": 0.00015736460625931828, + "loss": 0.0368, "step": 147330 }, { - "epoch": 1.59, - "learning_rate": 6.095139204361087e-05, - "loss": 0.0243, + "epoch": 0.95, + "learning_rate": 0.00015735492490496136, + "loss": 0.0445, "step": 147340 }, { - "epoch": 1.59, - "learning_rate": 6.093516775910182e-05, - "loss": 0.0249, + "epoch": 0.95, + "learning_rate": 0.00015734524355060444, + "loss": 0.0368, "step": 147350 }, { - "epoch": 1.59, - "learning_rate": 6.091894347459277e-05, - "loss": 0.0302, + "epoch": 0.95, + "learning_rate": 0.0001573355621962475, + "loss": 0.0462, "step": 147360 }, { - "epoch": 1.59, - "learning_rate": 6.0902719190083715e-05, - "loss": 0.0302, + "epoch": 0.95, + "learning_rate": 0.00015732588084189057, + "loss": 0.034, "step": 147370 }, { - "epoch": 1.59, - "learning_rate": 6.0886494905574665e-05, - "loss": 0.0268, + "epoch": 0.95, + "learning_rate": 0.00015731619948753365, + "loss": 0.0407, "step": 147380 }, { - "epoch": 1.59, - "learning_rate": 6.087027062106561e-05, - "loss": 0.0308, + "epoch": 0.95, + "learning_rate": 0.00015730651813317668, + "loss": 0.0435, "step": 147390 }, { - "epoch": 1.59, - "learning_rate": 6.085404633655656e-05, - "loss": 0.0309, + "epoch": 0.95, + "learning_rate": 0.00015729683677881976, + "loss": 0.0399, "step": 147400 }, { - "epoch": 1.59, - "learning_rate": 6.08378220520475e-05, - "loss": 0.0222, + "epoch": 0.95, + "learning_rate": 0.00015728715542446284, + "loss": 0.0434, "step": 147410 }, { - "epoch": 1.59, - "learning_rate": 6.082159776753845e-05, - "loss": 0.0257, + "epoch": 0.95, + "learning_rate": 0.0001572774740701059, + "loss": 0.0405, "step": 147420 }, { - "epoch": 1.59, - "learning_rate": 6.080537348302939e-05, - "loss": 0.0292, + "epoch": 0.95, + "learning_rate": 0.00015726779271574897, + "loss": 0.0344, "step": 147430 }, { - "epoch": 1.59, - "learning_rate": 6.078914919852034e-05, - "loss": 0.0262, + "epoch": 0.95, + "learning_rate": 0.00015725811136139205, + "loss": 0.0375, "step": 147440 }, { - "epoch": 1.59, - "learning_rate": 6.077292491401129e-05, - "loss": 0.0306, + "epoch": 0.95, + "learning_rate": 0.00015724843000703513, + "loss": 0.0411, "step": 147450 }, { - "epoch": 1.59, - "learning_rate": 6.0756700629502236e-05, - "loss": 0.0292, + "epoch": 0.95, + "learning_rate": 0.00015723874865267816, + "loss": 0.0405, "step": 147460 }, { - "epoch": 1.6, - "learning_rate": 6.0740476344993185e-05, - "loss": 0.0276, + "epoch": 0.95, + "learning_rate": 0.00015722906729832123, + "loss": 0.0383, "step": 147470 }, { - "epoch": 1.6, - "learning_rate": 6.072425206048413e-05, - "loss": 0.0296, + "epoch": 0.95, + "learning_rate": 0.00015721938594396431, + "loss": 0.0426, "step": 147480 }, { - "epoch": 1.6, - "learning_rate": 6.070802777597508e-05, - "loss": 0.0259, + "epoch": 0.95, + "learning_rate": 0.00015720970458960737, + "loss": 0.0409, "step": 147490 }, { - "epoch": 1.6, - "learning_rate": 6.069180349146602e-05, - "loss": 0.0255, + "epoch": 0.95, + "learning_rate": 0.00015720002323525045, + "loss": 0.0351, "step": 147500 }, { - "epoch": 1.6, - "learning_rate": 6.067557920695697e-05, - "loss": 0.0246, + "epoch": 0.95, + "learning_rate": 0.00015719034188089353, + "loss": 0.0371, "step": 147510 }, { - "epoch": 1.6, - "learning_rate": 6.0659354922447914e-05, - "loss": 0.0286, + "epoch": 0.95, + "learning_rate": 0.0001571806605265366, + "loss": 0.0358, "step": 147520 }, { - "epoch": 1.6, - "learning_rate": 6.0643130637938864e-05, - "loss": 0.0321, + "epoch": 0.95, + "learning_rate": 0.00015717097917217963, + "loss": 0.0425, "step": 147530 }, { - "epoch": 1.6, - "learning_rate": 6.0626906353429814e-05, - "loss": 0.0246, + "epoch": 0.95, + "learning_rate": 0.0001571612978178227, + "loss": 0.0398, "step": 147540 }, { - "epoch": 1.6, - "learning_rate": 6.0610682068920757e-05, - "loss": 0.028, + "epoch": 0.95, + "learning_rate": 0.0001571516164634658, + "loss": 0.0401, "step": 147550 }, { - "epoch": 1.6, - "learning_rate": 6.0594457784411706e-05, - "loss": 0.0242, + "epoch": 0.95, + "learning_rate": 0.00015714193510910884, + "loss": 0.0388, "step": 147560 }, { - "epoch": 1.6, - "learning_rate": 6.057823349990265e-05, - "loss": 0.0266, + "epoch": 0.95, + "learning_rate": 0.00015713225375475192, + "loss": 0.0383, "step": 147570 }, { - "epoch": 1.6, - "learning_rate": 6.05620092153936e-05, - "loss": 0.0272, + "epoch": 0.95, + "learning_rate": 0.000157122572400395, + "loss": 0.0353, "step": 147580 }, { - "epoch": 1.6, - "learning_rate": 6.054578493088454e-05, - "loss": 0.0205, + "epoch": 0.95, + "learning_rate": 0.00015711289104603806, + "loss": 0.0409, "step": 147590 }, { - "epoch": 1.6, - "learning_rate": 6.052956064637549e-05, - "loss": 0.023, + "epoch": 0.95, + "learning_rate": 0.0001571032096916811, + "loss": 0.0392, "step": 147600 }, { - "epoch": 1.6, - "learning_rate": 6.0513336361866435e-05, - "loss": 0.0255, + "epoch": 0.95, + "learning_rate": 0.0001570935283373242, + "loss": 0.0354, "step": 147610 }, { - "epoch": 1.6, - "learning_rate": 6.0497112077357385e-05, - "loss": 0.0262, + "epoch": 0.95, + "learning_rate": 0.00015708384698296724, + "loss": 0.0398, "step": 147620 }, { - "epoch": 1.6, - "learning_rate": 6.0480887792848334e-05, - "loss": 0.0291, + "epoch": 0.95, + "learning_rate": 0.00015707416562861032, + "loss": 0.0419, "step": 147630 }, { - "epoch": 1.6, - "learning_rate": 6.046466350833928e-05, - "loss": 0.0293, + "epoch": 0.95, + "learning_rate": 0.0001570644842742534, + "loss": 0.0353, "step": 147640 }, { - "epoch": 1.6, - "learning_rate": 6.044843922383023e-05, - "loss": 0.0312, + "epoch": 0.95, + "learning_rate": 0.00015705480291989648, + "loss": 0.0361, "step": 147650 }, { - "epoch": 1.6, - "learning_rate": 6.043221493932117e-05, - "loss": 0.0281, + "epoch": 0.95, + "learning_rate": 0.00015704512156553953, + "loss": 0.0446, "step": 147660 }, { - "epoch": 1.6, - "learning_rate": 6.041599065481212e-05, - "loss": 0.026, + "epoch": 0.95, + "learning_rate": 0.0001570354402111826, + "loss": 0.0387, "step": 147670 }, { - "epoch": 1.6, - "learning_rate": 6.039976637030306e-05, - "loss": 0.031, + "epoch": 0.95, + "learning_rate": 0.00015702575885682567, + "loss": 0.0351, "step": 147680 }, { - "epoch": 1.6, - "learning_rate": 6.038354208579401e-05, - "loss": 0.0281, + "epoch": 0.95, + "learning_rate": 0.00015701607750246872, + "loss": 0.0362, "step": 147690 }, { - "epoch": 1.6, - "learning_rate": 6.0367317801284956e-05, - "loss": 0.0284, + "epoch": 0.95, + "learning_rate": 0.0001570063961481118, + "loss": 0.0342, "step": 147700 }, { - "epoch": 1.6, - "learning_rate": 6.0351093516775905e-05, - "loss": 0.0289, + "epoch": 0.95, + "learning_rate": 0.00015699671479375488, + "loss": 0.0338, "step": 147710 }, { - "epoch": 1.6, - "learning_rate": 6.0334869232266855e-05, - "loss": 0.0286, + "epoch": 0.95, + "learning_rate": 0.00015698703343939796, + "loss": 0.0376, "step": 147720 }, { - "epoch": 1.6, - "learning_rate": 6.03186449477578e-05, - "loss": 0.0269, + "epoch": 0.95, + "learning_rate": 0.000156977352085041, + "loss": 0.0394, "step": 147730 }, { - "epoch": 1.6, - "learning_rate": 6.030242066324875e-05, - "loss": 0.0274, + "epoch": 0.95, + "learning_rate": 0.00015696767073068406, + "loss": 0.0528, "step": 147740 }, { - "epoch": 1.6, - "learning_rate": 6.028619637873969e-05, - "loss": 0.0305, + "epoch": 0.95, + "learning_rate": 0.00015695798937632714, + "loss": 0.0366, "step": 147750 }, { - "epoch": 1.6, - "learning_rate": 6.026997209423064e-05, - "loss": 0.0288, + "epoch": 0.95, + "learning_rate": 0.0001569483080219702, + "loss": 0.0454, "step": 147760 }, { - "epoch": 1.6, - "learning_rate": 6.0253747809721584e-05, - "loss": 0.0294, + "epoch": 0.95, + "learning_rate": 0.00015693862666761328, + "loss": 0.0365, "step": 147770 }, { - "epoch": 1.6, - "learning_rate": 6.0237523525212533e-05, - "loss": 0.0307, + "epoch": 0.95, + "learning_rate": 0.00015692894531325636, + "loss": 0.037, "step": 147780 }, { - "epoch": 1.6, - "learning_rate": 6.022129924070348e-05, - "loss": 0.0247, + "epoch": 0.95, + "learning_rate": 0.0001569192639588994, + "loss": 0.0395, "step": 147790 }, { - "epoch": 1.6, - "learning_rate": 6.0205074956194426e-05, - "loss": 0.0249, + "epoch": 0.95, + "learning_rate": 0.0001569095826045425, + "loss": 0.0449, "step": 147800 }, { - "epoch": 1.6, - "learning_rate": 6.0188850671685376e-05, - "loss": 0.0306, + "epoch": 0.95, + "learning_rate": 0.00015689990125018554, + "loss": 0.0407, "step": 147810 }, { - "epoch": 1.6, - "learning_rate": 6.017262638717632e-05, - "loss": 0.0245, + "epoch": 0.95, + "learning_rate": 0.0001568902198958286, + "loss": 0.0404, "step": 147820 }, { - "epoch": 1.6, - "learning_rate": 6.015640210266727e-05, - "loss": 0.0302, + "epoch": 0.95, + "learning_rate": 0.00015688053854147167, + "loss": 0.0328, "step": 147830 }, { - "epoch": 1.6, - "learning_rate": 6.014017781815821e-05, - "loss": 0.0252, + "epoch": 0.95, + "learning_rate": 0.00015687085718711475, + "loss": 0.0334, "step": 147840 }, { - "epoch": 1.6, - "learning_rate": 6.012395353364916e-05, - "loss": 0.024, + "epoch": 0.95, + "learning_rate": 0.00015686117583275783, + "loss": 0.0456, "step": 147850 }, { - "epoch": 1.6, - "learning_rate": 6.0107729249140105e-05, - "loss": 0.0281, + "epoch": 0.95, + "learning_rate": 0.00015685149447840089, + "loss": 0.0355, "step": 147860 }, { - "epoch": 1.6, - "learning_rate": 6.0091504964631054e-05, - "loss": 0.0257, + "epoch": 0.95, + "learning_rate": 0.00015684181312404397, + "loss": 0.042, "step": 147870 }, { - "epoch": 1.6, - "learning_rate": 6.0075280680122004e-05, - "loss": 0.0286, + "epoch": 0.95, + "learning_rate": 0.00015683213176968702, + "loss": 0.0478, "step": 147880 }, { - "epoch": 1.6, - "learning_rate": 6.005905639561295e-05, - "loss": 0.0322, + "epoch": 0.95, + "learning_rate": 0.00015682245041533007, + "loss": 0.033, "step": 147890 }, { - "epoch": 1.6, - "learning_rate": 6.00428321111039e-05, - "loss": 0.0329, + "epoch": 0.95, + "learning_rate": 0.00015681276906097315, + "loss": 0.0397, "step": 147900 }, { - "epoch": 1.6, - "learning_rate": 6.002660782659484e-05, - "loss": 0.031, + "epoch": 0.95, + "learning_rate": 0.00015680308770661623, + "loss": 0.0367, "step": 147910 }, { - "epoch": 1.6, - "learning_rate": 6.001038354208579e-05, - "loss": 0.0266, + "epoch": 0.95, + "learning_rate": 0.0001567934063522593, + "loss": 0.0378, "step": 147920 }, { - "epoch": 1.6, - "learning_rate": 5.999415925757673e-05, - "loss": 0.0238, + "epoch": 0.95, + "learning_rate": 0.00015678372499790236, + "loss": 0.0358, "step": 147930 }, { - "epoch": 1.6, - "learning_rate": 5.997793497306768e-05, - "loss": 0.029, + "epoch": 0.95, + "learning_rate": 0.00015677404364354544, + "loss": 0.0418, "step": 147940 }, { - "epoch": 1.6, - "learning_rate": 5.9961710688558625e-05, - "loss": 0.027, + "epoch": 0.95, + "learning_rate": 0.0001567643622891885, + "loss": 0.0383, "step": 147950 }, { - "epoch": 1.6, - "learning_rate": 5.9945486404049575e-05, - "loss": 0.0331, + "epoch": 0.95, + "learning_rate": 0.00015675468093483155, + "loss": 0.0366, "step": 147960 }, { - "epoch": 1.6, - "learning_rate": 5.9929262119540525e-05, - "loss": 0.0234, + "epoch": 0.96, + "learning_rate": 0.00015674499958047463, + "loss": 0.0429, "step": 147970 }, { - "epoch": 1.6, - "learning_rate": 5.991303783503147e-05, - "loss": 0.0338, + "epoch": 0.96, + "learning_rate": 0.0001567353182261177, + "loss": 0.0343, "step": 147980 }, { - "epoch": 1.6, - "learning_rate": 5.989681355052242e-05, - "loss": 0.0291, + "epoch": 0.96, + "learning_rate": 0.00015672563687176076, + "loss": 0.0539, "step": 147990 }, { - "epoch": 1.6, - "learning_rate": 5.988058926601336e-05, - "loss": 0.0281, + "epoch": 0.96, + "learning_rate": 0.00015671595551740384, + "loss": 0.0405, "step": 148000 }, { - "epoch": 1.6, - "eval_cer": 0.9211525583055478, - "eval_loss": 0.022573284804821014, - "eval_runtime": 119.1258, - "eval_samples_per_second": 16.789, - "eval_steps_per_second": 4.197, + "epoch": 0.96, + "eval_cer": 0.9198861145633261, + "eval_loss": 0.025960681959986687, + "eval_runtime": 119.8751, + "eval_samples_per_second": 16.684, + "eval_steps_per_second": 4.171, "step": 148000 }, { - "epoch": 1.6, - "learning_rate": 5.986436498150431e-05, - "loss": 0.0248, + "epoch": 0.96, + "learning_rate": 0.00015670627416304692, + "loss": 0.0314, "step": 148010 }, { - "epoch": 1.6, - "learning_rate": 5.9848140696995253e-05, - "loss": 0.0289, + "epoch": 0.96, + "learning_rate": 0.00015669659280868995, + "loss": 0.0357, "step": 148020 }, { - "epoch": 1.6, - "learning_rate": 5.98319164124862e-05, - "loss": 0.0325, + "epoch": 0.96, + "learning_rate": 0.00015668691145433303, + "loss": 0.0404, "step": 148030 }, { - "epoch": 1.6, - "learning_rate": 5.9815692127977146e-05, - "loss": 0.0238, + "epoch": 0.96, + "learning_rate": 0.0001566772300999761, + "loss": 0.0365, "step": 148040 }, { - "epoch": 1.6, - "learning_rate": 5.9799467843468096e-05, - "loss": 0.0278, + "epoch": 0.96, + "learning_rate": 0.00015666754874561919, + "loss": 0.0374, "step": 148050 }, { - "epoch": 1.6, - "learning_rate": 5.9783243558959046e-05, - "loss": 0.0258, + "epoch": 0.96, + "learning_rate": 0.00015665786739126224, + "loss": 0.0398, "step": 148060 }, { - "epoch": 1.6, - "learning_rate": 5.976701927444999e-05, - "loss": 0.033, + "epoch": 0.96, + "learning_rate": 0.00015664818603690532, + "loss": 0.0456, "step": 148070 }, { - "epoch": 1.6, - "learning_rate": 5.975079498994094e-05, - "loss": 0.0227, + "epoch": 0.96, + "learning_rate": 0.00015663850468254837, + "loss": 0.0348, "step": 148080 }, { - "epoch": 1.6, - "learning_rate": 5.973457070543188e-05, - "loss": 0.0254, + "epoch": 0.96, + "learning_rate": 0.00015662882332819142, + "loss": 0.0376, "step": 148090 }, { - "epoch": 1.6, - "learning_rate": 5.971834642092283e-05, - "loss": 0.0253, + "epoch": 0.96, + "learning_rate": 0.0001566191419738345, + "loss": 0.0396, "step": 148100 }, { - "epoch": 1.6, - "learning_rate": 5.9702122136413774e-05, - "loss": 0.0296, + "epoch": 0.96, + "learning_rate": 0.00015660946061947758, + "loss": 0.0393, "step": 148110 }, { - "epoch": 1.6, - "learning_rate": 5.9685897851904724e-05, - "loss": 0.0302, + "epoch": 0.96, + "learning_rate": 0.00015659977926512066, + "loss": 0.0374, "step": 148120 }, { - "epoch": 1.6, - "learning_rate": 5.9669673567395674e-05, - "loss": 0.0257, + "epoch": 0.96, + "learning_rate": 0.00015659009791076372, + "loss": 0.0426, "step": 148130 }, { - "epoch": 1.6, - "learning_rate": 5.965344928288662e-05, - "loss": 0.0288, + "epoch": 0.96, + "learning_rate": 0.0001565804165564068, + "loss": 0.0351, "step": 148140 }, { - "epoch": 1.6, - "learning_rate": 5.9637224998377567e-05, - "loss": 0.0278, + "epoch": 0.96, + "learning_rate": 0.00015657073520204985, + "loss": 0.0364, "step": 148150 }, { - "epoch": 1.6, - "learning_rate": 5.962100071386851e-05, - "loss": 0.0256, + "epoch": 0.96, + "learning_rate": 0.0001565610538476929, + "loss": 0.0413, "step": 148160 }, { - "epoch": 1.6, - "learning_rate": 5.960477642935946e-05, - "loss": 0.0264, + "epoch": 0.96, + "learning_rate": 0.00015655137249333598, + "loss": 0.0344, "step": 148170 }, { - "epoch": 1.6, - "learning_rate": 5.95885521448504e-05, - "loss": 0.0277, + "epoch": 0.96, + "learning_rate": 0.00015654169113897906, + "loss": 0.035, "step": 148180 }, { - "epoch": 1.6, - "learning_rate": 5.957232786034135e-05, - "loss": 0.0294, + "epoch": 0.96, + "learning_rate": 0.0001565320097846221, + "loss": 0.0417, "step": 148190 }, { - "epoch": 1.6, - "learning_rate": 5.9556103575832295e-05, - "loss": 0.0286, + "epoch": 0.96, + "learning_rate": 0.0001565223284302652, + "loss": 0.0349, "step": 148200 }, { - "epoch": 1.6, - "learning_rate": 5.9539879291323245e-05, - "loss": 0.0312, + "epoch": 0.96, + "learning_rate": 0.00015651264707590827, + "loss": 0.0405, "step": 148210 }, { - "epoch": 1.6, - "learning_rate": 5.9523655006814195e-05, - "loss": 0.0322, + "epoch": 0.96, + "learning_rate": 0.0001565029657215513, + "loss": 0.0426, "step": 148220 }, { - "epoch": 1.6, - "learning_rate": 5.950743072230514e-05, - "loss": 0.0274, + "epoch": 0.96, + "learning_rate": 0.00015649328436719438, + "loss": 0.0364, "step": 148230 }, { - "epoch": 1.6, - "learning_rate": 5.949120643779609e-05, - "loss": 0.0225, + "epoch": 0.96, + "learning_rate": 0.00015648360301283746, + "loss": 0.0356, "step": 148240 }, { - "epoch": 1.6, - "learning_rate": 5.947498215328703e-05, - "loss": 0.0283, + "epoch": 0.96, + "learning_rate": 0.00015647392165848054, + "loss": 0.0353, "step": 148250 }, { - "epoch": 1.6, - "learning_rate": 5.945875786877798e-05, - "loss": 0.027, + "epoch": 0.96, + "learning_rate": 0.0001564642403041236, + "loss": 0.043, "step": 148260 }, { - "epoch": 1.6, - "learning_rate": 5.944253358426892e-05, - "loss": 0.0352, + "epoch": 0.96, + "learning_rate": 0.00015645455894976667, + "loss": 0.0402, "step": 148270 }, { - "epoch": 1.6, - "learning_rate": 5.942630929975987e-05, - "loss": 0.029, + "epoch": 0.96, + "learning_rate": 0.00015644487759540975, + "loss": 0.039, "step": 148280 }, { - "epoch": 1.6, - "learning_rate": 5.9410085015250816e-05, - "loss": 0.0257, + "epoch": 0.96, + "learning_rate": 0.00015643519624105277, + "loss": 0.0365, "step": 148290 }, { - "epoch": 1.6, - "learning_rate": 5.9393860730741766e-05, - "loss": 0.0283, + "epoch": 0.96, + "learning_rate": 0.00015642551488669585, + "loss": 0.0373, "step": 148300 }, { - "epoch": 1.6, - "learning_rate": 5.9377636446232715e-05, - "loss": 0.0268, + "epoch": 0.96, + "learning_rate": 0.00015641583353233893, + "loss": 0.0321, "step": 148310 }, { - "epoch": 1.6, - "learning_rate": 5.936141216172366e-05, - "loss": 0.0263, + "epoch": 0.96, + "learning_rate": 0.00015640615217798201, + "loss": 0.0353, "step": 148320 }, { - "epoch": 1.6, - "learning_rate": 5.934518787721461e-05, - "loss": 0.0248, + "epoch": 0.96, + "learning_rate": 0.00015639647082362507, + "loss": 0.039, "step": 148330 }, { - "epoch": 1.6, - "learning_rate": 5.932896359270555e-05, - "loss": 0.0258, + "epoch": 0.96, + "learning_rate": 0.00015638678946926815, + "loss": 0.0429, "step": 148340 }, { - "epoch": 1.6, - "learning_rate": 5.93127393081965e-05, - "loss": 0.0282, + "epoch": 0.96, + "learning_rate": 0.00015637710811491123, + "loss": 0.035, "step": 148350 }, { - "epoch": 1.6, - "learning_rate": 5.9296515023687444e-05, - "loss": 0.0256, + "epoch": 0.96, + "learning_rate": 0.00015636742676055425, + "loss": 0.0575, "step": 148360 }, { - "epoch": 1.6, - "learning_rate": 5.9280290739178394e-05, - "loss": 0.0293, + "epoch": 0.96, + "learning_rate": 0.00015635774540619733, + "loss": 0.0481, "step": 148370 }, { - "epoch": 1.6, - "learning_rate": 5.926406645466934e-05, - "loss": 0.0264, + "epoch": 0.96, + "learning_rate": 0.0001563480640518404, + "loss": 0.0352, "step": 148380 }, { - "epoch": 1.6, - "learning_rate": 5.9247842170160287e-05, - "loss": 0.0272, + "epoch": 0.96, + "learning_rate": 0.00015633838269748346, + "loss": 0.0369, "step": 148390 }, { - "epoch": 1.61, - "learning_rate": 5.9231617885651236e-05, - "loss": 0.0295, + "epoch": 0.96, + "learning_rate": 0.00015632870134312654, + "loss": 0.0325, "step": 148400 }, { - "epoch": 1.61, - "learning_rate": 5.921539360114218e-05, - "loss": 0.0248, + "epoch": 0.96, + "learning_rate": 0.00015631901998876962, + "loss": 0.0458, "step": 148410 }, { - "epoch": 1.61, - "learning_rate": 5.9199169316633136e-05, - "loss": 0.0333, + "epoch": 0.96, + "learning_rate": 0.0001563093386344127, + "loss": 0.0425, "step": 148420 }, { - "epoch": 1.61, - "learning_rate": 5.9182945032124086e-05, - "loss": 0.0259, + "epoch": 0.96, + "learning_rate": 0.00015629965728005573, + "loss": 0.0332, "step": 148430 }, { - "epoch": 1.61, - "learning_rate": 5.916672074761503e-05, - "loss": 0.0258, + "epoch": 0.96, + "learning_rate": 0.0001562899759256988, + "loss": 0.0323, "step": 148440 }, { - "epoch": 1.61, - "learning_rate": 5.915049646310598e-05, - "loss": 0.0269, + "epoch": 0.96, + "learning_rate": 0.0001562802945713419, + "loss": 0.037, "step": 148450 }, { - "epoch": 1.61, - "learning_rate": 5.913427217859692e-05, - "loss": 0.0338, + "epoch": 0.96, + "learning_rate": 0.00015627061321698494, + "loss": 0.0469, "step": 148460 }, { - "epoch": 1.61, - "learning_rate": 5.911804789408787e-05, - "loss": 0.0251, + "epoch": 0.96, + "learning_rate": 0.00015626093186262802, + "loss": 0.0368, "step": 148470 }, { - "epoch": 1.61, - "learning_rate": 5.9101823609578814e-05, - "loss": 0.0337, + "epoch": 0.96, + "learning_rate": 0.0001562512505082711, + "loss": 0.0444, "step": 148480 }, { - "epoch": 1.61, - "learning_rate": 5.9085599325069764e-05, - "loss": 0.0306, + "epoch": 0.96, + "learning_rate": 0.00015624156915391418, + "loss": 0.0321, "step": 148490 }, { - "epoch": 1.61, - "learning_rate": 5.906937504056071e-05, - "loss": 0.0293, + "epoch": 0.96, + "learning_rate": 0.0001562318877995572, + "loss": 0.0499, "step": 148500 }, { - "epoch": 1.61, - "learning_rate": 5.905315075605166e-05, - "loss": 0.0309, + "epoch": 0.96, + "learning_rate": 0.00015622220644520029, + "loss": 0.034, "step": 148510 }, { - "epoch": 1.61, - "learning_rate": 5.9036926471542606e-05, - "loss": 0.0311, + "epoch": 0.96, + "learning_rate": 0.00015621252509084337, + "loss": 0.0405, "step": 148520 }, { - "epoch": 1.61, - "learning_rate": 5.902070218703355e-05, - "loss": 0.0298, + "epoch": 0.96, + "learning_rate": 0.00015620284373648642, + "loss": 0.0407, "step": 148530 }, { - "epoch": 1.61, - "learning_rate": 5.90044779025245e-05, - "loss": 0.0413, + "epoch": 0.96, + "learning_rate": 0.0001561931623821295, + "loss": 0.0486, "step": 148540 }, { - "epoch": 1.61, - "learning_rate": 5.898825361801544e-05, - "loss": 0.0309, + "epoch": 0.96, + "learning_rate": 0.00015618348102777258, + "loss": 0.0434, "step": 148550 }, { - "epoch": 1.61, - "learning_rate": 5.897202933350639e-05, - "loss": 0.0295, + "epoch": 0.96, + "learning_rate": 0.00015617379967341566, + "loss": 0.0437, "step": 148560 }, { - "epoch": 1.61, - "learning_rate": 5.8955805048997335e-05, - "loss": 0.026, + "epoch": 0.96, + "learning_rate": 0.00015616411831905868, + "loss": 0.0441, "step": 148570 }, { - "epoch": 1.61, - "learning_rate": 5.8939580764488285e-05, - "loss": 0.0344, + "epoch": 0.96, + "learning_rate": 0.00015615443696470176, + "loss": 0.0385, "step": 148580 }, { - "epoch": 1.61, - "learning_rate": 5.892335647997923e-05, - "loss": 0.025, + "epoch": 0.96, + "learning_rate": 0.00015614475561034482, + "loss": 0.0391, "step": 148590 }, { - "epoch": 1.61, - "learning_rate": 5.890713219547018e-05, - "loss": 0.0275, + "epoch": 0.96, + "learning_rate": 0.0001561350742559879, + "loss": 0.0329, "step": 148600 }, { - "epoch": 1.61, - "learning_rate": 5.889090791096113e-05, - "loss": 0.0268, + "epoch": 0.96, + "learning_rate": 0.00015612539290163098, + "loss": 0.0372, "step": 148610 }, { - "epoch": 1.61, - "learning_rate": 5.887468362645207e-05, - "loss": 0.024, + "epoch": 0.96, + "learning_rate": 0.00015611571154727406, + "loss": 0.0355, "step": 148620 }, { - "epoch": 1.61, - "learning_rate": 5.885845934194302e-05, - "loss": 0.0262, + "epoch": 0.96, + "learning_rate": 0.0001561060301929171, + "loss": 0.0409, "step": 148630 }, { - "epoch": 1.61, - "learning_rate": 5.884223505743396e-05, - "loss": 0.0314, + "epoch": 0.96, + "learning_rate": 0.00015609634883856016, + "loss": 0.0362, "step": 148640 }, { - "epoch": 1.61, - "learning_rate": 5.882601077292491e-05, - "loss": 0.0296, + "epoch": 0.96, + "learning_rate": 0.00015608666748420324, + "loss": 0.0393, "step": 148650 }, { - "epoch": 1.61, - "learning_rate": 5.8809786488415856e-05, - "loss": 0.0271, + "epoch": 0.96, + "learning_rate": 0.0001560769861298463, + "loss": 0.0352, "step": 148660 }, { - "epoch": 1.61, - "learning_rate": 5.8793562203906806e-05, - "loss": 0.0236, + "epoch": 0.96, + "learning_rate": 0.00015606730477548937, + "loss": 0.0405, "step": 148670 }, { - "epoch": 1.61, - "learning_rate": 5.877733791939775e-05, - "loss": 0.033, + "epoch": 0.96, + "learning_rate": 0.00015605762342113245, + "loss": 0.0377, "step": 148680 }, { - "epoch": 1.61, - "learning_rate": 5.87611136348887e-05, - "loss": 0.0231, + "epoch": 0.96, + "learning_rate": 0.00015604794206677553, + "loss": 0.033, "step": 148690 }, { - "epoch": 1.61, - "learning_rate": 5.874488935037965e-05, - "loss": 0.0298, + "epoch": 0.96, + "learning_rate": 0.00015603826071241859, + "loss": 0.0434, "step": 148700 }, { - "epoch": 1.61, - "learning_rate": 5.872866506587059e-05, - "loss": 0.0234, + "epoch": 0.96, + "learning_rate": 0.00015602857935806164, + "loss": 0.0443, "step": 148710 }, { - "epoch": 1.61, - "learning_rate": 5.871244078136154e-05, - "loss": 0.0277, + "epoch": 0.96, + "learning_rate": 0.00015601889800370472, + "loss": 0.0396, "step": 148720 }, { - "epoch": 1.61, - "learning_rate": 5.8696216496852484e-05, - "loss": 0.0313, + "epoch": 0.96, + "learning_rate": 0.00015600921664934777, + "loss": 0.0386, "step": 148730 }, { - "epoch": 1.61, - "learning_rate": 5.8679992212343434e-05, - "loss": 0.0261, + "epoch": 0.96, + "learning_rate": 0.00015599953529499085, + "loss": 0.0479, "step": 148740 }, { - "epoch": 1.61, - "learning_rate": 5.866376792783438e-05, - "loss": 0.0269, + "epoch": 0.96, + "learning_rate": 0.00015598985394063393, + "loss": 0.041, "step": 148750 }, { - "epoch": 1.61, - "learning_rate": 5.8647543643325326e-05, - "loss": 0.0328, + "epoch": 0.96, + "learning_rate": 0.000155980172586277, + "loss": 0.0386, "step": 148760 }, { - "epoch": 1.61, - "learning_rate": 5.863131935881627e-05, - "loss": 0.0279, + "epoch": 0.96, + "learning_rate": 0.00015597049123192006, + "loss": 0.0392, "step": 148770 }, { - "epoch": 1.61, - "learning_rate": 5.861509507430722e-05, - "loss": 0.0323, + "epoch": 0.96, + "learning_rate": 0.00015596080987756312, + "loss": 0.036, "step": 148780 }, { - "epoch": 1.61, - "learning_rate": 5.859887078979817e-05, - "loss": 0.0297, + "epoch": 0.96, + "learning_rate": 0.00015595112852320617, + "loss": 0.036, "step": 148790 }, { - "epoch": 1.61, - "learning_rate": 5.858264650528911e-05, - "loss": 0.0259, + "epoch": 0.96, + "learning_rate": 0.00015594144716884925, + "loss": 0.0355, "step": 148800 }, { - "epoch": 1.61, - "learning_rate": 5.856642222078006e-05, - "loss": 0.0274, + "epoch": 0.96, + "learning_rate": 0.00015593176581449233, + "loss": 0.0431, "step": 148810 }, { - "epoch": 1.61, - "learning_rate": 5.8550197936271005e-05, - "loss": 0.0284, + "epoch": 0.96, + "learning_rate": 0.0001559220844601354, + "loss": 0.0388, "step": 148820 }, { - "epoch": 1.61, - "learning_rate": 5.8533973651761954e-05, - "loss": 0.0284, + "epoch": 0.96, + "learning_rate": 0.00015591240310577846, + "loss": 0.0365, "step": 148830 }, { - "epoch": 1.61, - "learning_rate": 5.85177493672529e-05, - "loss": 0.0253, + "epoch": 0.96, + "learning_rate": 0.00015590272175142154, + "loss": 0.0385, "step": 148840 }, { - "epoch": 1.61, - "learning_rate": 5.850152508274385e-05, - "loss": 0.026, + "epoch": 0.96, + "learning_rate": 0.0001558930403970646, + "loss": 0.0406, "step": 148850 }, { - "epoch": 1.61, - "learning_rate": 5.84853007982348e-05, - "loss": 0.025, + "epoch": 0.96, + "learning_rate": 0.00015588335904270765, + "loss": 0.0348, "step": 148860 }, { - "epoch": 1.61, - "learning_rate": 5.846907651372574e-05, - "loss": 0.0277, + "epoch": 0.96, + "learning_rate": 0.00015587367768835073, + "loss": 0.043, "step": 148870 }, { - "epoch": 1.61, - "learning_rate": 5.845285222921669e-05, - "loss": 0.0242, + "epoch": 0.96, + "learning_rate": 0.0001558639963339938, + "loss": 0.0362, "step": 148880 }, { - "epoch": 1.61, - "learning_rate": 5.843662794470763e-05, - "loss": 0.032, + "epoch": 0.96, + "learning_rate": 0.00015585431497963688, + "loss": 0.0394, "step": 148890 }, { - "epoch": 1.61, - "learning_rate": 5.842040366019858e-05, - "loss": 0.0261, + "epoch": 0.96, + "learning_rate": 0.00015584463362527994, + "loss": 0.0374, "step": 148900 }, { - "epoch": 1.61, - "learning_rate": 5.8404179375689526e-05, - "loss": 0.0275, + "epoch": 0.96, + "learning_rate": 0.00015583495227092302, + "loss": 0.0467, "step": 148910 }, { - "epoch": 1.61, - "learning_rate": 5.8387955091180475e-05, - "loss": 0.0288, + "epoch": 0.96, + "learning_rate": 0.00015582527091656607, + "loss": 0.045, "step": 148920 }, { - "epoch": 1.61, - "learning_rate": 5.837173080667142e-05, - "loss": 0.034, + "epoch": 0.96, + "learning_rate": 0.00015581558956220912, + "loss": 0.0465, "step": 148930 }, { - "epoch": 1.61, - "learning_rate": 5.835550652216237e-05, - "loss": 0.0289, + "epoch": 0.96, + "learning_rate": 0.0001558059082078522, + "loss": 0.0378, "step": 148940 }, { - "epoch": 1.61, - "learning_rate": 5.833928223765332e-05, - "loss": 0.0358, + "epoch": 0.96, + "learning_rate": 0.00015579622685349528, + "loss": 0.0413, "step": 148950 }, { - "epoch": 1.61, - "learning_rate": 5.832305795314426e-05, - "loss": 0.0288, + "epoch": 0.96, + "learning_rate": 0.00015578654549913836, + "loss": 0.0397, "step": 148960 }, { - "epoch": 1.61, - "learning_rate": 5.830683366863521e-05, - "loss": 0.03, + "epoch": 0.96, + "learning_rate": 0.00015577686414478141, + "loss": 0.0363, "step": 148970 }, { - "epoch": 1.61, - "learning_rate": 5.8290609384126154e-05, - "loss": 0.0299, + "epoch": 0.96, + "learning_rate": 0.0001557671827904245, + "loss": 0.0481, "step": 148980 }, { - "epoch": 1.61, - "learning_rate": 5.82743850996171e-05, - "loss": 0.0264, + "epoch": 0.96, + "learning_rate": 0.00015575750143606752, + "loss": 0.0466, "step": 148990 }, { - "epoch": 1.61, - "learning_rate": 5.8258160815108046e-05, - "loss": 0.029, + "epoch": 0.96, + "learning_rate": 0.0001557478200817106, + "loss": 0.0433, "step": 149000 }, { - "epoch": 1.61, - "eval_cer": 0.9210995492462996, - "eval_loss": 0.022670477628707886, - "eval_runtime": 119.0552, - "eval_samples_per_second": 16.799, - "eval_steps_per_second": 4.2, + "epoch": 0.96, + "eval_cer": 0.919936730312959, + "eval_loss": 0.025839416310191154, + "eval_runtime": 119.7309, + "eval_samples_per_second": 16.704, + "eval_steps_per_second": 4.176, "step": 149000 }, { - "epoch": 1.61, - "learning_rate": 5.8241936530598996e-05, - "loss": 0.0348, + "epoch": 0.96, + "learning_rate": 0.00015573813872735368, + "loss": 0.0354, "step": 149010 }, { - "epoch": 1.61, - "learning_rate": 5.822571224608994e-05, - "loss": 0.0253, + "epoch": 0.96, + "learning_rate": 0.00015572845737299676, + "loss": 0.0353, "step": 149020 }, { - "epoch": 1.61, - "learning_rate": 5.820948796158089e-05, - "loss": 0.0298, + "epoch": 0.96, + "learning_rate": 0.0001557187760186398, + "loss": 0.0358, "step": 149030 }, { - "epoch": 1.61, - "learning_rate": 5.819326367707184e-05, - "loss": 0.03, + "epoch": 0.96, + "learning_rate": 0.0001557090946642829, + "loss": 0.0546, "step": 149040 }, { - "epoch": 1.61, - "learning_rate": 5.817703939256278e-05, - "loss": 0.0284, + "epoch": 0.96, + "learning_rate": 0.00015569941330992597, + "loss": 0.0436, "step": 149050 }, { - "epoch": 1.61, - "learning_rate": 5.816081510805373e-05, - "loss": 0.0287, + "epoch": 0.96, + "learning_rate": 0.000155689731955569, + "loss": 0.0369, "step": 149060 }, { - "epoch": 1.61, - "learning_rate": 5.8144590823544674e-05, - "loss": 0.0292, + "epoch": 0.96, + "learning_rate": 0.00015568005060121208, + "loss": 0.041, "step": 149070 }, { - "epoch": 1.61, - "learning_rate": 5.8128366539035624e-05, - "loss": 0.0237, + "epoch": 0.96, + "learning_rate": 0.00015567036924685516, + "loss": 0.0374, "step": 149080 }, { - "epoch": 1.61, - "learning_rate": 5.811214225452657e-05, - "loss": 0.0328, + "epoch": 0.96, + "learning_rate": 0.00015566068789249824, + "loss": 0.0366, "step": 149090 }, { - "epoch": 1.61, - "learning_rate": 5.809591797001752e-05, - "loss": 0.0311, + "epoch": 0.96, + "learning_rate": 0.0001556510065381413, + "loss": 0.0358, "step": 149100 }, { - "epoch": 1.61, - "learning_rate": 5.807969368550846e-05, - "loss": 0.0275, + "epoch": 0.96, + "learning_rate": 0.00015564132518378437, + "loss": 0.0375, "step": 149110 }, { - "epoch": 1.61, - "learning_rate": 5.806346940099941e-05, - "loss": 0.0266, + "epoch": 0.96, + "learning_rate": 0.00015563164382942745, + "loss": 0.0347, "step": 149120 }, { - "epoch": 1.61, - "learning_rate": 5.804724511649036e-05, - "loss": 0.0279, + "epoch": 0.96, + "learning_rate": 0.00015562196247507047, + "loss": 0.0363, "step": 149130 }, { - "epoch": 1.61, - "learning_rate": 5.80310208319813e-05, - "loss": 0.0272, + "epoch": 0.96, + "learning_rate": 0.00015561228112071355, + "loss": 0.0462, "step": 149140 }, { - "epoch": 1.61, - "learning_rate": 5.801479654747225e-05, - "loss": 0.0248, + "epoch": 0.96, + "learning_rate": 0.00015560259976635663, + "loss": 0.0369, "step": 149150 }, { - "epoch": 1.61, - "learning_rate": 5.7998572262963195e-05, - "loss": 0.0271, + "epoch": 0.96, + "learning_rate": 0.00015559291841199971, + "loss": 0.0406, "step": 149160 }, { - "epoch": 1.61, - "learning_rate": 5.7982347978454145e-05, - "loss": 0.0241, + "epoch": 0.96, + "learning_rate": 0.00015558323705764277, + "loss": 0.038, "step": 149170 }, { - "epoch": 1.61, - "learning_rate": 5.796612369394509e-05, - "loss": 0.0367, + "epoch": 0.96, + "learning_rate": 0.00015557355570328585, + "loss": 0.0402, "step": 149180 }, { - "epoch": 1.61, - "learning_rate": 5.794989940943604e-05, - "loss": 0.0272, + "epoch": 0.96, + "learning_rate": 0.00015556387434892893, + "loss": 0.0338, "step": 149190 }, { - "epoch": 1.61, - "learning_rate": 5.793367512492699e-05, - "loss": 0.029, + "epoch": 0.96, + "learning_rate": 0.00015555419299457195, + "loss": 0.0384, "step": 149200 }, { - "epoch": 1.61, - "learning_rate": 5.791745084041793e-05, - "loss": 0.0289, + "epoch": 0.96, + "learning_rate": 0.00015554451164021503, + "loss": 0.0304, "step": 149210 }, { - "epoch": 1.61, - "learning_rate": 5.790122655590888e-05, - "loss": 0.0308, + "epoch": 0.96, + "learning_rate": 0.0001555348302858581, + "loss": 0.0439, "step": 149220 }, { - "epoch": 1.61, - "learning_rate": 5.788500227139982e-05, - "loss": 0.0239, + "epoch": 0.96, + "learning_rate": 0.00015552514893150116, + "loss": 0.0399, "step": 149230 }, { - "epoch": 1.61, - "learning_rate": 5.786877798689077e-05, - "loss": 0.0331, + "epoch": 0.96, + "learning_rate": 0.00015551546757714424, + "loss": 0.0373, "step": 149240 }, { - "epoch": 1.61, - "learning_rate": 5.7852553702381716e-05, - "loss": 0.0298, + "epoch": 0.96, + "learning_rate": 0.00015550578622278732, + "loss": 0.0377, "step": 149250 }, { - "epoch": 1.61, - "learning_rate": 5.7836329417872666e-05, - "loss": 0.0256, + "epoch": 0.96, + "learning_rate": 0.0001554961048684304, + "loss": 0.0347, "step": 149260 }, { - "epoch": 1.61, - "learning_rate": 5.782010513336361e-05, - "loss": 0.0258, + "epoch": 0.96, + "learning_rate": 0.00015548642351407343, + "loss": 0.0401, "step": 149270 }, { - "epoch": 1.61, - "learning_rate": 5.780388084885456e-05, - "loss": 0.0243, + "epoch": 0.96, + "learning_rate": 0.0001554767421597165, + "loss": 0.0441, "step": 149280 }, { - "epoch": 1.61, - "learning_rate": 5.778765656434551e-05, - "loss": 0.0277, + "epoch": 0.96, + "learning_rate": 0.0001554670608053596, + "loss": 0.0388, "step": 149290 }, { - "epoch": 1.61, - "learning_rate": 5.777143227983645e-05, - "loss": 0.0259, + "epoch": 0.96, + "learning_rate": 0.00015545737945100264, + "loss": 0.0423, "step": 149300 }, { - "epoch": 1.61, - "learning_rate": 5.77552079953274e-05, - "loss": 0.0289, + "epoch": 0.96, + "learning_rate": 0.00015544769809664572, + "loss": 0.0311, "step": 149310 }, { - "epoch": 1.62, - "learning_rate": 5.7738983710818344e-05, - "loss": 0.0356, + "epoch": 0.96, + "learning_rate": 0.0001554380167422888, + "loss": 0.041, "step": 149320 }, { - "epoch": 1.62, - "learning_rate": 5.7722759426309294e-05, - "loss": 0.0291, + "epoch": 0.96, + "learning_rate": 0.00015542833538793188, + "loss": 0.0385, "step": 149330 }, { - "epoch": 1.62, - "learning_rate": 5.770653514180024e-05, - "loss": 0.0251, + "epoch": 0.96, + "learning_rate": 0.0001554186540335749, + "loss": 0.041, "step": 149340 }, { - "epoch": 1.62, - "learning_rate": 5.769031085729119e-05, - "loss": 0.0258, + "epoch": 0.96, + "learning_rate": 0.00015540897267921799, + "loss": 0.0342, "step": 149350 }, { - "epoch": 1.62, - "learning_rate": 5.767408657278213e-05, - "loss": 0.0306, + "epoch": 0.96, + "learning_rate": 0.00015539929132486107, + "loss": 0.0377, "step": 149360 }, { - "epoch": 1.62, - "learning_rate": 5.765786228827308e-05, - "loss": 0.0273, + "epoch": 0.96, + "learning_rate": 0.00015538960997050412, + "loss": 0.0317, "step": 149370 }, { - "epoch": 1.62, - "learning_rate": 5.764163800376403e-05, - "loss": 0.0314, + "epoch": 0.96, + "learning_rate": 0.0001553799286161472, + "loss": 0.0338, "step": 149380 }, { - "epoch": 1.62, - "learning_rate": 5.762541371925497e-05, - "loss": 0.0288, + "epoch": 0.96, + "learning_rate": 0.00015537024726179028, + "loss": 0.0346, "step": 149390 }, { - "epoch": 1.62, - "learning_rate": 5.760918943474592e-05, - "loss": 0.0318, + "epoch": 0.96, + "learning_rate": 0.00015536056590743333, + "loss": 0.0428, "step": 149400 }, { - "epoch": 1.62, - "learning_rate": 5.7592965150236865e-05, - "loss": 0.0314, + "epoch": 0.96, + "learning_rate": 0.00015535088455307638, + "loss": 0.0354, "step": 149410 }, { - "epoch": 1.62, - "learning_rate": 5.7576740865727815e-05, - "loss": 0.0302, + "epoch": 0.96, + "learning_rate": 0.00015534120319871946, + "loss": 0.0383, "step": 149420 }, { - "epoch": 1.62, - "learning_rate": 5.756051658121876e-05, - "loss": 0.0241, + "epoch": 0.96, + "learning_rate": 0.00015533152184436252, + "loss": 0.0398, "step": 149430 }, { - "epoch": 1.62, - "learning_rate": 5.754429229670971e-05, - "loss": 0.0292, + "epoch": 0.96, + "learning_rate": 0.0001553218404900056, + "loss": 0.0369, "step": 149440 }, { - "epoch": 1.62, - "learning_rate": 5.752806801220065e-05, - "loss": 0.0253, + "epoch": 0.96, + "learning_rate": 0.00015531215913564868, + "loss": 0.037, "step": 149450 }, { - "epoch": 1.62, - "learning_rate": 5.75118437276916e-05, - "loss": 0.026, + "epoch": 0.96, + "learning_rate": 0.00015530247778129176, + "loss": 0.0386, "step": 149460 }, { - "epoch": 1.62, - "learning_rate": 5.749561944318255e-05, - "loss": 0.0297, + "epoch": 0.96, + "learning_rate": 0.0001552927964269348, + "loss": 0.046, "step": 149470 }, { - "epoch": 1.62, - "learning_rate": 5.747939515867349e-05, - "loss": 0.0237, + "epoch": 0.96, + "learning_rate": 0.00015528311507257786, + "loss": 0.0466, "step": 149480 }, { - "epoch": 1.62, - "learning_rate": 5.746317087416444e-05, - "loss": 0.0244, + "epoch": 0.96, + "learning_rate": 0.00015527343371822094, + "loss": 0.0371, "step": 149490 }, { - "epoch": 1.62, - "learning_rate": 5.7446946589655386e-05, - "loss": 0.0239, + "epoch": 0.96, + "learning_rate": 0.000155263752363864, + "loss": 0.0417, "step": 149500 }, { - "epoch": 1.62, - "learning_rate": 5.7430722305146336e-05, - "loss": 0.0334, + "epoch": 0.96, + "learning_rate": 0.00015525407100950707, + "loss": 0.041, "step": 149510 }, { - "epoch": 1.62, - "learning_rate": 5.741449802063728e-05, - "loss": 0.0271, + "epoch": 0.97, + "learning_rate": 0.00015524438965515015, + "loss": 0.0344, "step": 149520 }, { - "epoch": 1.62, - "learning_rate": 5.739827373612823e-05, - "loss": 0.0306, + "epoch": 0.97, + "learning_rate": 0.00015523470830079323, + "loss": 0.0368, "step": 149530 }, { - "epoch": 1.62, - "learning_rate": 5.738204945161918e-05, - "loss": 0.0257, - "step": 149540 + "epoch": 0.97, + "learning_rate": 0.00015522502694643629, + "loss": 0.0313, + "step": 149540 }, { - "epoch": 1.62, - "learning_rate": 5.736582516711012e-05, - "loss": 0.0303, + "epoch": 0.97, + "learning_rate": 0.00015521534559207934, + "loss": 0.0371, "step": 149550 }, { - "epoch": 1.62, - "learning_rate": 5.734960088260107e-05, - "loss": 0.0325, + "epoch": 0.97, + "learning_rate": 0.00015520566423772242, + "loss": 0.0368, "step": 149560 }, { - "epoch": 1.62, - "learning_rate": 5.7333376598092014e-05, - "loss": 0.0263, + "epoch": 0.97, + "learning_rate": 0.00015519598288336547, + "loss": 0.0354, "step": 149570 }, { - "epoch": 1.62, - "learning_rate": 5.7317152313582964e-05, - "loss": 0.0309, + "epoch": 0.97, + "learning_rate": 0.00015518630152900855, + "loss": 0.0394, "step": 149580 }, { - "epoch": 1.62, - "learning_rate": 5.730092802907391e-05, - "loss": 0.0268, + "epoch": 0.97, + "learning_rate": 0.00015517662017465163, + "loss": 0.0357, "step": 149590 }, { - "epoch": 1.62, - "learning_rate": 5.728470374456486e-05, - "loss": 0.0241, + "epoch": 0.97, + "learning_rate": 0.00015516693882029468, + "loss": 0.0407, "step": 149600 }, { - "epoch": 1.62, - "learning_rate": 5.726847946005581e-05, - "loss": 0.0319, + "epoch": 0.97, + "learning_rate": 0.00015515725746593776, + "loss": 0.0464, "step": 149610 }, { - "epoch": 1.62, - "learning_rate": 5.7252255175546756e-05, - "loss": 0.0262, + "epoch": 0.97, + "learning_rate": 0.00015514757611158082, + "loss": 0.035, "step": 149620 }, { - "epoch": 1.62, - "learning_rate": 5.7236030891037706e-05, - "loss": 0.026, + "epoch": 0.97, + "learning_rate": 0.00015513789475722387, + "loss": 0.0482, "step": 149630 }, { - "epoch": 1.62, - "learning_rate": 5.721980660652865e-05, - "loss": 0.0289, + "epoch": 0.97, + "learning_rate": 0.00015512821340286695, + "loss": 0.033, "step": 149640 }, { - "epoch": 1.62, - "learning_rate": 5.72035823220196e-05, - "loss": 0.0351, + "epoch": 0.97, + "learning_rate": 0.00015511853204851003, + "loss": 0.0421, "step": 149650 }, { - "epoch": 1.62, - "learning_rate": 5.718735803751054e-05, - "loss": 0.0272, + "epoch": 0.97, + "learning_rate": 0.0001551088506941531, + "loss": 0.038, "step": 149660 }, { - "epoch": 1.62, - "learning_rate": 5.717113375300149e-05, - "loss": 0.026, + "epoch": 0.97, + "learning_rate": 0.00015509916933979616, + "loss": 0.0417, "step": 149670 }, { - "epoch": 1.62, - "learning_rate": 5.715490946849244e-05, - "loss": 0.0264, + "epoch": 0.97, + "learning_rate": 0.00015508948798543924, + "loss": 0.0415, "step": 149680 }, { - "epoch": 1.62, - "learning_rate": 5.7138685183983384e-05, - "loss": 0.0239, + "epoch": 0.97, + "learning_rate": 0.0001550798066310823, + "loss": 0.0405, "step": 149690 }, { - "epoch": 1.62, - "learning_rate": 5.7122460899474334e-05, - "loss": 0.0243, + "epoch": 0.97, + "learning_rate": 0.00015507012527672534, + "loss": 0.034, "step": 149700 }, { - "epoch": 1.62, - "learning_rate": 5.710623661496528e-05, - "loss": 0.0269, + "epoch": 0.97, + "learning_rate": 0.00015506044392236842, + "loss": 0.0386, "step": 149710 }, { - "epoch": 1.62, - "learning_rate": 5.7090012330456227e-05, - "loss": 0.031, + "epoch": 0.97, + "learning_rate": 0.0001550507625680115, + "loss": 0.0444, "step": 149720 }, { - "epoch": 1.62, - "learning_rate": 5.707378804594717e-05, - "loss": 0.0291, + "epoch": 0.97, + "learning_rate": 0.00015504108121365458, + "loss": 0.0398, "step": 149730 }, { - "epoch": 1.62, - "learning_rate": 5.705756376143812e-05, - "loss": 0.0268, + "epoch": 0.97, + "learning_rate": 0.00015503139985929764, + "loss": 0.0349, "step": 149740 }, { - "epoch": 1.62, - "learning_rate": 5.704133947692906e-05, - "loss": 0.0246, + "epoch": 0.97, + "learning_rate": 0.00015502171850494072, + "loss": 0.039, "step": 149750 }, { - "epoch": 1.62, - "learning_rate": 5.702511519242001e-05, - "loss": 0.0259, + "epoch": 0.97, + "learning_rate": 0.00015501203715058377, + "loss": 0.0375, "step": 149760 }, { - "epoch": 1.62, - "learning_rate": 5.700889090791096e-05, - "loss": 0.0265, + "epoch": 0.97, + "learning_rate": 0.00015500235579622682, + "loss": 0.0343, "step": 149770 }, { - "epoch": 1.62, - "learning_rate": 5.6992666623401905e-05, - "loss": 0.0268, + "epoch": 0.97, + "learning_rate": 0.0001549926744418699, + "loss": 0.0359, "step": 149780 }, { - "epoch": 1.62, - "learning_rate": 5.6976442338892855e-05, - "loss": 0.03, + "epoch": 0.97, + "learning_rate": 0.00015498299308751298, + "loss": 0.0394, "step": 149790 }, { - "epoch": 1.62, - "learning_rate": 5.69602180543838e-05, - "loss": 0.028, + "epoch": 0.97, + "learning_rate": 0.00015497331173315603, + "loss": 0.0368, "step": 149800 }, { - "epoch": 1.62, - "learning_rate": 5.694399376987475e-05, - "loss": 0.0262, + "epoch": 0.97, + "learning_rate": 0.00015496363037879911, + "loss": 0.0341, "step": 149810 }, { - "epoch": 1.62, - "learning_rate": 5.692776948536569e-05, - "loss": 0.0233, + "epoch": 0.97, + "learning_rate": 0.0001549539490244422, + "loss": 0.0437, "step": 149820 }, { - "epoch": 1.62, - "learning_rate": 5.691154520085664e-05, - "loss": 0.0215, + "epoch": 0.97, + "learning_rate": 0.00015494426767008522, + "loss": 0.0452, "step": 149830 }, { - "epoch": 1.62, - "learning_rate": 5.689532091634758e-05, - "loss": 0.0297, + "epoch": 0.97, + "learning_rate": 0.0001549345863157283, + "loss": 0.0433, "step": 149840 }, { - "epoch": 1.62, - "learning_rate": 5.687909663183853e-05, - "loss": 0.0254, + "epoch": 0.97, + "learning_rate": 0.00015492490496137138, + "loss": 0.0389, "step": 149850 }, { - "epoch": 1.62, - "learning_rate": 5.686287234732948e-05, - "loss": 0.0284, + "epoch": 0.97, + "learning_rate": 0.00015491522360701446, + "loss": 0.0413, "step": 149860 }, { - "epoch": 1.62, - "learning_rate": 5.6846648062820426e-05, - "loss": 0.0343, + "epoch": 0.97, + "learning_rate": 0.0001549055422526575, + "loss": 0.0334, "step": 149870 }, { - "epoch": 1.62, - "learning_rate": 5.6830423778311375e-05, - "loss": 0.0285, + "epoch": 0.97, + "learning_rate": 0.0001548958608983006, + "loss": 0.0389, "step": 149880 }, { - "epoch": 1.62, - "learning_rate": 5.681419949380232e-05, - "loss": 0.0305, + "epoch": 0.97, + "learning_rate": 0.00015488617954394367, + "loss": 0.0406, "step": 149890 }, { - "epoch": 1.62, - "learning_rate": 5.679797520929327e-05, - "loss": 0.0261, + "epoch": 0.97, + "learning_rate": 0.0001548764981895867, + "loss": 0.0366, "step": 149900 }, { - "epoch": 1.62, - "learning_rate": 5.678175092478421e-05, - "loss": 0.0313, + "epoch": 0.97, + "learning_rate": 0.00015486681683522978, + "loss": 0.0344, "step": 149910 }, { - "epoch": 1.62, - "learning_rate": 5.676552664027516e-05, - "loss": 0.0265, + "epoch": 0.97, + "learning_rate": 0.00015485713548087286, + "loss": 0.0366, "step": 149920 }, { - "epoch": 1.62, - "learning_rate": 5.674930235576611e-05, - "loss": 0.0328, + "epoch": 0.97, + "learning_rate": 0.00015484745412651594, + "loss": 0.0378, "step": 149930 }, { - "epoch": 1.62, - "learning_rate": 5.6733078071257054e-05, - "loss": 0.025, + "epoch": 0.97, + "learning_rate": 0.000154837772772159, + "loss": 0.0365, "step": 149940 }, { - "epoch": 1.62, - "learning_rate": 5.6716853786748004e-05, - "loss": 0.0265, + "epoch": 0.97, + "learning_rate": 0.00015482809141780207, + "loss": 0.0363, "step": 149950 }, { - "epoch": 1.62, - "learning_rate": 5.6700629502238947e-05, - "loss": 0.0255, + "epoch": 0.97, + "learning_rate": 0.00015481841006344515, + "loss": 0.0402, "step": 149960 }, { - "epoch": 1.62, - "learning_rate": 5.6684405217729896e-05, - "loss": 0.0268, + "epoch": 0.97, + "learning_rate": 0.00015480872870908817, + "loss": 0.042, "step": 149970 }, { - "epoch": 1.62, - "learning_rate": 5.666818093322084e-05, - "loss": 0.027, + "epoch": 0.97, + "learning_rate": 0.00015479904735473125, + "loss": 0.0349, "step": 149980 }, { - "epoch": 1.62, - "learning_rate": 5.665195664871179e-05, - "loss": 0.0297, + "epoch": 0.97, + "learning_rate": 0.00015478936600037433, + "loss": 0.0389, "step": 149990 }, { - "epoch": 1.62, - "learning_rate": 5.663573236420273e-05, - "loss": 0.0324, + "epoch": 0.97, + "learning_rate": 0.00015477968464601739, + "loss": 0.0378, "step": 150000 }, { - "epoch": 1.62, - "eval_cer": 0.9211136849954323, - "eval_loss": 0.02247888222336769, - "eval_runtime": 118.8982, - "eval_samples_per_second": 16.821, - "eval_steps_per_second": 4.205, + "epoch": 0.97, + "eval_cer": 0.9199909614732799, + "eval_loss": 0.026005547493696213, + "eval_runtime": 119.8926, + "eval_samples_per_second": 16.682, + "eval_steps_per_second": 4.17, "step": 150000 }, { - "epoch": 1.62, - "learning_rate": 5.661950807969368e-05, - "loss": 0.028, + "epoch": 0.97, + "learning_rate": 0.00015477000329166047, + "loss": 0.0436, "step": 150010 }, { - "epoch": 1.62, - "learning_rate": 5.660328379518463e-05, - "loss": 0.0327, + "epoch": 0.97, + "learning_rate": 0.00015476032193730355, + "loss": 0.0347, "step": 150020 }, { - "epoch": 1.62, - "learning_rate": 5.6587059510675575e-05, - "loss": 0.0245, + "epoch": 0.97, + "learning_rate": 0.00015475064058294663, + "loss": 0.0352, "step": 150030 }, { - "epoch": 1.62, - "learning_rate": 5.6570835226166524e-05, - "loss": 0.0271, + "epoch": 0.97, + "learning_rate": 0.00015474095922858965, + "loss": 0.0415, "step": 150040 }, { - "epoch": 1.62, - "learning_rate": 5.655461094165747e-05, - "loss": 0.0311, + "epoch": 0.97, + "learning_rate": 0.00015473127787423273, + "loss": 0.0391, "step": 150050 }, { - "epoch": 1.62, - "learning_rate": 5.653838665714842e-05, - "loss": 0.0286, + "epoch": 0.97, + "learning_rate": 0.0001547215965198758, + "loss": 0.0401, "step": 150060 }, { - "epoch": 1.62, - "learning_rate": 5.652216237263936e-05, - "loss": 0.0304, + "epoch": 0.97, + "learning_rate": 0.00015471191516551886, + "loss": 0.0407, "step": 150070 }, { - "epoch": 1.62, - "learning_rate": 5.650593808813031e-05, - "loss": 0.0274, + "epoch": 0.97, + "learning_rate": 0.00015470223381116194, + "loss": 0.043, "step": 150080 }, { - "epoch": 1.62, - "learning_rate": 5.648971380362125e-05, - "loss": 0.0258, + "epoch": 0.97, + "learning_rate": 0.00015469255245680502, + "loss": 0.0432, "step": 150090 }, { - "epoch": 1.62, - "learning_rate": 5.64734895191122e-05, - "loss": 0.0336, + "epoch": 0.97, + "learning_rate": 0.0001546828711024481, + "loss": 0.0341, "step": 150100 }, { - "epoch": 1.62, - "learning_rate": 5.645726523460315e-05, - "loss": 0.0252, + "epoch": 0.97, + "learning_rate": 0.00015467318974809113, + "loss": 0.0436, "step": 150110 }, { - "epoch": 1.62, - "learning_rate": 5.6441040950094095e-05, - "loss": 0.0222, + "epoch": 0.97, + "learning_rate": 0.0001546635083937342, + "loss": 0.0445, "step": 150120 }, { - "epoch": 1.62, - "learning_rate": 5.6424816665585045e-05, - "loss": 0.024, + "epoch": 0.97, + "learning_rate": 0.0001546538270393773, + "loss": 0.0388, "step": 150130 }, { - "epoch": 1.62, - "learning_rate": 5.640859238107599e-05, - "loss": 0.027, + "epoch": 0.97, + "learning_rate": 0.00015464414568502034, + "loss": 0.0377, "step": 150140 }, { - "epoch": 1.62, - "learning_rate": 5.639236809656694e-05, - "loss": 0.0325, + "epoch": 0.97, + "learning_rate": 0.00015463446433066342, + "loss": 0.04, "step": 150150 }, { - "epoch": 1.62, - "learning_rate": 5.637614381205788e-05, - "loss": 0.033, + "epoch": 0.97, + "learning_rate": 0.0001546247829763065, + "loss": 0.0361, "step": 150160 }, { - "epoch": 1.62, - "learning_rate": 5.635991952754883e-05, - "loss": 0.0278, + "epoch": 0.97, + "learning_rate": 0.00015461510162194955, + "loss": 0.0368, "step": 150170 }, { - "epoch": 1.62, - "learning_rate": 5.6343695243039774e-05, - "loss": 0.0311, + "epoch": 0.97, + "learning_rate": 0.0001546054202675926, + "loss": 0.0377, "step": 150180 }, { - "epoch": 1.62, - "learning_rate": 5.6327470958530723e-05, - "loss": 0.0234, + "epoch": 0.97, + "learning_rate": 0.00015459573891323569, + "loss": 0.0352, "step": 150190 }, { - "epoch": 1.62, - "learning_rate": 5.631124667402167e-05, - "loss": 0.0336, + "epoch": 0.97, + "learning_rate": 0.00015458605755887874, + "loss": 0.036, "step": 150200 }, { - "epoch": 1.62, - "learning_rate": 5.6295022389512616e-05, - "loss": 0.0293, + "epoch": 0.97, + "learning_rate": 0.00015457637620452182, + "loss": 0.0325, "step": 150210 }, { - "epoch": 1.62, - "learning_rate": 5.6278798105003566e-05, - "loss": 0.0282, + "epoch": 0.97, + "learning_rate": 0.0001545666948501649, + "loss": 0.0414, "step": 150220 }, { - "epoch": 1.62, - "learning_rate": 5.626257382049451e-05, - "loss": 0.0337, + "epoch": 0.97, + "learning_rate": 0.00015455701349580798, + "loss": 0.038, "step": 150230 }, { - "epoch": 1.63, - "learning_rate": 5.624634953598546e-05, - "loss": 0.0368, + "epoch": 0.97, + "learning_rate": 0.00015454733214145103, + "loss": 0.033, "step": 150240 }, { - "epoch": 1.63, - "learning_rate": 5.62301252514764e-05, - "loss": 0.0248, + "epoch": 0.97, + "learning_rate": 0.00015453765078709408, + "loss": 0.0421, "step": 150250 }, { - "epoch": 1.63, - "learning_rate": 5.621390096696735e-05, - "loss": 0.0303, + "epoch": 0.97, + "learning_rate": 0.00015452796943273716, + "loss": 0.038, "step": 150260 }, { - "epoch": 1.63, - "learning_rate": 5.61976766824583e-05, - "loss": 0.0254, + "epoch": 0.97, + "learning_rate": 0.00015451828807838022, + "loss": 0.0437, "step": 150270 }, { - "epoch": 1.63, - "learning_rate": 5.6181452397949244e-05, - "loss": 0.0264, + "epoch": 0.97, + "learning_rate": 0.0001545086067240233, + "loss": 0.0367, "step": 150280 }, { - "epoch": 1.63, - "learning_rate": 5.6165228113440194e-05, - "loss": 0.0301, + "epoch": 0.97, + "learning_rate": 0.00015449892536966638, + "loss": 0.0424, "step": 150290 }, { - "epoch": 1.63, - "learning_rate": 5.614900382893114e-05, - "loss": 0.0275, + "epoch": 0.97, + "learning_rate": 0.00015448924401530945, + "loss": 0.0457, "step": 150300 }, { - "epoch": 1.63, - "learning_rate": 5.613277954442209e-05, - "loss": 0.0246, + "epoch": 0.97, + "learning_rate": 0.0001544795626609525, + "loss": 0.0434, "step": 150310 }, { - "epoch": 1.63, - "learning_rate": 5.611655525991303e-05, - "loss": 0.0243, + "epoch": 0.97, + "learning_rate": 0.00015446988130659556, + "loss": 0.0466, "step": 150320 }, { - "epoch": 1.63, - "learning_rate": 5.610033097540398e-05, - "loss": 0.0267, + "epoch": 0.97, + "learning_rate": 0.00015446019995223864, + "loss": 0.0428, "step": 150330 }, { - "epoch": 1.63, - "learning_rate": 5.608410669089492e-05, - "loss": 0.0299, + "epoch": 0.97, + "learning_rate": 0.0001544505185978817, + "loss": 0.0432, "step": 150340 }, { - "epoch": 1.63, - "learning_rate": 5.606788240638587e-05, - "loss": 0.0276, + "epoch": 0.97, + "learning_rate": 0.00015444083724352477, + "loss": 0.0357, "step": 150350 }, { - "epoch": 1.63, - "learning_rate": 5.605165812187682e-05, - "loss": 0.023, + "epoch": 0.97, + "learning_rate": 0.00015443115588916785, + "loss": 0.0372, "step": 150360 }, { - "epoch": 1.63, - "learning_rate": 5.6035433837367765e-05, - "loss": 0.0264, + "epoch": 0.97, + "learning_rate": 0.0001544214745348109, + "loss": 0.0378, "step": 150370 }, { - "epoch": 1.63, - "learning_rate": 5.6019209552858715e-05, - "loss": 0.0269, + "epoch": 0.97, + "learning_rate": 0.00015441179318045398, + "loss": 0.0415, "step": 150380 }, { - "epoch": 1.63, - "learning_rate": 5.600298526834966e-05, - "loss": 0.0283, + "epoch": 0.97, + "learning_rate": 0.00015440211182609704, + "loss": 0.0408, "step": 150390 }, { - "epoch": 1.63, - "learning_rate": 5.598676098384061e-05, - "loss": 0.0274, + "epoch": 0.97, + "learning_rate": 0.0001543924304717401, + "loss": 0.0393, "step": 150400 }, { - "epoch": 1.63, - "learning_rate": 5.597053669933155e-05, - "loss": 0.0278, + "epoch": 0.97, + "learning_rate": 0.00015438274911738317, + "loss": 0.0369, "step": 150410 }, { - "epoch": 1.63, - "learning_rate": 5.59543124148225e-05, - "loss": 0.0257, + "epoch": 0.97, + "learning_rate": 0.00015437306776302625, + "loss": 0.0344, "step": 150420 }, { - "epoch": 1.63, - "learning_rate": 5.5938088130313443e-05, - "loss": 0.0325, + "epoch": 0.97, + "learning_rate": 0.00015436338640866933, + "loss": 0.0345, "step": 150430 }, { - "epoch": 1.63, - "learning_rate": 5.592186384580439e-05, - "loss": 0.0262, + "epoch": 0.97, + "learning_rate": 0.00015435370505431238, + "loss": 0.0417, "step": 150440 }, { - "epoch": 1.63, - "learning_rate": 5.590563956129534e-05, - "loss": 0.0239, + "epoch": 0.97, + "learning_rate": 0.00015434402369995546, + "loss": 0.0411, "step": 150450 }, { - "epoch": 1.63, - "learning_rate": 5.5889415276786286e-05, - "loss": 0.0276, + "epoch": 0.97, + "learning_rate": 0.00015433434234559851, + "loss": 0.0398, "step": 150460 }, { - "epoch": 1.63, - "learning_rate": 5.5873190992277236e-05, - "loss": 0.0266, + "epoch": 0.97, + "learning_rate": 0.00015432466099124157, + "loss": 0.0409, "step": 150470 }, { - "epoch": 1.63, - "learning_rate": 5.585696670776818e-05, - "loss": 0.0269, + "epoch": 0.97, + "learning_rate": 0.00015431497963688465, + "loss": 0.0346, "step": 150480 }, { - "epoch": 1.63, - "learning_rate": 5.584074242325913e-05, - "loss": 0.0259, + "epoch": 0.97, + "learning_rate": 0.00015430529828252773, + "loss": 0.0396, "step": 150490 }, { - "epoch": 1.63, - "learning_rate": 5.582451813875007e-05, - "loss": 0.0298, + "epoch": 0.97, + "learning_rate": 0.0001542956169281708, + "loss": 0.0427, "step": 150500 }, { - "epoch": 1.63, - "learning_rate": 5.580829385424102e-05, - "loss": 0.0286, + "epoch": 0.97, + "learning_rate": 0.00015428593557381386, + "loss": 0.0326, "step": 150510 }, { - "epoch": 1.63, - "learning_rate": 5.5792069569731964e-05, - "loss": 0.0269, + "epoch": 0.97, + "learning_rate": 0.00015427625421945694, + "loss": 0.0383, "step": 150520 }, { - "epoch": 1.63, - "learning_rate": 5.5775845285222914e-05, - "loss": 0.0304, + "epoch": 0.97, + "learning_rate": 0.0001542665728651, + "loss": 0.0364, "step": 150530 }, { - "epoch": 1.63, - "learning_rate": 5.5759621000713864e-05, - "loss": 0.0284, + "epoch": 0.97, + "learning_rate": 0.00015425689151074304, + "loss": 0.0401, "step": 150540 }, { - "epoch": 1.63, - "learning_rate": 5.574339671620481e-05, - "loss": 0.0291, + "epoch": 0.97, + "learning_rate": 0.00015424721015638612, + "loss": 0.0398, "step": 150550 }, { - "epoch": 1.63, - "learning_rate": 5.5727172431695757e-05, - "loss": 0.028, + "epoch": 0.97, + "learning_rate": 0.0001542375288020292, + "loss": 0.0379, "step": 150560 }, { - "epoch": 1.63, - "learning_rate": 5.57109481471867e-05, - "loss": 0.0235, + "epoch": 0.97, + "learning_rate": 0.00015422784744767226, + "loss": 0.0352, "step": 150570 }, { - "epoch": 1.63, - "learning_rate": 5.569472386267765e-05, - "loss": 0.0243, + "epoch": 0.97, + "learning_rate": 0.00015421816609331534, + "loss": 0.0399, "step": 150580 }, { - "epoch": 1.63, - "learning_rate": 5.567849957816859e-05, - "loss": 0.019, + "epoch": 0.97, + "learning_rate": 0.00015420848473895842, + "loss": 0.0377, "step": 150590 }, { - "epoch": 1.63, - "learning_rate": 5.566227529365954e-05, - "loss": 0.0329, + "epoch": 0.97, + "learning_rate": 0.00015419880338460144, + "loss": 0.0406, "step": 150600 }, { - "epoch": 1.63, - "learning_rate": 5.564605100915049e-05, - "loss": 0.0216, + "epoch": 0.97, + "learning_rate": 0.00015418912203024452, + "loss": 0.042, "step": 150610 }, { - "epoch": 1.63, - "learning_rate": 5.5629826724641435e-05, - "loss": 0.0241, + "epoch": 0.97, + "learning_rate": 0.0001541794406758876, + "loss": 0.0388, "step": 150620 }, { - "epoch": 1.63, - "learning_rate": 5.5613602440132385e-05, - "loss": 0.0324, + "epoch": 0.97, + "learning_rate": 0.00015416975932153068, + "loss": 0.04, "step": 150630 }, { - "epoch": 1.63, - "learning_rate": 5.559737815562333e-05, - "loss": 0.0235, + "epoch": 0.97, + "learning_rate": 0.00015416007796717373, + "loss": 0.0429, "step": 150640 }, { - "epoch": 1.63, - "learning_rate": 5.558115387111428e-05, - "loss": 0.0305, + "epoch": 0.97, + "learning_rate": 0.00015415039661281681, + "loss": 0.045, "step": 150650 }, { - "epoch": 1.63, - "learning_rate": 5.556492958660522e-05, - "loss": 0.0268, + "epoch": 0.97, + "learning_rate": 0.0001541407152584599, + "loss": 0.0354, "step": 150660 }, { - "epoch": 1.63, - "learning_rate": 5.554870530209617e-05, - "loss": 0.027, + "epoch": 0.97, + "learning_rate": 0.00015413103390410292, + "loss": 0.0438, "step": 150670 }, { - "epoch": 1.63, - "learning_rate": 5.553248101758711e-05, - "loss": 0.0258, + "epoch": 0.97, + "learning_rate": 0.000154121352549746, + "loss": 0.0426, "step": 150680 }, { - "epoch": 1.63, - "learning_rate": 5.551625673307806e-05, - "loss": 0.0296, + "epoch": 0.97, + "learning_rate": 0.00015411167119538908, + "loss": 0.0376, "step": 150690 }, { - "epoch": 1.63, - "learning_rate": 5.550003244856901e-05, - "loss": 0.0256, + "epoch": 0.97, + "learning_rate": 0.00015410198984103216, + "loss": 0.0329, "step": 150700 }, { - "epoch": 1.63, - "learning_rate": 5.5483808164059956e-05, - "loss": 0.0286, + "epoch": 0.97, + "learning_rate": 0.0001540923084866752, + "loss": 0.0392, "step": 150710 }, { - "epoch": 1.63, - "learning_rate": 5.5467583879550905e-05, - "loss": 0.024, + "epoch": 0.97, + "learning_rate": 0.0001540826271323183, + "loss": 0.032, "step": 150720 }, { - "epoch": 1.63, - "learning_rate": 5.545135959504185e-05, - "loss": 0.0268, + "epoch": 0.97, + "learning_rate": 0.00015407294577796137, + "loss": 0.0432, "step": 150730 }, { - "epoch": 1.63, - "learning_rate": 5.54351353105328e-05, - "loss": 0.0254, + "epoch": 0.97, + "learning_rate": 0.0001540632644236044, + "loss": 0.0302, "step": 150740 }, { - "epoch": 1.63, - "learning_rate": 5.541891102602374e-05, - "loss": 0.0266, + "epoch": 0.97, + "learning_rate": 0.00015405358306924748, + "loss": 0.0356, "step": 150750 }, { - "epoch": 1.63, - "learning_rate": 5.540268674151469e-05, - "loss": 0.0349, + "epoch": 0.97, + "learning_rate": 0.00015404390171489056, + "loss": 0.0354, "step": 150760 }, { - "epoch": 1.63, - "learning_rate": 5.538646245700565e-05, - "loss": 0.0279, + "epoch": 0.97, + "learning_rate": 0.0001540342203605336, + "loss": 0.0416, "step": 150770 }, { - "epoch": 1.63, - "learning_rate": 5.537023817249659e-05, - "loss": 0.0303, + "epoch": 0.97, + "learning_rate": 0.0001540245390061767, + "loss": 0.0379, "step": 150780 }, { - "epoch": 1.63, - "learning_rate": 5.535401388798754e-05, - "loss": 0.0325, + "epoch": 0.97, + "learning_rate": 0.00015401485765181977, + "loss": 0.033, "step": 150790 }, { - "epoch": 1.63, - "learning_rate": 5.533778960347848e-05, - "loss": 0.0283, + "epoch": 0.97, + "learning_rate": 0.00015400517629746285, + "loss": 0.0387, "step": 150800 }, { - "epoch": 1.63, - "learning_rate": 5.532156531896943e-05, - "loss": 0.0299, - "step": 150810 + "epoch": 0.97, + "learning_rate": 0.00015399549494310587, + "loss": 0.0393, + "step": 150810 }, { - "epoch": 1.63, - "learning_rate": 5.5305341034460376e-05, - "loss": 0.0304, + "epoch": 0.97, + "learning_rate": 0.00015398581358874895, + "loss": 0.0394, "step": 150820 }, { - "epoch": 1.63, - "learning_rate": 5.5289116749951326e-05, - "loss": 0.0216, + "epoch": 0.97, + "learning_rate": 0.00015397613223439203, + "loss": 0.0351, "step": 150830 }, { - "epoch": 1.63, - "learning_rate": 5.5272892465442276e-05, - "loss": 0.0236, + "epoch": 0.97, + "learning_rate": 0.00015396645088003509, + "loss": 0.045, "step": 150840 }, { - "epoch": 1.63, - "learning_rate": 5.525666818093322e-05, - "loss": 0.024, + "epoch": 0.97, + "learning_rate": 0.00015395676952567817, + "loss": 0.0394, "step": 150850 }, { - "epoch": 1.63, - "learning_rate": 5.524044389642417e-05, - "loss": 0.0245, + "epoch": 0.97, + "learning_rate": 0.00015394708817132125, + "loss": 0.0393, "step": 150860 }, { - "epoch": 1.63, - "learning_rate": 5.522421961191511e-05, - "loss": 0.0259, + "epoch": 0.97, + "learning_rate": 0.00015393740681696433, + "loss": 0.0394, "step": 150870 }, { - "epoch": 1.63, - "learning_rate": 5.520799532740606e-05, - "loss": 0.0329, + "epoch": 0.97, + "learning_rate": 0.00015392772546260735, + "loss": 0.0395, "step": 150880 }, { - "epoch": 1.63, - "learning_rate": 5.5191771042897004e-05, - "loss": 0.0234, + "epoch": 0.97, + "learning_rate": 0.00015391804410825043, + "loss": 0.0433, "step": 150890 }, { - "epoch": 1.63, - "learning_rate": 5.5175546758387954e-05, - "loss": 0.0278, + "epoch": 0.97, + "learning_rate": 0.0001539083627538935, + "loss": 0.0362, "step": 150900 }, { - "epoch": 1.63, - "learning_rate": 5.51593224738789e-05, - "loss": 0.028, + "epoch": 0.97, + "learning_rate": 0.00015389868139953656, + "loss": 0.0386, "step": 150910 }, { - "epoch": 1.63, - "learning_rate": 5.514309818936985e-05, - "loss": 0.0228, + "epoch": 0.97, + "learning_rate": 0.00015388900004517964, + "loss": 0.039, "step": 150920 }, { - "epoch": 1.63, - "learning_rate": 5.5126873904860796e-05, - "loss": 0.0285, + "epoch": 0.97, + "learning_rate": 0.00015387931869082272, + "loss": 0.0314, "step": 150930 }, { - "epoch": 1.63, - "learning_rate": 5.511064962035174e-05, - "loss": 0.0341, + "epoch": 0.97, + "learning_rate": 0.0001538696373364658, + "loss": 0.033, "step": 150940 }, { - "epoch": 1.63, - "learning_rate": 5.509442533584269e-05, - "loss": 0.0267, + "epoch": 0.97, + "learning_rate": 0.00015385995598210883, + "loss": 0.0386, "step": 150950 }, { - "epoch": 1.63, - "learning_rate": 5.507820105133363e-05, - "loss": 0.0272, + "epoch": 0.97, + "learning_rate": 0.0001538502746277519, + "loss": 0.0352, "step": 150960 }, { - "epoch": 1.63, - "learning_rate": 5.506197676682458e-05, - "loss": 0.0345, + "epoch": 0.97, + "learning_rate": 0.000153840593273395, + "loss": 0.0347, "step": 150970 }, { - "epoch": 1.63, - "learning_rate": 5.5045752482315525e-05, - "loss": 0.0286, + "epoch": 0.97, + "learning_rate": 0.00015383091191903804, + "loss": 0.035, "step": 150980 }, { - "epoch": 1.63, - "learning_rate": 5.5029528197806475e-05, - "loss": 0.0302, + "epoch": 0.97, + "learning_rate": 0.00015382123056468112, + "loss": 0.0362, "step": 150990 }, { - "epoch": 1.63, - "learning_rate": 5.5013303913297425e-05, - "loss": 0.0251, + "epoch": 0.97, + "learning_rate": 0.0001538115492103242, + "loss": 0.0337, "step": 151000 }, { - "epoch": 1.63, - "eval_cer": 0.921151674821227, - "eval_loss": 0.022289706394076347, - "eval_runtime": 118.8666, - "eval_samples_per_second": 16.826, - "eval_steps_per_second": 4.206, + "epoch": 0.97, + "eval_cer": 0.9198951530900463, + "eval_loss": 0.025833461433649063, + "eval_runtime": 120.3543, + "eval_samples_per_second": 16.618, + "eval_steps_per_second": 4.154, "step": 151000 }, { - "epoch": 1.63, - "learning_rate": 5.499707962878837e-05, - "loss": 0.0313, + "epoch": 0.97, + "learning_rate": 0.00015380186785596725, + "loss": 0.0423, "step": 151010 }, { - "epoch": 1.63, - "learning_rate": 5.498085534427932e-05, - "loss": 0.025, + "epoch": 0.97, + "learning_rate": 0.0001537921865016103, + "loss": 0.0407, "step": 151020 }, { - "epoch": 1.63, - "learning_rate": 5.496463105977026e-05, - "loss": 0.0263, + "epoch": 0.97, + "learning_rate": 0.00015378250514725339, + "loss": 0.0353, "step": 151030 }, { - "epoch": 1.63, - "learning_rate": 5.494840677526121e-05, - "loss": 0.0317, + "epoch": 0.97, + "learning_rate": 0.00015377282379289644, + "loss": 0.0353, "step": 151040 }, { - "epoch": 1.63, - "learning_rate": 5.493218249075215e-05, - "loss": 0.0247, + "epoch": 0.97, + "learning_rate": 0.00015376314243853952, + "loss": 0.0464, "step": 151050 }, { - "epoch": 1.63, - "learning_rate": 5.49159582062431e-05, - "loss": 0.0318, + "epoch": 0.97, + "learning_rate": 0.0001537534610841826, + "loss": 0.0385, "step": 151060 }, { - "epoch": 1.63, - "learning_rate": 5.4899733921734046e-05, - "loss": 0.0265, + "epoch": 0.98, + "learning_rate": 0.00015374377972982568, + "loss": 0.036, "step": 151070 }, { - "epoch": 1.63, - "learning_rate": 5.4883509637224996e-05, - "loss": 0.0295, + "epoch": 0.98, + "learning_rate": 0.00015373409837546873, + "loss": 0.0344, "step": 151080 }, { - "epoch": 1.63, - "learning_rate": 5.4867285352715945e-05, - "loss": 0.0281, + "epoch": 0.98, + "learning_rate": 0.00015372441702111178, + "loss": 0.0379, "step": 151090 }, { - "epoch": 1.63, - "learning_rate": 5.485106106820689e-05, - "loss": 0.0295, + "epoch": 0.98, + "learning_rate": 0.00015371473566675486, + "loss": 0.0339, "step": 151100 }, { - "epoch": 1.63, - "learning_rate": 5.483483678369784e-05, - "loss": 0.0278, + "epoch": 0.98, + "learning_rate": 0.00015370505431239792, + "loss": 0.0375, "step": 151110 }, { - "epoch": 1.63, - "learning_rate": 5.481861249918878e-05, - "loss": 0.0269, + "epoch": 0.98, + "learning_rate": 0.000153695372958041, + "loss": 0.0401, "step": 151120 }, { - "epoch": 1.63, - "learning_rate": 5.480238821467973e-05, - "loss": 0.0249, + "epoch": 0.98, + "learning_rate": 0.00015368569160368407, + "loss": 0.0346, "step": 151130 }, { - "epoch": 1.63, - "learning_rate": 5.4786163930170674e-05, - "loss": 0.0315, + "epoch": 0.98, + "learning_rate": 0.00015367601024932715, + "loss": 0.0402, "step": 151140 }, { - "epoch": 1.63, - "learning_rate": 5.4769939645661624e-05, - "loss": 0.0273, + "epoch": 0.98, + "learning_rate": 0.0001536663288949702, + "loss": 0.0422, "step": 151150 }, { - "epoch": 1.63, - "learning_rate": 5.475371536115257e-05, - "loss": 0.0257, + "epoch": 0.98, + "learning_rate": 0.00015365664754061326, + "loss": 0.0387, "step": 151160 }, { - "epoch": 1.64, - "learning_rate": 5.4737491076643516e-05, - "loss": 0.0289, + "epoch": 0.98, + "learning_rate": 0.00015364696618625634, + "loss": 0.0474, "step": 151170 }, { - "epoch": 1.64, - "learning_rate": 5.4721266792134466e-05, - "loss": 0.0253, + "epoch": 0.98, + "learning_rate": 0.0001536372848318994, + "loss": 0.0351, "step": 151180 }, { - "epoch": 1.64, - "learning_rate": 5.470504250762541e-05, - "loss": 0.0261, + "epoch": 0.98, + "learning_rate": 0.00015362760347754247, + "loss": 0.0356, "step": 151190 }, { - "epoch": 1.64, - "learning_rate": 5.468881822311636e-05, - "loss": 0.0283, + "epoch": 0.98, + "learning_rate": 0.00015361792212318555, + "loss": 0.042, "step": 151200 }, { - "epoch": 1.64, - "learning_rate": 5.46725939386073e-05, - "loss": 0.0322, + "epoch": 0.98, + "learning_rate": 0.0001536082407688286, + "loss": 0.0383, "step": 151210 }, { - "epoch": 1.64, - "learning_rate": 5.465636965409825e-05, - "loss": 0.0255, + "epoch": 0.98, + "learning_rate": 0.00015359855941447168, + "loss": 0.0397, "step": 151220 }, { - "epoch": 1.64, - "learning_rate": 5.4640145369589195e-05, - "loss": 0.0285, + "epoch": 0.98, + "learning_rate": 0.00015358887806011474, + "loss": 0.037, "step": 151230 }, { - "epoch": 1.64, - "learning_rate": 5.4623921085080144e-05, - "loss": 0.0301, + "epoch": 0.98, + "learning_rate": 0.0001535791967057578, + "loss": 0.0312, "step": 151240 }, { - "epoch": 1.64, - "learning_rate": 5.460769680057109e-05, - "loss": 0.0284, + "epoch": 0.98, + "learning_rate": 0.00015356951535140087, + "loss": 0.0376, "step": 151250 }, { - "epoch": 1.64, - "learning_rate": 5.459147251606204e-05, - "loss": 0.0257, + "epoch": 0.98, + "learning_rate": 0.00015355983399704395, + "loss": 0.0395, "step": 151260 }, { - "epoch": 1.64, - "learning_rate": 5.457524823155299e-05, - "loss": 0.0268, + "epoch": 0.98, + "learning_rate": 0.00015355015264268703, + "loss": 0.0402, "step": 151270 }, { - "epoch": 1.64, - "learning_rate": 5.455902394704393e-05, - "loss": 0.0235, + "epoch": 0.98, + "learning_rate": 0.00015354047128833008, + "loss": 0.0424, "step": 151280 }, { - "epoch": 1.64, - "learning_rate": 5.454279966253488e-05, - "loss": 0.0279, + "epoch": 0.98, + "learning_rate": 0.00015353078993397316, + "loss": 0.0395, "step": 151290 }, { - "epoch": 1.64, - "learning_rate": 5.452657537802582e-05, - "loss": 0.0269, + "epoch": 0.98, + "learning_rate": 0.00015352110857961621, + "loss": 0.0395, "step": 151300 }, { - "epoch": 1.64, - "learning_rate": 5.451035109351677e-05, - "loss": 0.0282, + "epoch": 0.98, + "learning_rate": 0.00015351142722525927, + "loss": 0.0432, "step": 151310 }, { - "epoch": 1.64, - "learning_rate": 5.4494126809007716e-05, - "loss": 0.0311, + "epoch": 0.98, + "learning_rate": 0.00015350174587090235, + "loss": 0.0384, "step": 151320 }, { - "epoch": 1.64, - "learning_rate": 5.4477902524498665e-05, - "loss": 0.0305, + "epoch": 0.98, + "learning_rate": 0.00015349206451654543, + "loss": 0.0428, "step": 151330 }, { - "epoch": 1.64, - "learning_rate": 5.4461678239989615e-05, - "loss": 0.0254, + "epoch": 0.98, + "learning_rate": 0.0001534823831621885, + "loss": 0.0403, "step": 151340 }, { - "epoch": 1.64, - "learning_rate": 5.444545395548056e-05, - "loss": 0.033, + "epoch": 0.98, + "learning_rate": 0.00015347270180783156, + "loss": 0.0393, "step": 151350 }, { - "epoch": 1.64, - "learning_rate": 5.442922967097151e-05, - "loss": 0.0217, + "epoch": 0.98, + "learning_rate": 0.00015346302045347464, + "loss": 0.0385, "step": 151360 }, { - "epoch": 1.64, - "learning_rate": 5.441300538646245e-05, - "loss": 0.0288, + "epoch": 0.98, + "learning_rate": 0.0001534533390991177, + "loss": 0.0333, "step": 151370 }, { - "epoch": 1.64, - "learning_rate": 5.43967811019534e-05, - "loss": 0.0278, + "epoch": 0.98, + "learning_rate": 0.00015344365774476074, + "loss": 0.0347, "step": 151380 }, { - "epoch": 1.64, - "learning_rate": 5.4380556817444344e-05, - "loss": 0.0263, + "epoch": 0.98, + "learning_rate": 0.00015343397639040382, + "loss": 0.0429, "step": 151390 }, { - "epoch": 1.64, - "learning_rate": 5.436433253293529e-05, - "loss": 0.0233, + "epoch": 0.98, + "learning_rate": 0.0001534242950360469, + "loss": 0.0475, "step": 151400 }, { - "epoch": 1.64, - "learning_rate": 5.4348108248426236e-05, - "loss": 0.0273, + "epoch": 0.98, + "learning_rate": 0.00015341461368168996, + "loss": 0.0348, "step": 151410 }, { - "epoch": 1.64, - "learning_rate": 5.4331883963917186e-05, - "loss": 0.0263, + "epoch": 0.98, + "learning_rate": 0.00015340493232733304, + "loss": 0.0377, "step": 151420 }, { - "epoch": 1.64, - "learning_rate": 5.4315659679408136e-05, - "loss": 0.027, + "epoch": 0.98, + "learning_rate": 0.00015339525097297612, + "loss": 0.0467, "step": 151430 }, { - "epoch": 1.64, - "learning_rate": 5.429943539489908e-05, - "loss": 0.0251, + "epoch": 0.98, + "learning_rate": 0.00015338556961861914, + "loss": 0.0356, "step": 151440 }, { - "epoch": 1.64, - "learning_rate": 5.428321111039003e-05, - "loss": 0.0261, + "epoch": 0.98, + "learning_rate": 0.00015337588826426222, + "loss": 0.0373, "step": 151450 }, { - "epoch": 1.64, - "learning_rate": 5.426698682588097e-05, - "loss": 0.0279, + "epoch": 0.98, + "learning_rate": 0.0001533662069099053, + "loss": 0.0411, "step": 151460 }, { - "epoch": 1.64, - "learning_rate": 5.425076254137192e-05, - "loss": 0.0245, + "epoch": 0.98, + "learning_rate": 0.00015335652555554838, + "loss": 0.0396, "step": 151470 }, { - "epoch": 1.64, - "learning_rate": 5.4234538256862864e-05, - "loss": 0.0285, + "epoch": 0.98, + "learning_rate": 0.00015334684420119143, + "loss": 0.0345, "step": 151480 }, { - "epoch": 1.64, - "learning_rate": 5.4218313972353814e-05, - "loss": 0.027, + "epoch": 0.98, + "learning_rate": 0.0001533371628468345, + "loss": 0.0408, "step": 151490 }, { - "epoch": 1.64, - "learning_rate": 5.420208968784476e-05, - "loss": 0.0299, + "epoch": 0.98, + "learning_rate": 0.0001533274814924776, + "loss": 0.0344, "step": 151500 }, { - "epoch": 1.64, - "learning_rate": 5.418586540333571e-05, - "loss": 0.0318, + "epoch": 0.98, + "learning_rate": 0.00015331780013812062, + "loss": 0.0414, "step": 151510 }, { - "epoch": 1.64, - "learning_rate": 5.416964111882666e-05, - "loss": 0.0315, + "epoch": 0.98, + "learning_rate": 0.0001533081187837637, + "loss": 0.046, "step": 151520 }, { - "epoch": 1.64, - "learning_rate": 5.41534168343176e-05, - "loss": 0.0267, + "epoch": 0.98, + "learning_rate": 0.00015329843742940678, + "loss": 0.042, "step": 151530 }, { - "epoch": 1.64, - "learning_rate": 5.413719254980855e-05, - "loss": 0.0239, + "epoch": 0.98, + "learning_rate": 0.00015328875607504986, + "loss": 0.0338, "step": 151540 }, { - "epoch": 1.64, - "learning_rate": 5.412096826529949e-05, - "loss": 0.028, + "epoch": 0.98, + "learning_rate": 0.0001532790747206929, + "loss": 0.0429, "step": 151550 }, { - "epoch": 1.64, - "learning_rate": 5.410474398079044e-05, - "loss": 0.028, + "epoch": 0.98, + "learning_rate": 0.000153269393366336, + "loss": 0.0354, "step": 151560 }, { - "epoch": 1.64, - "learning_rate": 5.4088519696281385e-05, - "loss": 0.0299, + "epoch": 0.98, + "learning_rate": 0.00015325971201197907, + "loss": 0.0374, "step": 151570 }, { - "epoch": 1.64, - "learning_rate": 5.4072295411772335e-05, - "loss": 0.0259, + "epoch": 0.98, + "learning_rate": 0.0001532500306576221, + "loss": 0.0329, "step": 151580 }, { - "epoch": 1.64, - "learning_rate": 5.405607112726328e-05, - "loss": 0.0336, + "epoch": 0.98, + "learning_rate": 0.00015324034930326518, + "loss": 0.0368, "step": 151590 }, { - "epoch": 1.64, - "learning_rate": 5.403984684275423e-05, - "loss": 0.0311, + "epoch": 0.98, + "learning_rate": 0.00015323066794890826, + "loss": 0.0449, "step": 151600 }, { - "epoch": 1.64, - "learning_rate": 5.402362255824518e-05, - "loss": 0.029, + "epoch": 0.98, + "learning_rate": 0.0001532209865945513, + "loss": 0.0379, "step": 151610 }, { - "epoch": 1.64, - "learning_rate": 5.400739827373612e-05, - "loss": 0.0265, + "epoch": 0.98, + "learning_rate": 0.0001532113052401944, + "loss": 0.0411, "step": 151620 }, { - "epoch": 1.64, - "learning_rate": 5.399117398922707e-05, - "loss": 0.0243, + "epoch": 0.98, + "learning_rate": 0.00015320162388583747, + "loss": 0.0426, "step": 151630 }, { - "epoch": 1.64, - "learning_rate": 5.397494970471801e-05, - "loss": 0.0257, + "epoch": 0.98, + "learning_rate": 0.00015319194253148055, + "loss": 0.0384, "step": 151640 }, { - "epoch": 1.64, - "learning_rate": 5.395872542020896e-05, - "loss": 0.0267, + "epoch": 0.98, + "learning_rate": 0.00015318226117712357, + "loss": 0.0365, "step": 151650 }, { - "epoch": 1.64, - "learning_rate": 5.3942501135699906e-05, - "loss": 0.0267, + "epoch": 0.98, + "learning_rate": 0.00015317257982276665, + "loss": 0.0421, "step": 151660 }, { - "epoch": 1.64, - "learning_rate": 5.3926276851190856e-05, - "loss": 0.0277, + "epoch": 0.98, + "learning_rate": 0.00015316289846840973, + "loss": 0.0323, "step": 151670 }, { - "epoch": 1.64, - "learning_rate": 5.3910052566681806e-05, - "loss": 0.021, + "epoch": 0.98, + "learning_rate": 0.00015315321711405279, + "loss": 0.0327, "step": 151680 }, { - "epoch": 1.64, - "learning_rate": 5.389382828217275e-05, - "loss": 0.0284, + "epoch": 0.98, + "learning_rate": 0.00015314353575969587, + "loss": 0.0418, "step": 151690 }, { - "epoch": 1.64, - "learning_rate": 5.38776039976637e-05, - "loss": 0.0322, + "epoch": 0.98, + "learning_rate": 0.00015313385440533895, + "loss": 0.0391, "step": 151700 }, { - "epoch": 1.64, - "learning_rate": 5.386137971315464e-05, - "loss": 0.0247, + "epoch": 0.98, + "learning_rate": 0.00015312417305098202, + "loss": 0.0359, "step": 151710 }, { - "epoch": 1.64, - "learning_rate": 5.384515542864559e-05, - "loss": 0.0259, + "epoch": 0.98, + "learning_rate": 0.00015311449169662505, + "loss": 0.0394, "step": 151720 }, { - "epoch": 1.64, - "learning_rate": 5.3828931144136534e-05, - "loss": 0.0281, + "epoch": 0.98, + "learning_rate": 0.00015310481034226813, + "loss": 0.0345, "step": 151730 }, { - "epoch": 1.64, - "learning_rate": 5.3812706859627484e-05, - "loss": 0.0299, + "epoch": 0.98, + "learning_rate": 0.0001530951289879112, + "loss": 0.0375, "step": 151740 }, { - "epoch": 1.64, - "learning_rate": 5.379648257511843e-05, - "loss": 0.0324, + "epoch": 0.98, + "learning_rate": 0.00015308544763355426, + "loss": 0.0342, "step": 151750 }, { - "epoch": 1.64, - "learning_rate": 5.378025829060938e-05, - "loss": 0.0255, + "epoch": 0.98, + "learning_rate": 0.00015307576627919734, + "loss": 0.0361, "step": 151760 }, { - "epoch": 1.64, - "learning_rate": 5.3764034006100326e-05, - "loss": 0.0265, + "epoch": 0.98, + "learning_rate": 0.00015306608492484042, + "loss": 0.0358, "step": 151770 }, { - "epoch": 1.64, - "learning_rate": 5.374780972159127e-05, - "loss": 0.0244, + "epoch": 0.98, + "learning_rate": 0.00015305640357048348, + "loss": 0.0432, "step": 151780 }, { - "epoch": 1.64, - "learning_rate": 5.373158543708222e-05, - "loss": 0.0266, + "epoch": 0.98, + "learning_rate": 0.00015304672221612653, + "loss": 0.0399, "step": 151790 }, { - "epoch": 1.64, - "learning_rate": 5.371536115257316e-05, - "loss": 0.0361, + "epoch": 0.98, + "learning_rate": 0.0001530370408617696, + "loss": 0.0458, "step": 151800 }, { - "epoch": 1.64, - "learning_rate": 5.369913686806411e-05, - "loss": 0.0354, + "epoch": 0.98, + "learning_rate": 0.00015302735950741266, + "loss": 0.0404, "step": 151810 }, { - "epoch": 1.64, - "learning_rate": 5.3682912583555055e-05, - "loss": 0.0251, + "epoch": 0.98, + "learning_rate": 0.00015301767815305574, + "loss": 0.0408, "step": 151820 }, { - "epoch": 1.64, - "learning_rate": 5.3666688299046005e-05, - "loss": 0.0298, + "epoch": 0.98, + "learning_rate": 0.00015300799679869882, + "loss": 0.0471, "step": 151830 }, { - "epoch": 1.64, - "learning_rate": 5.365046401453695e-05, - "loss": 0.0238, + "epoch": 0.98, + "learning_rate": 0.0001529983154443419, + "loss": 0.0351, "step": 151840 }, { - "epoch": 1.64, - "learning_rate": 5.36342397300279e-05, - "loss": 0.0242, + "epoch": 0.98, + "learning_rate": 0.00015298863408998495, + "loss": 0.0425, "step": 151850 }, { - "epoch": 1.64, - "learning_rate": 5.361801544551885e-05, - "loss": 0.0313, + "epoch": 0.98, + "learning_rate": 0.000152978952735628, + "loss": 0.0376, "step": 151860 }, { - "epoch": 1.64, - "learning_rate": 5.360179116100979e-05, - "loss": 0.0266, + "epoch": 0.98, + "learning_rate": 0.00015296927138127108, + "loss": 0.0421, "step": 151870 }, { - "epoch": 1.64, - "learning_rate": 5.358556687650074e-05, - "loss": 0.0327, + "epoch": 0.98, + "learning_rate": 0.00015295959002691414, + "loss": 0.0405, "step": 151880 }, { - "epoch": 1.64, - "learning_rate": 5.356934259199168e-05, - "loss": 0.0276, + "epoch": 0.98, + "learning_rate": 0.00015294990867255722, + "loss": 0.0349, "step": 151890 }, { - "epoch": 1.64, - "learning_rate": 5.355311830748263e-05, - "loss": 0.0225, + "epoch": 0.98, + "learning_rate": 0.0001529402273182003, + "loss": 0.0374, "step": 151900 }, { - "epoch": 1.64, - "learning_rate": 5.3536894022973576e-05, - "loss": 0.0268, + "epoch": 0.98, + "learning_rate": 0.00015293054596384338, + "loss": 0.0418, "step": 151910 }, { - "epoch": 1.64, - "learning_rate": 5.3520669738464526e-05, - "loss": 0.0327, + "epoch": 0.98, + "learning_rate": 0.00015292086460948643, + "loss": 0.035, "step": 151920 }, { - "epoch": 1.64, - "learning_rate": 5.350444545395547e-05, - "loss": 0.0289, + "epoch": 0.98, + "learning_rate": 0.00015291118325512948, + "loss": 0.0379, "step": 151930 }, { - "epoch": 1.64, - "learning_rate": 5.3488221169446425e-05, - "loss": 0.0283, + "epoch": 0.98, + "learning_rate": 0.00015290150190077256, + "loss": 0.0386, "step": 151940 }, { - "epoch": 1.64, - "learning_rate": 5.3471996884937375e-05, - "loss": 0.0272, + "epoch": 0.98, + "learning_rate": 0.00015289182054641561, + "loss": 0.042, "step": 151950 }, { - "epoch": 1.64, - "learning_rate": 5.345577260042832e-05, - "loss": 0.0321, + "epoch": 0.98, + "learning_rate": 0.0001528821391920587, + "loss": 0.0353, "step": 151960 }, { - "epoch": 1.64, - "learning_rate": 5.343954831591927e-05, - "loss": 0.0236, + "epoch": 0.98, + "learning_rate": 0.00015287245783770177, + "loss": 0.0349, "step": 151970 }, { - "epoch": 1.64, - "learning_rate": 5.342332403141021e-05, - "loss": 0.0214, + "epoch": 0.98, + "learning_rate": 0.00015286277648334483, + "loss": 0.0355, "step": 151980 }, { - "epoch": 1.64, - "learning_rate": 5.340709974690116e-05, - "loss": 0.0277, + "epoch": 0.98, + "learning_rate": 0.0001528530951289879, + "loss": 0.0446, "step": 151990 }, { - "epoch": 1.64, - "learning_rate": 5.339087546239211e-05, - "loss": 0.0278, + "epoch": 0.98, + "learning_rate": 0.00015284341377463096, + "loss": 0.0456, "step": 152000 }, { - "epoch": 1.64, - "eval_cer": 0.92111103454247, - "eval_loss": 0.022334229201078415, - "eval_runtime": 119.238, - "eval_samples_per_second": 16.773, - "eval_steps_per_second": 4.193, + "epoch": 0.98, + "eval_cer": 0.9199484803976952, + "eval_loss": 0.02544480562210083, + "eval_runtime": 119.9384, + "eval_samples_per_second": 16.675, + "eval_steps_per_second": 4.169, "step": 152000 }, { - "epoch": 1.64, - "learning_rate": 5.337465117788305e-05, - "loss": 0.0297, + "epoch": 0.98, + "learning_rate": 0.000152833732420274, + "loss": 0.0438, "step": 152010 }, { - "epoch": 1.64, - "learning_rate": 5.3358426893374e-05, - "loss": 0.0279, + "epoch": 0.98, + "learning_rate": 0.0001528240510659171, + "loss": 0.0327, "step": 152020 }, { - "epoch": 1.64, - "learning_rate": 5.3342202608864946e-05, - "loss": 0.0276, + "epoch": 0.98, + "learning_rate": 0.00015281436971156017, + "loss": 0.0362, "step": 152030 }, { - "epoch": 1.64, - "learning_rate": 5.3325978324355896e-05, - "loss": 0.0242, + "epoch": 0.98, + "learning_rate": 0.00015280468835720325, + "loss": 0.0365, "step": 152040 }, { - "epoch": 1.64, - "learning_rate": 5.330975403984684e-05, - "loss": 0.0317, + "epoch": 0.98, + "learning_rate": 0.0001527950070028463, + "loss": 0.0399, "step": 152050 }, { - "epoch": 1.64, - "learning_rate": 5.329352975533779e-05, - "loss": 0.0225, + "epoch": 0.98, + "learning_rate": 0.00015278532564848938, + "loss": 0.0367, "step": 152060 }, { - "epoch": 1.64, - "learning_rate": 5.327730547082874e-05, - "loss": 0.0279, + "epoch": 0.98, + "learning_rate": 0.00015277564429413244, + "loss": 0.0398, "step": 152070 }, { - "epoch": 1.64, - "learning_rate": 5.326108118631968e-05, - "loss": 0.026, + "epoch": 0.98, + "learning_rate": 0.0001527659629397755, + "loss": 0.0375, "step": 152080 }, { - "epoch": 1.65, - "learning_rate": 5.324485690181063e-05, - "loss": 0.0254, + "epoch": 0.98, + "learning_rate": 0.00015275628158541857, + "loss": 0.047, "step": 152090 }, { - "epoch": 1.65, - "learning_rate": 5.3228632617301574e-05, - "loss": 0.0293, + "epoch": 0.98, + "learning_rate": 0.00015274660023106165, + "loss": 0.0465, "step": 152100 }, { - "epoch": 1.65, - "learning_rate": 5.3212408332792524e-05, - "loss": 0.0389, + "epoch": 0.98, + "learning_rate": 0.00015273691887670473, + "loss": 0.0347, "step": 152110 }, { - "epoch": 1.65, - "learning_rate": 5.319618404828347e-05, - "loss": 0.0301, + "epoch": 0.98, + "learning_rate": 0.00015272723752234778, + "loss": 0.0374, "step": 152120 }, { - "epoch": 1.65, - "learning_rate": 5.3179959763774417e-05, - "loss": 0.0261, + "epoch": 0.98, + "learning_rate": 0.00015271755616799086, + "loss": 0.0392, "step": 152130 }, { - "epoch": 1.65, - "learning_rate": 5.316373547926536e-05, - "loss": 0.0283, + "epoch": 0.98, + "learning_rate": 0.00015270787481363391, + "loss": 0.0377, "step": 152140 }, { - "epoch": 1.65, - "learning_rate": 5.314751119475631e-05, - "loss": 0.0278, + "epoch": 0.98, + "learning_rate": 0.00015269819345927697, + "loss": 0.0395, "step": 152150 }, { - "epoch": 1.65, - "learning_rate": 5.313128691024726e-05, - "loss": 0.0261, + "epoch": 0.98, + "learning_rate": 0.00015268851210492005, + "loss": 0.0397, "step": 152160 }, { - "epoch": 1.65, - "learning_rate": 5.31150626257382e-05, - "loss": 0.0271, + "epoch": 0.98, + "learning_rate": 0.00015267883075056313, + "loss": 0.0378, "step": 152170 }, { - "epoch": 1.65, - "learning_rate": 5.309883834122915e-05, - "loss": 0.0278, + "epoch": 0.98, + "learning_rate": 0.00015266914939620618, + "loss": 0.0427, "step": 152180 }, { - "epoch": 1.65, - "learning_rate": 5.3082614056720095e-05, - "loss": 0.0266, + "epoch": 0.98, + "learning_rate": 0.00015265946804184926, + "loss": 0.042, "step": 152190 }, { - "epoch": 1.65, - "learning_rate": 5.3066389772211045e-05, - "loss": 0.0253, + "epoch": 0.98, + "learning_rate": 0.00015264978668749234, + "loss": 0.0388, "step": 152200 }, { - "epoch": 1.65, - "learning_rate": 5.305016548770199e-05, - "loss": 0.0242, + "epoch": 0.98, + "learning_rate": 0.00015264010533313536, + "loss": 0.0386, "step": 152210 }, { - "epoch": 1.65, - "learning_rate": 5.303394120319294e-05, - "loss": 0.0308, + "epoch": 0.98, + "learning_rate": 0.00015263042397877844, + "loss": 0.0355, "step": 152220 }, { - "epoch": 1.65, - "learning_rate": 5.301771691868388e-05, - "loss": 0.0279, + "epoch": 0.98, + "learning_rate": 0.00015262074262442152, + "loss": 0.0366, "step": 152230 }, { - "epoch": 1.65, - "learning_rate": 5.300149263417483e-05, - "loss": 0.0288, + "epoch": 0.98, + "learning_rate": 0.0001526110612700646, + "loss": 0.036, "step": 152240 }, { - "epoch": 1.65, - "learning_rate": 5.298526834966578e-05, - "loss": 0.0269, + "epoch": 0.98, + "learning_rate": 0.00015260137991570766, + "loss": 0.0445, "step": 152250 }, { - "epoch": 1.65, - "learning_rate": 5.296904406515672e-05, - "loss": 0.0233, + "epoch": 0.98, + "learning_rate": 0.00015259169856135074, + "loss": 0.043, "step": 152260 }, { - "epoch": 1.65, - "learning_rate": 5.295281978064767e-05, - "loss": 0.0242, + "epoch": 0.98, + "learning_rate": 0.00015258201720699382, + "loss": 0.037, "step": 152270 }, { - "epoch": 1.65, - "learning_rate": 5.2936595496138616e-05, - "loss": 0.0286, + "epoch": 0.98, + "learning_rate": 0.00015257233585263684, + "loss": 0.0329, "step": 152280 }, { - "epoch": 1.65, - "learning_rate": 5.2920371211629565e-05, - "loss": 0.0226, + "epoch": 0.98, + "learning_rate": 0.00015256265449827992, + "loss": 0.0393, "step": 152290 }, { - "epoch": 1.65, - "learning_rate": 5.290414692712051e-05, - "loss": 0.0287, + "epoch": 0.98, + "learning_rate": 0.000152552973143923, + "loss": 0.0466, "step": 152300 }, { - "epoch": 1.65, - "learning_rate": 5.288792264261146e-05, - "loss": 0.0315, + "epoch": 0.98, + "learning_rate": 0.00015254329178956608, + "loss": 0.0437, "step": 152310 }, { - "epoch": 1.65, - "learning_rate": 5.28716983581024e-05, - "loss": 0.0286, + "epoch": 0.98, + "learning_rate": 0.00015253361043520913, + "loss": 0.0381, "step": 152320 }, { - "epoch": 1.65, - "learning_rate": 5.285547407359335e-05, - "loss": 0.0253, + "epoch": 0.98, + "learning_rate": 0.0001525239290808522, + "loss": 0.0343, "step": 152330 }, { - "epoch": 1.65, - "learning_rate": 5.28392497890843e-05, - "loss": 0.0304, + "epoch": 0.98, + "learning_rate": 0.0001525142477264953, + "loss": 0.0322, "step": 152340 }, { - "epoch": 1.65, - "learning_rate": 5.2823025504575244e-05, - "loss": 0.0302, + "epoch": 0.98, + "learning_rate": 0.00015250456637213832, + "loss": 0.0397, "step": 152350 }, { - "epoch": 1.65, - "learning_rate": 5.2806801220066194e-05, - "loss": 0.0251, + "epoch": 0.98, + "learning_rate": 0.0001524948850177814, + "loss": 0.0374, "step": 152360 }, { - "epoch": 1.65, - "learning_rate": 5.2790576935557137e-05, - "loss": 0.0324, + "epoch": 0.98, + "learning_rate": 0.00015248520366342448, + "loss": 0.0413, "step": 152370 }, { - "epoch": 1.65, - "learning_rate": 5.2774352651048086e-05, - "loss": 0.0261, + "epoch": 0.98, + "learning_rate": 0.00015247552230906753, + "loss": 0.0384, "step": 152380 }, { - "epoch": 1.65, - "learning_rate": 5.275812836653903e-05, - "loss": 0.0266, + "epoch": 0.98, + "learning_rate": 0.0001524658409547106, + "loss": 0.0362, "step": 152390 }, { - "epoch": 1.65, - "learning_rate": 5.274190408202998e-05, - "loss": 0.0346, + "epoch": 0.98, + "learning_rate": 0.0001524561596003537, + "loss": 0.0385, "step": 152400 }, { - "epoch": 1.65, - "learning_rate": 5.272567979752093e-05, - "loss": 0.0289, + "epoch": 0.98, + "learning_rate": 0.00015244647824599677, + "loss": 0.0374, "step": 152410 }, { - "epoch": 1.65, - "learning_rate": 5.270945551301187e-05, - "loss": 0.0248, + "epoch": 0.98, + "learning_rate": 0.0001524367968916398, + "loss": 0.035, "step": 152420 }, { - "epoch": 1.65, - "learning_rate": 5.269323122850282e-05, - "loss": 0.0264, + "epoch": 0.98, + "learning_rate": 0.00015242711553728288, + "loss": 0.0402, "step": 152430 }, { - "epoch": 1.65, - "learning_rate": 5.2677006943993765e-05, - "loss": 0.0377, + "epoch": 0.98, + "learning_rate": 0.00015241743418292596, + "loss": 0.0361, "step": 152440 }, { - "epoch": 1.65, - "learning_rate": 5.2660782659484714e-05, - "loss": 0.0263, + "epoch": 0.98, + "learning_rate": 0.000152407752828569, + "loss": 0.0423, "step": 152450 }, { - "epoch": 1.65, - "learning_rate": 5.264455837497566e-05, - "loss": 0.0229, + "epoch": 0.98, + "learning_rate": 0.0001523980714742121, + "loss": 0.0298, "step": 152460 }, { - "epoch": 1.65, - "learning_rate": 5.262833409046661e-05, - "loss": 0.029, + "epoch": 0.98, + "learning_rate": 0.00015238839011985517, + "loss": 0.0347, "step": 152470 }, { - "epoch": 1.65, - "learning_rate": 5.261210980595755e-05, - "loss": 0.024, + "epoch": 0.98, + "learning_rate": 0.00015237870876549825, + "loss": 0.0326, "step": 152480 }, { - "epoch": 1.65, - "learning_rate": 5.25958855214485e-05, - "loss": 0.0261, + "epoch": 0.98, + "learning_rate": 0.00015236902741114127, + "loss": 0.0358, "step": 152490 }, { - "epoch": 1.65, - "learning_rate": 5.257966123693945e-05, - "loss": 0.0294, + "epoch": 0.98, + "learning_rate": 0.00015235934605678435, + "loss": 0.0341, "step": 152500 }, { - "epoch": 1.65, - "learning_rate": 5.256343695243039e-05, - "loss": 0.032, + "epoch": 0.98, + "learning_rate": 0.00015234966470242743, + "loss": 0.0368, "step": 152510 }, { - "epoch": 1.65, - "learning_rate": 5.254721266792134e-05, - "loss": 0.0229, + "epoch": 0.98, + "learning_rate": 0.00015233998334807049, + "loss": 0.044, "step": 152520 }, { - "epoch": 1.65, - "learning_rate": 5.2530988383412285e-05, - "loss": 0.0262, + "epoch": 0.98, + "learning_rate": 0.00015233030199371356, + "loss": 0.0375, "step": 152530 }, { - "epoch": 1.65, - "learning_rate": 5.2514764098903235e-05, - "loss": 0.0336, + "epoch": 0.98, + "learning_rate": 0.00015232062063935664, + "loss": 0.0377, "step": 152540 }, { - "epoch": 1.65, - "learning_rate": 5.249853981439418e-05, - "loss": 0.0252, + "epoch": 0.98, + "learning_rate": 0.00015231093928499972, + "loss": 0.0351, "step": 152550 }, { - "epoch": 1.65, - "learning_rate": 5.248231552988513e-05, - "loss": 0.0241, + "epoch": 0.98, + "learning_rate": 0.00015230125793064275, + "loss": 0.0376, "step": 152560 }, { - "epoch": 1.65, - "learning_rate": 5.246609124537607e-05, - "loss": 0.0278, + "epoch": 0.98, + "learning_rate": 0.00015229157657628583, + "loss": 0.042, "step": 152570 }, { - "epoch": 1.65, - "learning_rate": 5.244986696086702e-05, - "loss": 0.025, + "epoch": 0.98, + "learning_rate": 0.00015228189522192888, + "loss": 0.0349, "step": 152580 }, { - "epoch": 1.65, - "learning_rate": 5.243364267635797e-05, - "loss": 0.026, + "epoch": 0.98, + "learning_rate": 0.00015227221386757196, + "loss": 0.0361, "step": 152590 }, { - "epoch": 1.65, - "learning_rate": 5.2417418391848913e-05, - "loss": 0.0267, + "epoch": 0.98, + "learning_rate": 0.00015226253251321504, + "loss": 0.036, "step": 152600 }, { - "epoch": 1.65, - "learning_rate": 5.240119410733986e-05, - "loss": 0.0233, + "epoch": 0.98, + "learning_rate": 0.00015225285115885812, + "loss": 0.0379, "step": 152610 }, { - "epoch": 1.65, - "learning_rate": 5.2384969822830806e-05, - "loss": 0.0253, + "epoch": 0.99, + "learning_rate": 0.00015224316980450117, + "loss": 0.0378, "step": 152620 }, { - "epoch": 1.65, - "learning_rate": 5.2368745538321756e-05, - "loss": 0.0273, + "epoch": 0.99, + "learning_rate": 0.00015223348845014423, + "loss": 0.0365, "step": 152630 }, { - "epoch": 1.65, - "learning_rate": 5.23525212538127e-05, - "loss": 0.0276, + "epoch": 0.99, + "learning_rate": 0.0001522238070957873, + "loss": 0.0394, "step": 152640 }, { - "epoch": 1.65, - "learning_rate": 5.233629696930365e-05, - "loss": 0.0259, + "epoch": 0.99, + "learning_rate": 0.00015221412574143036, + "loss": 0.0395, "step": 152650 }, { - "epoch": 1.65, - "learning_rate": 5.232007268479459e-05, - "loss": 0.0256, + "epoch": 0.99, + "learning_rate": 0.00015220444438707344, + "loss": 0.0418, "step": 152660 }, { - "epoch": 1.65, - "learning_rate": 5.230384840028554e-05, - "loss": 0.0373, + "epoch": 0.99, + "learning_rate": 0.00015219476303271652, + "loss": 0.0337, "step": 152670 }, { - "epoch": 1.65, - "learning_rate": 5.228762411577649e-05, - "loss": 0.0274, + "epoch": 0.99, + "learning_rate": 0.0001521850816783596, + "loss": 0.0369, "step": 152680 }, { - "epoch": 1.65, - "learning_rate": 5.2271399831267434e-05, - "loss": 0.0291, + "epoch": 0.99, + "learning_rate": 0.00015217540032400265, + "loss": 0.0408, "step": 152690 }, { - "epoch": 1.65, - "learning_rate": 5.2255175546758384e-05, - "loss": 0.0257, + "epoch": 0.99, + "learning_rate": 0.0001521657189696457, + "loss": 0.0408, "step": 152700 }, { - "epoch": 1.65, - "learning_rate": 5.223895126224933e-05, - "loss": 0.0185, + "epoch": 0.99, + "learning_rate": 0.00015215603761528878, + "loss": 0.0344, "step": 152710 }, { - "epoch": 1.65, - "learning_rate": 5.222272697774028e-05, - "loss": 0.0279, + "epoch": 0.99, + "learning_rate": 0.00015214635626093184, + "loss": 0.0346, "step": 152720 }, { - "epoch": 1.65, - "learning_rate": 5.220650269323122e-05, - "loss": 0.0217, + "epoch": 0.99, + "learning_rate": 0.00015213667490657492, + "loss": 0.0329, "step": 152730 }, { - "epoch": 1.65, - "learning_rate": 5.219027840872217e-05, - "loss": 0.0256, + "epoch": 0.99, + "learning_rate": 0.000152126993552218, + "loss": 0.0378, "step": 152740 }, { - "epoch": 1.65, - "learning_rate": 5.217405412421312e-05, - "loss": 0.0277, + "epoch": 0.99, + "learning_rate": 0.00015211731219786108, + "loss": 0.0363, "step": 152750 }, { - "epoch": 1.65, - "learning_rate": 5.215782983970406e-05, - "loss": 0.0274, + "epoch": 0.99, + "learning_rate": 0.00015210763084350413, + "loss": 0.0375, "step": 152760 }, { - "epoch": 1.65, - "learning_rate": 5.214160555519501e-05, - "loss": 0.0276, + "epoch": 0.99, + "learning_rate": 0.00015209794948914718, + "loss": 0.044, "step": 152770 }, { - "epoch": 1.65, - "learning_rate": 5.2125381270685955e-05, - "loss": 0.0289, + "epoch": 0.99, + "learning_rate": 0.00015208826813479023, + "loss": 0.0331, "step": 152780 }, { - "epoch": 1.65, - "learning_rate": 5.2109156986176905e-05, - "loss": 0.0286, + "epoch": 0.99, + "learning_rate": 0.00015207858678043331, + "loss": 0.0323, "step": 152790 }, { - "epoch": 1.65, - "learning_rate": 5.209293270166785e-05, - "loss": 0.024, + "epoch": 0.99, + "learning_rate": 0.0001520689054260764, + "loss": 0.032, "step": 152800 }, { - "epoch": 1.65, - "learning_rate": 5.20767084171588e-05, - "loss": 0.0319, + "epoch": 0.99, + "learning_rate": 0.00015205922407171947, + "loss": 0.0359, "step": 152810 }, { - "epoch": 1.65, - "learning_rate": 5.206048413264974e-05, - "loss": 0.0282, + "epoch": 0.99, + "learning_rate": 0.00015204954271736253, + "loss": 0.0333, "step": 152820 }, { - "epoch": 1.65, - "learning_rate": 5.204425984814069e-05, - "loss": 0.0223, + "epoch": 0.99, + "learning_rate": 0.0001520398613630056, + "loss": 0.0323, "step": 152830 }, { - "epoch": 1.65, - "learning_rate": 5.202803556363164e-05, - "loss": 0.0302, + "epoch": 0.99, + "learning_rate": 0.00015203018000864866, + "loss": 0.0334, "step": 152840 }, { - "epoch": 1.65, - "learning_rate": 5.201181127912258e-05, - "loss": 0.024, + "epoch": 0.99, + "learning_rate": 0.0001520204986542917, + "loss": 0.0327, "step": 152850 }, { - "epoch": 1.65, - "learning_rate": 5.199558699461353e-05, - "loss": 0.0275, + "epoch": 0.99, + "learning_rate": 0.0001520108172999348, + "loss": 0.0384, "step": 152860 }, { - "epoch": 1.65, - "learning_rate": 5.1979362710104476e-05, - "loss": 0.0281, + "epoch": 0.99, + "learning_rate": 0.00015200113594557787, + "loss": 0.035, "step": 152870 }, { - "epoch": 1.65, - "learning_rate": 5.1963138425595426e-05, - "loss": 0.0285, + "epoch": 0.99, + "learning_rate": 0.00015199145459122095, + "loss": 0.0447, "step": 152880 }, { - "epoch": 1.65, - "learning_rate": 5.194691414108637e-05, - "loss": 0.031, + "epoch": 0.99, + "learning_rate": 0.000151981773236864, + "loss": 0.0348, "step": 152890 }, { - "epoch": 1.65, - "learning_rate": 5.193068985657732e-05, - "loss": 0.032, + "epoch": 0.99, + "learning_rate": 0.00015197209188250708, + "loss": 0.0357, "step": 152900 }, { - "epoch": 1.65, - "learning_rate": 5.191446557206826e-05, - "loss": 0.0288, + "epoch": 0.99, + "learning_rate": 0.00015196241052815014, + "loss": 0.0307, "step": 152910 }, { - "epoch": 1.65, - "learning_rate": 5.189824128755921e-05, - "loss": 0.0263, + "epoch": 0.99, + "learning_rate": 0.0001519527291737932, + "loss": 0.0346, "step": 152920 }, { - "epoch": 1.65, - "learning_rate": 5.188201700305016e-05, - "loss": 0.0236, + "epoch": 0.99, + "learning_rate": 0.00015194304781943627, + "loss": 0.0355, "step": 152930 }, { - "epoch": 1.65, - "learning_rate": 5.1865792718541104e-05, - "loss": 0.0277, + "epoch": 0.99, + "learning_rate": 0.00015193336646507935, + "loss": 0.0384, "step": 152940 }, { - "epoch": 1.65, - "learning_rate": 5.1849568434032054e-05, - "loss": 0.0257, + "epoch": 0.99, + "learning_rate": 0.00015192368511072243, + "loss": 0.0392, "step": 152950 }, { - "epoch": 1.65, - "learning_rate": 5.1833344149523e-05, - "loss": 0.0265, + "epoch": 0.99, + "learning_rate": 0.00015191400375636548, + "loss": 0.0386, "step": 152960 }, { - "epoch": 1.65, - "learning_rate": 5.1817119865013947e-05, - "loss": 0.0243, + "epoch": 0.99, + "learning_rate": 0.00015190432240200856, + "loss": 0.0352, "step": 152970 }, { - "epoch": 1.65, - "learning_rate": 5.180089558050489e-05, - "loss": 0.0278, + "epoch": 0.99, + "learning_rate": 0.00015189464104765159, + "loss": 0.0438, "step": 152980 }, { - "epoch": 1.65, - "learning_rate": 5.178467129599584e-05, - "loss": 0.032, + "epoch": 0.99, + "learning_rate": 0.00015188495969329467, + "loss": 0.0362, "step": 152990 }, { - "epoch": 1.65, - "learning_rate": 5.176844701148678e-05, - "loss": 0.0284, + "epoch": 0.99, + "learning_rate": 0.00015187527833893775, + "loss": 0.0355, "step": 153000 }, { - "epoch": 1.65, - "eval_cer": 0.9210315209535976, - "eval_loss": 0.02240966632962227, - "eval_runtime": 118.9535, - "eval_samples_per_second": 16.813, - "eval_steps_per_second": 4.203, + "epoch": 0.99, + "eval_cer": 0.9198879222686702, + "eval_loss": 0.02557929791510105, + "eval_runtime": 119.8042, + "eval_samples_per_second": 16.694, + "eval_steps_per_second": 4.173, "step": 153000 }, { - "epoch": 1.65, - "learning_rate": 5.175222272697773e-05, - "loss": 0.0262, + "epoch": 0.99, + "learning_rate": 0.00015186559698458083, + "loss": 0.0425, "step": 153010 }, { - "epoch": 1.66, - "learning_rate": 5.173599844246868e-05, - "loss": 0.0253, + "epoch": 0.99, + "learning_rate": 0.00015185591563022388, + "loss": 0.0391, "step": 153020 }, { - "epoch": 1.66, - "learning_rate": 5.1719774157959625e-05, - "loss": 0.0275, + "epoch": 0.99, + "learning_rate": 0.00015184623427586696, + "loss": 0.0404, "step": 153030 }, { - "epoch": 1.66, - "learning_rate": 5.1703549873450575e-05, - "loss": 0.026, + "epoch": 0.99, + "learning_rate": 0.00015183655292151004, + "loss": 0.031, "step": 153040 }, { - "epoch": 1.66, - "learning_rate": 5.168732558894152e-05, - "loss": 0.0255, + "epoch": 0.99, + "learning_rate": 0.00015182687156715306, + "loss": 0.0379, "step": 153050 }, { - "epoch": 1.66, - "learning_rate": 5.167110130443247e-05, - "loss": 0.0286, + "epoch": 0.99, + "learning_rate": 0.00015181719021279614, + "loss": 0.0362, "step": 153060 }, { - "epoch": 1.66, - "learning_rate": 5.165487701992341e-05, - "loss": 0.026, + "epoch": 0.99, + "learning_rate": 0.00015180750885843922, + "loss": 0.0426, "step": 153070 }, { - "epoch": 1.66, - "learning_rate": 5.163865273541436e-05, - "loss": 0.0299, + "epoch": 0.99, + "learning_rate": 0.0001517978275040823, + "loss": 0.0393, "step": 153080 }, { - "epoch": 1.66, - "learning_rate": 5.162242845090531e-05, - "loss": 0.0233, + "epoch": 0.99, + "learning_rate": 0.00015178814614972536, + "loss": 0.0409, "step": 153090 }, { - "epoch": 1.66, - "learning_rate": 5.160620416639625e-05, - "loss": 0.0252, + "epoch": 0.99, + "learning_rate": 0.00015177846479536844, + "loss": 0.0344, "step": 153100 }, { - "epoch": 1.66, - "learning_rate": 5.15899798818872e-05, - "loss": 0.0273, + "epoch": 0.99, + "learning_rate": 0.00015176878344101152, + "loss": 0.0465, "step": 153110 }, { - "epoch": 1.66, - "learning_rate": 5.157375559737815e-05, - "loss": 0.0241, + "epoch": 0.99, + "learning_rate": 0.00015175910208665454, + "loss": 0.0384, "step": 153120 }, { - "epoch": 1.66, - "learning_rate": 5.15575313128691e-05, - "loss": 0.0247, + "epoch": 0.99, + "learning_rate": 0.00015174942073229762, + "loss": 0.0392, "step": 153130 }, { - "epoch": 1.66, - "learning_rate": 5.154130702836005e-05, - "loss": 0.0275, + "epoch": 0.99, + "learning_rate": 0.0001517397393779407, + "loss": 0.0411, "step": 153140 }, { - "epoch": 1.66, - "learning_rate": 5.1525082743850995e-05, - "loss": 0.0284, + "epoch": 0.99, + "learning_rate": 0.00015173005802358378, + "loss": 0.0366, "step": 153150 }, { - "epoch": 1.66, - "learning_rate": 5.1508858459341945e-05, - "loss": 0.0306, + "epoch": 0.99, + "learning_rate": 0.00015172037666922683, + "loss": 0.0387, "step": 153160 }, { - "epoch": 1.66, - "learning_rate": 5.149263417483289e-05, - "loss": 0.0319, + "epoch": 0.99, + "learning_rate": 0.0001517106953148699, + "loss": 0.0325, "step": 153170 }, { - "epoch": 1.66, - "learning_rate": 5.147640989032384e-05, - "loss": 0.0248, + "epoch": 0.99, + "learning_rate": 0.000151701013960513, + "loss": 0.0402, "step": 153180 }, { - "epoch": 1.66, - "learning_rate": 5.146018560581478e-05, - "loss": 0.0324, + "epoch": 0.99, + "learning_rate": 0.00015169133260615602, + "loss": 0.0407, "step": 153190 }, { - "epoch": 1.66, - "learning_rate": 5.144396132130573e-05, - "loss": 0.0279, + "epoch": 0.99, + "learning_rate": 0.0001516816512517991, + "loss": 0.038, "step": 153200 }, { - "epoch": 1.66, - "learning_rate": 5.142773703679667e-05, - "loss": 0.0313, + "epoch": 0.99, + "learning_rate": 0.00015167196989744218, + "loss": 0.0362, "step": 153210 }, { - "epoch": 1.66, - "learning_rate": 5.141151275228762e-05, - "loss": 0.0227, + "epoch": 0.99, + "learning_rate": 0.00015166228854308523, + "loss": 0.037, "step": 153220 }, { - "epoch": 1.66, - "learning_rate": 5.139528846777857e-05, - "loss": 0.0268, + "epoch": 0.99, + "learning_rate": 0.0001516526071887283, + "loss": 0.0366, "step": 153230 }, { - "epoch": 1.66, - "learning_rate": 5.1379064183269516e-05, - "loss": 0.0307, + "epoch": 0.99, + "learning_rate": 0.0001516429258343714, + "loss": 0.0345, "step": 153240 }, { - "epoch": 1.66, - "learning_rate": 5.1362839898760466e-05, - "loss": 0.0298, + "epoch": 0.99, + "learning_rate": 0.00015163324448001447, + "loss": 0.038, "step": 153250 }, { - "epoch": 1.66, - "learning_rate": 5.134661561425141e-05, - "loss": 0.0265, + "epoch": 0.99, + "learning_rate": 0.0001516235631256575, + "loss": 0.0396, "step": 153260 }, { - "epoch": 1.66, - "learning_rate": 5.133039132974236e-05, - "loss": 0.0277, + "epoch": 0.99, + "learning_rate": 0.00015161388177130058, + "loss": 0.0327, "step": 153270 }, { - "epoch": 1.66, - "learning_rate": 5.13141670452333e-05, - "loss": 0.0276, + "epoch": 0.99, + "learning_rate": 0.00015160420041694365, + "loss": 0.0447, "step": 153280 }, { - "epoch": 1.66, - "learning_rate": 5.129794276072425e-05, - "loss": 0.0261, + "epoch": 0.99, + "learning_rate": 0.0001515945190625867, + "loss": 0.0414, "step": 153290 }, { - "epoch": 1.66, - "learning_rate": 5.1281718476215194e-05, - "loss": 0.0269, + "epoch": 0.99, + "learning_rate": 0.0001515848377082298, + "loss": 0.0441, "step": 153300 }, { - "epoch": 1.66, - "learning_rate": 5.1265494191706144e-05, - "loss": 0.0267, + "epoch": 0.99, + "learning_rate": 0.00015157515635387287, + "loss": 0.0344, "step": 153310 }, { - "epoch": 1.66, - "learning_rate": 5.1249269907197094e-05, - "loss": 0.0265, + "epoch": 0.99, + "learning_rate": 0.00015156547499951595, + "loss": 0.0416, "step": 153320 }, { - "epoch": 1.66, - "learning_rate": 5.123304562268804e-05, - "loss": 0.0256, + "epoch": 0.99, + "learning_rate": 0.00015155579364515897, + "loss": 0.0354, "step": 153330 }, { - "epoch": 1.66, - "learning_rate": 5.1216821338178986e-05, - "loss": 0.0276, + "epoch": 0.99, + "learning_rate": 0.00015154611229080205, + "loss": 0.0427, "step": 153340 }, { - "epoch": 1.66, - "learning_rate": 5.120059705366993e-05, - "loss": 0.0256, + "epoch": 0.99, + "learning_rate": 0.00015153643093644513, + "loss": 0.0309, "step": 153350 }, { - "epoch": 1.66, - "learning_rate": 5.118437276916088e-05, - "loss": 0.0287, + "epoch": 0.99, + "learning_rate": 0.00015152674958208818, + "loss": 0.041, "step": 153360 }, { - "epoch": 1.66, - "learning_rate": 5.116814848465182e-05, - "loss": 0.0262, + "epoch": 0.99, + "learning_rate": 0.00015151706822773126, + "loss": 0.0345, "step": 153370 }, { - "epoch": 1.66, - "learning_rate": 5.115192420014277e-05, - "loss": 0.0235, + "epoch": 0.99, + "learning_rate": 0.00015150738687337434, + "loss": 0.0355, "step": 153380 }, { - "epoch": 1.66, - "learning_rate": 5.1135699915633715e-05, - "loss": 0.0238, + "epoch": 0.99, + "learning_rate": 0.0001514977055190174, + "loss": 0.0341, "step": 153390 }, { - "epoch": 1.66, - "learning_rate": 5.1119475631124665e-05, - "loss": 0.0239, + "epoch": 0.99, + "learning_rate": 0.00015148802416466045, + "loss": 0.039, "step": 153400 }, { - "epoch": 1.66, - "learning_rate": 5.1103251346615615e-05, - "loss": 0.0269, + "epoch": 0.99, + "learning_rate": 0.00015147834281030353, + "loss": 0.047, "step": 153410 }, { - "epoch": 1.66, - "learning_rate": 5.108702706210656e-05, - "loss": 0.0353, + "epoch": 0.99, + "learning_rate": 0.00015146866145594658, + "loss": 0.0374, "step": 153420 }, { - "epoch": 1.66, - "learning_rate": 5.107080277759751e-05, - "loss": 0.0238, + "epoch": 0.99, + "learning_rate": 0.00015145898010158966, + "loss": 0.0427, "step": 153430 }, { - "epoch": 1.66, - "learning_rate": 5.105457849308845e-05, - "loss": 0.0311, + "epoch": 0.99, + "learning_rate": 0.00015144929874723274, + "loss": 0.0364, "step": 153440 }, { - "epoch": 1.66, - "learning_rate": 5.10383542085794e-05, - "loss": 0.022, + "epoch": 0.99, + "learning_rate": 0.00015143961739287582, + "loss": 0.0384, "step": 153450 }, { - "epoch": 1.66, - "learning_rate": 5.102212992407034e-05, - "loss": 0.0261, + "epoch": 0.99, + "learning_rate": 0.00015142993603851887, + "loss": 0.0386, "step": 153460 }, { - "epoch": 1.66, - "learning_rate": 5.100590563956129e-05, - "loss": 0.0228, + "epoch": 0.99, + "learning_rate": 0.00015142025468416193, + "loss": 0.0394, "step": 153470 }, { - "epoch": 1.66, - "learning_rate": 5.098968135505224e-05, - "loss": 0.0251, + "epoch": 0.99, + "learning_rate": 0.000151410573329805, + "loss": 0.0375, "step": 153480 }, { - "epoch": 1.66, - "learning_rate": 5.0973457070543186e-05, - "loss": 0.0269, + "epoch": 0.99, + "learning_rate": 0.00015140089197544806, + "loss": 0.0416, "step": 153490 }, { - "epoch": 1.66, - "learning_rate": 5.0957232786034135e-05, - "loss": 0.0248, + "epoch": 0.99, + "learning_rate": 0.00015139121062109114, + "loss": 0.0318, "step": 153500 }, { - "epoch": 1.66, - "learning_rate": 5.094100850152508e-05, - "loss": 0.0295, + "epoch": 0.99, + "learning_rate": 0.00015138152926673422, + "loss": 0.0408, "step": 153510 }, { - "epoch": 1.66, - "learning_rate": 5.092478421701603e-05, - "loss": 0.0298, + "epoch": 0.99, + "learning_rate": 0.0001513718479123773, + "loss": 0.0471, "step": 153520 }, { - "epoch": 1.66, - "learning_rate": 5.090855993250697e-05, - "loss": 0.0275, + "epoch": 0.99, + "learning_rate": 0.00015136216655802035, + "loss": 0.0348, "step": 153530 }, { - "epoch": 1.66, - "learning_rate": 5.089233564799792e-05, - "loss": 0.0249, + "epoch": 0.99, + "learning_rate": 0.0001513524852036634, + "loss": 0.0393, "step": 153540 }, { - "epoch": 1.66, - "learning_rate": 5.0876111363488864e-05, - "loss": 0.0259, + "epoch": 0.99, + "learning_rate": 0.00015134280384930648, + "loss": 0.0378, "step": 153550 }, { - "epoch": 1.66, - "learning_rate": 5.0859887078979814e-05, - "loss": 0.0385, + "epoch": 0.99, + "learning_rate": 0.00015133312249494954, + "loss": 0.0372, "step": 153560 }, { - "epoch": 1.66, - "learning_rate": 5.0843662794470763e-05, - "loss": 0.0258, + "epoch": 0.99, + "learning_rate": 0.00015132344114059262, + "loss": 0.0371, "step": 153570 }, { - "epoch": 1.66, - "learning_rate": 5.0827438509961706e-05, - "loss": 0.0307, + "epoch": 0.99, + "learning_rate": 0.0001513137597862357, + "loss": 0.0406, "step": 153580 }, { - "epoch": 1.66, - "learning_rate": 5.0811214225452656e-05, - "loss": 0.0288, + "epoch": 0.99, + "learning_rate": 0.00015130407843187875, + "loss": 0.0392, "step": 153590 }, { - "epoch": 1.66, - "learning_rate": 5.07949899409436e-05, - "loss": 0.0257, + "epoch": 0.99, + "learning_rate": 0.00015129439707752183, + "loss": 0.0424, "step": 153600 }, { - "epoch": 1.66, - "learning_rate": 5.077876565643455e-05, - "loss": 0.0258, + "epoch": 0.99, + "learning_rate": 0.00015128471572316488, + "loss": 0.0356, "step": 153610 }, { - "epoch": 1.66, - "learning_rate": 5.076254137192549e-05, - "loss": 0.0335, + "epoch": 0.99, + "learning_rate": 0.00015127503436880793, + "loss": 0.0429, "step": 153620 }, { - "epoch": 1.66, - "learning_rate": 5.074631708741644e-05, - "loss": 0.0335, + "epoch": 0.99, + "learning_rate": 0.00015126535301445101, + "loss": 0.0395, "step": 153630 }, { - "epoch": 1.66, - "learning_rate": 5.0730092802907385e-05, - "loss": 0.0278, + "epoch": 0.99, + "learning_rate": 0.0001512556716600941, + "loss": 0.042, "step": 153640 }, { - "epoch": 1.66, - "learning_rate": 5.0713868518398334e-05, - "loss": 0.026, + "epoch": 0.99, + "learning_rate": 0.00015124599030573717, + "loss": 0.0423, "step": 153650 }, { - "epoch": 1.66, - "learning_rate": 5.0697644233889284e-05, - "loss": 0.0271, + "epoch": 0.99, + "learning_rate": 0.00015123630895138023, + "loss": 0.0376, "step": 153660 }, { - "epoch": 1.66, - "learning_rate": 5.068141994938023e-05, - "loss": 0.0248, + "epoch": 0.99, + "learning_rate": 0.0001512266275970233, + "loss": 0.0343, "step": 153670 }, { - "epoch": 1.66, - "learning_rate": 5.066519566487118e-05, - "loss": 0.025, + "epoch": 0.99, + "learning_rate": 0.00015121694624266636, + "loss": 0.0331, "step": 153680 }, { - "epoch": 1.66, - "learning_rate": 5.064897138036212e-05, - "loss": 0.0252, + "epoch": 0.99, + "learning_rate": 0.0001512072648883094, + "loss": 0.0353, "step": 153690 }, { - "epoch": 1.66, - "learning_rate": 5.063274709585307e-05, - "loss": 0.0256, + "epoch": 0.99, + "learning_rate": 0.0001511975835339525, + "loss": 0.0396, "step": 153700 }, { - "epoch": 1.66, - "learning_rate": 5.061652281134401e-05, - "loss": 0.0266, + "epoch": 0.99, + "learning_rate": 0.00015118790217959557, + "loss": 0.0331, "step": 153710 }, { - "epoch": 1.66, - "learning_rate": 5.060029852683496e-05, - "loss": 0.0278, + "epoch": 0.99, + "learning_rate": 0.00015117822082523865, + "loss": 0.0341, "step": 153720 }, { - "epoch": 1.66, - "learning_rate": 5.0584074242325906e-05, - "loss": 0.0286, + "epoch": 0.99, + "learning_rate": 0.0001511685394708817, + "loss": 0.0409, "step": 153730 }, { - "epoch": 1.66, - "learning_rate": 5.0567849957816855e-05, - "loss": 0.0274, + "epoch": 0.99, + "learning_rate": 0.00015115885811652478, + "loss": 0.0355, "step": 153740 }, { - "epoch": 1.66, - "learning_rate": 5.0551625673307805e-05, - "loss": 0.0245, + "epoch": 0.99, + "learning_rate": 0.00015114917676216784, + "loss": 0.0358, "step": 153750 }, { - "epoch": 1.66, - "learning_rate": 5.053540138879875e-05, - "loss": 0.0272, + "epoch": 0.99, + "learning_rate": 0.0001511394954078109, + "loss": 0.0354, "step": 153760 }, { - "epoch": 1.66, - "learning_rate": 5.05191771042897e-05, - "loss": 0.0351, + "epoch": 0.99, + "learning_rate": 0.00015112981405345397, + "loss": 0.0332, "step": 153770 }, { - "epoch": 1.66, - "learning_rate": 5.050295281978064e-05, - "loss": 0.0319, + "epoch": 0.99, + "learning_rate": 0.00015112013269909705, + "loss": 0.0489, "step": 153780 }, { - "epoch": 1.66, - "learning_rate": 5.048672853527159e-05, - "loss": 0.0261, + "epoch": 0.99, + "learning_rate": 0.0001511104513447401, + "loss": 0.0394, "step": 153790 }, { - "epoch": 1.66, - "learning_rate": 5.0470504250762534e-05, - "loss": 0.0283, + "epoch": 0.99, + "learning_rate": 0.00015110076999038318, + "loss": 0.0351, "step": 153800 }, { - "epoch": 1.66, - "learning_rate": 5.045427996625348e-05, - "loss": 0.0312, + "epoch": 0.99, + "learning_rate": 0.00015109108863602626, + "loss": 0.0384, "step": 153810 }, { - "epoch": 1.66, - "learning_rate": 5.043805568174443e-05, - "loss": 0.0305, + "epoch": 0.99, + "learning_rate": 0.00015108140728166929, + "loss": 0.0358, "step": 153820 }, { - "epoch": 1.66, - "learning_rate": 5.0421831397235376e-05, - "loss": 0.0325, + "epoch": 0.99, + "learning_rate": 0.00015107172592731237, + "loss": 0.043, "step": 153830 }, { - "epoch": 1.66, - "learning_rate": 5.0405607112726326e-05, - "loss": 0.0284, + "epoch": 0.99, + "learning_rate": 0.00015106204457295545, + "loss": 0.04, "step": 153840 }, { - "epoch": 1.66, - "learning_rate": 5.038938282821727e-05, - "loss": 0.0236, + "epoch": 0.99, + "learning_rate": 0.00015105236321859853, + "loss": 0.0359, "step": 153850 }, { - "epoch": 1.66, - "learning_rate": 5.037315854370822e-05, - "loss": 0.0307, + "epoch": 0.99, + "learning_rate": 0.00015104268186424158, + "loss": 0.0402, "step": 153860 }, { - "epoch": 1.66, - "learning_rate": 5.035693425919916e-05, - "loss": 0.0238, + "epoch": 0.99, + "learning_rate": 0.00015103300050988466, + "loss": 0.0373, "step": 153870 }, { - "epoch": 1.66, - "learning_rate": 5.034070997469011e-05, - "loss": 0.0276, + "epoch": 0.99, + "learning_rate": 0.00015102331915552774, + "loss": 0.0422, "step": 153880 }, { - "epoch": 1.66, - "learning_rate": 5.0324485690181054e-05, - "loss": 0.0334, + "epoch": 0.99, + "learning_rate": 0.00015101363780117076, + "loss": 0.0354, "step": 153890 }, { - "epoch": 1.66, - "learning_rate": 5.0308261405672004e-05, - "loss": 0.0208, + "epoch": 0.99, + "learning_rate": 0.00015100395644681384, + "loss": 0.0377, "step": 153900 }, { - "epoch": 1.66, - "learning_rate": 5.0292037121162954e-05, - "loss": 0.0334, + "epoch": 0.99, + "learning_rate": 0.00015099427509245692, + "loss": 0.0322, "step": 153910 }, { - "epoch": 1.66, - "learning_rate": 5.02758128366539e-05, - "loss": 0.0214, + "epoch": 0.99, + "learning_rate": 0.0001509845937381, + "loss": 0.0385, "step": 153920 }, { - "epoch": 1.66, - "learning_rate": 5.025958855214485e-05, - "loss": 0.0311, + "epoch": 0.99, + "learning_rate": 0.00015097491238374306, + "loss": 0.0392, "step": 153930 }, { - "epoch": 1.67, - "learning_rate": 5.024336426763579e-05, - "loss": 0.0286, + "epoch": 0.99, + "learning_rate": 0.00015096523102938614, + "loss": 0.0372, "step": 153940 }, { - "epoch": 1.67, - "learning_rate": 5.022713998312674e-05, - "loss": 0.0235, + "epoch": 0.99, + "learning_rate": 0.00015095554967502921, + "loss": 0.0447, "step": 153950 }, { - "epoch": 1.67, - "learning_rate": 5.021091569861768e-05, - "loss": 0.0252, + "epoch": 0.99, + "learning_rate": 0.00015094586832067224, + "loss": 0.0374, "step": 153960 }, { - "epoch": 1.67, - "learning_rate": 5.019469141410863e-05, - "loss": 0.0301, + "epoch": 0.99, + "learning_rate": 0.00015093618696631532, + "loss": 0.039, "step": 153970 }, { - "epoch": 1.67, - "learning_rate": 5.0178467129599575e-05, - "loss": 0.0286, + "epoch": 0.99, + "learning_rate": 0.0001509265056119584, + "loss": 0.0325, "step": 153980 }, { - "epoch": 1.67, - "learning_rate": 5.0162242845090525e-05, - "loss": 0.0273, + "epoch": 0.99, + "learning_rate": 0.00015091682425760145, + "loss": 0.0432, "step": 153990 }, { - "epoch": 1.67, - "learning_rate": 5.0146018560581475e-05, - "loss": 0.0254, + "epoch": 0.99, + "learning_rate": 0.00015090714290324453, + "loss": 0.0396, "step": 154000 }, { - "epoch": 1.67, - "eval_cer": 0.9210889474344499, - "eval_loss": 0.022017398849129677, - "eval_runtime": 118.9259, - "eval_samples_per_second": 16.817, - "eval_steps_per_second": 4.204, + "epoch": 0.99, + "eval_cer": 0.9199123262908147, + "eval_loss": 0.025343097746372223, + "eval_runtime": 119.9926, + "eval_samples_per_second": 16.668, + "eval_steps_per_second": 4.167, "step": 154000 }, { - "epoch": 1.67, - "learning_rate": 5.012979427607242e-05, - "loss": 0.0278, + "epoch": 0.99, + "learning_rate": 0.0001508974615488876, + "loss": 0.0374, "step": 154010 }, { - "epoch": 1.67, - "learning_rate": 5.011356999156337e-05, - "loss": 0.0289, + "epoch": 0.99, + "learning_rate": 0.0001508877801945307, + "loss": 0.04, "step": 154020 }, { - "epoch": 1.67, - "learning_rate": 5.009734570705431e-05, - "loss": 0.0277, + "epoch": 0.99, + "learning_rate": 0.00015087809884017372, + "loss": 0.0331, "step": 154030 }, { - "epoch": 1.67, - "learning_rate": 5.008112142254526e-05, - "loss": 0.0303, + "epoch": 0.99, + "learning_rate": 0.0001508684174858168, + "loss": 0.038, "step": 154040 }, { - "epoch": 1.67, - "learning_rate": 5.00648971380362e-05, - "loss": 0.0334, + "epoch": 0.99, + "learning_rate": 0.00015085873613145988, + "loss": 0.0362, "step": 154050 }, { - "epoch": 1.67, - "learning_rate": 5.004867285352715e-05, - "loss": 0.0283, + "epoch": 0.99, + "learning_rate": 0.00015084905477710293, + "loss": 0.0374, "step": 154060 }, { - "epoch": 1.67, - "learning_rate": 5.0032448569018096e-05, - "loss": 0.026, + "epoch": 0.99, + "learning_rate": 0.000150839373422746, + "loss": 0.0358, "step": 154070 }, { - "epoch": 1.67, - "learning_rate": 5.0016224284509046e-05, - "loss": 0.0311, + "epoch": 0.99, + "learning_rate": 0.0001508296920683891, + "loss": 0.0405, "step": 154080 }, { - "epoch": 1.67, - "learning_rate": 4.9999999999999996e-05, - "loss": 0.0262, + "epoch": 0.99, + "learning_rate": 0.00015082001071403217, + "loss": 0.0442, "step": 154090 }, { - "epoch": 1.67, - "learning_rate": 4.998377571549094e-05, - "loss": 0.0259, + "epoch": 0.99, + "learning_rate": 0.0001508103293596752, + "loss": 0.0371, "step": 154100 }, { - "epoch": 1.67, - "learning_rate": 4.996755143098189e-05, - "loss": 0.026, + "epoch": 0.99, + "learning_rate": 0.00015080064800531827, + "loss": 0.036, "step": 154110 }, { - "epoch": 1.67, - "learning_rate": 4.995132714647283e-05, - "loss": 0.0294, + "epoch": 0.99, + "learning_rate": 0.00015079096665096135, + "loss": 0.0368, "step": 154120 }, { - "epoch": 1.67, - "learning_rate": 4.993510286196378e-05, - "loss": 0.0272, + "epoch": 0.99, + "learning_rate": 0.0001507812852966044, + "loss": 0.043, "step": 154130 }, { - "epoch": 1.67, - "learning_rate": 4.9918878577454724e-05, - "loss": 0.0348, + "epoch": 0.99, + "learning_rate": 0.0001507716039422475, + "loss": 0.0322, "step": 154140 }, { - "epoch": 1.67, - "learning_rate": 4.9902654292945674e-05, - "loss": 0.0278, + "epoch": 0.99, + "learning_rate": 0.00015076192258789057, + "loss": 0.0413, "step": 154150 }, { - "epoch": 1.67, - "learning_rate": 4.9886430008436624e-05, - "loss": 0.0246, + "epoch": 0.99, + "learning_rate": 0.00015075224123353362, + "loss": 0.033, "step": 154160 }, { - "epoch": 1.67, - "learning_rate": 4.987020572392757e-05, - "loss": 0.0351, + "epoch": 1.0, + "learning_rate": 0.00015074255987917667, + "loss": 0.0385, "step": 154170 }, { - "epoch": 1.67, - "learning_rate": 4.9853981439418516e-05, - "loss": 0.0246, + "epoch": 1.0, + "learning_rate": 0.00015073287852481975, + "loss": 0.0334, "step": 154180 }, { - "epoch": 1.67, - "learning_rate": 4.983775715490946e-05, - "loss": 0.0235, + "epoch": 1.0, + "learning_rate": 0.0001507231971704628, + "loss": 0.0389, "step": 154190 }, { - "epoch": 1.67, - "learning_rate": 4.982153287040041e-05, - "loss": 0.0263, + "epoch": 1.0, + "learning_rate": 0.00015071351581610588, + "loss": 0.0385, "step": 154200 }, { - "epoch": 1.67, - "learning_rate": 4.980530858589135e-05, - "loss": 0.0282, + "epoch": 1.0, + "learning_rate": 0.00015070383446174896, + "loss": 0.0392, "step": 154210 }, { - "epoch": 1.67, - "learning_rate": 4.97890843013823e-05, - "loss": 0.027, + "epoch": 1.0, + "learning_rate": 0.00015069415310739204, + "loss": 0.0396, "step": 154220 }, { - "epoch": 1.67, - "learning_rate": 4.9772860016873245e-05, - "loss": 0.0275, + "epoch": 1.0, + "learning_rate": 0.0001506844717530351, + "loss": 0.0373, "step": 154230 }, { - "epoch": 1.67, - "learning_rate": 4.9756635732364195e-05, - "loss": 0.0323, + "epoch": 1.0, + "learning_rate": 0.00015067479039867815, + "loss": 0.0387, "step": 154240 }, { - "epoch": 1.67, - "learning_rate": 4.9740411447855145e-05, - "loss": 0.0235, + "epoch": 1.0, + "learning_rate": 0.00015066510904432123, + "loss": 0.0381, "step": 154250 }, { - "epoch": 1.67, - "learning_rate": 4.972418716334609e-05, - "loss": 0.0265, + "epoch": 1.0, + "learning_rate": 0.00015065542768996428, + "loss": 0.0338, "step": 154260 }, { - "epoch": 1.67, - "learning_rate": 4.970796287883704e-05, - "loss": 0.0266, + "epoch": 1.0, + "learning_rate": 0.00015064574633560736, + "loss": 0.0395, "step": 154270 }, { - "epoch": 1.67, - "learning_rate": 4.969173859432798e-05, - "loss": 0.0248, + "epoch": 1.0, + "learning_rate": 0.00015063606498125044, + "loss": 0.0399, "step": 154280 }, { - "epoch": 1.67, - "learning_rate": 4.967551430981894e-05, - "loss": 0.0304, + "epoch": 1.0, + "learning_rate": 0.00015062638362689352, + "loss": 0.036, "step": 154290 }, { - "epoch": 1.67, - "learning_rate": 4.9659290025309887e-05, - "loss": 0.0313, + "epoch": 1.0, + "learning_rate": 0.00015061670227253657, + "loss": 0.0389, "step": 154300 }, { - "epoch": 1.67, - "learning_rate": 4.964306574080083e-05, - "loss": 0.0269, + "epoch": 1.0, + "learning_rate": 0.00015060702091817963, + "loss": 0.0396, "step": 154310 }, { - "epoch": 1.67, - "learning_rate": 4.962684145629178e-05, - "loss": 0.0242, + "epoch": 1.0, + "learning_rate": 0.0001505973395638227, + "loss": 0.0352, "step": 154320 }, { - "epoch": 1.67, - "learning_rate": 4.961061717178272e-05, - "loss": 0.0254, + "epoch": 1.0, + "learning_rate": 0.00015058765820946576, + "loss": 0.0362, "step": 154330 }, { - "epoch": 1.67, - "learning_rate": 4.959439288727367e-05, - "loss": 0.0257, + "epoch": 1.0, + "learning_rate": 0.00015057797685510884, + "loss": 0.0448, "step": 154340 }, { - "epoch": 1.67, - "learning_rate": 4.9578168602764615e-05, - "loss": 0.0238, + "epoch": 1.0, + "learning_rate": 0.00015056829550075192, + "loss": 0.0416, "step": 154350 }, { - "epoch": 1.67, - "learning_rate": 4.9561944318255565e-05, - "loss": 0.0264, + "epoch": 1.0, + "learning_rate": 0.00015055861414639497, + "loss": 0.0471, "step": 154360 }, { - "epoch": 1.67, - "learning_rate": 4.954572003374651e-05, - "loss": 0.0239, + "epoch": 1.0, + "learning_rate": 0.00015054893279203805, + "loss": 0.0417, "step": 154370 }, { - "epoch": 1.67, - "learning_rate": 4.952949574923746e-05, - "loss": 0.0273, + "epoch": 1.0, + "learning_rate": 0.0001505392514376811, + "loss": 0.0401, "step": 154380 }, { - "epoch": 1.67, - "learning_rate": 4.951327146472841e-05, - "loss": 0.0295, + "epoch": 1.0, + "learning_rate": 0.00015052957008332416, + "loss": 0.0378, "step": 154390 }, { - "epoch": 1.67, - "learning_rate": 4.949704718021935e-05, - "loss": 0.0329, + "epoch": 1.0, + "learning_rate": 0.00015051988872896724, + "loss": 0.036, "step": 154400 }, { - "epoch": 1.67, - "learning_rate": 4.94808228957103e-05, - "loss": 0.027, + "epoch": 1.0, + "learning_rate": 0.00015051020737461032, + "loss": 0.0337, "step": 154410 }, { - "epoch": 1.67, - "learning_rate": 4.946459861120124e-05, - "loss": 0.0223, + "epoch": 1.0, + "learning_rate": 0.0001505005260202534, + "loss": 0.0341, "step": 154420 }, { - "epoch": 1.67, - "learning_rate": 4.944837432669219e-05, - "loss": 0.0254, + "epoch": 1.0, + "learning_rate": 0.00015049084466589645, + "loss": 0.0363, "step": 154430 }, { - "epoch": 1.67, - "learning_rate": 4.9432150042183136e-05, - "loss": 0.0287, + "epoch": 1.0, + "learning_rate": 0.00015048116331153953, + "loss": 0.0313, "step": 154440 }, { - "epoch": 1.67, - "learning_rate": 4.9415925757674086e-05, - "loss": 0.0243, + "epoch": 1.0, + "learning_rate": 0.00015047148195718258, + "loss": 0.042, "step": 154450 }, { - "epoch": 1.67, - "learning_rate": 4.939970147316503e-05, - "loss": 0.0236, + "epoch": 1.0, + "learning_rate": 0.00015046180060282563, + "loss": 0.0382, "step": 154460 }, { - "epoch": 1.67, - "learning_rate": 4.938347718865598e-05, - "loss": 0.0253, + "epoch": 1.0, + "learning_rate": 0.0001504521192484687, + "loss": 0.0356, "step": 154470 }, { - "epoch": 1.67, - "learning_rate": 4.936725290414693e-05, - "loss": 0.0298, + "epoch": 1.0, + "learning_rate": 0.0001504424378941118, + "loss": 0.0415, "step": 154480 }, { - "epoch": 1.67, - "learning_rate": 4.935102861963787e-05, - "loss": 0.0237, + "epoch": 1.0, + "learning_rate": 0.00015043275653975487, + "loss": 0.0381, "step": 154490 }, { - "epoch": 1.67, - "learning_rate": 4.933480433512882e-05, - "loss": 0.0283, + "epoch": 1.0, + "learning_rate": 0.00015042307518539793, + "loss": 0.0363, "step": 154500 }, { - "epoch": 1.67, - "learning_rate": 4.9318580050619764e-05, - "loss": 0.0257, + "epoch": 1.0, + "learning_rate": 0.000150413393831041, + "loss": 0.0416, "step": 154510 }, { - "epoch": 1.67, - "learning_rate": 4.9302355766110714e-05, - "loss": 0.0218, + "epoch": 1.0, + "learning_rate": 0.00015040371247668406, + "loss": 0.0367, "step": 154520 }, { - "epoch": 1.67, - "learning_rate": 4.928613148160166e-05, - "loss": 0.0257, + "epoch": 1.0, + "learning_rate": 0.0001503940311223271, + "loss": 0.0426, "step": 154530 }, { - "epoch": 1.67, - "learning_rate": 4.9269907197092607e-05, - "loss": 0.0279, + "epoch": 1.0, + "learning_rate": 0.0001503843497679702, + "loss": 0.041, "step": 154540 }, { - "epoch": 1.67, - "learning_rate": 4.9253682912583556e-05, - "loss": 0.0294, + "epoch": 1.0, + "learning_rate": 0.00015037466841361327, + "loss": 0.0385, "step": 154550 }, { - "epoch": 1.67, - "learning_rate": 4.92374586280745e-05, - "loss": 0.0251, + "epoch": 1.0, + "learning_rate": 0.00015036498705925632, + "loss": 0.0358, "step": 154560 }, { - "epoch": 1.67, - "learning_rate": 4.922123434356545e-05, - "loss": 0.0245, + "epoch": 1.0, + "learning_rate": 0.0001503553057048994, + "loss": 0.0352, "step": 154570 }, { - "epoch": 1.67, - "learning_rate": 4.920501005905639e-05, - "loss": 0.0298, + "epoch": 1.0, + "learning_rate": 0.00015034562435054248, + "loss": 0.0429, "step": 154580 }, { - "epoch": 1.67, - "learning_rate": 4.918878577454734e-05, - "loss": 0.0311, + "epoch": 1.0, + "learning_rate": 0.0001503359429961855, + "loss": 0.0408, "step": 154590 }, { - "epoch": 1.67, - "learning_rate": 4.9172561490038285e-05, - "loss": 0.0237, + "epoch": 1.0, + "learning_rate": 0.0001503262616418286, + "loss": 0.042, "step": 154600 }, { - "epoch": 1.67, - "learning_rate": 4.9156337205529235e-05, - "loss": 0.026, + "epoch": 1.0, + "learning_rate": 0.00015031658028747167, + "loss": 0.0409, "step": 154610 }, { - "epoch": 1.67, - "learning_rate": 4.914011292102018e-05, - "loss": 0.0268, - "step": 154620 + "epoch": 1.0, + "learning_rate": 0.00015030689893311475, + "loss": 0.0341, + "step": 154620 }, { - "epoch": 1.67, - "learning_rate": 4.912388863651113e-05, - "loss": 0.0308, + "epoch": 1.0, + "learning_rate": 0.0001502972175787578, + "loss": 0.0332, "step": 154630 }, { - "epoch": 1.67, - "learning_rate": 4.910766435200208e-05, - "loss": 0.0254, + "epoch": 1.0, + "learning_rate": 0.00015028753622440088, + "loss": 0.0356, "step": 154640 }, { - "epoch": 1.67, - "learning_rate": 4.909144006749302e-05, - "loss": 0.0263, + "epoch": 1.0, + "learning_rate": 0.00015027785487004396, + "loss": 0.0365, "step": 154650 }, { - "epoch": 1.67, - "learning_rate": 4.907521578298397e-05, - "loss": 0.027, + "epoch": 1.0, + "learning_rate": 0.00015026817351568699, + "loss": 0.0426, "step": 154660 }, { - "epoch": 1.67, - "learning_rate": 4.905899149847491e-05, - "loss": 0.0212, + "epoch": 1.0, + "learning_rate": 0.00015025849216133007, + "loss": 0.0361, "step": 154670 }, { - "epoch": 1.67, - "learning_rate": 4.904276721396586e-05, - "loss": 0.0278, + "epoch": 1.0, + "learning_rate": 0.00015024881080697315, + "loss": 0.0363, "step": 154680 }, { - "epoch": 1.67, - "learning_rate": 4.9026542929456806e-05, - "loss": 0.0306, + "epoch": 1.0, + "learning_rate": 0.00015023912945261623, + "loss": 0.0419, "step": 154690 }, { - "epoch": 1.67, - "learning_rate": 4.9010318644947755e-05, - "loss": 0.0248, + "epoch": 1.0, + "learning_rate": 0.00015022944809825928, + "loss": 0.0399, "step": 154700 }, { - "epoch": 1.67, - "learning_rate": 4.89940943604387e-05, - "loss": 0.0243, + "epoch": 1.0, + "learning_rate": 0.00015021976674390236, + "loss": 0.0393, "step": 154710 }, { - "epoch": 1.67, - "learning_rate": 4.897787007592965e-05, - "loss": 0.0316, + "epoch": 1.0, + "learning_rate": 0.00015021008538954544, + "loss": 0.0381, "step": 154720 }, { - "epoch": 1.67, - "learning_rate": 4.89616457914206e-05, - "loss": 0.0276, + "epoch": 1.0, + "learning_rate": 0.00015020040403518846, + "loss": 0.0335, "step": 154730 }, { - "epoch": 1.67, - "learning_rate": 4.894542150691154e-05, - "loss": 0.0289, + "epoch": 1.0, + "learning_rate": 0.00015019072268083154, + "loss": 0.0371, "step": 154740 }, { - "epoch": 1.67, - "learning_rate": 4.892919722240249e-05, - "loss": 0.029, + "epoch": 1.0, + "learning_rate": 0.00015018104132647462, + "loss": 0.0339, "step": 154750 }, { - "epoch": 1.67, - "learning_rate": 4.8912972937893434e-05, - "loss": 0.0409, + "epoch": 1.0, + "learning_rate": 0.00015017135997211768, + "loss": 0.0367, "step": 154760 }, { - "epoch": 1.67, - "learning_rate": 4.8896748653384384e-05, - "loss": 0.0275, + "epoch": 1.0, + "learning_rate": 0.00015016167861776075, + "loss": 0.0408, "step": 154770 }, { - "epoch": 1.67, - "learning_rate": 4.8880524368875327e-05, - "loss": 0.0311, + "epoch": 1.0, + "learning_rate": 0.00015015199726340383, + "loss": 0.0344, "step": 154780 }, { - "epoch": 1.67, - "learning_rate": 4.8864300084366276e-05, - "loss": 0.0224, + "epoch": 1.0, + "learning_rate": 0.00015014231590904691, + "loss": 0.0433, "step": 154790 }, { - "epoch": 1.67, - "learning_rate": 4.884807579985722e-05, - "loss": 0.0264, + "epoch": 1.0, + "learning_rate": 0.00015013263455468994, + "loss": 0.0355, "step": 154800 }, { - "epoch": 1.67, - "learning_rate": 4.883185151534817e-05, - "loss": 0.0319, + "epoch": 1.0, + "learning_rate": 0.00015012295320033302, + "loss": 0.0365, "step": 154810 }, { - "epoch": 1.67, - "learning_rate": 4.881562723083912e-05, - "loss": 0.0282, + "epoch": 1.0, + "learning_rate": 0.0001501132718459761, + "loss": 0.04, "step": 154820 }, { - "epoch": 1.67, - "learning_rate": 4.879940294633006e-05, - "loss": 0.0286, + "epoch": 1.0, + "learning_rate": 0.00015010359049161915, + "loss": 0.0355, "step": 154830 }, { - "epoch": 1.67, - "learning_rate": 4.878317866182101e-05, - "loss": 0.0333, + "epoch": 1.0, + "learning_rate": 0.00015009390913726223, + "loss": 0.0343, "step": 154840 }, { - "epoch": 1.67, - "learning_rate": 4.8766954377311955e-05, - "loss": 0.0276, + "epoch": 1.0, + "learning_rate": 0.0001500842277829053, + "loss": 0.0336, "step": 154850 }, { - "epoch": 1.67, - "learning_rate": 4.8750730092802904e-05, - "loss": 0.0272, + "epoch": 1.0, + "learning_rate": 0.0001500745464285484, + "loss": 0.0324, "step": 154860 }, { - "epoch": 1.68, - "learning_rate": 4.873450580829385e-05, - "loss": 0.0243, + "epoch": 1.0, + "learning_rate": 0.00015006486507419142, + "loss": 0.0381, "step": 154870 }, { - "epoch": 1.68, - "learning_rate": 4.87182815237848e-05, - "loss": 0.0276, + "epoch": 1.0, + "learning_rate": 0.0001500551837198345, + "loss": 0.0397, "step": 154880 }, { - "epoch": 1.68, - "learning_rate": 4.870205723927575e-05, - "loss": 0.0228, + "epoch": 1.0, + "learning_rate": 0.00015004550236547758, + "loss": 0.0435, "step": 154890 }, { - "epoch": 1.68, - "learning_rate": 4.868583295476669e-05, - "loss": 0.0287, + "epoch": 1.0, + "learning_rate": 0.00015003582101112063, + "loss": 0.0382, "step": 154900 }, { - "epoch": 1.68, - "learning_rate": 4.866960867025764e-05, - "loss": 0.0284, + "epoch": 1.0, + "learning_rate": 0.0001500261396567637, + "loss": 0.0305, "step": 154910 }, { - "epoch": 1.68, - "learning_rate": 4.865338438574858e-05, - "loss": 0.0238, + "epoch": 1.0, + "learning_rate": 0.0001500164583024068, + "loss": 0.0357, "step": 154920 }, { - "epoch": 1.68, - "learning_rate": 4.863716010123953e-05, - "loss": 0.023, + "epoch": 1.0, + "learning_rate": 0.00015000677694804987, + "loss": 0.0422, "step": 154930 }, { - "epoch": 1.68, - "learning_rate": 4.8620935816730475e-05, - "loss": 0.0239, + "epoch": 1.0, + "learning_rate": 0.00014999709559369292, + "loss": 0.0439, "step": 154940 }, { - "epoch": 1.68, - "learning_rate": 4.8604711532221425e-05, - "loss": 0.0264, + "epoch": 1.0, + "learning_rate": 0.00014998741423933597, + "loss": 0.0317, "step": 154950 }, { - "epoch": 1.68, - "learning_rate": 4.858848724771237e-05, - "loss": 0.0243, + "epoch": 1.0, + "learning_rate": 0.00014997773288497903, + "loss": 0.0317, "step": 154960 }, { - "epoch": 1.68, - "learning_rate": 4.857226296320332e-05, - "loss": 0.0233, + "epoch": 1.0, + "learning_rate": 0.0001499680515306221, + "loss": 0.0352, "step": 154970 }, { - "epoch": 1.68, - "learning_rate": 4.855603867869427e-05, - "loss": 0.0293, + "epoch": 1.0, + "learning_rate": 0.0001499583701762652, + "loss": 0.0339, "step": 154980 }, { - "epoch": 1.68, - "learning_rate": 4.853981439418521e-05, - "loss": 0.0293, + "epoch": 1.0, + "learning_rate": 0.00014994868882190824, + "loss": 0.0411, "step": 154990 }, { - "epoch": 1.68, - "learning_rate": 4.852359010967616e-05, - "loss": 0.028, + "epoch": 1.0, + "learning_rate": 0.00014993900746755132, + "loss": 0.0353, "step": 155000 }, { - "epoch": 1.68, - "eval_cer": 0.9210173852044647, - "eval_loss": 0.02208337001502514, - "eval_runtime": 119.0358, - "eval_samples_per_second": 16.802, - "eval_steps_per_second": 4.2, + "epoch": 1.0, + "eval_cer": 0.9199014800587504, + "eval_loss": 0.025568395853042603, + "eval_runtime": 120.4271, + "eval_samples_per_second": 16.608, + "eval_steps_per_second": 4.152, "step": 155000 }, { - "epoch": 1.68, - "learning_rate": 4.8507365825167103e-05, - "loss": 0.0234, + "epoch": 1.0, + "learning_rate": 0.0001499293261131944, + "loss": 0.0359, "step": 155010 }, { - "epoch": 1.68, - "learning_rate": 4.849114154065805e-05, - "loss": 0.0256, + "epoch": 1.0, + "learning_rate": 0.00014991964475883745, + "loss": 0.0331, "step": 155020 }, { - "epoch": 1.68, - "learning_rate": 4.8474917256148996e-05, - "loss": 0.0238, + "epoch": 1.0, + "learning_rate": 0.0001499099634044805, + "loss": 0.0358, "step": 155030 }, { - "epoch": 1.68, - "learning_rate": 4.8458692971639946e-05, - "loss": 0.0294, + "epoch": 1.0, + "learning_rate": 0.00014990028205012358, + "loss": 0.0383, "step": 155040 }, { - "epoch": 1.68, - "learning_rate": 4.844246868713089e-05, - "loss": 0.0248, + "epoch": 1.0, + "learning_rate": 0.00014989060069576666, + "loss": 0.0365, "step": 155050 }, { - "epoch": 1.68, - "learning_rate": 4.842624440262184e-05, - "loss": 0.0234, + "epoch": 1.0, + "learning_rate": 0.00014988091934140972, + "loss": 0.0406, "step": 155060 }, { - "epoch": 1.68, - "learning_rate": 4.841002011811279e-05, - "loss": 0.0241, + "epoch": 1.0, + "learning_rate": 0.0001498712379870528, + "loss": 0.0346, "step": 155070 }, { - "epoch": 1.68, - "learning_rate": 4.839379583360373e-05, - "loss": 0.0335, + "epoch": 1.0, + "learning_rate": 0.00014986155663269585, + "loss": 0.0334, "step": 155080 }, { - "epoch": 1.68, - "learning_rate": 4.837757154909468e-05, - "loss": 0.0291, + "epoch": 1.0, + "learning_rate": 0.00014985187527833893, + "loss": 0.0312, "step": 155090 }, { - "epoch": 1.68, - "learning_rate": 4.8361347264585624e-05, - "loss": 0.0275, + "epoch": 1.0, + "learning_rate": 0.00014984219392398198, + "loss": 0.032, "step": 155100 }, { - "epoch": 1.68, - "learning_rate": 4.8345122980076574e-05, - "loss": 0.0224, + "epoch": 1.0, + "learning_rate": 0.00014983251256962506, + "loss": 0.0362, "step": 155110 }, { - "epoch": 1.68, - "learning_rate": 4.832889869556752e-05, - "loss": 0.0247, + "epoch": 1.0, + "learning_rate": 0.00014982283121526814, + "loss": 0.0304, "step": 155120 }, { - "epoch": 1.68, - "learning_rate": 4.831267441105847e-05, - "loss": 0.0288, + "epoch": 1.0, + "learning_rate": 0.0001498131498609112, + "loss": 0.0371, "step": 155130 }, { - "epoch": 1.68, - "learning_rate": 4.829645012654941e-05, - "loss": 0.0265, + "epoch": 1.0, + "learning_rate": 0.00014980346850655427, + "loss": 0.0348, "step": 155140 }, { - "epoch": 1.68, - "learning_rate": 4.828022584204036e-05, - "loss": 0.0222, + "epoch": 1.0, + "learning_rate": 0.00014979378715219733, + "loss": 0.0327, "step": 155150 }, { - "epoch": 1.68, - "learning_rate": 4.826400155753131e-05, - "loss": 0.0247, + "epoch": 1.0, + "learning_rate": 0.00014978410579784038, + "loss": 0.0399, "step": 155160 }, { - "epoch": 1.68, - "learning_rate": 4.824777727302225e-05, - "loss": 0.0269, + "epoch": 1.0, + "learning_rate": 0.00014977442444348346, + "loss": 0.0378, "step": 155170 }, { - "epoch": 1.68, - "learning_rate": 4.82315529885132e-05, - "loss": 0.0314, + "epoch": 1.0, + "learning_rate": 0.00014976474308912654, + "loss": 0.0295, "step": 155180 }, { - "epoch": 1.68, - "learning_rate": 4.8215328704004145e-05, - "loss": 0.0228, + "epoch": 1.0, + "learning_rate": 0.00014975506173476962, + "loss": 0.0385, "step": 155190 }, { - "epoch": 1.68, - "learning_rate": 4.8199104419495095e-05, - "loss": 0.0213, + "epoch": 1.0, + "learning_rate": 0.00014974538038041267, + "loss": 0.0422, "step": 155200 }, { - "epoch": 1.68, - "learning_rate": 4.818288013498604e-05, - "loss": 0.0288, + "epoch": 1.0, + "learning_rate": 0.00014973569902605575, + "loss": 0.0397, "step": 155210 }, { - "epoch": 1.68, - "learning_rate": 4.816665585047699e-05, - "loss": 0.0324, + "epoch": 1.0, + "learning_rate": 0.0001497260176716988, + "loss": 0.0359, "step": 155220 }, { - "epoch": 1.68, - "learning_rate": 4.815043156596794e-05, - "loss": 0.0259, + "epoch": 1.0, + "learning_rate": 0.00014971633631734186, + "loss": 0.0306, "step": 155230 }, { - "epoch": 1.68, - "learning_rate": 4.813420728145888e-05, - "loss": 0.0271, + "epoch": 1.0, + "learning_rate": 0.00014970665496298494, + "loss": 0.0316, "step": 155240 }, { - "epoch": 1.68, - "learning_rate": 4.811798299694983e-05, - "loss": 0.0382, + "epoch": 1.0, + "learning_rate": 0.00014969697360862802, + "loss": 0.033, "step": 155250 }, { - "epoch": 1.68, - "learning_rate": 4.810175871244077e-05, - "loss": 0.0245, + "epoch": 1.0, + "learning_rate": 0.0001496872922542711, + "loss": 0.0382, "step": 155260 }, { - "epoch": 1.68, - "learning_rate": 4.808553442793172e-05, - "loss": 0.0247, + "epoch": 1.0, + "learning_rate": 0.00014967761089991415, + "loss": 0.037, "step": 155270 }, { - "epoch": 1.68, - "learning_rate": 4.8069310143422666e-05, - "loss": 0.0248, + "epoch": 1.0, + "learning_rate": 0.0001496679295455572, + "loss": 0.0362, "step": 155280 }, { - "epoch": 1.68, - "learning_rate": 4.8053085858913616e-05, - "loss": 0.029, + "epoch": 1.0, + "learning_rate": 0.00014965824819120028, + "loss": 0.0328, "step": 155290 }, { - "epoch": 1.68, - "learning_rate": 4.803686157440456e-05, - "loss": 0.0231, + "epoch": 1.0, + "learning_rate": 0.00014964856683684333, + "loss": 0.033, "step": 155300 }, { - "epoch": 1.68, - "learning_rate": 4.802063728989551e-05, - "loss": 0.0261, + "epoch": 1.0, + "learning_rate": 0.0001496388854824864, + "loss": 0.0299, "step": 155310 }, { - "epoch": 1.68, - "learning_rate": 4.800441300538646e-05, - "loss": 0.03, + "epoch": 1.0, + "learning_rate": 0.0001496292041281295, + "loss": 0.0343, "step": 155320 }, { - "epoch": 1.68, - "learning_rate": 4.79881887208774e-05, - "loss": 0.0261, + "epoch": 1.0, + "learning_rate": 0.00014961952277377257, + "loss": 0.0366, "step": 155330 }, { - "epoch": 1.68, - "learning_rate": 4.797196443636835e-05, - "loss": 0.0257, + "epoch": 1.0, + "learning_rate": 0.00014960984141941563, + "loss": 0.0294, "step": 155340 }, { - "epoch": 1.68, - "learning_rate": 4.7955740151859294e-05, - "loss": 0.0258, + "epoch": 1.0, + "learning_rate": 0.00014960016006505868, + "loss": 0.0366, "step": 155350 }, { - "epoch": 1.68, - "learning_rate": 4.7939515867350244e-05, - "loss": 0.026, + "epoch": 1.0, + "learning_rate": 0.00014959047871070176, + "loss": 0.0372, "step": 155360 }, { - "epoch": 1.68, - "learning_rate": 4.792329158284119e-05, - "loss": 0.0287, + "epoch": 1.0, + "learning_rate": 0.0001495807973563448, + "loss": 0.0404, "step": 155370 }, { - "epoch": 1.68, - "learning_rate": 4.7907067298332137e-05, - "loss": 0.0297, + "epoch": 1.0, + "learning_rate": 0.0001495711160019879, + "loss": 0.0347, "step": 155380 }, { - "epoch": 1.68, - "learning_rate": 4.789084301382308e-05, - "loss": 0.0232, + "epoch": 1.0, + "learning_rate": 0.00014956143464763097, + "loss": 0.03, "step": 155390 }, { - "epoch": 1.68, - "learning_rate": 4.787461872931403e-05, - "loss": 0.0328, + "epoch": 1.0, + "learning_rate": 0.00014955175329327402, + "loss": 0.0377, "step": 155400 }, { - "epoch": 1.68, - "learning_rate": 4.785839444480498e-05, - "loss": 0.0315, + "epoch": 1.0, + "learning_rate": 0.0001495420719389171, + "loss": 0.0361, "step": 155410 }, { - "epoch": 1.68, - "learning_rate": 4.784217016029592e-05, - "loss": 0.0248, + "epoch": 1.0, + "learning_rate": 0.00014953239058456016, + "loss": 0.0376, "step": 155420 }, { - "epoch": 1.68, - "learning_rate": 4.782594587578687e-05, - "loss": 0.0265, + "epoch": 1.0, + "learning_rate": 0.00014952270923020324, + "loss": 0.0357, "step": 155430 }, { - "epoch": 1.68, - "learning_rate": 4.7809721591277815e-05, - "loss": 0.0281, + "epoch": 1.0, + "learning_rate": 0.0001495130278758463, + "loss": 0.0308, "step": 155440 }, { - "epoch": 1.68, - "learning_rate": 4.7793497306768765e-05, - "loss": 0.025, + "epoch": 1.0, + "learning_rate": 0.00014950334652148937, + "loss": 0.0361, "step": 155450 }, { - "epoch": 1.68, - "learning_rate": 4.777727302225972e-05, - "loss": 0.0282, + "epoch": 1.0, + "learning_rate": 0.00014949366516713245, + "loss": 0.0324, "step": 155460 }, { - "epoch": 1.68, - "learning_rate": 4.7761048737750664e-05, - "loss": 0.0346, + "epoch": 1.0, + "learning_rate": 0.0001494839838127755, + "loss": 0.0311, "step": 155470 }, { - "epoch": 1.68, - "learning_rate": 4.7744824453241614e-05, - "loss": 0.0267, + "epoch": 1.0, + "learning_rate": 0.00014947430245841855, + "loss": 0.0321, "step": 155480 }, { - "epoch": 1.68, - "learning_rate": 4.772860016873256e-05, - "loss": 0.0223, + "epoch": 1.0, + "learning_rate": 0.00014946462110406163, + "loss": 0.0379, "step": 155490 }, { - "epoch": 1.68, - "learning_rate": 4.771237588422351e-05, - "loss": 0.026, + "epoch": 1.0, + "learning_rate": 0.0001494549397497047, + "loss": 0.0357, "step": 155500 }, { - "epoch": 1.68, - "learning_rate": 4.769615159971445e-05, - "loss": 0.0303, + "epoch": 1.0, + "learning_rate": 0.00014944525839534777, + "loss": 0.0372, "step": 155510 }, { - "epoch": 1.68, - "learning_rate": 4.76799273152054e-05, - "loss": 0.0246, + "epoch": 1.0, + "learning_rate": 0.00014943557704099084, + "loss": 0.0326, "step": 155520 }, { - "epoch": 1.68, - "learning_rate": 4.766370303069634e-05, - "loss": 0.027, + "epoch": 1.0, + "learning_rate": 0.00014942589568663392, + "loss": 0.0331, "step": 155530 }, { - "epoch": 1.68, - "learning_rate": 4.764747874618729e-05, - "loss": 0.0251, + "epoch": 1.0, + "learning_rate": 0.00014941621433227698, + "loss": 0.0372, "step": 155540 }, { - "epoch": 1.68, - "learning_rate": 4.763125446167824e-05, - "loss": 0.0275, + "epoch": 1.0, + "learning_rate": 0.00014940653297792003, + "loss": 0.0385, "step": 155550 }, { - "epoch": 1.68, - "learning_rate": 4.7615030177169185e-05, - "loss": 0.0241, + "epoch": 1.0, + "learning_rate": 0.0001493968516235631, + "loss": 0.0402, "step": 155560 }, { - "epoch": 1.68, - "learning_rate": 4.7598805892660135e-05, - "loss": 0.0281, + "epoch": 1.0, + "learning_rate": 0.0001493871702692062, + "loss": 0.0312, "step": 155570 }, { - "epoch": 1.68, - "learning_rate": 4.758258160815108e-05, - "loss": 0.0256, + "epoch": 1.0, + "learning_rate": 0.00014937748891484924, + "loss": 0.0371, "step": 155580 }, { - "epoch": 1.68, - "learning_rate": 4.756635732364203e-05, - "loss": 0.0268, + "epoch": 1.0, + "learning_rate": 0.00014936780756049232, + "loss": 0.0378, "step": 155590 }, { - "epoch": 1.68, - "learning_rate": 4.755013303913297e-05, - "loss": 0.0265, + "epoch": 1.0, + "learning_rate": 0.00014935812620613537, + "loss": 0.0329, "step": 155600 }, { - "epoch": 1.68, - "learning_rate": 4.753390875462392e-05, - "loss": 0.028, + "epoch": 1.0, + "learning_rate": 0.00014934844485177845, + "loss": 0.0319, "step": 155610 }, { - "epoch": 1.68, - "learning_rate": 4.751768447011487e-05, - "loss": 0.0296, + "epoch": 1.0, + "learning_rate": 0.0001493387634974215, + "loss": 0.0376, "step": 155620 }, { - "epoch": 1.68, - "learning_rate": 4.750146018560581e-05, - "loss": 0.0268, + "epoch": 1.0, + "learning_rate": 0.0001493290821430646, + "loss": 0.0347, "step": 155630 }, { - "epoch": 1.68, - "learning_rate": 4.748523590109676e-05, - "loss": 0.0306, + "epoch": 1.0, + "learning_rate": 0.00014931940078870767, + "loss": 0.0371, "step": 155640 }, { - "epoch": 1.68, - "learning_rate": 4.7469011616587706e-05, - "loss": 0.023, + "epoch": 1.0, + "learning_rate": 0.00014930971943435072, + "loss": 0.0413, "step": 155650 }, { - "epoch": 1.68, - "learning_rate": 4.7452787332078656e-05, - "loss": 0.0207, + "epoch": 1.0, + "learning_rate": 0.0001493000380799938, + "loss": 0.0333, "step": 155660 }, { - "epoch": 1.68, - "learning_rate": 4.74365630475696e-05, - "loss": 0.0281, + "epoch": 1.0, + "learning_rate": 0.00014929035672563685, + "loss": 0.0375, "step": 155670 }, { - "epoch": 1.68, - "learning_rate": 4.742033876306055e-05, - "loss": 0.0251, + "epoch": 1.0, + "learning_rate": 0.00014928067537127993, + "loss": 0.0377, "step": 155680 }, { - "epoch": 1.68, - "learning_rate": 4.740411447855149e-05, - "loss": 0.0271, + "epoch": 1.0, + "learning_rate": 0.00014927099401692298, + "loss": 0.0347, "step": 155690 }, { - "epoch": 1.68, - "learning_rate": 4.738789019404244e-05, - "loss": 0.0297, + "epoch": 1.0, + "learning_rate": 0.00014926131266256606, + "loss": 0.0315, "step": 155700 }, { - "epoch": 1.68, - "learning_rate": 4.737166590953339e-05, - "loss": 0.0254, + "epoch": 1.0, + "learning_rate": 0.00014925163130820914, + "loss": 0.0374, "step": 155710 }, { - "epoch": 1.68, - "learning_rate": 4.7355441625024334e-05, - "loss": 0.0279, + "epoch": 1.01, + "learning_rate": 0.0001492419499538522, + "loss": 0.0337, "step": 155720 }, { - "epoch": 1.68, - "learning_rate": 4.7339217340515284e-05, - "loss": 0.0215, + "epoch": 1.01, + "learning_rate": 0.00014923226859949528, + "loss": 0.0357, "step": 155730 }, { - "epoch": 1.68, - "learning_rate": 4.732299305600623e-05, - "loss": 0.0283, + "epoch": 1.01, + "learning_rate": 0.00014922258724513833, + "loss": 0.036, "step": 155740 }, { - "epoch": 1.68, - "learning_rate": 4.7306768771497176e-05, - "loss": 0.0255, + "epoch": 1.01, + "learning_rate": 0.0001492129058907814, + "loss": 0.042, "step": 155750 }, { - "epoch": 1.68, - "learning_rate": 4.729054448698812e-05, - "loss": 0.0246, + "epoch": 1.01, + "learning_rate": 0.00014920322453642446, + "loss": 0.0397, "step": 155760 }, { - "epoch": 1.68, - "learning_rate": 4.727432020247907e-05, - "loss": 0.0306, + "epoch": 1.01, + "learning_rate": 0.00014919354318206754, + "loss": 0.0328, "step": 155770 }, { - "epoch": 1.68, - "learning_rate": 4.725809591797001e-05, - "loss": 0.0327, + "epoch": 1.01, + "learning_rate": 0.00014918386182771062, + "loss": 0.0395, "step": 155780 }, { - "epoch": 1.69, - "learning_rate": 4.724187163346096e-05, - "loss": 0.0286, + "epoch": 1.01, + "learning_rate": 0.00014917418047335367, + "loss": 0.0388, "step": 155790 }, { - "epoch": 1.69, - "learning_rate": 4.722564734895191e-05, - "loss": 0.0283, + "epoch": 1.01, + "learning_rate": 0.00014916449911899673, + "loss": 0.0373, "step": 155800 }, { - "epoch": 1.69, - "learning_rate": 4.7209423064442855e-05, - "loss": 0.0231, + "epoch": 1.01, + "learning_rate": 0.0001491548177646398, + "loss": 0.0382, "step": 155810 }, { - "epoch": 1.69, - "learning_rate": 4.7193198779933805e-05, - "loss": 0.0273, + "epoch": 1.01, + "learning_rate": 0.00014914513641028289, + "loss": 0.0438, "step": 155820 }, { - "epoch": 1.69, - "learning_rate": 4.717697449542475e-05, - "loss": 0.0236, + "epoch": 1.01, + "learning_rate": 0.00014913545505592594, + "loss": 0.0337, "step": 155830 }, { - "epoch": 1.69, - "learning_rate": 4.71607502109157e-05, - "loss": 0.0232, + "epoch": 1.01, + "learning_rate": 0.00014912577370156902, + "loss": 0.0339, "step": 155840 }, { - "epoch": 1.69, - "learning_rate": 4.714452592640664e-05, - "loss": 0.0235, + "epoch": 1.01, + "learning_rate": 0.0001491160923472121, + "loss": 0.0367, "step": 155850 }, { - "epoch": 1.69, - "learning_rate": 4.712830164189759e-05, - "loss": 0.0259, + "epoch": 1.01, + "learning_rate": 0.00014910641099285515, + "loss": 0.0343, "step": 155860 }, { - "epoch": 1.69, - "learning_rate": 4.711207735738853e-05, - "loss": 0.0273, + "epoch": 1.01, + "learning_rate": 0.0001490967296384982, + "loss": 0.032, "step": 155870 }, { - "epoch": 1.69, - "learning_rate": 4.709585307287948e-05, - "loss": 0.0278, + "epoch": 1.01, + "learning_rate": 0.00014908704828414128, + "loss": 0.0319, "step": 155880 }, { - "epoch": 1.69, - "learning_rate": 4.707962878837043e-05, - "loss": 0.0263, - "step": 155890 + "epoch": 1.01, + "learning_rate": 0.00014907736692978436, + "loss": 0.0325, + "step": 155890 }, { - "epoch": 1.69, - "learning_rate": 4.7063404503861376e-05, - "loss": 0.0279, + "epoch": 1.01, + "learning_rate": 0.00014906768557542742, + "loss": 0.0347, "step": 155900 }, { - "epoch": 1.69, - "learning_rate": 4.7047180219352325e-05, - "loss": 0.0224, + "epoch": 1.01, + "learning_rate": 0.0001490580042210705, + "loss": 0.0386, "step": 155910 }, { - "epoch": 1.69, - "learning_rate": 4.703095593484327e-05, - "loss": 0.0342, + "epoch": 1.01, + "learning_rate": 0.00014904832286671355, + "loss": 0.0361, "step": 155920 }, { - "epoch": 1.69, - "learning_rate": 4.701473165033422e-05, - "loss": 0.0276, + "epoch": 1.01, + "learning_rate": 0.00014903864151235663, + "loss": 0.0312, "step": 155930 }, { - "epoch": 1.69, - "learning_rate": 4.699850736582516e-05, - "loss": 0.0259, + "epoch": 1.01, + "learning_rate": 0.00014902896015799968, + "loss": 0.0369, "step": 155940 }, { - "epoch": 1.69, - "learning_rate": 4.698228308131611e-05, - "loss": 0.0257, + "epoch": 1.01, + "learning_rate": 0.00014901927880364276, + "loss": 0.0361, "step": 155950 }, { - "epoch": 1.69, - "learning_rate": 4.696605879680706e-05, - "loss": 0.0236, + "epoch": 1.01, + "learning_rate": 0.00014900959744928584, + "loss": 0.035, "step": 155960 }, { - "epoch": 1.69, - "learning_rate": 4.6949834512298004e-05, - "loss": 0.0246, + "epoch": 1.01, + "learning_rate": 0.0001489999160949289, + "loss": 0.0373, "step": 155970 }, { - "epoch": 1.69, - "learning_rate": 4.6933610227788953e-05, - "loss": 0.0249, + "epoch": 1.01, + "learning_rate": 0.00014899023474057197, + "loss": 0.035, "step": 155980 }, { - "epoch": 1.69, - "learning_rate": 4.6917385943279896e-05, - "loss": 0.0267, + "epoch": 1.01, + "learning_rate": 0.00014898055338621503, + "loss": 0.0393, "step": 155990 }, { - "epoch": 1.69, - "learning_rate": 4.6901161658770846e-05, - "loss": 0.0247, + "epoch": 1.01, + "learning_rate": 0.00014897087203185808, + "loss": 0.036, "step": 156000 }, { - "epoch": 1.69, - "eval_cer": 0.9210942483403747, - "eval_loss": 0.02218388393521309, - "eval_runtime": 118.9596, - "eval_samples_per_second": 16.812, - "eval_steps_per_second": 4.203, + "epoch": 1.01, + "eval_cer": 0.9199502881030392, + "eval_loss": 0.02528407983481884, + "eval_runtime": 120.345, + "eval_samples_per_second": 16.619, + "eval_steps_per_second": 4.155, "step": 156000 }, { - "epoch": 1.69, - "learning_rate": 4.688493737426179e-05, - "loss": 0.0235, + "epoch": 1.01, + "learning_rate": 0.00014896119067750116, + "loss": 0.033, "step": 156010 }, { - "epoch": 1.69, - "learning_rate": 4.686871308975274e-05, - "loss": 0.0252, + "epoch": 1.01, + "learning_rate": 0.00014895150932314424, + "loss": 0.0362, "step": 156020 }, { - "epoch": 1.69, - "learning_rate": 4.685248880524368e-05, - "loss": 0.0252, + "epoch": 1.01, + "learning_rate": 0.00014894182796878732, + "loss": 0.0361, "step": 156030 }, { - "epoch": 1.69, - "learning_rate": 4.683626452073463e-05, - "loss": 0.024, + "epoch": 1.01, + "learning_rate": 0.00014893214661443037, + "loss": 0.0355, "step": 156040 }, { - "epoch": 1.69, - "learning_rate": 4.682004023622558e-05, - "loss": 0.0234, + "epoch": 1.01, + "learning_rate": 0.00014892246526007345, + "loss": 0.0323, "step": 156050 }, { - "epoch": 1.69, - "learning_rate": 4.6803815951716524e-05, - "loss": 0.0265, + "epoch": 1.01, + "learning_rate": 0.0001489127839057165, + "loss": 0.0364, "step": 156060 }, { - "epoch": 1.69, - "learning_rate": 4.6787591667207474e-05, - "loss": 0.0268, + "epoch": 1.01, + "learning_rate": 0.00014890310255135956, + "loss": 0.0345, "step": 156070 }, { - "epoch": 1.69, - "learning_rate": 4.677136738269842e-05, - "loss": 0.0241, + "epoch": 1.01, + "learning_rate": 0.00014889342119700264, + "loss": 0.0359, "step": 156080 }, { - "epoch": 1.69, - "learning_rate": 4.675514309818937e-05, - "loss": 0.0257, + "epoch": 1.01, + "learning_rate": 0.00014888373984264572, + "loss": 0.033, "step": 156090 }, { - "epoch": 1.69, - "learning_rate": 4.673891881368031e-05, - "loss": 0.0259, + "epoch": 1.01, + "learning_rate": 0.0001488740584882888, + "loss": 0.0332, "step": 156100 }, { - "epoch": 1.69, - "learning_rate": 4.672269452917126e-05, - "loss": 0.0278, + "epoch": 1.01, + "learning_rate": 0.00014886437713393185, + "loss": 0.035, "step": 156110 }, { - "epoch": 1.69, - "learning_rate": 4.67064702446622e-05, - "loss": 0.0227, + "epoch": 1.01, + "learning_rate": 0.0001488546957795749, + "loss": 0.0328, "step": 156120 }, { - "epoch": 1.69, - "learning_rate": 4.669024596015315e-05, - "loss": 0.0233, + "epoch": 1.01, + "learning_rate": 0.00014884501442521798, + "loss": 0.0366, "step": 156130 }, { - "epoch": 1.69, - "learning_rate": 4.66740216756441e-05, - "loss": 0.0237, + "epoch": 1.01, + "learning_rate": 0.00014883533307086103, + "loss": 0.0341, "step": 156140 }, { - "epoch": 1.69, - "learning_rate": 4.6657797391135045e-05, - "loss": 0.0296, + "epoch": 1.01, + "learning_rate": 0.0001488256517165041, + "loss": 0.0368, "step": 156150 }, { - "epoch": 1.69, - "learning_rate": 4.6641573106625995e-05, - "loss": 0.032, + "epoch": 1.01, + "learning_rate": 0.0001488159703621472, + "loss": 0.0365, "step": 156160 }, { - "epoch": 1.69, - "learning_rate": 4.662534882211694e-05, - "loss": 0.0234, + "epoch": 1.01, + "learning_rate": 0.00014880628900779025, + "loss": 0.0314, "step": 156170 }, { - "epoch": 1.69, - "learning_rate": 4.660912453760789e-05, - "loss": 0.0276, + "epoch": 1.01, + "learning_rate": 0.00014879660765343333, + "loss": 0.0368, "step": 156180 }, { - "epoch": 1.69, - "learning_rate": 4.659290025309883e-05, - "loss": 0.0261, + "epoch": 1.01, + "learning_rate": 0.00014878692629907638, + "loss": 0.0358, "step": 156190 }, { - "epoch": 1.69, - "learning_rate": 4.657667596858978e-05, - "loss": 0.023, + "epoch": 1.01, + "learning_rate": 0.00014877724494471946, + "loss": 0.0384, "step": 156200 }, { - "epoch": 1.69, - "learning_rate": 4.6560451684080724e-05, - "loss": 0.0252, + "epoch": 1.01, + "learning_rate": 0.0001487675635903625, + "loss": 0.0436, "step": 156210 }, { - "epoch": 1.69, - "learning_rate": 4.654422739957167e-05, - "loss": 0.029, + "epoch": 1.01, + "learning_rate": 0.0001487578822360056, + "loss": 0.0323, "step": 156220 }, { - "epoch": 1.69, - "learning_rate": 4.652800311506262e-05, - "loss": 0.0238, + "epoch": 1.01, + "learning_rate": 0.00014874820088164867, + "loss": 0.0325, "step": 156230 }, { - "epoch": 1.69, - "learning_rate": 4.6511778830553566e-05, - "loss": 0.0298, + "epoch": 1.01, + "learning_rate": 0.00014873851952729172, + "loss": 0.0322, "step": 156240 }, { - "epoch": 1.69, - "learning_rate": 4.6495554546044516e-05, - "loss": 0.0238, + "epoch": 1.01, + "learning_rate": 0.0001487288381729348, + "loss": 0.0321, "step": 156250 }, { - "epoch": 1.69, - "learning_rate": 4.647933026153546e-05, - "loss": 0.026, + "epoch": 1.01, + "learning_rate": 0.00014871915681857785, + "loss": 0.0336, "step": 156260 }, { - "epoch": 1.69, - "learning_rate": 4.646310597702641e-05, - "loss": 0.0281, + "epoch": 1.01, + "learning_rate": 0.00014870947546422093, + "loss": 0.0343, "step": 156270 }, { - "epoch": 1.69, - "learning_rate": 4.644688169251735e-05, - "loss": 0.0295, + "epoch": 1.01, + "learning_rate": 0.000148699794109864, + "loss": 0.0333, "step": 156280 }, { - "epoch": 1.69, - "learning_rate": 4.64306574080083e-05, - "loss": 0.0289, + "epoch": 1.01, + "learning_rate": 0.00014869011275550707, + "loss": 0.035, "step": 156290 }, { - "epoch": 1.69, - "learning_rate": 4.641443312349925e-05, - "loss": 0.0314, + "epoch": 1.01, + "learning_rate": 0.00014868043140115015, + "loss": 0.0302, "step": 156300 }, { - "epoch": 1.69, - "learning_rate": 4.6398208838990194e-05, - "loss": 0.0281, + "epoch": 1.01, + "learning_rate": 0.0001486707500467932, + "loss": 0.0346, "step": 156310 }, { - "epoch": 1.69, - "learning_rate": 4.6381984554481144e-05, - "loss": 0.0254, + "epoch": 1.01, + "learning_rate": 0.00014866106869243625, + "loss": 0.0356, "step": 156320 }, { - "epoch": 1.69, - "learning_rate": 4.636576026997209e-05, - "loss": 0.0289, + "epoch": 1.01, + "learning_rate": 0.00014865138733807933, + "loss": 0.035, "step": 156330 }, { - "epoch": 1.69, - "learning_rate": 4.634953598546304e-05, - "loss": 0.0314, + "epoch": 1.01, + "learning_rate": 0.0001486417059837224, + "loss": 0.0325, "step": 156340 }, { - "epoch": 1.69, - "learning_rate": 4.633331170095398e-05, - "loss": 0.0246, + "epoch": 1.01, + "learning_rate": 0.00014863202462936546, + "loss": 0.0368, "step": 156350 }, { - "epoch": 1.69, - "learning_rate": 4.631708741644493e-05, - "loss": 0.023, + "epoch": 1.01, + "learning_rate": 0.00014862234327500854, + "loss": 0.0388, "step": 156360 }, { - "epoch": 1.69, - "learning_rate": 4.630086313193587e-05, - "loss": 0.0227, + "epoch": 1.01, + "learning_rate": 0.0001486126619206516, + "loss": 0.0395, "step": 156370 }, { - "epoch": 1.69, - "learning_rate": 4.628463884742682e-05, - "loss": 0.0275, + "epoch": 1.01, + "learning_rate": 0.00014860298056629468, + "loss": 0.0352, "step": 156380 }, { - "epoch": 1.69, - "learning_rate": 4.626841456291777e-05, - "loss": 0.0233, + "epoch": 1.01, + "learning_rate": 0.00014859329921193773, + "loss": 0.0396, "step": 156390 }, { - "epoch": 1.69, - "learning_rate": 4.6252190278408715e-05, - "loss": 0.0227, + "epoch": 1.01, + "learning_rate": 0.0001485836178575808, + "loss": 0.0346, "step": 156400 }, { - "epoch": 1.69, - "learning_rate": 4.6235965993899665e-05, - "loss": 0.0273, + "epoch": 1.01, + "learning_rate": 0.0001485739365032239, + "loss": 0.0322, "step": 156410 }, { - "epoch": 1.69, - "learning_rate": 4.621974170939061e-05, - "loss": 0.0255, + "epoch": 1.01, + "learning_rate": 0.00014856425514886694, + "loss": 0.0353, "step": 156420 }, { - "epoch": 1.69, - "learning_rate": 4.620351742488156e-05, - "loss": 0.0209, + "epoch": 1.01, + "learning_rate": 0.00014855457379451002, + "loss": 0.0328, "step": 156430 }, { - "epoch": 1.69, - "learning_rate": 4.61872931403725e-05, - "loss": 0.0249, + "epoch": 1.01, + "learning_rate": 0.00014854489244015307, + "loss": 0.0312, "step": 156440 }, { - "epoch": 1.69, - "learning_rate": 4.617106885586345e-05, - "loss": 0.0233, + "epoch": 1.01, + "learning_rate": 0.00014853521108579615, + "loss": 0.0401, "step": 156450 }, { - "epoch": 1.69, - "learning_rate": 4.615484457135439e-05, - "loss": 0.0251, + "epoch": 1.01, + "learning_rate": 0.0001485255297314392, + "loss": 0.0396, "step": 156460 }, { - "epoch": 1.69, - "learning_rate": 4.613862028684534e-05, - "loss": 0.0258, + "epoch": 1.01, + "learning_rate": 0.0001485158483770823, + "loss": 0.0359, "step": 156470 }, { - "epoch": 1.69, - "learning_rate": 4.612239600233629e-05, - "loss": 0.025, + "epoch": 1.01, + "learning_rate": 0.00014850616702272537, + "loss": 0.0315, "step": 156480 }, { - "epoch": 1.69, - "learning_rate": 4.6106171717827236e-05, - "loss": 0.0206, + "epoch": 1.01, + "learning_rate": 0.00014849648566836842, + "loss": 0.036, "step": 156490 }, { - "epoch": 1.69, - "learning_rate": 4.6089947433318186e-05, - "loss": 0.0297, + "epoch": 1.01, + "learning_rate": 0.0001484868043140115, + "loss": 0.0372, "step": 156500 }, { - "epoch": 1.69, - "learning_rate": 4.607372314880913e-05, - "loss": 0.0257, + "epoch": 1.01, + "learning_rate": 0.00014847712295965455, + "loss": 0.0349, "step": 156510 }, { - "epoch": 1.69, - "learning_rate": 4.605749886430008e-05, - "loss": 0.0338, + "epoch": 1.01, + "learning_rate": 0.00014846744160529763, + "loss": 0.0319, "step": 156520 }, { - "epoch": 1.69, - "learning_rate": 4.604127457979102e-05, - "loss": 0.0224, + "epoch": 1.01, + "learning_rate": 0.00014845776025094068, + "loss": 0.0339, "step": 156530 }, { - "epoch": 1.69, - "learning_rate": 4.602505029528197e-05, - "loss": 0.0279, + "epoch": 1.01, + "learning_rate": 0.00014844807889658376, + "loss": 0.0304, "step": 156540 }, { - "epoch": 1.69, - "learning_rate": 4.6008826010772914e-05, - "loss": 0.03, + "epoch": 1.01, + "learning_rate": 0.00014843839754222684, + "loss": 0.0333, "step": 156550 }, { - "epoch": 1.69, - "learning_rate": 4.5992601726263864e-05, - "loss": 0.021, + "epoch": 1.01, + "learning_rate": 0.0001484287161878699, + "loss": 0.0395, "step": 156560 }, { - "epoch": 1.69, - "learning_rate": 4.5976377441754814e-05, - "loss": 0.0249, + "epoch": 1.01, + "learning_rate": 0.00014841903483351295, + "loss": 0.0306, "step": 156570 }, { - "epoch": 1.69, - "learning_rate": 4.596015315724576e-05, - "loss": 0.0319, + "epoch": 1.01, + "learning_rate": 0.00014840935347915603, + "loss": 0.0392, "step": 156580 }, { - "epoch": 1.69, - "learning_rate": 4.5943928872736706e-05, - "loss": 0.0211, + "epoch": 1.01, + "learning_rate": 0.0001483996721247991, + "loss": 0.0362, "step": 156590 }, { - "epoch": 1.69, - "learning_rate": 4.592770458822765e-05, - "loss": 0.0282, + "epoch": 1.01, + "learning_rate": 0.00014838999077044216, + "loss": 0.0354, "step": 156600 }, { - "epoch": 1.69, - "learning_rate": 4.59114803037186e-05, - "loss": 0.0264, + "epoch": 1.01, + "learning_rate": 0.00014838030941608524, + "loss": 0.0394, "step": 156610 }, { - "epoch": 1.69, - "learning_rate": 4.589525601920954e-05, - "loss": 0.0267, + "epoch": 1.01, + "learning_rate": 0.00014837062806172832, + "loss": 0.0384, "step": 156620 }, { - "epoch": 1.69, - "learning_rate": 4.587903173470049e-05, - "loss": 0.0263, + "epoch": 1.01, + "learning_rate": 0.00014836094670737137, + "loss": 0.0371, "step": 156630 }, { - "epoch": 1.69, - "learning_rate": 4.586280745019145e-05, - "loss": 0.0277, + "epoch": 1.01, + "learning_rate": 0.00014835126535301443, + "loss": 0.0361, "step": 156640 }, { - "epoch": 1.69, - "learning_rate": 4.584658316568239e-05, - "loss": 0.0334, + "epoch": 1.01, + "learning_rate": 0.0001483415839986575, + "loss": 0.038, "step": 156650 }, { - "epoch": 1.69, - "learning_rate": 4.583035888117334e-05, - "loss": 0.0247, + "epoch": 1.01, + "learning_rate": 0.00014833190264430056, + "loss": 0.0401, "step": 156660 }, { - "epoch": 1.69, - "learning_rate": 4.5814134596664284e-05, - "loss": 0.0266, + "epoch": 1.01, + "learning_rate": 0.00014832222128994364, + "loss": 0.0358, "step": 156670 }, { - "epoch": 1.69, - "learning_rate": 4.5797910312155234e-05, - "loss": 0.0298, + "epoch": 1.01, + "learning_rate": 0.00014831253993558672, + "loss": 0.0357, "step": 156680 }, { - "epoch": 1.69, - "learning_rate": 4.5781686027646184e-05, - "loss": 0.0315, + "epoch": 1.01, + "learning_rate": 0.00014830285858122977, + "loss": 0.0317, "step": 156690 }, { - "epoch": 1.69, - "learning_rate": 4.576546174313713e-05, - "loss": 0.0254, + "epoch": 1.01, + "learning_rate": 0.00014829317722687285, + "loss": 0.0383, "step": 156700 }, { - "epoch": 1.69, - "learning_rate": 4.5749237458628077e-05, - "loss": 0.0219, + "epoch": 1.01, + "learning_rate": 0.0001482834958725159, + "loss": 0.0296, "step": 156710 }, { - "epoch": 1.7, - "learning_rate": 4.573301317411902e-05, - "loss": 0.0262, + "epoch": 1.01, + "learning_rate": 0.00014827381451815898, + "loss": 0.0369, "step": 156720 }, { - "epoch": 1.7, - "learning_rate": 4.571678888960997e-05, - "loss": 0.0223, + "epoch": 1.01, + "learning_rate": 0.00014826413316380204, + "loss": 0.041, "step": 156730 }, { - "epoch": 1.7, - "learning_rate": 4.570056460510091e-05, - "loss": 0.0309, + "epoch": 1.01, + "learning_rate": 0.00014825445180944512, + "loss": 0.0367, "step": 156740 }, { - "epoch": 1.7, - "learning_rate": 4.568434032059186e-05, - "loss": 0.0242, + "epoch": 1.01, + "learning_rate": 0.0001482447704550882, + "loss": 0.0366, "step": 156750 }, { - "epoch": 1.7, - "learning_rate": 4.5668116036082805e-05, - "loss": 0.0242, + "epoch": 1.01, + "learning_rate": 0.00014823508910073125, + "loss": 0.0356, "step": 156760 }, { - "epoch": 1.7, - "learning_rate": 4.5651891751573755e-05, - "loss": 0.0275, + "epoch": 1.01, + "learning_rate": 0.0001482254077463743, + "loss": 0.0386, "step": 156770 }, { - "epoch": 1.7, - "learning_rate": 4.5635667467064705e-05, - "loss": 0.0309, + "epoch": 1.01, + "learning_rate": 0.00014821572639201738, + "loss": 0.0351, "step": 156780 }, { - "epoch": 1.7, - "learning_rate": 4.561944318255565e-05, - "loss": 0.0302, + "epoch": 1.01, + "learning_rate": 0.00014820604503766046, + "loss": 0.0379, "step": 156790 }, { - "epoch": 1.7, - "learning_rate": 4.56032188980466e-05, - "loss": 0.0284, + "epoch": 1.01, + "learning_rate": 0.0001481963636833035, + "loss": 0.0347, "step": 156800 }, { - "epoch": 1.7, - "learning_rate": 4.558699461353754e-05, - "loss": 0.0282, + "epoch": 1.01, + "learning_rate": 0.0001481866823289466, + "loss": 0.036, "step": 156810 }, { - "epoch": 1.7, - "learning_rate": 4.557077032902849e-05, - "loss": 0.0291, + "epoch": 1.01, + "learning_rate": 0.00014817700097458967, + "loss": 0.0326, "step": 156820 }, { - "epoch": 1.7, - "learning_rate": 4.555454604451943e-05, - "loss": 0.0271, + "epoch": 1.01, + "learning_rate": 0.00014816731962023273, + "loss": 0.0337, "step": 156830 }, { - "epoch": 1.7, - "learning_rate": 4.553832176001038e-05, - "loss": 0.0218, + "epoch": 1.01, + "learning_rate": 0.00014815763826587578, + "loss": 0.039, "step": 156840 }, { - "epoch": 1.7, - "learning_rate": 4.5522097475501326e-05, - "loss": 0.0231, + "epoch": 1.01, + "learning_rate": 0.00014814795691151886, + "loss": 0.0376, "step": 156850 }, { - "epoch": 1.7, - "learning_rate": 4.5505873190992276e-05, - "loss": 0.0297, + "epoch": 1.01, + "learning_rate": 0.00014813827555716194, + "loss": 0.0338, "step": 156860 }, { - "epoch": 1.7, - "learning_rate": 4.5489648906483225e-05, - "loss": 0.0313, + "epoch": 1.01, + "learning_rate": 0.000148128594202805, + "loss": 0.0343, "step": 156870 }, { - "epoch": 1.7, - "learning_rate": 4.547342462197417e-05, + "epoch": 1.01, + "learning_rate": 0.00014811891284844807, "loss": 0.0305, "step": 156880 }, { - "epoch": 1.7, - "learning_rate": 4.545720033746512e-05, - "loss": 0.0247, + "epoch": 1.01, + "learning_rate": 0.00014810923149409112, + "loss": 0.0355, "step": 156890 }, { - "epoch": 1.7, - "learning_rate": 4.544097605295606e-05, - "loss": 0.0266, + "epoch": 1.01, + "learning_rate": 0.0001480995501397342, + "loss": 0.0377, "step": 156900 }, { - "epoch": 1.7, - "learning_rate": 4.542475176844701e-05, - "loss": 0.0258, + "epoch": 1.01, + "learning_rate": 0.00014808986878537726, + "loss": 0.0286, "step": 156910 }, { - "epoch": 1.7, - "learning_rate": 4.5408527483937954e-05, - "loss": 0.0315, + "epoch": 1.01, + "learning_rate": 0.00014808018743102034, + "loss": 0.042, "step": 156920 }, { - "epoch": 1.7, - "learning_rate": 4.5392303199428904e-05, - "loss": 0.0351, + "epoch": 1.01, + "learning_rate": 0.00014807050607666341, + "loss": 0.0347, "step": 156930 }, { - "epoch": 1.7, - "learning_rate": 4.537607891491985e-05, - "loss": 0.0297, + "epoch": 1.01, + "learning_rate": 0.00014806082472230647, + "loss": 0.0358, "step": 156940 }, { - "epoch": 1.7, - "learning_rate": 4.5359854630410797e-05, - "loss": 0.0283, + "epoch": 1.01, + "learning_rate": 0.00014805114336794955, + "loss": 0.0417, "step": 156950 }, { - "epoch": 1.7, - "learning_rate": 4.5343630345901746e-05, - "loss": 0.0236, + "epoch": 1.01, + "learning_rate": 0.0001480414620135926, + "loss": 0.0336, "step": 156960 }, { - "epoch": 1.7, - "learning_rate": 4.532740606139269e-05, - "loss": 0.0254, + "epoch": 1.01, + "learning_rate": 0.00014803178065923568, + "loss": 0.0333, "step": 156970 }, { - "epoch": 1.7, - "learning_rate": 4.531118177688364e-05, - "loss": 0.0266, + "epoch": 1.01, + "learning_rate": 0.00014802209930487873, + "loss": 0.032, "step": 156980 }, { - "epoch": 1.7, - "learning_rate": 4.529495749237458e-05, - "loss": 0.0272, + "epoch": 1.01, + "learning_rate": 0.0001480124179505218, + "loss": 0.0318, "step": 156990 }, { - "epoch": 1.7, - "learning_rate": 4.527873320786553e-05, - "loss": 0.0295, + "epoch": 1.01, + "learning_rate": 0.0001480027365961649, + "loss": 0.0345, "step": 157000 }, { - "epoch": 1.7, - "eval_cer": 0.921128704228886, - "eval_loss": 0.021839609369635582, - "eval_runtime": 118.9554, - "eval_samples_per_second": 16.813, - "eval_steps_per_second": 4.203, + "epoch": 1.01, + "eval_cer": 0.9199014800587504, + "eval_loss": 0.025441249832510948, + "eval_runtime": 120.9546, + "eval_samples_per_second": 16.535, + "eval_steps_per_second": 4.134, "step": 157000 }, { - "epoch": 1.7, - "learning_rate": 4.5262508923356475e-05, - "loss": 0.0246, + "epoch": 1.01, + "learning_rate": 0.00014799305524180794, + "loss": 0.0367, "step": 157010 }, { - "epoch": 1.7, - "learning_rate": 4.5246284638847425e-05, - "loss": 0.0267, + "epoch": 1.01, + "learning_rate": 0.00014798337388745102, + "loss": 0.0335, "step": 157020 }, { - "epoch": 1.7, - "learning_rate": 4.5230060354338374e-05, - "loss": 0.0225, + "epoch": 1.01, + "learning_rate": 0.00014797369253309408, + "loss": 0.0405, "step": 157030 }, { - "epoch": 1.7, - "learning_rate": 4.521383606982932e-05, - "loss": 0.0286, + "epoch": 1.01, + "learning_rate": 0.00014796401117873716, + "loss": 0.0323, "step": 157040 }, { - "epoch": 1.7, - "learning_rate": 4.519761178532027e-05, - "loss": 0.0254, + "epoch": 1.01, + "learning_rate": 0.0001479543298243802, + "loss": 0.0383, "step": 157050 }, { - "epoch": 1.7, - "learning_rate": 4.518138750081121e-05, - "loss": 0.0291, + "epoch": 1.01, + "learning_rate": 0.0001479446484700233, + "loss": 0.0342, "step": 157060 }, { - "epoch": 1.7, - "learning_rate": 4.516516321630216e-05, - "loss": 0.0328, + "epoch": 1.01, + "learning_rate": 0.00014793496711566637, + "loss": 0.0357, "step": 157070 }, { - "epoch": 1.7, - "learning_rate": 4.51489389317931e-05, - "loss": 0.022, + "epoch": 1.01, + "learning_rate": 0.00014792528576130942, + "loss": 0.0357, "step": 157080 }, { - "epoch": 1.7, - "learning_rate": 4.513271464728405e-05, - "loss": 0.0293, + "epoch": 1.01, + "learning_rate": 0.00014791560440695247, + "loss": 0.0307, "step": 157090 }, { - "epoch": 1.7, - "learning_rate": 4.5116490362774996e-05, - "loss": 0.0322, + "epoch": 1.01, + "learning_rate": 0.00014790592305259555, + "loss": 0.0318, "step": 157100 }, { - "epoch": 1.7, - "learning_rate": 4.5100266078265945e-05, - "loss": 0.0266, + "epoch": 1.01, + "learning_rate": 0.00014789624169823863, + "loss": 0.031, "step": 157110 }, { - "epoch": 1.7, - "learning_rate": 4.5084041793756895e-05, - "loss": 0.026, + "epoch": 1.01, + "learning_rate": 0.0001478865603438817, + "loss": 0.0341, "step": 157120 }, { - "epoch": 1.7, - "learning_rate": 4.506781750924784e-05, - "loss": 0.0253, + "epoch": 1.01, + "learning_rate": 0.00014787687898952477, + "loss": 0.0392, "step": 157130 }, { - "epoch": 1.7, - "learning_rate": 4.505159322473879e-05, - "loss": 0.0281, + "epoch": 1.01, + "learning_rate": 0.00014786719763516785, + "loss": 0.0325, "step": 157140 }, { - "epoch": 1.7, - "learning_rate": 4.503536894022973e-05, - "loss": 0.0277, + "epoch": 1.01, + "learning_rate": 0.0001478575162808109, + "loss": 0.0384, "step": 157150 }, { - "epoch": 1.7, - "learning_rate": 4.501914465572068e-05, - "loss": 0.0249, - "step": 157160 + "epoch": 1.01, + "learning_rate": 0.00014784783492645395, + "loss": 0.0354, + "step": 157160 }, { - "epoch": 1.7, - "learning_rate": 4.5002920371211624e-05, - "loss": 0.0308, + "epoch": 1.01, + "learning_rate": 0.00014783815357209703, + "loss": 0.0405, "step": 157170 }, { - "epoch": 1.7, - "learning_rate": 4.4986696086702574e-05, - "loss": 0.0275, + "epoch": 1.01, + "learning_rate": 0.0001478284722177401, + "loss": 0.0436, "step": 157180 }, { - "epoch": 1.7, - "learning_rate": 4.4970471802193517e-05, - "loss": 0.0262, + "epoch": 1.01, + "learning_rate": 0.00014781879086338316, + "loss": 0.0335, "step": 157190 }, { - "epoch": 1.7, - "learning_rate": 4.4954247517684466e-05, - "loss": 0.0232, + "epoch": 1.01, + "learning_rate": 0.00014780910950902624, + "loss": 0.0316, "step": 157200 }, { - "epoch": 1.7, - "learning_rate": 4.4938023233175416e-05, - "loss": 0.028, + "epoch": 1.01, + "learning_rate": 0.0001477994281546693, + "loss": 0.037, "step": 157210 }, { - "epoch": 1.7, - "learning_rate": 4.492179894866636e-05, - "loss": 0.0307, + "epoch": 1.01, + "learning_rate": 0.00014778974680031238, + "loss": 0.0349, "step": 157220 }, { - "epoch": 1.7, - "learning_rate": 4.490557466415731e-05, - "loss": 0.028, + "epoch": 1.01, + "learning_rate": 0.00014778006544595543, + "loss": 0.0392, "step": 157230 }, { - "epoch": 1.7, - "learning_rate": 4.488935037964825e-05, - "loss": 0.0311, + "epoch": 1.01, + "learning_rate": 0.0001477703840915985, + "loss": 0.0352, "step": 157240 }, { - "epoch": 1.7, - "learning_rate": 4.48731260951392e-05, - "loss": 0.0252, + "epoch": 1.01, + "learning_rate": 0.0001477607027372416, + "loss": 0.0312, "step": 157250 }, { - "epoch": 1.7, - "learning_rate": 4.4856901810630145e-05, - "loss": 0.0246, + "epoch": 1.01, + "learning_rate": 0.00014775102138288464, + "loss": 0.0348, "step": 157260 }, { - "epoch": 1.7, - "learning_rate": 4.4840677526121094e-05, - "loss": 0.0276, + "epoch": 1.02, + "learning_rate": 0.00014774134002852772, + "loss": 0.0364, "step": 157270 }, { - "epoch": 1.7, - "learning_rate": 4.482445324161204e-05, - "loss": 0.0302, + "epoch": 1.02, + "learning_rate": 0.00014773165867417077, + "loss": 0.0375, "step": 157280 }, { - "epoch": 1.7, - "learning_rate": 4.480822895710299e-05, - "loss": 0.0271, + "epoch": 1.02, + "learning_rate": 0.00014772197731981383, + "loss": 0.0359, "step": 157290 }, { - "epoch": 1.7, - "learning_rate": 4.479200467259394e-05, - "loss": 0.0238, + "epoch": 1.02, + "learning_rate": 0.0001477122959654569, + "loss": 0.0311, "step": 157300 }, { - "epoch": 1.7, - "learning_rate": 4.477578038808488e-05, - "loss": 0.0295, + "epoch": 1.02, + "learning_rate": 0.00014770261461109999, + "loss": 0.0327, "step": 157310 }, { - "epoch": 1.7, - "learning_rate": 4.475955610357583e-05, - "loss": 0.0205, + "epoch": 1.02, + "learning_rate": 0.00014769293325674307, + "loss": 0.0332, "step": 157320 }, { - "epoch": 1.7, - "learning_rate": 4.474333181906677e-05, - "loss": 0.0302, + "epoch": 1.02, + "learning_rate": 0.00014768325190238612, + "loss": 0.0377, "step": 157330 }, { - "epoch": 1.7, - "learning_rate": 4.472710753455772e-05, - "loss": 0.0258, + "epoch": 1.02, + "learning_rate": 0.0001476735705480292, + "loss": 0.0333, "step": 157340 }, { - "epoch": 1.7, - "learning_rate": 4.4710883250048665e-05, - "loss": 0.0308, + "epoch": 1.02, + "learning_rate": 0.00014766388919367225, + "loss": 0.0331, "step": 157350 }, { - "epoch": 1.7, - "learning_rate": 4.4694658965539615e-05, - "loss": 0.0298, + "epoch": 1.02, + "learning_rate": 0.0001476542078393153, + "loss": 0.036, "step": 157360 }, { - "epoch": 1.7, - "learning_rate": 4.4678434681030565e-05, - "loss": 0.0254, + "epoch": 1.02, + "learning_rate": 0.00014764452648495838, + "loss": 0.0385, "step": 157370 }, { - "epoch": 1.7, - "learning_rate": 4.466221039652151e-05, - "loss": 0.0237, + "epoch": 1.02, + "learning_rate": 0.00014763484513060146, + "loss": 0.038, "step": 157380 }, { - "epoch": 1.7, - "learning_rate": 4.464598611201246e-05, - "loss": 0.0272, + "epoch": 1.02, + "learning_rate": 0.00014762516377624454, + "loss": 0.0374, "step": 157390 }, { - "epoch": 1.7, - "learning_rate": 4.46297618275034e-05, - "loss": 0.0219, + "epoch": 1.02, + "learning_rate": 0.0001476154824218876, + "loss": 0.0381, "step": 157400 }, { - "epoch": 1.7, - "learning_rate": 4.461353754299435e-05, - "loss": 0.0251, + "epoch": 1.02, + "learning_rate": 0.00014760580106753065, + "loss": 0.0536, "step": 157410 }, { - "epoch": 1.7, - "learning_rate": 4.4597313258485293e-05, - "loss": 0.0288, + "epoch": 1.02, + "learning_rate": 0.00014759611971317373, + "loss": 0.0396, "step": 157420 }, { - "epoch": 1.7, - "learning_rate": 4.458108897397624e-05, - "loss": 0.0295, + "epoch": 1.02, + "learning_rate": 0.00014758643835881678, + "loss": 0.0348, "step": 157430 }, { - "epoch": 1.7, - "learning_rate": 4.4564864689467186e-05, - "loss": 0.027, + "epoch": 1.02, + "learning_rate": 0.00014757675700445986, + "loss": 0.0341, "step": 157440 }, { - "epoch": 1.7, - "learning_rate": 4.4548640404958136e-05, - "loss": 0.0264, + "epoch": 1.02, + "learning_rate": 0.00014756707565010294, + "loss": 0.0369, "step": 157450 }, { - "epoch": 1.7, - "learning_rate": 4.4532416120449086e-05, - "loss": 0.0305, + "epoch": 1.02, + "learning_rate": 0.000147557394295746, + "loss": 0.0337, "step": 157460 }, { - "epoch": 1.7, - "learning_rate": 4.451619183594003e-05, - "loss": 0.0283, + "epoch": 1.02, + "learning_rate": 0.00014754771294138907, + "loss": 0.0334, "step": 157470 }, { - "epoch": 1.7, - "learning_rate": 4.449996755143098e-05, - "loss": 0.0229, + "epoch": 1.02, + "learning_rate": 0.00014753803158703213, + "loss": 0.0362, "step": 157480 }, { - "epoch": 1.7, - "learning_rate": 4.448374326692192e-05, - "loss": 0.0272, + "epoch": 1.02, + "learning_rate": 0.0001475283502326752, + "loss": 0.0397, "step": 157490 }, { - "epoch": 1.7, - "learning_rate": 4.446751898241287e-05, - "loss": 0.0308, + "epoch": 1.02, + "learning_rate": 0.00014751866887831826, + "loss": 0.0341, "step": 157500 }, { - "epoch": 1.7, - "learning_rate": 4.4451294697903814e-05, - "loss": 0.025, + "epoch": 1.02, + "learning_rate": 0.00014750898752396134, + "loss": 0.0409, "step": 157510 }, { - "epoch": 1.7, - "learning_rate": 4.4435070413394764e-05, - "loss": 0.0255, + "epoch": 1.02, + "learning_rate": 0.00014749930616960442, + "loss": 0.0348, "step": 157520 }, { - "epoch": 1.7, - "learning_rate": 4.441884612888571e-05, - "loss": 0.0269, + "epoch": 1.02, + "learning_rate": 0.00014748962481524747, + "loss": 0.0352, "step": 157530 }, { - "epoch": 1.7, - "learning_rate": 4.440262184437666e-05, - "loss": 0.021, + "epoch": 1.02, + "learning_rate": 0.00014747994346089055, + "loss": 0.0374, "step": 157540 }, { - "epoch": 1.7, - "learning_rate": 4.4386397559867607e-05, - "loss": 0.0248, + "epoch": 1.02, + "learning_rate": 0.0001474702621065336, + "loss": 0.0375, "step": 157550 }, { - "epoch": 1.7, - "learning_rate": 4.437017327535855e-05, - "loss": 0.0235, + "epoch": 1.02, + "learning_rate": 0.00014746058075217668, + "loss": 0.035, "step": 157560 }, { - "epoch": 1.7, - "learning_rate": 4.43539489908495e-05, - "loss": 0.0237, + "epoch": 1.02, + "learning_rate": 0.00014745089939781974, + "loss": 0.0407, "step": 157570 }, { - "epoch": 1.7, - "learning_rate": 4.433772470634044e-05, - "loss": 0.0247, + "epoch": 1.02, + "learning_rate": 0.00014744121804346282, + "loss": 0.0288, "step": 157580 }, { - "epoch": 1.7, - "learning_rate": 4.432150042183139e-05, - "loss": 0.032, + "epoch": 1.02, + "learning_rate": 0.0001474315366891059, + "loss": 0.034, "step": 157590 }, { - "epoch": 1.7, - "learning_rate": 4.4305276137322335e-05, - "loss": 0.0233, + "epoch": 1.02, + "learning_rate": 0.00014742185533474895, + "loss": 0.0344, "step": 157600 }, { - "epoch": 1.7, - "learning_rate": 4.4289051852813285e-05, - "loss": 0.0298, + "epoch": 1.02, + "learning_rate": 0.000147412173980392, + "loss": 0.0349, "step": 157610 }, { - "epoch": 1.7, - "learning_rate": 4.427282756830423e-05, - "loss": 0.0265, + "epoch": 1.02, + "learning_rate": 0.00014740249262603508, + "loss": 0.0337, "step": 157620 }, { - "epoch": 1.7, - "learning_rate": 4.425660328379518e-05, - "loss": 0.0255, + "epoch": 1.02, + "learning_rate": 0.00014739281127167816, + "loss": 0.0397, "step": 157630 }, { - "epoch": 1.71, - "learning_rate": 4.424037899928613e-05, - "loss": 0.0261, + "epoch": 1.02, + "learning_rate": 0.0001473831299173212, + "loss": 0.0383, "step": 157640 }, { - "epoch": 1.71, - "learning_rate": 4.422415471477707e-05, - "loss": 0.032, + "epoch": 1.02, + "learning_rate": 0.0001473734485629643, + "loss": 0.0478, "step": 157650 }, { - "epoch": 1.71, - "learning_rate": 4.420793043026802e-05, - "loss": 0.0282, + "epoch": 1.02, + "learning_rate": 0.00014736376720860735, + "loss": 0.0402, "step": 157660 }, { - "epoch": 1.71, - "learning_rate": 4.419170614575896e-05, - "loss": 0.033, + "epoch": 1.02, + "learning_rate": 0.00014735408585425043, + "loss": 0.0348, "step": 157670 }, { - "epoch": 1.71, - "learning_rate": 4.417548186124991e-05, - "loss": 0.0257, + "epoch": 1.02, + "learning_rate": 0.00014734440449989348, + "loss": 0.036, "step": 157680 }, { - "epoch": 1.71, - "learning_rate": 4.4159257576740856e-05, - "loss": 0.0292, + "epoch": 1.02, + "learning_rate": 0.00014733472314553656, + "loss": 0.0552, "step": 157690 }, { - "epoch": 1.71, - "learning_rate": 4.4143033292231806e-05, - "loss": 0.0284, + "epoch": 1.02, + "learning_rate": 0.00014732504179117964, + "loss": 0.0389, "step": 157700 }, { - "epoch": 1.71, - "learning_rate": 4.412680900772275e-05, - "loss": 0.0307, + "epoch": 1.02, + "learning_rate": 0.0001473153604368227, + "loss": 0.0348, "step": 157710 }, { - "epoch": 1.71, - "learning_rate": 4.41105847232137e-05, - "loss": 0.0286, + "epoch": 1.02, + "learning_rate": 0.00014730567908246577, + "loss": 0.0346, "step": 157720 }, { - "epoch": 1.71, - "learning_rate": 4.409436043870465e-05, - "loss": 0.0273, + "epoch": 1.02, + "learning_rate": 0.00014729599772810882, + "loss": 0.0395, "step": 157730 }, { - "epoch": 1.71, - "learning_rate": 4.407813615419559e-05, - "loss": 0.0324, + "epoch": 1.02, + "learning_rate": 0.0001472863163737519, + "loss": 0.0343, "step": 157740 }, { - "epoch": 1.71, - "learning_rate": 4.406191186968654e-05, - "loss": 0.0295, + "epoch": 1.02, + "learning_rate": 0.00014727663501939495, + "loss": 0.0356, "step": 157750 }, { - "epoch": 1.71, - "learning_rate": 4.4045687585177484e-05, - "loss": 0.0312, + "epoch": 1.02, + "learning_rate": 0.00014726695366503803, + "loss": 0.0357, "step": 157760 }, { - "epoch": 1.71, - "learning_rate": 4.4029463300668434e-05, - "loss": 0.0243, + "epoch": 1.02, + "learning_rate": 0.00014725727231068111, + "loss": 0.0362, "step": 157770 }, { - "epoch": 1.71, - "learning_rate": 4.401323901615938e-05, - "loss": 0.0259, + "epoch": 1.02, + "learning_rate": 0.00014724759095632417, + "loss": 0.0354, "step": 157780 }, { - "epoch": 1.71, - "learning_rate": 4.3997014731650327e-05, - "loss": 0.0251, + "epoch": 1.02, + "learning_rate": 0.00014723790960196725, + "loss": 0.0387, "step": 157790 }, { - "epoch": 1.71, - "learning_rate": 4.3980790447141276e-05, - "loss": 0.0225, + "epoch": 1.02, + "learning_rate": 0.0001472282282476103, + "loss": 0.0343, "step": 157800 }, { - "epoch": 1.71, - "learning_rate": 4.3964566162632226e-05, - "loss": 0.0259, + "epoch": 1.02, + "learning_rate": 0.00014721854689325338, + "loss": 0.0421, "step": 157810 }, { - "epoch": 1.71, - "learning_rate": 4.3948341878123176e-05, - "loss": 0.024, + "epoch": 1.02, + "learning_rate": 0.00014720886553889643, + "loss": 0.033, "step": 157820 }, { - "epoch": 1.71, - "learning_rate": 4.393211759361412e-05, - "loss": 0.0264, + "epoch": 1.02, + "learning_rate": 0.0001471991841845395, + "loss": 0.0351, "step": 157830 }, { - "epoch": 1.71, - "learning_rate": 4.391589330910507e-05, - "loss": 0.0228, + "epoch": 1.02, + "learning_rate": 0.0001471895028301826, + "loss": 0.0346, "step": 157840 }, { - "epoch": 1.71, - "learning_rate": 4.389966902459602e-05, - "loss": 0.029, + "epoch": 1.02, + "learning_rate": 0.00014717982147582564, + "loss": 0.0371, "step": 157850 }, { - "epoch": 1.71, - "learning_rate": 4.388344474008696e-05, - "loss": 0.0238, + "epoch": 1.02, + "learning_rate": 0.0001471701401214687, + "loss": 0.0404, "step": 157860 }, { - "epoch": 1.71, - "learning_rate": 4.386722045557791e-05, - "loss": 0.0279, + "epoch": 1.02, + "learning_rate": 0.00014716045876711178, + "loss": 0.0418, "step": 157870 }, { - "epoch": 1.71, - "learning_rate": 4.3850996171068854e-05, - "loss": 0.035, + "epoch": 1.02, + "learning_rate": 0.00014715077741275486, + "loss": 0.0329, "step": 157880 }, { - "epoch": 1.71, - "learning_rate": 4.3834771886559804e-05, - "loss": 0.0263, + "epoch": 1.02, + "learning_rate": 0.0001471410960583979, + "loss": 0.0296, "step": 157890 }, { - "epoch": 1.71, - "learning_rate": 4.381854760205075e-05, - "loss": 0.0326, + "epoch": 1.02, + "learning_rate": 0.000147131414704041, + "loss": 0.0375, "step": 157900 }, { - "epoch": 1.71, - "learning_rate": 4.38023233175417e-05, - "loss": 0.0254, + "epoch": 1.02, + "learning_rate": 0.00014712173334968407, + "loss": 0.0395, "step": 157910 }, { - "epoch": 1.71, - "learning_rate": 4.378609903303264e-05, - "loss": 0.0272, + "epoch": 1.02, + "learning_rate": 0.00014711205199532712, + "loss": 0.0379, "step": 157920 }, { - "epoch": 1.71, - "learning_rate": 4.376987474852359e-05, - "loss": 0.0287, + "epoch": 1.02, + "learning_rate": 0.00014710237064097017, + "loss": 0.0392, "step": 157930 }, { - "epoch": 1.71, - "learning_rate": 4.375365046401454e-05, - "loss": 0.0293, + "epoch": 1.02, + "learning_rate": 0.00014709268928661325, + "loss": 0.0361, "step": 157940 }, { - "epoch": 1.71, - "learning_rate": 4.373742617950548e-05, - "loss": 0.0248, + "epoch": 1.02, + "learning_rate": 0.00014708300793225633, + "loss": 0.0304, "step": 157950 }, { - "epoch": 1.71, - "learning_rate": 4.372120189499643e-05, - "loss": 0.0302, + "epoch": 1.02, + "learning_rate": 0.0001470733265778994, + "loss": 0.0374, "step": 157960 }, { - "epoch": 1.71, - "learning_rate": 4.3704977610487375e-05, - "loss": 0.0265, + "epoch": 1.02, + "learning_rate": 0.00014706364522354247, + "loss": 0.0299, "step": 157970 }, { - "epoch": 1.71, - "learning_rate": 4.3688753325978325e-05, - "loss": 0.0215, + "epoch": 1.02, + "learning_rate": 0.00014705396386918552, + "loss": 0.0366, "step": 157980 }, { - "epoch": 1.71, - "learning_rate": 4.367252904146927e-05, - "loss": 0.0222, + "epoch": 1.02, + "learning_rate": 0.0001470442825148286, + "loss": 0.0374, "step": 157990 }, { - "epoch": 1.71, - "learning_rate": 4.365630475696022e-05, - "loss": 0.0283, + "epoch": 1.02, + "learning_rate": 0.00014703460116047165, + "loss": 0.0321, "step": 158000 }, { - "epoch": 1.71, - "eval_cer": 0.9211039666679035, - "eval_loss": 0.021647585555911064, - "eval_runtime": 119.2059, - "eval_samples_per_second": 16.778, - "eval_steps_per_second": 4.194, + "epoch": 1.02, + "eval_cer": 0.9197731329793244, + "eval_loss": 0.024751625955104828, + "eval_runtime": 120.2028, + "eval_samples_per_second": 16.639, + "eval_steps_per_second": 4.16, "step": 158000 }, { - "epoch": 1.71, - "learning_rate": 4.364008047245116e-05, - "loss": 0.0277, + "epoch": 1.02, + "learning_rate": 0.00014702491980611473, + "loss": 0.0361, "step": 158010 }, { - "epoch": 1.71, - "learning_rate": 4.362385618794211e-05, - "loss": 0.0222, + "epoch": 1.02, + "learning_rate": 0.0001470152384517578, + "loss": 0.0356, "step": 158020 }, { - "epoch": 1.71, - "learning_rate": 4.360763190343306e-05, + "epoch": 1.02, + "learning_rate": 0.00014700555709740086, "loss": 0.0295, "step": 158030 }, { - "epoch": 1.71, - "learning_rate": 4.3591407618924e-05, - "loss": 0.0214, + "epoch": 1.02, + "learning_rate": 0.00014699587574304394, + "loss": 0.0346, "step": 158040 }, { - "epoch": 1.71, - "learning_rate": 4.357518333441495e-05, - "loss": 0.0301, + "epoch": 1.02, + "learning_rate": 0.000146986194388687, + "loss": 0.0434, "step": 158050 }, { - "epoch": 1.71, - "learning_rate": 4.3558959049905896e-05, - "loss": 0.029, + "epoch": 1.02, + "learning_rate": 0.00014697651303433005, + "loss": 0.0352, "step": 158060 }, { - "epoch": 1.71, - "learning_rate": 4.3542734765396846e-05, - "loss": 0.0262, + "epoch": 1.02, + "learning_rate": 0.00014696683167997313, + "loss": 0.0357, "step": 158070 }, { - "epoch": 1.71, - "learning_rate": 4.352651048088779e-05, - "loss": 0.0235, + "epoch": 1.02, + "learning_rate": 0.0001469571503256162, + "loss": 0.0381, "step": 158080 }, { - "epoch": 1.71, - "learning_rate": 4.351028619637874e-05, - "loss": 0.0256, + "epoch": 1.02, + "learning_rate": 0.0001469474689712593, + "loss": 0.034, "step": 158090 }, { - "epoch": 1.71, - "learning_rate": 4.349406191186969e-05, - "loss": 0.0268, + "epoch": 1.02, + "learning_rate": 0.00014693778761690234, + "loss": 0.0342, "step": 158100 }, { - "epoch": 1.71, - "learning_rate": 4.347783762736063e-05, - "loss": 0.0238, + "epoch": 1.02, + "learning_rate": 0.00014692810626254542, + "loss": 0.0356, "step": 158110 }, { - "epoch": 1.71, - "learning_rate": 4.346161334285158e-05, - "loss": 0.0234, + "epoch": 1.02, + "learning_rate": 0.00014691842490818847, + "loss": 0.0314, "step": 158120 }, { - "epoch": 1.71, - "learning_rate": 4.3445389058342524e-05, - "loss": 0.03, + "epoch": 1.02, + "learning_rate": 0.00014690874355383153, + "loss": 0.0339, "step": 158130 }, { - "epoch": 1.71, - "learning_rate": 4.3429164773833474e-05, - "loss": 0.0277, + "epoch": 1.02, + "learning_rate": 0.0001468990621994746, + "loss": 0.0346, "step": 158140 }, { - "epoch": 1.71, - "learning_rate": 4.341294048932442e-05, - "loss": 0.0244, + "epoch": 1.02, + "learning_rate": 0.00014688938084511769, + "loss": 0.0309, "step": 158150 }, { - "epoch": 1.71, - "learning_rate": 4.3396716204815366e-05, - "loss": 0.0239, + "epoch": 1.02, + "learning_rate": 0.00014687969949076077, + "loss": 0.0368, "step": 158160 }, { - "epoch": 1.71, - "learning_rate": 4.338049192030631e-05, - "loss": 0.0269, + "epoch": 1.02, + "learning_rate": 0.00014687001813640382, + "loss": 0.0425, "step": 158170 }, { - "epoch": 1.71, - "learning_rate": 4.336426763579726e-05, - "loss": 0.0253, + "epoch": 1.02, + "learning_rate": 0.00014686033678204687, + "loss": 0.0353, "step": 158180 }, { - "epoch": 1.71, - "learning_rate": 4.334804335128821e-05, - "loss": 0.0248, + "epoch": 1.02, + "learning_rate": 0.00014685065542768995, + "loss": 0.0363, "step": 158190 }, { - "epoch": 1.71, - "learning_rate": 4.333181906677915e-05, - "loss": 0.0246, + "epoch": 1.02, + "learning_rate": 0.000146840974073333, + "loss": 0.0373, "step": 158200 }, { - "epoch": 1.71, - "learning_rate": 4.33155947822701e-05, - "loss": 0.0211, + "epoch": 1.02, + "learning_rate": 0.00014683129271897608, + "loss": 0.0338, "step": 158210 }, { - "epoch": 1.71, - "learning_rate": 4.3299370497761045e-05, - "loss": 0.0281, + "epoch": 1.02, + "learning_rate": 0.00014682161136461916, + "loss": 0.0429, "step": 158220 }, { - "epoch": 1.71, - "learning_rate": 4.3283146213251995e-05, - "loss": 0.0282, + "epoch": 1.02, + "learning_rate": 0.00014681193001026224, + "loss": 0.037, "step": 158230 }, { - "epoch": 1.71, - "learning_rate": 4.326692192874294e-05, - "loss": 0.0272, + "epoch": 1.02, + "learning_rate": 0.0001468022486559053, + "loss": 0.0435, "step": 158240 }, { - "epoch": 1.71, - "learning_rate": 4.325069764423389e-05, - "loss": 0.026, + "epoch": 1.02, + "learning_rate": 0.00014679256730154835, + "loss": 0.0355, "step": 158250 }, { - "epoch": 1.71, - "learning_rate": 4.323447335972483e-05, - "loss": 0.0296, + "epoch": 1.02, + "learning_rate": 0.00014678288594719143, + "loss": 0.036, "step": 158260 }, { - "epoch": 1.71, - "learning_rate": 4.321824907521578e-05, - "loss": 0.0204, + "epoch": 1.02, + "learning_rate": 0.00014677320459283448, + "loss": 0.0391, "step": 158270 }, { - "epoch": 1.71, - "learning_rate": 4.320202479070673e-05, - "loss": 0.0268, + "epoch": 1.02, + "learning_rate": 0.00014676352323847756, + "loss": 0.0373, "step": 158280 }, { - "epoch": 1.71, - "learning_rate": 4.318580050619767e-05, - "loss": 0.028, + "epoch": 1.02, + "learning_rate": 0.00014675384188412064, + "loss": 0.0349, "step": 158290 }, { - "epoch": 1.71, - "learning_rate": 4.316957622168862e-05, - "loss": 0.0295, + "epoch": 1.02, + "learning_rate": 0.0001467441605297637, + "loss": 0.0356, "step": 158300 }, { - "epoch": 1.71, - "learning_rate": 4.3153351937179566e-05, - "loss": 0.0254, + "epoch": 1.02, + "learning_rate": 0.00014673447917540677, + "loss": 0.0343, "step": 158310 }, { - "epoch": 1.71, - "learning_rate": 4.3137127652670515e-05, - "loss": 0.0257, + "epoch": 1.02, + "learning_rate": 0.00014672479782104983, + "loss": 0.036, "step": 158320 }, { - "epoch": 1.71, - "learning_rate": 4.312090336816146e-05, - "loss": 0.025, + "epoch": 1.02, + "learning_rate": 0.0001467151164666929, + "loss": 0.0341, "step": 158330 }, { - "epoch": 1.71, - "learning_rate": 4.310467908365241e-05, - "loss": 0.033, + "epoch": 1.02, + "learning_rate": 0.00014670543511233596, + "loss": 0.0362, "step": 158340 }, { - "epoch": 1.71, - "learning_rate": 4.308845479914335e-05, - "loss": 0.0224, + "epoch": 1.02, + "learning_rate": 0.00014669575375797904, + "loss": 0.0381, "step": 158350 }, { - "epoch": 1.71, - "learning_rate": 4.30722305146343e-05, - "loss": 0.0264, + "epoch": 1.02, + "learning_rate": 0.00014668607240362212, + "loss": 0.0357, "step": 158360 }, { - "epoch": 1.71, - "learning_rate": 4.305600623012525e-05, - "loss": 0.0237, + "epoch": 1.02, + "learning_rate": 0.00014667639104926517, + "loss": 0.0327, "step": 158370 }, { - "epoch": 1.71, - "learning_rate": 4.3039781945616194e-05, - "loss": 0.026, + "epoch": 1.02, + "learning_rate": 0.00014666670969490822, + "loss": 0.0295, "step": 158380 }, { - "epoch": 1.71, - "learning_rate": 4.3023557661107143e-05, - "loss": 0.03, + "epoch": 1.02, + "learning_rate": 0.0001466570283405513, + "loss": 0.0291, "step": 158390 }, { - "epoch": 1.71, - "learning_rate": 4.3007333376598086e-05, - "loss": 0.0275, + "epoch": 1.02, + "learning_rate": 0.00014664734698619438, + "loss": 0.0299, "step": 158400 }, { - "epoch": 1.71, - "learning_rate": 4.2991109092089036e-05, - "loss": 0.0285, + "epoch": 1.02, + "learning_rate": 0.00014663766563183744, + "loss": 0.036, "step": 158410 }, { - "epoch": 1.71, - "learning_rate": 4.297488480757998e-05, - "loss": 0.033, + "epoch": 1.02, + "learning_rate": 0.00014662798427748051, + "loss": 0.0321, "step": 158420 }, { - "epoch": 1.71, - "learning_rate": 4.295866052307093e-05, - "loss": 0.0244, + "epoch": 1.02, + "learning_rate": 0.0001466183029231236, + "loss": 0.034, "step": 158430 }, { - "epoch": 1.71, - "learning_rate": 4.294243623856188e-05, - "loss": 0.0252, + "epoch": 1.02, + "learning_rate": 0.00014660862156876665, + "loss": 0.037, "step": 158440 }, { - "epoch": 1.71, - "learning_rate": 4.292621195405282e-05, - "loss": 0.0246, + "epoch": 1.02, + "learning_rate": 0.0001465989402144097, + "loss": 0.0341, "step": 158450 }, { - "epoch": 1.71, - "learning_rate": 4.290998766954377e-05, - "loss": 0.0286, + "epoch": 1.02, + "learning_rate": 0.00014658925886005278, + "loss": 0.0363, "step": 158460 }, { - "epoch": 1.71, - "learning_rate": 4.2893763385034714e-05, - "loss": 0.0334, + "epoch": 1.02, + "learning_rate": 0.00014657957750569586, + "loss": 0.0301, "step": 158470 }, { - "epoch": 1.71, - "learning_rate": 4.2877539100525664e-05, - "loss": 0.0217, + "epoch": 1.02, + "learning_rate": 0.0001465698961513389, + "loss": 0.0314, "step": 158480 }, { - "epoch": 1.71, - "learning_rate": 4.286131481601661e-05, - "loss": 0.024, + "epoch": 1.02, + "learning_rate": 0.000146560214796982, + "loss": 0.0385, "step": 158490 }, { - "epoch": 1.71, - "learning_rate": 4.284509053150756e-05, - "loss": 0.0224, + "epoch": 1.02, + "learning_rate": 0.00014655053344262504, + "loss": 0.0327, "step": 158500 }, { - "epoch": 1.71, - "learning_rate": 4.28288662469985e-05, - "loss": 0.0293, + "epoch": 1.02, + "learning_rate": 0.00014654085208826812, + "loss": 0.0315, "step": 158510 }, { - "epoch": 1.71, - "learning_rate": 4.281264196248945e-05, - "loss": 0.0291, + "epoch": 1.02, + "learning_rate": 0.00014653117073391118, + "loss": 0.0366, "step": 158520 }, { - "epoch": 1.71, - "learning_rate": 4.27964176779804e-05, - "loss": 0.0255, + "epoch": 1.02, + "learning_rate": 0.00014652148937955426, + "loss": 0.0393, "step": 158530 }, { - "epoch": 1.71, - "learning_rate": 4.278019339347134e-05, - "loss": 0.0216, + "epoch": 1.02, + "learning_rate": 0.00014651180802519734, + "loss": 0.0343, "step": 158540 }, { - "epoch": 1.71, - "learning_rate": 4.276396910896229e-05, - "loss": 0.0285, + "epoch": 1.02, + "learning_rate": 0.0001465021266708404, + "loss": 0.0405, "step": 158550 }, { - "epoch": 1.71, - "learning_rate": 4.2747744824453235e-05, - "loss": 0.0322, + "epoch": 1.02, + "learning_rate": 0.00014649244531648347, + "loss": 0.0339, "step": 158560 }, { - "epoch": 1.72, - "learning_rate": 4.2731520539944185e-05, - "loss": 0.0241, + "epoch": 1.02, + "learning_rate": 0.00014648276396212652, + "loss": 0.0384, "step": 158570 }, { - "epoch": 1.72, - "learning_rate": 4.271529625543513e-05, - "loss": 0.0234, + "epoch": 1.02, + "learning_rate": 0.0001464730826077696, + "loss": 0.0349, "step": 158580 }, { - "epoch": 1.72, - "learning_rate": 4.269907197092608e-05, - "loss": 0.0253, + "epoch": 1.02, + "learning_rate": 0.00014646340125341265, + "loss": 0.0347, "step": 158590 }, { - "epoch": 1.72, - "learning_rate": 4.268284768641702e-05, - "loss": 0.0283, + "epoch": 1.02, + "learning_rate": 0.00014645371989905573, + "loss": 0.031, "step": 158600 }, { - "epoch": 1.72, - "learning_rate": 4.266662340190797e-05, - "loss": 0.0242, + "epoch": 1.02, + "learning_rate": 0.00014644403854469881, + "loss": 0.0358, "step": 158610 }, { - "epoch": 1.72, - "learning_rate": 4.265039911739892e-05, - "loss": 0.0276, + "epoch": 1.02, + "learning_rate": 0.00014643435719034187, + "loss": 0.0345, "step": 158620 }, { - "epoch": 1.72, - "learning_rate": 4.263417483288986e-05, - "loss": 0.021, + "epoch": 1.02, + "learning_rate": 0.00014642467583598495, + "loss": 0.0372, "step": 158630 }, { - "epoch": 1.72, - "learning_rate": 4.261795054838081e-05, - "loss": 0.0262, + "epoch": 1.02, + "learning_rate": 0.000146414994481628, + "loss": 0.0318, "step": 158640 }, { - "epoch": 1.72, - "learning_rate": 4.2601726263871756e-05, - "loss": 0.0293, + "epoch": 1.02, + "learning_rate": 0.00014640531312727108, + "loss": 0.0342, "step": 158650 }, { - "epoch": 1.72, - "learning_rate": 4.2585501979362706e-05, - "loss": 0.025, + "epoch": 1.02, + "learning_rate": 0.00014639563177291413, + "loss": 0.0302, "step": 158660 }, { - "epoch": 1.72, - "learning_rate": 4.256927769485365e-05, - "loss": 0.0234, + "epoch": 1.02, + "learning_rate": 0.0001463859504185572, + "loss": 0.0361, "step": 158670 }, { - "epoch": 1.72, - "learning_rate": 4.25530534103446e-05, - "loss": 0.0215, + "epoch": 1.02, + "learning_rate": 0.0001463762690642003, + "loss": 0.0402, "step": 158680 }, { - "epoch": 1.72, - "learning_rate": 4.253682912583554e-05, - "loss": 0.0214, + "epoch": 1.02, + "learning_rate": 0.00014636658770984334, + "loss": 0.0353, "step": 158690 }, { - "epoch": 1.72, - "learning_rate": 4.252060484132649e-05, - "loss": 0.0254, + "epoch": 1.02, + "learning_rate": 0.0001463569063554864, + "loss": 0.036, "step": 158700 }, { - "epoch": 1.72, - "learning_rate": 4.250438055681744e-05, - "loss": 0.0237, + "epoch": 1.02, + "learning_rate": 0.00014634722500112948, + "loss": 0.0341, "step": 158710 }, { - "epoch": 1.72, - "learning_rate": 4.2488156272308384e-05, - "loss": 0.024, + "epoch": 1.02, + "learning_rate": 0.00014633754364677256, + "loss": 0.0326, "step": 158720 }, { - "epoch": 1.72, - "learning_rate": 4.2471931987799334e-05, - "loss": 0.0313, + "epoch": 1.02, + "learning_rate": 0.0001463278622924156, + "loss": 0.0314, "step": 158730 }, { - "epoch": 1.72, - "learning_rate": 4.245570770329028e-05, - "loss": 0.0256, + "epoch": 1.02, + "learning_rate": 0.0001463181809380587, + "loss": 0.0318, "step": 158740 }, { - "epoch": 1.72, - "learning_rate": 4.243948341878123e-05, - "loss": 0.0233, + "epoch": 1.02, + "learning_rate": 0.00014630849958370174, + "loss": 0.0323, "step": 158750 }, { - "epoch": 1.72, - "learning_rate": 4.242325913427217e-05, - "loss": 0.0257, + "epoch": 1.02, + "learning_rate": 0.00014629881822934482, + "loss": 0.0323, "step": 158760 }, { - "epoch": 1.72, - "learning_rate": 4.240703484976312e-05, - "loss": 0.025, + "epoch": 1.02, + "learning_rate": 0.00014628913687498787, + "loss": 0.0395, "step": 158770 }, { - "epoch": 1.72, - "learning_rate": 4.239081056525406e-05, - "loss": 0.0246, + "epoch": 1.02, + "learning_rate": 0.00014627945552063095, + "loss": 0.0349, "step": 158780 }, { - "epoch": 1.72, - "learning_rate": 4.237458628074501e-05, - "loss": 0.0327, + "epoch": 1.02, + "learning_rate": 0.00014626977416627403, + "loss": 0.0402, "step": 158790 }, { - "epoch": 1.72, - "learning_rate": 4.235836199623596e-05, - "loss": 0.0211, + "epoch": 1.02, + "learning_rate": 0.00014626009281191709, + "loss": 0.0395, "step": 158800 }, { - "epoch": 1.72, - "learning_rate": 4.2342137711726905e-05, - "loss": 0.0278, + "epoch": 1.02, + "learning_rate": 0.00014625041145756017, + "loss": 0.0315, "step": 158810 }, { - "epoch": 1.72, - "learning_rate": 4.2325913427217855e-05, - "loss": 0.0257, + "epoch": 1.03, + "learning_rate": 0.00014624073010320322, + "loss": 0.0346, "step": 158820 }, { - "epoch": 1.72, - "learning_rate": 4.23096891427088e-05, - "loss": 0.0206, + "epoch": 1.03, + "learning_rate": 0.0001462310487488463, + "loss": 0.0308, "step": 158830 }, { - "epoch": 1.72, - "learning_rate": 4.229346485819975e-05, - "loss": 0.0265, + "epoch": 1.03, + "learning_rate": 0.00014622136739448935, + "loss": 0.0347, "step": 158840 }, { - "epoch": 1.72, - "learning_rate": 4.227724057369069e-05, - "loss": 0.0259, + "epoch": 1.03, + "learning_rate": 0.00014621168604013243, + "loss": 0.0408, "step": 158850 }, { - "epoch": 1.72, - "learning_rate": 4.226101628918164e-05, - "loss": 0.0262, + "epoch": 1.03, + "learning_rate": 0.0001462020046857755, + "loss": 0.0373, "step": 158860 }, { - "epoch": 1.72, - "learning_rate": 4.224479200467259e-05, - "loss": 0.0235, + "epoch": 1.03, + "learning_rate": 0.00014619232333141856, + "loss": 0.0296, "step": 158870 }, { - "epoch": 1.72, - "learning_rate": 4.222856772016353e-05, - "loss": 0.0265, + "epoch": 1.03, + "learning_rate": 0.00014618264197706164, + "loss": 0.0361, "step": 158880 }, { - "epoch": 1.72, - "learning_rate": 4.221234343565448e-05, - "loss": 0.0266, + "epoch": 1.03, + "learning_rate": 0.0001461729606227047, + "loss": 0.0293, "step": 158890 }, { - "epoch": 1.72, - "learning_rate": 4.2196119151145426e-05, - "loss": 0.0222, + "epoch": 1.03, + "learning_rate": 0.00014616327926834775, + "loss": 0.0312, "step": 158900 }, { - "epoch": 1.72, - "learning_rate": 4.2179894866636376e-05, - "loss": 0.0324, + "epoch": 1.03, + "learning_rate": 0.00014615359791399083, + "loss": 0.032, "step": 158910 }, { - "epoch": 1.72, - "learning_rate": 4.216367058212732e-05, - "loss": 0.0229, + "epoch": 1.03, + "learning_rate": 0.0001461439165596339, + "loss": 0.0288, "step": 158920 }, { - "epoch": 1.72, - "learning_rate": 4.214744629761827e-05, - "loss": 0.0288, + "epoch": 1.03, + "learning_rate": 0.000146134235205277, + "loss": 0.0335, "step": 158930 }, { - "epoch": 1.72, - "learning_rate": 4.213122201310921e-05, - "loss": 0.0242, + "epoch": 1.03, + "learning_rate": 0.00014612455385092004, + "loss": 0.0346, "step": 158940 }, { - "epoch": 1.72, - "learning_rate": 4.211499772860016e-05, - "loss": 0.023, + "epoch": 1.03, + "learning_rate": 0.0001461148724965631, + "loss": 0.031, "step": 158950 }, { - "epoch": 1.72, - "learning_rate": 4.209877344409111e-05, - "loss": 0.0297, + "epoch": 1.03, + "learning_rate": 0.00014610519114220617, + "loss": 0.0355, "step": 158960 }, { - "epoch": 1.72, - "learning_rate": 4.2082549159582054e-05, - "loss": 0.0267, + "epoch": 1.03, + "learning_rate": 0.00014609550978784923, + "loss": 0.0364, "step": 158970 }, { - "epoch": 1.72, - "learning_rate": 4.206632487507301e-05, - "loss": 0.0289, + "epoch": 1.03, + "learning_rate": 0.0001460858284334923, + "loss": 0.0331, "step": 158980 }, { - "epoch": 1.72, - "learning_rate": 4.2050100590563953e-05, - "loss": 0.025, + "epoch": 1.03, + "learning_rate": 0.00014607614707913539, + "loss": 0.0347, "step": 158990 }, { - "epoch": 1.72, - "learning_rate": 4.20338763060549e-05, - "loss": 0.0245, + "epoch": 1.03, + "learning_rate": 0.00014606646572477847, + "loss": 0.0366, "step": 159000 }, { - "epoch": 1.72, - "eval_cer": 0.9210633263891466, - "eval_loss": 0.021797267720103264, - "eval_runtime": 119.1593, - "eval_samples_per_second": 16.784, - "eval_steps_per_second": 4.196, + "epoch": 1.03, + "eval_cer": 0.9199665574511354, + "eval_loss": 0.02524988353252411, + "eval_runtime": 120.5727, + "eval_samples_per_second": 16.587, + "eval_steps_per_second": 4.147, "step": 159000 }, { - "epoch": 1.72, - "learning_rate": 4.201765202154585e-05, - "loss": 0.026, + "epoch": 1.03, + "learning_rate": 0.00014605678437042152, + "loss": 0.0339, "step": 159010 }, { - "epoch": 1.72, - "learning_rate": 4.2001427737036796e-05, - "loss": 0.0323, + "epoch": 1.03, + "learning_rate": 0.00014604710301606457, + "loss": 0.0347, "step": 159020 }, { - "epoch": 1.72, - "learning_rate": 4.1985203452527746e-05, - "loss": 0.0303, + "epoch": 1.03, + "learning_rate": 0.00014603742166170765, + "loss": 0.0381, "step": 159030 }, { - "epoch": 1.72, - "learning_rate": 4.196897916801869e-05, - "loss": 0.0297, + "epoch": 1.03, + "learning_rate": 0.0001460277403073507, + "loss": 0.0335, "step": 159040 }, { - "epoch": 1.72, - "learning_rate": 4.195275488350964e-05, - "loss": 0.0276, + "epoch": 1.03, + "learning_rate": 0.00014601805895299378, + "loss": 0.0321, "step": 159050 }, { - "epoch": 1.72, - "learning_rate": 4.193653059900058e-05, - "loss": 0.0315, + "epoch": 1.03, + "learning_rate": 0.00014600837759863686, + "loss": 0.0295, "step": 159060 }, { - "epoch": 1.72, - "learning_rate": 4.192030631449153e-05, - "loss": 0.0304, + "epoch": 1.03, + "learning_rate": 0.00014599869624427992, + "loss": 0.0345, "step": 159070 }, { - "epoch": 1.72, - "learning_rate": 4.1904082029982474e-05, - "loss": 0.0274, + "epoch": 1.03, + "learning_rate": 0.000145989014889923, + "loss": 0.0364, "step": 159080 }, { - "epoch": 1.72, - "learning_rate": 4.1887857745473424e-05, - "loss": 0.0246, + "epoch": 1.03, + "learning_rate": 0.00014597933353556605, + "loss": 0.0325, "step": 159090 }, { - "epoch": 1.72, - "learning_rate": 4.1871633460964374e-05, - "loss": 0.0232, + "epoch": 1.03, + "learning_rate": 0.00014596965218120913, + "loss": 0.0388, "step": 159100 }, { - "epoch": 1.72, - "learning_rate": 4.185540917645532e-05, - "loss": 0.0256, + "epoch": 1.03, + "learning_rate": 0.00014595997082685218, + "loss": 0.0381, "step": 159110 }, { - "epoch": 1.72, - "learning_rate": 4.1839184891946267e-05, - "loss": 0.0246, + "epoch": 1.03, + "learning_rate": 0.00014595028947249526, + "loss": 0.0344, "step": 159120 }, { - "epoch": 1.72, - "learning_rate": 4.182296060743721e-05, - "loss": 0.0298, + "epoch": 1.03, + "learning_rate": 0.00014594060811813834, + "loss": 0.0367, "step": 159130 }, { - "epoch": 1.72, - "learning_rate": 4.180673632292816e-05, - "loss": 0.0234, + "epoch": 1.03, + "learning_rate": 0.0001459309267637814, + "loss": 0.037, "step": 159140 }, { - "epoch": 1.72, - "learning_rate": 4.17905120384191e-05, - "loss": 0.0259, + "epoch": 1.03, + "learning_rate": 0.00014592124540942445, + "loss": 0.0363, "step": 159150 }, { - "epoch": 1.72, - "learning_rate": 4.177428775391005e-05, - "loss": 0.0247, + "epoch": 1.03, + "learning_rate": 0.00014591156405506753, + "loss": 0.0301, "step": 159160 }, { - "epoch": 1.72, - "learning_rate": 4.1758063469401e-05, - "loss": 0.0352, + "epoch": 1.03, + "learning_rate": 0.0001459018827007106, + "loss": 0.0356, "step": 159170 }, { - "epoch": 1.72, - "learning_rate": 4.1741839184891945e-05, - "loss": 0.0262, + "epoch": 1.03, + "learning_rate": 0.00014589220134635366, + "loss": 0.034, "step": 159180 }, { - "epoch": 1.72, - "learning_rate": 4.1725614900382895e-05, - "loss": 0.0279, + "epoch": 1.03, + "learning_rate": 0.00014588251999199674, + "loss": 0.0345, "step": 159190 }, { - "epoch": 1.72, - "learning_rate": 4.170939061587384e-05, - "loss": 0.0301, + "epoch": 1.03, + "learning_rate": 0.00014587283863763982, + "loss": 0.0394, "step": 159200 }, { - "epoch": 1.72, - "learning_rate": 4.169316633136479e-05, - "loss": 0.0221, + "epoch": 1.03, + "learning_rate": 0.00014586315728328287, + "loss": 0.0334, "step": 159210 }, { - "epoch": 1.72, - "learning_rate": 4.167694204685573e-05, - "loss": 0.022, + "epoch": 1.03, + "learning_rate": 0.00014585347592892592, + "loss": 0.0372, "step": 159220 }, { - "epoch": 1.72, - "learning_rate": 4.166071776234668e-05, - "loss": 0.0294, + "epoch": 1.03, + "learning_rate": 0.000145843794574569, + "loss": 0.0323, "step": 159230 }, { - "epoch": 1.72, - "learning_rate": 4.164449347783762e-05, - "loss": 0.0209, + "epoch": 1.03, + "learning_rate": 0.00014583411322021208, + "loss": 0.0393, "step": 159240 }, { - "epoch": 1.72, - "learning_rate": 4.162826919332857e-05, - "loss": 0.0235, + "epoch": 1.03, + "learning_rate": 0.00014582443186585513, + "loss": 0.0356, "step": 159250 }, { - "epoch": 1.72, - "learning_rate": 4.161204490881952e-05, - "loss": 0.0376, + "epoch": 1.03, + "learning_rate": 0.00014581475051149821, + "loss": 0.0378, "step": 159260 }, { - "epoch": 1.72, - "learning_rate": 4.1595820624310466e-05, - "loss": 0.0283, + "epoch": 1.03, + "learning_rate": 0.00014580506915714127, + "loss": 0.0331, "step": 159270 }, { - "epoch": 1.72, - "learning_rate": 4.1579596339801415e-05, - "loss": 0.0289, + "epoch": 1.03, + "learning_rate": 0.00014579538780278435, + "loss": 0.036, "step": 159280 }, { - "epoch": 1.72, - "learning_rate": 4.156337205529236e-05, - "loss": 0.0244, + "epoch": 1.03, + "learning_rate": 0.0001457857064484274, + "loss": 0.0357, "step": 159290 }, { - "epoch": 1.72, - "learning_rate": 4.154714777078331e-05, - "loss": 0.0272, + "epoch": 1.03, + "learning_rate": 0.00014577602509407048, + "loss": 0.0329, "step": 159300 }, { - "epoch": 1.72, - "learning_rate": 4.153092348627425e-05, - "loss": 0.0251, + "epoch": 1.03, + "learning_rate": 0.00014576634373971356, + "loss": 0.0352, "step": 159310 }, { - "epoch": 1.72, - "learning_rate": 4.15146992017652e-05, - "loss": 0.0264, + "epoch": 1.03, + "learning_rate": 0.0001457566623853566, + "loss": 0.0405, "step": 159320 }, { - "epoch": 1.72, - "learning_rate": 4.1498474917256144e-05, - "loss": 0.0215, + "epoch": 1.03, + "learning_rate": 0.0001457469810309997, + "loss": 0.0313, "step": 159330 }, { - "epoch": 1.72, - "learning_rate": 4.1482250632747094e-05, - "loss": 0.0246, + "epoch": 1.03, + "learning_rate": 0.00014573729967664274, + "loss": 0.0378, "step": 159340 }, { - "epoch": 1.72, - "learning_rate": 4.1466026348238044e-05, - "loss": 0.0283, + "epoch": 1.03, + "learning_rate": 0.00014572761832228582, + "loss": 0.0355, "step": 159350 }, { - "epoch": 1.72, - "learning_rate": 4.1449802063728987e-05, - "loss": 0.0243, + "epoch": 1.03, + "learning_rate": 0.00014571793696792888, + "loss": 0.0334, "step": 159360 }, { - "epoch": 1.72, - "learning_rate": 4.1433577779219936e-05, - "loss": 0.0204, + "epoch": 1.03, + "learning_rate": 0.00014570825561357196, + "loss": 0.0325, "step": 159370 }, { - "epoch": 1.72, - "learning_rate": 4.141735349471088e-05, - "loss": 0.0224, + "epoch": 1.03, + "learning_rate": 0.00014569857425921504, + "loss": 0.0342, "step": 159380 }, { - "epoch": 1.72, - "learning_rate": 4.140112921020183e-05, - "loss": 0.0264, + "epoch": 1.03, + "learning_rate": 0.0001456888929048581, + "loss": 0.037, "step": 159390 }, { - "epoch": 1.72, - "learning_rate": 4.138490492569277e-05, - "loss": 0.0202, + "epoch": 1.03, + "learning_rate": 0.00014567921155050117, + "loss": 0.0397, "step": 159400 }, { - "epoch": 1.72, - "learning_rate": 4.136868064118372e-05, - "loss": 0.0259, + "epoch": 1.03, + "learning_rate": 0.00014566953019614422, + "loss": 0.0342, "step": 159410 }, { - "epoch": 1.72, - "learning_rate": 4.1352456356674665e-05, - "loss": 0.0239, + "epoch": 1.03, + "learning_rate": 0.0001456598488417873, + "loss": 0.0357, "step": 159420 }, { - "epoch": 1.72, - "learning_rate": 4.1336232072165615e-05, - "loss": 0.0285, + "epoch": 1.03, + "learning_rate": 0.00014565016748743035, + "loss": 0.0393, "step": 159430 }, { - "epoch": 1.72, - "learning_rate": 4.1320007787656564e-05, - "loss": 0.0291, + "epoch": 1.03, + "learning_rate": 0.00014564048613307343, + "loss": 0.0369, "step": 159440 }, { - "epoch": 1.72, - "learning_rate": 4.130378350314751e-05, - "loss": 0.0266, + "epoch": 1.03, + "learning_rate": 0.00014563080477871651, + "loss": 0.0304, "step": 159450 }, { - "epoch": 1.72, - "learning_rate": 4.128755921863846e-05, - "loss": 0.0242, + "epoch": 1.03, + "learning_rate": 0.00014562112342435957, + "loss": 0.0335, "step": 159460 }, { - "epoch": 1.72, - "learning_rate": 4.12713349341294e-05, - "loss": 0.0237, + "epoch": 1.03, + "learning_rate": 0.00014561144207000262, + "loss": 0.0335, "step": 159470 }, { - "epoch": 1.72, - "learning_rate": 4.125511064962035e-05, - "loss": 0.0223, + "epoch": 1.03, + "learning_rate": 0.0001456017607156457, + "loss": 0.0314, "step": 159480 }, { - "epoch": 1.73, - "learning_rate": 4.123888636511129e-05, - "loss": 0.0203, + "epoch": 1.03, + "learning_rate": 0.00014559207936128878, + "loss": 0.0323, "step": 159490 }, { - "epoch": 1.73, - "learning_rate": 4.122266208060224e-05, - "loss": 0.0255, + "epoch": 1.03, + "learning_rate": 0.00014558239800693183, + "loss": 0.0375, "step": 159500 }, { - "epoch": 1.73, - "learning_rate": 4.120643779609319e-05, - "loss": 0.0304, + "epoch": 1.03, + "learning_rate": 0.0001455727166525749, + "loss": 0.0348, "step": 159510 }, { - "epoch": 1.73, - "learning_rate": 4.1190213511584135e-05, - "loss": 0.0284, + "epoch": 1.03, + "learning_rate": 0.000145563035298218, + "loss": 0.0321, "step": 159520 }, { - "epoch": 1.73, - "learning_rate": 4.1173989227075085e-05, - "loss": 0.0243, + "epoch": 1.03, + "learning_rate": 0.00014555335394386104, + "loss": 0.0324, "step": 159530 }, { - "epoch": 1.73, - "learning_rate": 4.115776494256603e-05, - "loss": 0.0238, + "epoch": 1.03, + "learning_rate": 0.0001455436725895041, + "loss": 0.0322, "step": 159540 }, { - "epoch": 1.73, - "learning_rate": 4.114154065805698e-05, - "loss": 0.0298, + "epoch": 1.03, + "learning_rate": 0.00014553399123514718, + "loss": 0.035, "step": 159550 }, { - "epoch": 1.73, - "learning_rate": 4.112531637354792e-05, - "loss": 0.0275, + "epoch": 1.03, + "learning_rate": 0.00014552430988079026, + "loss": 0.0357, "step": 159560 }, { - "epoch": 1.73, - "learning_rate": 4.110909208903887e-05, - "loss": 0.0272, + "epoch": 1.03, + "learning_rate": 0.0001455146285264333, + "loss": 0.0331, "step": 159570 }, { - "epoch": 1.73, - "learning_rate": 4.1092867804529814e-05, - "loss": 0.0286, + "epoch": 1.03, + "learning_rate": 0.0001455049471720764, + "loss": 0.0306, "step": 159580 }, { - "epoch": 1.73, - "learning_rate": 4.1076643520020764e-05, - "loss": 0.0275, + "epoch": 1.03, + "learning_rate": 0.00014549526581771944, + "loss": 0.0381, "step": 159590 }, { - "epoch": 1.73, - "learning_rate": 4.106041923551171e-05, - "loss": 0.0304, + "epoch": 1.03, + "learning_rate": 0.00014548558446336252, + "loss": 0.0341, "step": 159600 }, { - "epoch": 1.73, - "learning_rate": 4.1044194951002656e-05, - "loss": 0.0244, + "epoch": 1.03, + "learning_rate": 0.00014547590310900557, + "loss": 0.0332, "step": 159610 }, { - "epoch": 1.73, - "learning_rate": 4.1027970666493606e-05, - "loss": 0.0231, + "epoch": 1.03, + "learning_rate": 0.00014546622175464865, + "loss": 0.0371, "step": 159620 }, { - "epoch": 1.73, - "learning_rate": 4.101174638198455e-05, - "loss": 0.0237, + "epoch": 1.03, + "learning_rate": 0.00014545654040029173, + "loss": 0.0332, "step": 159630 }, { - "epoch": 1.73, - "learning_rate": 4.09955220974755e-05, - "loss": 0.0287, + "epoch": 1.03, + "learning_rate": 0.00014544685904593479, + "loss": 0.0366, "step": 159640 }, { - "epoch": 1.73, - "learning_rate": 4.097929781296644e-05, - "loss": 0.0237, + "epoch": 1.03, + "learning_rate": 0.00014543717769157787, + "loss": 0.0324, "step": 159650 }, { - "epoch": 1.73, - "learning_rate": 4.096307352845739e-05, - "loss": 0.027, + "epoch": 1.03, + "learning_rate": 0.00014542749633722092, + "loss": 0.032, "step": 159660 }, { - "epoch": 1.73, - "learning_rate": 4.0946849243948335e-05, - "loss": 0.0301, + "epoch": 1.03, + "learning_rate": 0.00014541781498286397, + "loss": 0.0333, "step": 159670 }, { - "epoch": 1.73, - "learning_rate": 4.0930624959439284e-05, - "loss": 0.0241, + "epoch": 1.03, + "learning_rate": 0.00014540813362850705, + "loss": 0.0271, "step": 159680 }, { - "epoch": 1.73, - "learning_rate": 4.0914400674930234e-05, - "loss": 0.0237, + "epoch": 1.03, + "learning_rate": 0.00014539845227415013, + "loss": 0.0347, "step": 159690 }, { - "epoch": 1.73, - "learning_rate": 4.089817639042118e-05, - "loss": 0.0259, + "epoch": 1.03, + "learning_rate": 0.0001453887709197932, + "loss": 0.0344, "step": 159700 }, { - "epoch": 1.73, - "learning_rate": 4.088195210591213e-05, - "loss": 0.0184, - "step": 159710 + "epoch": 1.03, + "learning_rate": 0.00014537908956543626, + "loss": 0.0391, + "step": 159710 }, { - "epoch": 1.73, - "learning_rate": 4.086572782140307e-05, - "loss": 0.0288, + "epoch": 1.03, + "learning_rate": 0.00014536940821107934, + "loss": 0.0395, "step": 159720 }, { - "epoch": 1.73, - "learning_rate": 4.084950353689402e-05, - "loss": 0.0242, + "epoch": 1.03, + "learning_rate": 0.0001453597268567224, + "loss": 0.0417, "step": 159730 }, { - "epoch": 1.73, - "learning_rate": 4.083327925238496e-05, - "loss": 0.0208, + "epoch": 1.03, + "learning_rate": 0.00014535004550236545, + "loss": 0.0404, "step": 159740 }, { - "epoch": 1.73, - "learning_rate": 4.081705496787591e-05, - "loss": 0.0244, + "epoch": 1.03, + "learning_rate": 0.00014534036414800853, + "loss": 0.0372, "step": 159750 }, { - "epoch": 1.73, - "learning_rate": 4.0800830683366855e-05, - "loss": 0.0224, + "epoch": 1.03, + "learning_rate": 0.0001453306827936516, + "loss": 0.0339, "step": 159760 }, { - "epoch": 1.73, - "learning_rate": 4.0784606398857805e-05, - "loss": 0.0246, + "epoch": 1.03, + "learning_rate": 0.0001453210014392947, + "loss": 0.0315, "step": 159770 }, { - "epoch": 1.73, - "learning_rate": 4.0768382114348755e-05, - "loss": 0.0252, + "epoch": 1.03, + "learning_rate": 0.00014531132008493774, + "loss": 0.032, "step": 159780 }, { - "epoch": 1.73, - "learning_rate": 4.07521578298397e-05, - "loss": 0.0272, + "epoch": 1.03, + "learning_rate": 0.0001453016387305808, + "loss": 0.0365, "step": 159790 }, { - "epoch": 1.73, - "learning_rate": 4.073593354533065e-05, - "loss": 0.0316, + "epoch": 1.03, + "learning_rate": 0.00014529195737622387, + "loss": 0.0362, "step": 159800 }, { - "epoch": 1.73, - "learning_rate": 4.071970926082159e-05, - "loss": 0.0245, + "epoch": 1.03, + "learning_rate": 0.00014528227602186693, + "loss": 0.0282, "step": 159810 }, { - "epoch": 1.73, - "learning_rate": 4.070348497631254e-05, - "loss": 0.0253, + "epoch": 1.03, + "learning_rate": 0.00014527259466751, + "loss": 0.0361, "step": 159820 }, { - "epoch": 1.73, - "learning_rate": 4.0687260691803483e-05, - "loss": 0.0227, + "epoch": 1.03, + "learning_rate": 0.00014526291331315309, + "loss": 0.0395, "step": 159830 }, { - "epoch": 1.73, - "learning_rate": 4.067103640729443e-05, - "loss": 0.0229, + "epoch": 1.03, + "learning_rate": 0.00014525323195879614, + "loss": 0.0347, "step": 159840 }, { - "epoch": 1.73, - "learning_rate": 4.0654812122785376e-05, - "loss": 0.0258, + "epoch": 1.03, + "learning_rate": 0.00014524355060443922, + "loss": 0.031, "step": 159850 }, { - "epoch": 1.73, - "learning_rate": 4.0638587838276326e-05, - "loss": 0.0245, + "epoch": 1.03, + "learning_rate": 0.00014523386925008227, + "loss": 0.0333, "step": 159860 }, { - "epoch": 1.73, - "learning_rate": 4.0622363553767276e-05, - "loss": 0.0273, + "epoch": 1.03, + "learning_rate": 0.00014522418789572535, + "loss": 0.035, "step": 159870 }, { - "epoch": 1.73, - "learning_rate": 4.060613926925822e-05, - "loss": 0.0247, + "epoch": 1.03, + "learning_rate": 0.0001452145065413684, + "loss": 0.0326, "step": 159880 }, { - "epoch": 1.73, - "learning_rate": 4.058991498474917e-05, - "loss": 0.0242, + "epoch": 1.03, + "learning_rate": 0.00014520482518701148, + "loss": 0.0392, "step": 159890 }, { - "epoch": 1.73, - "learning_rate": 4.057369070024011e-05, - "loss": 0.0268, + "epoch": 1.03, + "learning_rate": 0.00014519514383265456, + "loss": 0.0313, "step": 159900 }, { - "epoch": 1.73, - "learning_rate": 4.055746641573106e-05, - "loss": 0.0301, + "epoch": 1.03, + "learning_rate": 0.00014518546247829761, + "loss": 0.0378, "step": 159910 }, { - "epoch": 1.73, - "learning_rate": 4.0541242131222004e-05, - "loss": 0.0339, + "epoch": 1.03, + "learning_rate": 0.0001451757811239407, + "loss": 0.032, "step": 159920 }, { - "epoch": 1.73, - "learning_rate": 4.0525017846712954e-05, - "loss": 0.027, + "epoch": 1.03, + "learning_rate": 0.00014516609976958375, + "loss": 0.0359, "step": 159930 }, { - "epoch": 1.73, - "learning_rate": 4.0508793562203904e-05, - "loss": 0.0286, + "epoch": 1.03, + "learning_rate": 0.00014515641841522683, + "loss": 0.0361, "step": 159940 }, { - "epoch": 1.73, - "learning_rate": 4.049256927769485e-05, - "loss": 0.0315, + "epoch": 1.03, + "learning_rate": 0.00014514673706086988, + "loss": 0.0343, "step": 159950 }, { - "epoch": 1.73, - "learning_rate": 4.0476344993185797e-05, - "loss": 0.0267, + "epoch": 1.03, + "learning_rate": 0.00014513705570651296, + "loss": 0.0442, "step": 159960 }, { - "epoch": 1.73, - "learning_rate": 4.046012070867674e-05, - "loss": 0.0264, + "epoch": 1.03, + "learning_rate": 0.00014512737435215604, + "loss": 0.0358, "step": 159970 }, { - "epoch": 1.73, - "learning_rate": 4.044389642416769e-05, - "loss": 0.0308, + "epoch": 1.03, + "learning_rate": 0.0001451176929977991, + "loss": 0.0376, "step": 159980 }, { - "epoch": 1.73, - "learning_rate": 4.042767213965863e-05, - "loss": 0.0266, + "epoch": 1.03, + "learning_rate": 0.00014510801164344214, + "loss": 0.0335, "step": 159990 }, { - "epoch": 1.73, - "learning_rate": 4.041144785514958e-05, - "loss": 0.0249, + "epoch": 1.03, + "learning_rate": 0.00014509833028908522, + "loss": 0.0298, "step": 160000 }, { - "epoch": 1.73, - "eval_cer": 0.921070394263713, - "eval_loss": 0.02162080444395542, - "eval_runtime": 118.9899, - "eval_samples_per_second": 16.808, - "eval_steps_per_second": 4.202, + "epoch": 1.03, + "eval_cer": 0.919810190938877, + "eval_loss": 0.025443054735660553, + "eval_runtime": 120.5621, + "eval_samples_per_second": 16.589, + "eval_steps_per_second": 4.147, "step": 160000 }, { - "epoch": 1.73, - "learning_rate": 4.0395223570640525e-05, - "loss": 0.0296, + "epoch": 1.03, + "learning_rate": 0.0001450886489347283, + "loss": 0.0344, "step": 160010 }, { - "epoch": 1.73, - "learning_rate": 4.0378999286131475e-05, - "loss": 0.025, + "epoch": 1.03, + "learning_rate": 0.00014507896758037136, + "loss": 0.0417, "step": 160020 }, { - "epoch": 1.73, - "learning_rate": 4.0362775001622425e-05, - "loss": 0.0259, + "epoch": 1.03, + "learning_rate": 0.00014506928622601444, + "loss": 0.0344, "step": 160030 }, { - "epoch": 1.73, - "learning_rate": 4.034655071711337e-05, - "loss": 0.026, + "epoch": 1.03, + "learning_rate": 0.00014505960487165752, + "loss": 0.0317, "step": 160040 }, { - "epoch": 1.73, - "learning_rate": 4.033032643260432e-05, - "loss": 0.0263, + "epoch": 1.03, + "learning_rate": 0.00014504992351730057, + "loss": 0.0311, "step": 160050 }, { - "epoch": 1.73, - "learning_rate": 4.031410214809526e-05, - "loss": 0.0283, + "epoch": 1.03, + "learning_rate": 0.00014504024216294362, + "loss": 0.0316, "step": 160060 }, { - "epoch": 1.73, - "learning_rate": 4.029787786358621e-05, - "loss": 0.0223, + "epoch": 1.03, + "learning_rate": 0.0001450305608085867, + "loss": 0.0382, "step": 160070 }, { - "epoch": 1.73, - "learning_rate": 4.028165357907715e-05, - "loss": 0.0247, + "epoch": 1.03, + "learning_rate": 0.00014502087945422978, + "loss": 0.0411, "step": 160080 }, { - "epoch": 1.73, - "learning_rate": 4.02654292945681e-05, - "loss": 0.0242, + "epoch": 1.03, + "learning_rate": 0.00014501119809987283, + "loss": 0.0304, "step": 160090 }, { - "epoch": 1.73, - "learning_rate": 4.0249205010059046e-05, - "loss": 0.0262, + "epoch": 1.03, + "learning_rate": 0.00014500151674551591, + "loss": 0.0428, "step": 160100 }, { - "epoch": 1.73, - "learning_rate": 4.0232980725549996e-05, - "loss": 0.0282, + "epoch": 1.03, + "learning_rate": 0.00014499183539115897, + "loss": 0.0383, "step": 160110 }, { - "epoch": 1.73, - "learning_rate": 4.0216756441040946e-05, - "loss": 0.0234, + "epoch": 1.03, + "learning_rate": 0.00014498215403680205, + "loss": 0.0345, "step": 160120 }, { - "epoch": 1.73, - "learning_rate": 4.020053215653189e-05, - "loss": 0.0258, + "epoch": 1.03, + "learning_rate": 0.0001449724726824451, + "loss": 0.0293, "step": 160130 }, { - "epoch": 1.73, - "learning_rate": 4.018430787202284e-05, - "loss": 0.0259, + "epoch": 1.03, + "learning_rate": 0.00014496279132808818, + "loss": 0.0343, "step": 160140 }, { - "epoch": 1.73, - "learning_rate": 4.016808358751378e-05, - "loss": 0.0277, + "epoch": 1.03, + "learning_rate": 0.00014495310997373126, + "loss": 0.0378, "step": 160150 }, { - "epoch": 1.73, - "learning_rate": 4.015185930300474e-05, - "loss": 0.027, + "epoch": 1.03, + "learning_rate": 0.0001449434286193743, + "loss": 0.0283, "step": 160160 }, { - "epoch": 1.73, - "learning_rate": 4.013563501849569e-05, - "loss": 0.0285, + "epoch": 1.03, + "learning_rate": 0.0001449337472650174, + "loss": 0.0307, "step": 160170 }, { - "epoch": 1.73, - "learning_rate": 4.011941073398663e-05, - "loss": 0.0245, + "epoch": 1.03, + "learning_rate": 0.00014492406591066044, + "loss": 0.0331, "step": 160180 }, { - "epoch": 1.73, - "learning_rate": 4.010318644947758e-05, - "loss": 0.0253, + "epoch": 1.03, + "learning_rate": 0.0001449143845563035, + "loss": 0.0333, "step": 160190 }, { - "epoch": 1.73, - "learning_rate": 4.008696216496852e-05, - "loss": 0.0247, + "epoch": 1.03, + "learning_rate": 0.00014490470320194658, + "loss": 0.0395, "step": 160200 }, { - "epoch": 1.73, - "learning_rate": 4.007073788045947e-05, - "loss": 0.0268, + "epoch": 1.03, + "learning_rate": 0.00014489502184758966, + "loss": 0.037, "step": 160210 }, { - "epoch": 1.73, - "learning_rate": 4.0054513595950416e-05, - "loss": 0.0226, + "epoch": 1.03, + "learning_rate": 0.00014488534049323274, + "loss": 0.0434, "step": 160220 }, { - "epoch": 1.73, - "learning_rate": 4.0038289311441366e-05, - "loss": 0.0286, + "epoch": 1.03, + "learning_rate": 0.0001448756591388758, + "loss": 0.0345, "step": 160230 }, { - "epoch": 1.73, - "learning_rate": 4.0022065026932316e-05, - "loss": 0.0232, + "epoch": 1.03, + "learning_rate": 0.00014486597778451887, + "loss": 0.0339, "step": 160240 }, { - "epoch": 1.73, - "learning_rate": 4.000584074242326e-05, - "loss": 0.0298, + "epoch": 1.03, + "learning_rate": 0.00014485629643016192, + "loss": 0.0328, "step": 160250 }, { - "epoch": 1.73, - "learning_rate": 3.998961645791421e-05, - "loss": 0.0277, + "epoch": 1.03, + "learning_rate": 0.00014484661507580497, + "loss": 0.0346, "step": 160260 }, { - "epoch": 1.73, - "learning_rate": 3.997339217340515e-05, - "loss": 0.0291, + "epoch": 1.03, + "learning_rate": 0.00014483693372144805, + "loss": 0.0313, "step": 160270 }, { - "epoch": 1.73, - "learning_rate": 3.99571678888961e-05, - "loss": 0.0258, + "epoch": 1.03, + "learning_rate": 0.00014482725236709113, + "loss": 0.0323, "step": 160280 }, { - "epoch": 1.73, - "learning_rate": 3.9940943604387044e-05, - "loss": 0.028, + "epoch": 1.03, + "learning_rate": 0.0001448175710127342, + "loss": 0.0375, "step": 160290 }, { - "epoch": 1.73, - "learning_rate": 3.9924719319877994e-05, - "loss": 0.0274, + "epoch": 1.03, + "learning_rate": 0.00014480788965837727, + "loss": 0.0313, "step": 160300 }, { - "epoch": 1.73, - "learning_rate": 3.990849503536894e-05, - "loss": 0.0261, + "epoch": 1.03, + "learning_rate": 0.00014479820830402032, + "loss": 0.0317, "step": 160310 }, { - "epoch": 1.73, - "learning_rate": 3.989227075085989e-05, - "loss": 0.0357, + "epoch": 1.03, + "learning_rate": 0.0001447885269496634, + "loss": 0.039, "step": 160320 }, { - "epoch": 1.73, - "learning_rate": 3.9876046466350836e-05, - "loss": 0.0214, + "epoch": 1.03, + "learning_rate": 0.00014477884559530645, + "loss": 0.0325, "step": 160330 }, { - "epoch": 1.73, - "learning_rate": 3.985982218184178e-05, - "loss": 0.0257, + "epoch": 1.03, + "learning_rate": 0.00014476916424094953, + "loss": 0.0372, "step": 160340 }, { - "epoch": 1.73, - "learning_rate": 3.984359789733273e-05, - "loss": 0.0239, + "epoch": 1.03, + "learning_rate": 0.0001447594828865926, + "loss": 0.0346, "step": 160350 }, { - "epoch": 1.73, - "learning_rate": 3.982737361282367e-05, - "loss": 0.0317, + "epoch": 1.03, + "learning_rate": 0.00014474980153223566, + "loss": 0.0328, "step": 160360 }, { - "epoch": 1.73, - "learning_rate": 3.981114932831462e-05, - "loss": 0.0253, + "epoch": 1.04, + "learning_rate": 0.00014474012017787874, + "loss": 0.0338, "step": 160370 }, { - "epoch": 1.73, - "learning_rate": 3.9794925043805565e-05, - "loss": 0.0245, + "epoch": 1.04, + "learning_rate": 0.0001447304388235218, + "loss": 0.0317, "step": 160380 }, { - "epoch": 1.73, - "learning_rate": 3.9778700759296515e-05, - "loss": 0.0289, + "epoch": 1.04, + "learning_rate": 0.00014472075746916488, + "loss": 0.0336, "step": 160390 }, { - "epoch": 1.73, - "learning_rate": 3.976247647478746e-05, - "loss": 0.0242, + "epoch": 1.04, + "learning_rate": 0.00014471107611480793, + "loss": 0.0315, "step": 160400 }, { - "epoch": 1.74, - "learning_rate": 3.974625219027841e-05, - "loss": 0.0234, + "epoch": 1.04, + "learning_rate": 0.000144701394760451, + "loss": 0.0377, "step": 160410 }, { - "epoch": 1.74, - "learning_rate": 3.973002790576936e-05, - "loss": 0.0244, + "epoch": 1.04, + "learning_rate": 0.0001446917134060941, + "loss": 0.0368, "step": 160420 }, { - "epoch": 1.74, - "learning_rate": 3.97138036212603e-05, - "loss": 0.0288, + "epoch": 1.04, + "learning_rate": 0.00014468203205173714, + "loss": 0.0324, "step": 160430 }, { - "epoch": 1.74, - "learning_rate": 3.969757933675125e-05, - "loss": 0.0244, + "epoch": 1.04, + "learning_rate": 0.00014467235069738022, + "loss": 0.0344, "step": 160440 }, { - "epoch": 1.74, - "learning_rate": 3.968135505224219e-05, - "loss": 0.0224, + "epoch": 1.04, + "learning_rate": 0.00014466266934302327, + "loss": 0.0316, "step": 160450 }, { - "epoch": 1.74, - "learning_rate": 3.966513076773314e-05, - "loss": 0.0237, + "epoch": 1.04, + "learning_rate": 0.00014465298798866635, + "loss": 0.0374, "step": 160460 }, { - "epoch": 1.74, - "learning_rate": 3.9648906483224086e-05, - "loss": 0.0238, + "epoch": 1.04, + "learning_rate": 0.0001446433066343094, + "loss": 0.0327, "step": 160470 }, { - "epoch": 1.74, - "learning_rate": 3.9632682198715036e-05, - "loss": 0.022, + "epoch": 1.04, + "learning_rate": 0.00014463362527995249, + "loss": 0.0414, "step": 160480 }, { - "epoch": 1.74, - "learning_rate": 3.961645791420598e-05, - "loss": 0.0273, + "epoch": 1.04, + "learning_rate": 0.00014462394392559557, + "loss": 0.0388, "step": 160490 }, { - "epoch": 1.74, - "learning_rate": 3.960023362969693e-05, - "loss": 0.0326, + "epoch": 1.04, + "learning_rate": 0.00014461426257123862, + "loss": 0.0398, "step": 160500 }, { - "epoch": 1.74, - "learning_rate": 3.958400934518788e-05, - "loss": 0.033, + "epoch": 1.04, + "learning_rate": 0.00014460458121688167, + "loss": 0.0383, "step": 160510 }, { - "epoch": 1.74, - "learning_rate": 3.956778506067882e-05, - "loss": 0.0241, + "epoch": 1.04, + "learning_rate": 0.00014459489986252475, + "loss": 0.0366, "step": 160520 }, { - "epoch": 1.74, - "learning_rate": 3.955156077616977e-05, - "loss": 0.025, + "epoch": 1.04, + "learning_rate": 0.00014458521850816783, + "loss": 0.0397, "step": 160530 }, { - "epoch": 1.74, - "learning_rate": 3.9535336491660714e-05, - "loss": 0.0252, + "epoch": 1.04, + "learning_rate": 0.00014457553715381088, + "loss": 0.0353, "step": 160540 }, { - "epoch": 1.74, - "learning_rate": 3.9519112207151664e-05, - "loss": 0.0284, + "epoch": 1.04, + "learning_rate": 0.00014456585579945396, + "loss": 0.0341, "step": 160550 }, { - "epoch": 1.74, - "learning_rate": 3.950288792264261e-05, - "loss": 0.029, + "epoch": 1.04, + "learning_rate": 0.00014455617444509702, + "loss": 0.0397, "step": 160560 }, { - "epoch": 1.74, - "learning_rate": 3.9486663638133556e-05, - "loss": 0.02, + "epoch": 1.04, + "learning_rate": 0.0001445464930907401, + "loss": 0.0377, "step": 160570 }, { - "epoch": 1.74, - "learning_rate": 3.9470439353624506e-05, - "loss": 0.028, + "epoch": 1.04, + "learning_rate": 0.00014453681173638315, + "loss": 0.035, "step": 160580 }, { - "epoch": 1.74, - "learning_rate": 3.945421506911545e-05, - "loss": 0.0289, + "epoch": 1.04, + "learning_rate": 0.00014452713038202623, + "loss": 0.0321, "step": 160590 }, { - "epoch": 1.74, - "learning_rate": 3.94379907846064e-05, - "loss": 0.0187, + "epoch": 1.04, + "learning_rate": 0.0001445174490276693, + "loss": 0.0322, "step": 160600 }, { - "epoch": 1.74, - "learning_rate": 3.942176650009734e-05, - "loss": 0.0264, + "epoch": 1.04, + "learning_rate": 0.00014450776767331236, + "loss": 0.0348, "step": 160610 }, { - "epoch": 1.74, - "learning_rate": 3.940554221558829e-05, - "loss": 0.0261, + "epoch": 1.04, + "learning_rate": 0.00014449808631895544, + "loss": 0.0304, "step": 160620 }, { - "epoch": 1.74, - "learning_rate": 3.9389317931079235e-05, - "loss": 0.0268, + "epoch": 1.04, + "learning_rate": 0.0001444884049645985, + "loss": 0.037, "step": 160630 }, { - "epoch": 1.74, - "learning_rate": 3.9373093646570185e-05, - "loss": 0.026, + "epoch": 1.04, + "learning_rate": 0.00014447872361024157, + "loss": 0.0389, "step": 160640 }, { - "epoch": 1.74, - "learning_rate": 3.935686936206113e-05, - "loss": 0.029, + "epoch": 1.04, + "learning_rate": 0.00014446904225588463, + "loss": 0.0355, "step": 160650 }, { - "epoch": 1.74, - "learning_rate": 3.934064507755208e-05, - "loss": 0.0212, + "epoch": 1.04, + "learning_rate": 0.0001444593609015277, + "loss": 0.0343, "step": 160660 }, { - "epoch": 1.74, - "learning_rate": 3.932442079304303e-05, - "loss": 0.0273, + "epoch": 1.04, + "learning_rate": 0.00014444967954717078, + "loss": 0.032, "step": 160670 }, { - "epoch": 1.74, - "learning_rate": 3.930819650853397e-05, - "loss": 0.0259, + "epoch": 1.04, + "learning_rate": 0.00014443999819281384, + "loss": 0.0322, "step": 160680 }, { - "epoch": 1.74, - "learning_rate": 3.929197222402492e-05, - "loss": 0.0231, + "epoch": 1.04, + "learning_rate": 0.00014443031683845692, + "loss": 0.0308, "step": 160690 }, { - "epoch": 1.74, - "learning_rate": 3.927574793951586e-05, - "loss": 0.0243, + "epoch": 1.04, + "learning_rate": 0.00014442063548409997, + "loss": 0.0357, "step": 160700 }, { - "epoch": 1.74, - "learning_rate": 3.925952365500681e-05, - "loss": 0.0245, + "epoch": 1.04, + "learning_rate": 0.00014441095412974305, + "loss": 0.0352, "step": 160710 }, { - "epoch": 1.74, - "learning_rate": 3.9243299370497756e-05, - "loss": 0.0234, + "epoch": 1.04, + "learning_rate": 0.0001444012727753861, + "loss": 0.035, "step": 160720 }, { - "epoch": 1.74, - "learning_rate": 3.9227075085988705e-05, - "loss": 0.0244, + "epoch": 1.04, + "learning_rate": 0.00014439159142102918, + "loss": 0.0333, "step": 160730 }, { - "epoch": 1.74, - "learning_rate": 3.921085080147965e-05, - "loss": 0.0202, + "epoch": 1.04, + "learning_rate": 0.00014438191006667226, + "loss": 0.04, "step": 160740 }, { - "epoch": 1.74, - "learning_rate": 3.91946265169706e-05, - "loss": 0.0296, + "epoch": 1.04, + "learning_rate": 0.00014437222871231531, + "loss": 0.035, "step": 160750 }, { - "epoch": 1.74, - "learning_rate": 3.917840223246155e-05, - "loss": 0.0267, + "epoch": 1.04, + "learning_rate": 0.00014436254735795837, + "loss": 0.0377, "step": 160760 }, { - "epoch": 1.74, - "learning_rate": 3.916217794795249e-05, - "loss": 0.0306, + "epoch": 1.04, + "learning_rate": 0.00014435286600360145, + "loss": 0.034, "step": 160770 }, { - "epoch": 1.74, - "learning_rate": 3.914595366344344e-05, - "loss": 0.027, + "epoch": 1.04, + "learning_rate": 0.00014434318464924453, + "loss": 0.0359, "step": 160780 }, { - "epoch": 1.74, - "learning_rate": 3.9129729378934384e-05, - "loss": 0.0219, + "epoch": 1.04, + "learning_rate": 0.00014433350329488758, + "loss": 0.0313, "step": 160790 }, { - "epoch": 1.74, - "learning_rate": 3.9113505094425333e-05, - "loss": 0.0292, + "epoch": 1.04, + "learning_rate": 0.00014432382194053066, + "loss": 0.0316, "step": 160800 }, { - "epoch": 1.74, - "learning_rate": 3.9097280809916276e-05, - "loss": 0.0255, + "epoch": 1.04, + "learning_rate": 0.00014431414058617374, + "loss": 0.0324, "step": 160810 }, { - "epoch": 1.74, - "learning_rate": 3.9081056525407226e-05, - "loss": 0.0243, + "epoch": 1.04, + "learning_rate": 0.0001443044592318168, + "loss": 0.0376, "step": 160820 }, { - "epoch": 1.74, - "learning_rate": 3.906483224089817e-05, - "loss": 0.0271, + "epoch": 1.04, + "learning_rate": 0.00014429477787745984, + "loss": 0.0303, "step": 160830 }, { - "epoch": 1.74, - "learning_rate": 3.904860795638912e-05, - "loss": 0.0235, + "epoch": 1.04, + "learning_rate": 0.00014428509652310292, + "loss": 0.0359, "step": 160840 }, { - "epoch": 1.74, - "learning_rate": 3.903238367188007e-05, - "loss": 0.0293, + "epoch": 1.04, + "learning_rate": 0.000144275415168746, + "loss": 0.0341, "step": 160850 }, { - "epoch": 1.74, - "learning_rate": 3.901615938737101e-05, - "loss": 0.031, + "epoch": 1.04, + "learning_rate": 0.00014426573381438906, + "loss": 0.0338, "step": 160860 }, { - "epoch": 1.74, - "learning_rate": 3.899993510286196e-05, - "loss": 0.0246, + "epoch": 1.04, + "learning_rate": 0.00014425605246003214, + "loss": 0.0329, "step": 160870 }, { - "epoch": 1.74, - "learning_rate": 3.8983710818352904e-05, - "loss": 0.023, + "epoch": 1.04, + "learning_rate": 0.0001442463711056752, + "loss": 0.0329, "step": 160880 }, { - "epoch": 1.74, - "learning_rate": 3.8967486533843854e-05, - "loss": 0.0306, + "epoch": 1.04, + "learning_rate": 0.00014423668975131827, + "loss": 0.0366, "step": 160890 }, { - "epoch": 1.74, - "learning_rate": 3.89512622493348e-05, - "loss": 0.0216, + "epoch": 1.04, + "learning_rate": 0.00014422700839696132, + "loss": 0.0303, "step": 160900 }, { - "epoch": 1.74, - "learning_rate": 3.893503796482575e-05, - "loss": 0.0298, + "epoch": 1.04, + "learning_rate": 0.0001442173270426044, + "loss": 0.0371, "step": 160910 }, { - "epoch": 1.74, - "learning_rate": 3.891881368031669e-05, - "loss": 0.0208, + "epoch": 1.04, + "learning_rate": 0.00014420764568824748, + "loss": 0.0332, "step": 160920 }, { - "epoch": 1.74, - "learning_rate": 3.890258939580764e-05, - "loss": 0.0296, + "epoch": 1.04, + "learning_rate": 0.00014419796433389053, + "loss": 0.0335, "step": 160930 }, { - "epoch": 1.74, - "learning_rate": 3.888636511129859e-05, - "loss": 0.0255, + "epoch": 1.04, + "learning_rate": 0.00014418828297953361, + "loss": 0.0317, "step": 160940 }, { - "epoch": 1.74, - "learning_rate": 3.887014082678953e-05, - "loss": 0.0218, + "epoch": 1.04, + "learning_rate": 0.00014417860162517667, + "loss": 0.0398, "step": 160950 }, { - "epoch": 1.74, - "learning_rate": 3.885391654228048e-05, - "loss": 0.026, + "epoch": 1.04, + "learning_rate": 0.00014416892027081972, + "loss": 0.0311, "step": 160960 }, { - "epoch": 1.74, - "learning_rate": 3.8837692257771425e-05, - "loss": 0.0236, + "epoch": 1.04, + "learning_rate": 0.0001441592389164628, + "loss": 0.035, "step": 160970 }, { - "epoch": 1.74, - "learning_rate": 3.8821467973262375e-05, - "loss": 0.0266, - "step": 160980 + "epoch": 1.04, + "learning_rate": 0.00014414955756210588, + "loss": 0.0365, + "step": 160980 }, { - "epoch": 1.74, - "learning_rate": 3.880524368875332e-05, - "loss": 0.0231, + "epoch": 1.04, + "learning_rate": 0.00014413987620774896, + "loss": 0.034, "step": 160990 }, { - "epoch": 1.74, - "learning_rate": 3.878901940424427e-05, - "loss": 0.0264, + "epoch": 1.04, + "learning_rate": 0.000144130194853392, + "loss": 0.0316, "step": 161000 }, { - "epoch": 1.74, - "eval_cer": 0.9210721612323546, - "eval_loss": 0.021502630785107613, - "eval_runtime": 118.9442, - "eval_samples_per_second": 16.815, - "eval_steps_per_second": 4.204, + "epoch": 1.04, + "eval_cer": 0.9198617105411818, + "eval_loss": 0.025041013956069946, + "eval_runtime": 120.0341, + "eval_samples_per_second": 16.662, + "eval_steps_per_second": 4.165, "step": 161000 }, { - "epoch": 1.74, - "learning_rate": 3.877279511973522e-05, - "loss": 0.0265, + "epoch": 1.04, + "learning_rate": 0.0001441205134990351, + "loss": 0.032, "step": 161010 }, { - "epoch": 1.74, - "learning_rate": 3.875657083522616e-05, - "loss": 0.0238, + "epoch": 1.04, + "learning_rate": 0.00014411083214467814, + "loss": 0.0337, "step": 161020 }, { - "epoch": 1.74, - "learning_rate": 3.874034655071711e-05, - "loss": 0.0211, + "epoch": 1.04, + "learning_rate": 0.0001441011507903212, + "loss": 0.037, "step": 161030 }, { - "epoch": 1.74, - "learning_rate": 3.872412226620805e-05, - "loss": 0.041, + "epoch": 1.04, + "learning_rate": 0.00014409146943596428, + "loss": 0.0404, "step": 161040 }, { - "epoch": 1.74, - "learning_rate": 3.8707897981699e-05, - "loss": 0.0308, + "epoch": 1.04, + "learning_rate": 0.00014408178808160736, + "loss": 0.0339, "step": 161050 }, { - "epoch": 1.74, - "learning_rate": 3.8691673697189946e-05, - "loss": 0.0248, + "epoch": 1.04, + "learning_rate": 0.00014407210672725044, + "loss": 0.0345, "step": 161060 }, { - "epoch": 1.74, - "learning_rate": 3.8675449412680896e-05, - "loss": 0.0255, + "epoch": 1.04, + "learning_rate": 0.0001440624253728935, + "loss": 0.0313, "step": 161070 }, { - "epoch": 1.74, - "learning_rate": 3.865922512817184e-05, - "loss": 0.0243, + "epoch": 1.04, + "learning_rate": 0.00014405274401853654, + "loss": 0.0331, "step": 161080 }, { - "epoch": 1.74, - "learning_rate": 3.864300084366279e-05, - "loss": 0.0278, + "epoch": 1.04, + "learning_rate": 0.00014404306266417962, + "loss": 0.0405, "step": 161090 }, { - "epoch": 1.74, - "learning_rate": 3.862677655915374e-05, - "loss": 0.0252, + "epoch": 1.04, + "learning_rate": 0.00014403338130982267, + "loss": 0.0336, "step": 161100 }, { - "epoch": 1.74, - "learning_rate": 3.861055227464468e-05, - "loss": 0.0254, + "epoch": 1.04, + "learning_rate": 0.00014402369995546575, + "loss": 0.0392, "step": 161110 }, { - "epoch": 1.74, - "learning_rate": 3.859432799013563e-05, - "loss": 0.029, + "epoch": 1.04, + "learning_rate": 0.00014401401860110883, + "loss": 0.0355, "step": 161120 }, { - "epoch": 1.74, - "learning_rate": 3.8578103705626574e-05, - "loss": 0.0261, + "epoch": 1.04, + "learning_rate": 0.0001440043372467519, + "loss": 0.0292, "step": 161130 }, { - "epoch": 1.74, - "learning_rate": 3.8561879421117524e-05, - "loss": 0.0292, + "epoch": 1.04, + "learning_rate": 0.00014399465589239497, + "loss": 0.0356, "step": 161140 }, { - "epoch": 1.74, - "learning_rate": 3.854565513660847e-05, - "loss": 0.0232, + "epoch": 1.04, + "learning_rate": 0.00014398497453803802, + "loss": 0.0335, "step": 161150 }, { - "epoch": 1.74, - "learning_rate": 3.852943085209942e-05, - "loss": 0.0221, + "epoch": 1.04, + "learning_rate": 0.0001439752931836811, + "loss": 0.0311, "step": 161160 }, { - "epoch": 1.74, - "learning_rate": 3.851320656759036e-05, - "loss": 0.0258, + "epoch": 1.04, + "learning_rate": 0.00014396561182932415, + "loss": 0.0333, "step": 161170 }, { - "epoch": 1.74, - "learning_rate": 3.849698228308131e-05, - "loss": 0.0239, + "epoch": 1.04, + "learning_rate": 0.00014395593047496723, + "loss": 0.0313, "step": 161180 }, { - "epoch": 1.74, - "learning_rate": 3.848075799857226e-05, - "loss": 0.0224, + "epoch": 1.04, + "learning_rate": 0.0001439462491206103, + "loss": 0.0322, "step": 161190 }, { - "epoch": 1.74, - "learning_rate": 3.84645337140632e-05, - "loss": 0.0261, + "epoch": 1.04, + "learning_rate": 0.00014393656776625336, + "loss": 0.0306, "step": 161200 }, { - "epoch": 1.74, - "learning_rate": 3.844830942955415e-05, - "loss": 0.0257, + "epoch": 1.04, + "learning_rate": 0.00014392688641189644, + "loss": 0.0392, "step": 161210 }, { - "epoch": 1.74, - "learning_rate": 3.8432085145045095e-05, - "loss": 0.0284, + "epoch": 1.04, + "learning_rate": 0.0001439172050575395, + "loss": 0.0408, "step": 161220 }, { - "epoch": 1.74, - "learning_rate": 3.8415860860536045e-05, - "loss": 0.0243, + "epoch": 1.04, + "learning_rate": 0.00014390752370318258, + "loss": 0.0371, "step": 161230 }, { - "epoch": 1.74, - "learning_rate": 3.839963657602699e-05, - "loss": 0.0228, + "epoch": 1.04, + "learning_rate": 0.00014389784234882563, + "loss": 0.0369, "step": 161240 }, { - "epoch": 1.74, - "learning_rate": 3.838341229151794e-05, - "loss": 0.029, + "epoch": 1.04, + "learning_rate": 0.0001438881609944687, + "loss": 0.032, "step": 161250 }, { - "epoch": 1.74, - "learning_rate": 3.836718800700888e-05, - "loss": 0.0272, + "epoch": 1.04, + "learning_rate": 0.0001438784796401118, + "loss": 0.0369, "step": 161260 }, { - "epoch": 1.74, - "learning_rate": 3.835096372249983e-05, - "loss": 0.0282, + "epoch": 1.04, + "learning_rate": 0.00014386879828575484, + "loss": 0.0318, "step": 161270 }, { - "epoch": 1.74, - "learning_rate": 3.833473943799078e-05, - "loss": 0.0224, + "epoch": 1.04, + "learning_rate": 0.0001438591169313979, + "loss": 0.0352, "step": 161280 }, { - "epoch": 1.74, - "learning_rate": 3.831851515348172e-05, - "loss": 0.0231, + "epoch": 1.04, + "learning_rate": 0.00014384943557704097, + "loss": 0.0365, "step": 161290 }, { - "epoch": 1.74, - "learning_rate": 3.830229086897267e-05, - "loss": 0.028, + "epoch": 1.04, + "learning_rate": 0.00014383975422268405, + "loss": 0.0364, "step": 161300 }, { - "epoch": 1.74, - "learning_rate": 3.8286066584463616e-05, - "loss": 0.0272, + "epoch": 1.04, + "learning_rate": 0.0001438300728683271, + "loss": 0.0351, "step": 161310 }, { - "epoch": 1.74, - "learning_rate": 3.8269842299954566e-05, - "loss": 0.0225, + "epoch": 1.04, + "learning_rate": 0.00014382039151397019, + "loss": 0.0339, "step": 161320 }, { - "epoch": 1.74, - "learning_rate": 3.825361801544552e-05, - "loss": 0.0227, + "epoch": 1.04, + "learning_rate": 0.00014381071015961326, + "loss": 0.0363, "step": 161330 }, { - "epoch": 1.75, - "learning_rate": 3.8237393730936465e-05, - "loss": 0.0284, + "epoch": 1.04, + "learning_rate": 0.00014380102880525632, + "loss": 0.0315, "step": 161340 }, { - "epoch": 1.75, - "learning_rate": 3.8221169446427415e-05, - "loss": 0.0248, + "epoch": 1.04, + "learning_rate": 0.00014379134745089937, + "loss": 0.0338, "step": 161350 }, { - "epoch": 1.75, - "learning_rate": 3.820494516191836e-05, - "loss": 0.0216, + "epoch": 1.04, + "learning_rate": 0.00014378166609654245, + "loss": 0.0319, "step": 161360 }, { - "epoch": 1.75, - "learning_rate": 3.818872087740931e-05, - "loss": 0.0238, + "epoch": 1.04, + "learning_rate": 0.00014377198474218553, + "loss": 0.0321, "step": 161370 }, { - "epoch": 1.75, - "learning_rate": 3.817249659290025e-05, - "loss": 0.0258, + "epoch": 1.04, + "learning_rate": 0.00014376230338782858, + "loss": 0.0412, "step": 161380 }, { - "epoch": 1.75, - "learning_rate": 3.81562723083912e-05, - "loss": 0.023, + "epoch": 1.04, + "learning_rate": 0.00014375262203347166, + "loss": 0.03, "step": 161390 }, { - "epoch": 1.75, - "learning_rate": 3.814004802388215e-05, - "loss": 0.0315, + "epoch": 1.04, + "learning_rate": 0.00014374294067911472, + "loss": 0.0345, "step": 161400 }, { - "epoch": 1.75, - "learning_rate": 3.812382373937309e-05, - "loss": 0.0303, + "epoch": 1.04, + "learning_rate": 0.0001437332593247578, + "loss": 0.0305, "step": 161410 }, { - "epoch": 1.75, - "learning_rate": 3.810759945486404e-05, - "loss": 0.0253, + "epoch": 1.04, + "learning_rate": 0.00014372357797040085, + "loss": 0.0329, "step": 161420 }, { - "epoch": 1.75, - "learning_rate": 3.8091375170354986e-05, - "loss": 0.0228, + "epoch": 1.04, + "learning_rate": 0.00014371389661604393, + "loss": 0.0335, "step": 161430 }, { - "epoch": 1.75, - "learning_rate": 3.8075150885845936e-05, - "loss": 0.0297, + "epoch": 1.04, + "learning_rate": 0.000143704215261687, + "loss": 0.0335, "step": 161440 }, { - "epoch": 1.75, - "learning_rate": 3.805892660133688e-05, - "loss": 0.0273, + "epoch": 1.04, + "learning_rate": 0.00014369453390733006, + "loss": 0.0368, "step": 161450 }, { - "epoch": 1.75, - "learning_rate": 3.804270231682783e-05, - "loss": 0.0246, + "epoch": 1.04, + "learning_rate": 0.00014368485255297314, + "loss": 0.039, "step": 161460 }, { - "epoch": 1.75, - "learning_rate": 3.802647803231877e-05, - "loss": 0.0244, + "epoch": 1.04, + "learning_rate": 0.0001436751711986162, + "loss": 0.0306, "step": 161470 }, { - "epoch": 1.75, - "learning_rate": 3.801025374780972e-05, - "loss": 0.0258, + "epoch": 1.04, + "learning_rate": 0.00014366548984425927, + "loss": 0.0313, "step": 161480 }, { - "epoch": 1.75, - "learning_rate": 3.799402946330067e-05, - "loss": 0.0268, + "epoch": 1.04, + "learning_rate": 0.00014365580848990232, + "loss": 0.0342, "step": 161490 }, { - "epoch": 1.75, - "learning_rate": 3.7977805178791614e-05, - "loss": 0.0253, + "epoch": 1.04, + "learning_rate": 0.0001436461271355454, + "loss": 0.039, "step": 161500 }, { - "epoch": 1.75, - "learning_rate": 3.7961580894282564e-05, - "loss": 0.0305, + "epoch": 1.04, + "learning_rate": 0.00014363644578118848, + "loss": 0.0386, "step": 161510 }, { - "epoch": 1.75, - "learning_rate": 3.794535660977351e-05, - "loss": 0.0251, + "epoch": 1.04, + "learning_rate": 0.00014362676442683154, + "loss": 0.0367, "step": 161520 }, { - "epoch": 1.75, - "learning_rate": 3.7929132325264457e-05, - "loss": 0.0284, + "epoch": 1.04, + "learning_rate": 0.00014361708307247462, + "loss": 0.0331, "step": 161530 }, { - "epoch": 1.75, - "learning_rate": 3.79129080407554e-05, - "loss": 0.0256, + "epoch": 1.04, + "learning_rate": 0.00014360740171811767, + "loss": 0.0407, "step": 161540 }, { - "epoch": 1.75, - "learning_rate": 3.789668375624635e-05, - "loss": 0.0278, + "epoch": 1.04, + "learning_rate": 0.00014359772036376075, + "loss": 0.0338, "step": 161550 }, { - "epoch": 1.75, - "learning_rate": 3.788045947173729e-05, - "loss": 0.0241, + "epoch": 1.04, + "learning_rate": 0.0001435880390094038, + "loss": 0.0295, "step": 161560 }, { - "epoch": 1.75, - "learning_rate": 3.786423518722824e-05, - "loss": 0.0272, + "epoch": 1.04, + "learning_rate": 0.00014357835765504688, + "loss": 0.0356, "step": 161570 }, { - "epoch": 1.75, - "learning_rate": 3.784801090271919e-05, - "loss": 0.0288, + "epoch": 1.04, + "learning_rate": 0.00014356867630068996, + "loss": 0.0387, "step": 161580 }, { - "epoch": 1.75, - "learning_rate": 3.7831786618210135e-05, - "loss": 0.025, + "epoch": 1.04, + "learning_rate": 0.00014355899494633301, + "loss": 0.0398, "step": 161590 }, { - "epoch": 1.75, - "learning_rate": 3.7815562333701085e-05, - "loss": 0.0248, + "epoch": 1.04, + "learning_rate": 0.00014354931359197607, + "loss": 0.032, "step": 161600 }, { - "epoch": 1.75, - "learning_rate": 3.779933804919203e-05, - "loss": 0.0262, + "epoch": 1.04, + "learning_rate": 0.00014353963223761915, + "loss": 0.0315, "step": 161610 }, { - "epoch": 1.75, - "learning_rate": 3.778311376468298e-05, - "loss": 0.028, + "epoch": 1.04, + "learning_rate": 0.00014352995088326223, + "loss": 0.0406, "step": 161620 }, { - "epoch": 1.75, - "learning_rate": 3.776688948017392e-05, - "loss": 0.0241, + "epoch": 1.04, + "learning_rate": 0.00014352026952890528, + "loss": 0.036, "step": 161630 }, { - "epoch": 1.75, - "learning_rate": 3.775066519566487e-05, - "loss": 0.0274, + "epoch": 1.04, + "learning_rate": 0.00014351058817454836, + "loss": 0.0315, "step": 161640 }, { - "epoch": 1.75, - "learning_rate": 3.773444091115582e-05, - "loss": 0.0232, + "epoch": 1.04, + "learning_rate": 0.0001435009068201914, + "loss": 0.0396, "step": 161650 }, { - "epoch": 1.75, - "learning_rate": 3.771821662664676e-05, - "loss": 0.0301, + "epoch": 1.04, + "learning_rate": 0.0001434912254658345, + "loss": 0.0302, "step": 161660 }, { - "epoch": 1.75, - "learning_rate": 3.770199234213771e-05, - "loss": 0.0246, + "epoch": 1.04, + "learning_rate": 0.00014348154411147754, + "loss": 0.0387, "step": 161670 }, { - "epoch": 1.75, - "learning_rate": 3.7685768057628656e-05, - "loss": 0.0219, + "epoch": 1.04, + "learning_rate": 0.00014347186275712062, + "loss": 0.0354, "step": 161680 }, { - "epoch": 1.75, - "learning_rate": 3.7669543773119605e-05, - "loss": 0.0257, + "epoch": 1.04, + "learning_rate": 0.0001434621814027637, + "loss": 0.0361, "step": 161690 }, { - "epoch": 1.75, - "learning_rate": 3.765331948861055e-05, - "loss": 0.0263, + "epoch": 1.04, + "learning_rate": 0.00014345250004840676, + "loss": 0.0345, "step": 161700 }, { - "epoch": 1.75, - "learning_rate": 3.76370952041015e-05, - "loss": 0.0248, + "epoch": 1.04, + "learning_rate": 0.00014344281869404984, + "loss": 0.0311, "step": 161710 }, { - "epoch": 1.75, - "learning_rate": 3.762087091959244e-05, - "loss": 0.0298, + "epoch": 1.04, + "learning_rate": 0.0001434331373396929, + "loss": 0.0361, "step": 161720 }, { - "epoch": 1.75, - "learning_rate": 3.760464663508339e-05, - "loss": 0.0284, + "epoch": 1.04, + "learning_rate": 0.00014342345598533597, + "loss": 0.0336, "step": 161730 }, { - "epoch": 1.75, - "learning_rate": 3.758842235057434e-05, - "loss": 0.0276, + "epoch": 1.04, + "learning_rate": 0.00014341377463097902, + "loss": 0.04, "step": 161740 }, { - "epoch": 1.75, - "learning_rate": 3.7572198066065284e-05, - "loss": 0.0283, + "epoch": 1.04, + "learning_rate": 0.0001434040932766221, + "loss": 0.0311, "step": 161750 }, { - "epoch": 1.75, - "learning_rate": 3.7555973781556234e-05, - "loss": 0.0275, + "epoch": 1.04, + "learning_rate": 0.00014339441192226518, + "loss": 0.0383, "step": 161760 }, { - "epoch": 1.75, - "learning_rate": 3.7539749497047177e-05, - "loss": 0.0311, + "epoch": 1.04, + "learning_rate": 0.00014338473056790823, + "loss": 0.0318, "step": 161770 }, { - "epoch": 1.75, - "learning_rate": 3.7523525212538126e-05, - "loss": 0.023, + "epoch": 1.04, + "learning_rate": 0.0001433750492135513, + "loss": 0.032, "step": 161780 }, { - "epoch": 1.75, - "learning_rate": 3.750730092802907e-05, - "loss": 0.0226, + "epoch": 1.04, + "learning_rate": 0.00014336536785919437, + "loss": 0.0308, "step": 161790 }, { - "epoch": 1.75, - "learning_rate": 3.749107664352002e-05, - "loss": 0.0234, + "epoch": 1.04, + "learning_rate": 0.00014335568650483742, + "loss": 0.039, "step": 161800 }, { - "epoch": 1.75, - "learning_rate": 3.747485235901096e-05, - "loss": 0.0321, + "epoch": 1.04, + "learning_rate": 0.0001433460051504805, + "loss": 0.0333, "step": 161810 }, { - "epoch": 1.75, - "learning_rate": 3.745862807450191e-05, - "loss": 0.0247, + "epoch": 1.04, + "learning_rate": 0.00014333632379612358, + "loss": 0.0322, "step": 161820 }, { - "epoch": 1.75, - "learning_rate": 3.744240378999286e-05, - "loss": 0.0238, + "epoch": 1.04, + "learning_rate": 0.00014332664244176666, + "loss": 0.0376, "step": 161830 }, { - "epoch": 1.75, - "learning_rate": 3.7426179505483805e-05, - "loss": 0.0234, + "epoch": 1.04, + "learning_rate": 0.0001433169610874097, + "loss": 0.0414, "step": 161840 }, { - "epoch": 1.75, - "learning_rate": 3.7409955220974754e-05, - "loss": 0.0306, + "epoch": 1.04, + "learning_rate": 0.00014330727973305276, + "loss": 0.0359, "step": 161850 }, { - "epoch": 1.75, - "learning_rate": 3.73937309364657e-05, - "loss": 0.0253, + "epoch": 1.04, + "learning_rate": 0.00014329759837869584, + "loss": 0.0372, "step": 161860 }, { - "epoch": 1.75, - "learning_rate": 3.737750665195665e-05, - "loss": 0.0235, + "epoch": 1.04, + "learning_rate": 0.0001432879170243389, + "loss": 0.0341, "step": 161870 }, { - "epoch": 1.75, - "learning_rate": 3.736128236744759e-05, - "loss": 0.024, + "epoch": 1.04, + "learning_rate": 0.00014327823566998198, + "loss": 0.0334, "step": 161880 }, { - "epoch": 1.75, - "learning_rate": 3.734505808293854e-05, - "loss": 0.0274, + "epoch": 1.04, + "learning_rate": 0.00014326855431562506, + "loss": 0.0335, "step": 161890 }, { - "epoch": 1.75, - "learning_rate": 3.732883379842948e-05, - "loss": 0.0297, + "epoch": 1.04, + "learning_rate": 0.00014325887296126814, + "loss": 0.039, "step": 161900 }, { - "epoch": 1.75, - "learning_rate": 3.731260951392043e-05, - "loss": 0.0245, + "epoch": 1.05, + "learning_rate": 0.0001432491916069112, + "loss": 0.0415, "step": 161910 }, { - "epoch": 1.75, - "learning_rate": 3.729638522941138e-05, - "loss": 0.0249, + "epoch": 1.05, + "learning_rate": 0.00014323951025255424, + "loss": 0.0348, "step": 161920 }, { - "epoch": 1.75, - "learning_rate": 3.7280160944902325e-05, - "loss": 0.029, + "epoch": 1.05, + "learning_rate": 0.00014322982889819732, + "loss": 0.0309, "step": 161930 }, { - "epoch": 1.75, - "learning_rate": 3.7263936660393275e-05, - "loss": 0.0236, + "epoch": 1.05, + "learning_rate": 0.00014322014754384037, + "loss": 0.0333, "step": 161940 }, { - "epoch": 1.75, - "learning_rate": 3.724771237588422e-05, - "loss": 0.0251, + "epoch": 1.05, + "learning_rate": 0.00014321046618948345, + "loss": 0.0359, "step": 161950 }, { - "epoch": 1.75, - "learning_rate": 3.723148809137517e-05, - "loss": 0.0337, + "epoch": 1.05, + "learning_rate": 0.00014320078483512653, + "loss": 0.0324, "step": 161960 }, { - "epoch": 1.75, - "learning_rate": 3.721526380686611e-05, - "loss": 0.0215, + "epoch": 1.05, + "learning_rate": 0.00014319110348076959, + "loss": 0.0322, "step": 161970 }, { - "epoch": 1.75, - "learning_rate": 3.719903952235706e-05, - "loss": 0.027, + "epoch": 1.05, + "learning_rate": 0.00014318142212641267, + "loss": 0.0318, "step": 161980 }, { - "epoch": 1.75, - "learning_rate": 3.7182815237848004e-05, - "loss": 0.0258, + "epoch": 1.05, + "learning_rate": 0.00014317174077205572, + "loss": 0.0386, "step": 161990 }, { - "epoch": 1.75, - "learning_rate": 3.7166590953338954e-05, - "loss": 0.0264, + "epoch": 1.05, + "learning_rate": 0.0001431620594176988, + "loss": 0.0322, "step": 162000 }, { - "epoch": 1.75, - "eval_cer": 0.9211128015111116, - "eval_loss": 0.021288909018039703, - "eval_runtime": 119.0345, - "eval_samples_per_second": 16.802, - "eval_steps_per_second": 4.2, + "epoch": 1.05, + "eval_cer": 0.9199168455541746, + "eval_loss": 0.024344589561223984, + "eval_runtime": 120.0857, + "eval_samples_per_second": 16.655, + "eval_steps_per_second": 4.164, "step": 162000 }, { - "epoch": 1.75, - "learning_rate": 3.71503666688299e-05, - "loss": 0.0222, + "epoch": 1.05, + "learning_rate": 0.00014315237806334185, + "loss": 0.0327, "step": 162010 }, { - "epoch": 1.75, - "learning_rate": 3.7134142384320846e-05, - "loss": 0.031, + "epoch": 1.05, + "learning_rate": 0.00014314269670898493, + "loss": 0.0367, "step": 162020 }, { - "epoch": 1.75, - "learning_rate": 3.7117918099811796e-05, - "loss": 0.0263, + "epoch": 1.05, + "learning_rate": 0.000143133015354628, + "loss": 0.0369, "step": 162030 }, { - "epoch": 1.75, - "learning_rate": 3.710169381530274e-05, - "loss": 0.025, + "epoch": 1.05, + "learning_rate": 0.00014312333400027106, + "loss": 0.036, "step": 162040 }, { - "epoch": 1.75, - "learning_rate": 3.708546953079369e-05, - "loss": 0.0257, + "epoch": 1.05, + "learning_rate": 0.00014311365264591412, + "loss": 0.0399, "step": 162050 }, { - "epoch": 1.75, - "learning_rate": 3.706924524628463e-05, - "loss": 0.0213, + "epoch": 1.05, + "learning_rate": 0.0001431039712915572, + "loss": 0.0353, "step": 162060 }, { - "epoch": 1.75, - "learning_rate": 3.705302096177558e-05, - "loss": 0.0292, + "epoch": 1.05, + "learning_rate": 0.00014309428993720028, + "loss": 0.0294, "step": 162070 }, { - "epoch": 1.75, - "learning_rate": 3.703679667726653e-05, - "loss": 0.0257, + "epoch": 1.05, + "learning_rate": 0.00014308460858284333, + "loss": 0.0263, "step": 162080 }, { - "epoch": 1.75, - "learning_rate": 3.7020572392757474e-05, - "loss": 0.0253, + "epoch": 1.05, + "learning_rate": 0.0001430749272284864, + "loss": 0.0408, "step": 162090 }, { - "epoch": 1.75, - "learning_rate": 3.7004348108248424e-05, - "loss": 0.0324, + "epoch": 1.05, + "learning_rate": 0.0001430652458741295, + "loss": 0.0361, "step": 162100 }, { - "epoch": 1.75, - "learning_rate": 3.698812382373937e-05, - "loss": 0.0239, + "epoch": 1.05, + "learning_rate": 0.00014305556451977254, + "loss": 0.0347, "step": 162110 }, { - "epoch": 1.75, - "learning_rate": 3.697189953923032e-05, - "loss": 0.0274, + "epoch": 1.05, + "learning_rate": 0.0001430458831654156, + "loss": 0.0343, "step": 162120 }, { - "epoch": 1.75, - "learning_rate": 3.695567525472126e-05, - "loss": 0.0225, + "epoch": 1.05, + "learning_rate": 0.00014303620181105867, + "loss": 0.0348, "step": 162130 }, { - "epoch": 1.75, - "learning_rate": 3.693945097021221e-05, - "loss": 0.0258, + "epoch": 1.05, + "learning_rate": 0.00014302652045670175, + "loss": 0.0362, "step": 162140 }, { - "epoch": 1.75, - "learning_rate": 3.692322668570315e-05, - "loss": 0.022, + "epoch": 1.05, + "learning_rate": 0.0001430168391023448, + "loss": 0.0299, "step": 162150 }, { - "epoch": 1.75, - "learning_rate": 3.69070024011941e-05, - "loss": 0.0272, + "epoch": 1.05, + "learning_rate": 0.00014300715774798788, + "loss": 0.0363, "step": 162160 }, { - "epoch": 1.75, - "learning_rate": 3.689077811668505e-05, - "loss": 0.0269, + "epoch": 1.05, + "learning_rate": 0.00014299747639363094, + "loss": 0.0392, "step": 162170 }, { - "epoch": 1.75, - "learning_rate": 3.6874553832175995e-05, - "loss": 0.0275, + "epoch": 1.05, + "learning_rate": 0.00014298779503927402, + "loss": 0.0379, "step": 162180 }, { - "epoch": 1.75, - "learning_rate": 3.6858329547666945e-05, - "loss": 0.0251, + "epoch": 1.05, + "learning_rate": 0.00014297811368491707, + "loss": 0.0364, "step": 162190 }, { - "epoch": 1.75, - "learning_rate": 3.684210526315789e-05, - "loss": 0.0213, + "epoch": 1.05, + "learning_rate": 0.00014296843233056015, + "loss": 0.0308, "step": 162200 }, { - "epoch": 1.75, - "learning_rate": 3.682588097864884e-05, - "loss": 0.0259, + "epoch": 1.05, + "learning_rate": 0.00014295875097620323, + "loss": 0.0347, "step": 162210 }, { - "epoch": 1.75, - "learning_rate": 3.680965669413979e-05, - "loss": 0.0232, + "epoch": 1.05, + "learning_rate": 0.00014294906962184628, + "loss": 0.0368, "step": 162220 }, { - "epoch": 1.75, - "learning_rate": 3.679343240963074e-05, - "loss": 0.0305, + "epoch": 1.05, + "learning_rate": 0.00014293938826748936, + "loss": 0.0323, "step": 162230 }, { - "epoch": 1.75, - "learning_rate": 3.677720812512168e-05, - "loss": 0.0259, + "epoch": 1.05, + "learning_rate": 0.00014292970691313241, + "loss": 0.0317, "step": 162240 }, { - "epoch": 1.75, - "learning_rate": 3.676098384061263e-05, - "loss": 0.0276, + "epoch": 1.05, + "learning_rate": 0.0001429200255587755, + "loss": 0.0316, "step": 162250 }, { - "epoch": 1.76, - "learning_rate": 3.674475955610357e-05, - "loss": 0.0257, + "epoch": 1.05, + "learning_rate": 0.00014291034420441855, + "loss": 0.0337, "step": 162260 }, { - "epoch": 1.76, - "learning_rate": 3.672853527159452e-05, - "loss": 0.0205, + "epoch": 1.05, + "learning_rate": 0.00014290066285006163, + "loss": 0.0423, "step": 162270 }, { - "epoch": 1.76, - "learning_rate": 3.6712310987085466e-05, - "loss": 0.0304, + "epoch": 1.05, + "learning_rate": 0.0001428909814957047, + "loss": 0.0366, "step": 162280 }, { - "epoch": 1.76, - "learning_rate": 3.6696086702576416e-05, - "loss": 0.0268, + "epoch": 1.05, + "learning_rate": 0.00014288130014134776, + "loss": 0.0375, "step": 162290 }, { - "epoch": 1.76, - "learning_rate": 3.667986241806736e-05, - "loss": 0.0207, + "epoch": 1.05, + "learning_rate": 0.00014287161878699084, + "loss": 0.032, "step": 162300 }, { - "epoch": 1.76, - "learning_rate": 3.666363813355831e-05, - "loss": 0.0301, + "epoch": 1.05, + "learning_rate": 0.0001428619374326339, + "loss": 0.0325, "step": 162310 }, { - "epoch": 1.76, - "learning_rate": 3.664741384904926e-05, - "loss": 0.0252, + "epoch": 1.05, + "learning_rate": 0.00014285225607827697, + "loss": 0.0379, "step": 162320 }, { - "epoch": 1.76, - "learning_rate": 3.66311895645402e-05, - "loss": 0.0252, + "epoch": 1.05, + "learning_rate": 0.00014284257472392002, + "loss": 0.0308, "step": 162330 }, { - "epoch": 1.76, - "learning_rate": 3.661496528003115e-05, - "loss": 0.026, + "epoch": 1.05, + "learning_rate": 0.0001428328933695631, + "loss": 0.0324, "step": 162340 }, { - "epoch": 1.76, - "learning_rate": 3.6598740995522094e-05, - "loss": 0.0231, + "epoch": 1.05, + "learning_rate": 0.00014282321201520618, + "loss": 0.0318, "step": 162350 }, { - "epoch": 1.76, - "learning_rate": 3.6582516711013044e-05, - "loss": 0.0247, + "epoch": 1.05, + "learning_rate": 0.00014281353066084924, + "loss": 0.0311, "step": 162360 }, { - "epoch": 1.76, - "learning_rate": 3.6566292426503987e-05, - "loss": 0.0336, + "epoch": 1.05, + "learning_rate": 0.0001428038493064923, + "loss": 0.033, "step": 162370 }, { - "epoch": 1.76, - "learning_rate": 3.6550068141994936e-05, - "loss": 0.0303, + "epoch": 1.05, + "learning_rate": 0.00014279416795213537, + "loss": 0.0333, "step": 162380 }, { - "epoch": 1.76, - "learning_rate": 3.653384385748588e-05, - "loss": 0.0326, + "epoch": 1.05, + "learning_rate": 0.00014278448659777845, + "loss": 0.0345, "step": 162390 }, { - "epoch": 1.76, - "learning_rate": 3.651761957297683e-05, - "loss": 0.0252, + "epoch": 1.05, + "learning_rate": 0.0001427748052434215, + "loss": 0.0315, "step": 162400 }, { - "epoch": 1.76, - "learning_rate": 3.650139528846778e-05, - "loss": 0.0237, + "epoch": 1.05, + "learning_rate": 0.00014276512388906458, + "loss": 0.0312, "step": 162410 }, { - "epoch": 1.76, - "learning_rate": 3.648517100395872e-05, - "loss": 0.0244, + "epoch": 1.05, + "learning_rate": 0.00014275544253470766, + "loss": 0.0424, "step": 162420 }, { - "epoch": 1.76, - "learning_rate": 3.646894671944967e-05, - "loss": 0.0243, + "epoch": 1.05, + "learning_rate": 0.00014274576118035071, + "loss": 0.0336, "step": 162430 }, { - "epoch": 1.76, - "learning_rate": 3.6452722434940615e-05, - "loss": 0.0256, + "epoch": 1.05, + "learning_rate": 0.00014273607982599377, + "loss": 0.0317, "step": 162440 }, { - "epoch": 1.76, - "learning_rate": 3.6436498150431564e-05, - "loss": 0.0197, + "epoch": 1.05, + "learning_rate": 0.00014272639847163685, + "loss": 0.0346, "step": 162450 }, { - "epoch": 1.76, - "learning_rate": 3.642027386592251e-05, - "loss": 0.0333, + "epoch": 1.05, + "learning_rate": 0.00014271671711727993, + "loss": 0.0334, "step": 162460 }, { - "epoch": 1.76, - "learning_rate": 3.640404958141346e-05, - "loss": 0.0285, + "epoch": 1.05, + "learning_rate": 0.00014270703576292298, + "loss": 0.0361, "step": 162470 }, { - "epoch": 1.76, - "learning_rate": 3.63878252969044e-05, - "loss": 0.0252, + "epoch": 1.05, + "learning_rate": 0.00014269735440856606, + "loss": 0.0355, "step": 162480 }, { - "epoch": 1.76, - "learning_rate": 3.637160101239535e-05, - "loss": 0.0283, + "epoch": 1.05, + "learning_rate": 0.0001426876730542091, + "loss": 0.0408, "step": 162490 }, { - "epoch": 1.76, - "learning_rate": 3.63553767278863e-05, - "loss": 0.0237, + "epoch": 1.05, + "learning_rate": 0.0001426779916998522, + "loss": 0.0304, "step": 162500 }, { - "epoch": 1.76, - "learning_rate": 3.633915244337724e-05, - "loss": 0.028, + "epoch": 1.05, + "learning_rate": 0.00014266831034549524, + "loss": 0.0343, "step": 162510 }, { - "epoch": 1.76, - "learning_rate": 3.632292815886819e-05, - "loss": 0.0269, + "epoch": 1.05, + "learning_rate": 0.00014265862899113832, + "loss": 0.0369, "step": 162520 }, { - "epoch": 1.76, - "learning_rate": 3.6306703874359136e-05, - "loss": 0.023, + "epoch": 1.05, + "learning_rate": 0.0001426489476367814, + "loss": 0.0385, "step": 162530 }, { - "epoch": 1.76, - "learning_rate": 3.6290479589850085e-05, - "loss": 0.0307, + "epoch": 1.05, + "learning_rate": 0.00014263926628242446, + "loss": 0.033, "step": 162540 }, { - "epoch": 1.76, - "learning_rate": 3.627425530534103e-05, - "loss": 0.0284, + "epoch": 1.05, + "learning_rate": 0.00014262958492806754, + "loss": 0.0393, "step": 162550 }, { - "epoch": 1.76, - "learning_rate": 3.625803102083198e-05, - "loss": 0.0248, + "epoch": 1.05, + "learning_rate": 0.0001426199035737106, + "loss": 0.0363, "step": 162560 }, { - "epoch": 1.76, - "learning_rate": 3.624180673632293e-05, - "loss": 0.0235, + "epoch": 1.05, + "learning_rate": 0.00014261022221935364, + "loss": 0.035, "step": 162570 }, { - "epoch": 1.76, - "learning_rate": 3.622558245181387e-05, - "loss": 0.0223, + "epoch": 1.05, + "learning_rate": 0.00014260054086499672, + "loss": 0.0509, "step": 162580 }, { - "epoch": 1.76, - "learning_rate": 3.620935816730482e-05, - "loss": 0.0275, + "epoch": 1.05, + "learning_rate": 0.0001425908595106398, + "loss": 0.0344, "step": 162590 }, { - "epoch": 1.76, - "learning_rate": 3.6193133882795764e-05, - "loss": 0.0256, + "epoch": 1.05, + "learning_rate": 0.00014258117815628288, + "loss": 0.0312, "step": 162600 }, { - "epoch": 1.76, - "learning_rate": 3.617690959828671e-05, - "loss": 0.0266, + "epoch": 1.05, + "learning_rate": 0.00014257149680192593, + "loss": 0.0307, "step": 162610 }, { - "epoch": 1.76, - "learning_rate": 3.6160685313777656e-05, - "loss": 0.0253, + "epoch": 1.05, + "learning_rate": 0.000142561815447569, + "loss": 0.0284, "step": 162620 }, { - "epoch": 1.76, - "learning_rate": 3.6144461029268606e-05, - "loss": 0.0281, + "epoch": 1.05, + "learning_rate": 0.00014255213409321207, + "loss": 0.0342, "step": 162630 }, { - "epoch": 1.76, - "learning_rate": 3.612823674475955e-05, - "loss": 0.0259, + "epoch": 1.05, + "learning_rate": 0.00014254245273885512, + "loss": 0.0325, "step": 162640 }, { - "epoch": 1.76, - "learning_rate": 3.61120124602505e-05, - "loss": 0.0274, + "epoch": 1.05, + "learning_rate": 0.0001425327713844982, + "loss": 0.0302, "step": 162650 }, { - "epoch": 1.76, - "learning_rate": 3.609578817574145e-05, - "loss": 0.0286, + "epoch": 1.05, + "learning_rate": 0.00014252309003014128, + "loss": 0.0359, "step": 162660 }, { - "epoch": 1.76, - "learning_rate": 3.607956389123239e-05, - "loss": 0.0205, + "epoch": 1.05, + "learning_rate": 0.00014251340867578436, + "loss": 0.0333, "step": 162670 }, { - "epoch": 1.76, - "learning_rate": 3.606333960672334e-05, - "loss": 0.0228, + "epoch": 1.05, + "learning_rate": 0.0001425037273214274, + "loss": 0.0471, "step": 162680 }, { - "epoch": 1.76, - "learning_rate": 3.6047115322214284e-05, - "loss": 0.0304, + "epoch": 1.05, + "learning_rate": 0.00014249404596707046, + "loss": 0.0311, "step": 162690 }, { - "epoch": 1.76, - "learning_rate": 3.6030891037705234e-05, - "loss": 0.0224, + "epoch": 1.05, + "learning_rate": 0.00014248436461271354, + "loss": 0.0329, "step": 162700 }, { - "epoch": 1.76, - "learning_rate": 3.601466675319618e-05, - "loss": 0.0253, + "epoch": 1.05, + "learning_rate": 0.0001424746832583566, + "loss": 0.0355, "step": 162710 }, { - "epoch": 1.76, - "learning_rate": 3.599844246868713e-05, - "loss": 0.0273, + "epoch": 1.05, + "learning_rate": 0.00014246500190399968, + "loss": 0.0337, "step": 162720 }, { - "epoch": 1.76, - "learning_rate": 3.598221818417807e-05, - "loss": 0.0227, + "epoch": 1.05, + "learning_rate": 0.00014245532054964276, + "loss": 0.0348, "step": 162730 }, { - "epoch": 1.76, - "learning_rate": 3.596599389966902e-05, - "loss": 0.0228, + "epoch": 1.05, + "learning_rate": 0.0001424456391952858, + "loss": 0.029, "step": 162740 }, { - "epoch": 1.76, - "learning_rate": 3.594976961515997e-05, - "loss": 0.0216, + "epoch": 1.05, + "learning_rate": 0.0001424359578409289, + "loss": 0.0304, "step": 162750 }, { - "epoch": 1.76, - "learning_rate": 3.593354533065091e-05, - "loss": 0.0281, + "epoch": 1.05, + "learning_rate": 0.00014242627648657194, + "loss": 0.0341, "step": 162760 }, { - "epoch": 1.76, - "learning_rate": 3.591732104614186e-05, - "loss": 0.0221, + "epoch": 1.05, + "learning_rate": 0.00014241659513221502, + "loss": 0.0323, "step": 162770 }, { - "epoch": 1.76, - "learning_rate": 3.5901096761632805e-05, - "loss": 0.03, + "epoch": 1.05, + "learning_rate": 0.00014240691377785807, + "loss": 0.0365, "step": 162780 }, { - "epoch": 1.76, - "learning_rate": 3.5884872477123755e-05, - "loss": 0.0265, + "epoch": 1.05, + "learning_rate": 0.00014239723242350115, + "loss": 0.0326, "step": 162790 }, { - "epoch": 1.76, - "learning_rate": 3.5868648192614705e-05, - "loss": 0.0203, + "epoch": 1.05, + "learning_rate": 0.00014238755106914423, + "loss": 0.0305, "step": 162800 }, { - "epoch": 1.76, - "learning_rate": 3.5852423908105655e-05, - "loss": 0.0279, + "epoch": 1.05, + "learning_rate": 0.00014237786971478729, + "loss": 0.0324, "step": 162810 }, { - "epoch": 1.76, - "learning_rate": 3.58361996235966e-05, - "loss": 0.0233, + "epoch": 1.05, + "learning_rate": 0.00014236818836043036, + "loss": 0.0358, "step": 162820 }, { - "epoch": 1.76, - "learning_rate": 3.581997533908755e-05, - "loss": 0.0296, + "epoch": 1.05, + "learning_rate": 0.00014235850700607342, + "loss": 0.0343, "step": 162830 }, { - "epoch": 1.76, - "learning_rate": 3.580375105457849e-05, - "loss": 0.0222, + "epoch": 1.05, + "learning_rate": 0.0001423488256517165, + "loss": 0.0265, "step": 162840 }, { - "epoch": 1.76, - "learning_rate": 3.578752677006944e-05, - "loss": 0.0292, + "epoch": 1.05, + "learning_rate": 0.00014233914429735955, + "loss": 0.0336, "step": 162850 }, { - "epoch": 1.76, - "learning_rate": 3.577130248556038e-05, - "loss": 0.026, + "epoch": 1.05, + "learning_rate": 0.00014232946294300263, + "loss": 0.0346, "step": 162860 }, { - "epoch": 1.76, - "learning_rate": 3.575507820105133e-05, - "loss": 0.0322, + "epoch": 1.05, + "learning_rate": 0.0001423197815886457, + "loss": 0.0414, "step": 162870 }, { - "epoch": 1.76, - "learning_rate": 3.5738853916542276e-05, - "loss": 0.0222, + "epoch": 1.05, + "learning_rate": 0.00014231010023428876, + "loss": 0.0293, "step": 162880 }, { - "epoch": 1.76, - "learning_rate": 3.5722629632033226e-05, - "loss": 0.0239, + "epoch": 1.05, + "learning_rate": 0.00014230041887993182, + "loss": 0.0371, "step": 162890 }, { - "epoch": 1.76, - "learning_rate": 3.5706405347524175e-05, - "loss": 0.0267, + "epoch": 1.05, + "learning_rate": 0.0001422907375255749, + "loss": 0.0407, "step": 162900 }, { - "epoch": 1.76, - "learning_rate": 3.569018106301512e-05, - "loss": 0.0253, + "epoch": 1.05, + "learning_rate": 0.00014228105617121797, + "loss": 0.0293, "step": 162910 }, { - "epoch": 1.76, - "learning_rate": 3.567395677850607e-05, - "loss": 0.0293, + "epoch": 1.05, + "learning_rate": 0.00014227137481686103, + "loss": 0.0388, "step": 162920 }, { - "epoch": 1.76, - "learning_rate": 3.565773249399701e-05, - "loss": 0.0275, + "epoch": 1.05, + "learning_rate": 0.0001422616934625041, + "loss": 0.0318, "step": 162930 }, { - "epoch": 1.76, - "learning_rate": 3.564150820948796e-05, - "loss": 0.0284, + "epoch": 1.05, + "learning_rate": 0.00014225201210814716, + "loss": 0.035, "step": 162940 }, { - "epoch": 1.76, - "learning_rate": 3.5625283924978904e-05, - "loss": 0.0272, + "epoch": 1.05, + "learning_rate": 0.00014224233075379024, + "loss": 0.0376, "step": 162950 }, { - "epoch": 1.76, - "learning_rate": 3.5609059640469854e-05, - "loss": 0.0279, + "epoch": 1.05, + "learning_rate": 0.0001422326493994333, + "loss": 0.0311, "step": 162960 }, { - "epoch": 1.76, - "learning_rate": 3.55928353559608e-05, - "loss": 0.0298, + "epoch": 1.05, + "learning_rate": 0.00014222296804507637, + "loss": 0.0312, "step": 162970 }, { - "epoch": 1.76, - "learning_rate": 3.5576611071451746e-05, - "loss": 0.024, + "epoch": 1.05, + "learning_rate": 0.00014221328669071945, + "loss": 0.0327, "step": 162980 }, { - "epoch": 1.76, - "learning_rate": 3.5560386786942696e-05, - "loss": 0.031, + "epoch": 1.05, + "learning_rate": 0.0001422036053363625, + "loss": 0.0341, "step": 162990 }, { - "epoch": 1.76, - "learning_rate": 3.554416250243364e-05, - "loss": 0.0306, + "epoch": 1.05, + "learning_rate": 0.00014219392398200558, + "loss": 0.0313, "step": 163000 }, { - "epoch": 1.76, - "eval_cer": 0.9210951318246955, - "eval_loss": 0.02121070772409439, - "eval_runtime": 119.0044, - "eval_samples_per_second": 16.806, - "eval_steps_per_second": 4.202, + "epoch": 1.05, + "eval_cer": 0.9198481527511015, + "eval_loss": 0.024626342579722404, + "eval_runtime": 120.1691, + "eval_samples_per_second": 16.643, + "eval_steps_per_second": 4.161, "step": 163000 }, { - "epoch": 1.76, - "learning_rate": 3.552793821792459e-05, - "loss": 0.0287, + "epoch": 1.05, + "learning_rate": 0.00014218424262764864, + "loss": 0.0356, "step": 163010 }, { - "epoch": 1.76, - "learning_rate": 3.551171393341553e-05, - "loss": 0.0241, + "epoch": 1.05, + "learning_rate": 0.00014217456127329172, + "loss": 0.0372, "step": 163020 }, { - "epoch": 1.76, - "learning_rate": 3.549548964890648e-05, - "loss": 0.0248, + "epoch": 1.05, + "learning_rate": 0.00014216487991893477, + "loss": 0.0331, "step": 163030 }, { - "epoch": 1.76, - "learning_rate": 3.5479265364397425e-05, - "loss": 0.0219, + "epoch": 1.05, + "learning_rate": 0.00014215519856457785, + "loss": 0.0353, "step": 163040 }, { - "epoch": 1.76, - "learning_rate": 3.5463041079888375e-05, - "loss": 0.0229, + "epoch": 1.05, + "learning_rate": 0.00014214551721022093, + "loss": 0.0386, "step": 163050 }, { - "epoch": 1.76, - "learning_rate": 3.544681679537932e-05, - "loss": 0.0216, + "epoch": 1.05, + "learning_rate": 0.00014213583585586398, + "loss": 0.0388, "step": 163060 }, { - "epoch": 1.76, - "learning_rate": 3.543059251087027e-05, - "loss": 0.0296, + "epoch": 1.05, + "learning_rate": 0.00014212615450150706, + "loss": 0.0356, "step": 163070 }, { - "epoch": 1.76, - "learning_rate": 3.541436822636122e-05, - "loss": 0.0238, + "epoch": 1.05, + "learning_rate": 0.00014211647314715011, + "loss": 0.0364, "step": 163080 }, { - "epoch": 1.76, - "learning_rate": 3.539814394185216e-05, - "loss": 0.0291, + "epoch": 1.05, + "learning_rate": 0.0001421067917927932, + "loss": 0.0326, "step": 163090 }, { - "epoch": 1.76, - "learning_rate": 3.538191965734311e-05, - "loss": 0.0277, + "epoch": 1.05, + "learning_rate": 0.00014209711043843625, + "loss": 0.0318, "step": 163100 }, { - "epoch": 1.76, - "learning_rate": 3.536569537283405e-05, - "loss": 0.0256, + "epoch": 1.05, + "learning_rate": 0.00014208742908407933, + "loss": 0.0384, "step": 163110 }, { - "epoch": 1.76, - "learning_rate": 3.5349471088325e-05, - "loss": 0.0262, + "epoch": 1.05, + "learning_rate": 0.0001420777477297224, + "loss": 0.0364, "step": 163120 }, { - "epoch": 1.76, - "learning_rate": 3.5333246803815946e-05, - "loss": 0.0234, + "epoch": 1.05, + "learning_rate": 0.00014206806637536546, + "loss": 0.0329, "step": 163130 }, { - "epoch": 1.76, - "learning_rate": 3.5317022519306895e-05, - "loss": 0.0363, + "epoch": 1.05, + "learning_rate": 0.0001420583850210085, + "loss": 0.0339, "step": 163140 }, { - "epoch": 1.76, - "learning_rate": 3.5300798234797845e-05, - "loss": 0.0237, + "epoch": 1.05, + "learning_rate": 0.0001420487036666516, + "loss": 0.0342, "step": 163150 }, { - "epoch": 1.76, - "learning_rate": 3.528457395028879e-05, - "loss": 0.0295, + "epoch": 1.05, + "learning_rate": 0.00014203902231229467, + "loss": 0.0323, "step": 163160 }, { - "epoch": 1.76, - "learning_rate": 3.526834966577974e-05, - "loss": 0.0225, + "epoch": 1.05, + "learning_rate": 0.00014202934095793772, + "loss": 0.0323, "step": 163170 }, { - "epoch": 1.76, - "learning_rate": 3.525212538127068e-05, - "loss": 0.0226, + "epoch": 1.05, + "learning_rate": 0.0001420196596035808, + "loss": 0.0344, "step": 163180 }, { - "epoch": 1.77, - "learning_rate": 3.523590109676163e-05, - "loss": 0.0244, + "epoch": 1.05, + "learning_rate": 0.00014200997824922388, + "loss": 0.0347, "step": 163190 }, { - "epoch": 1.77, - "learning_rate": 3.5219676812252574e-05, - "loss": 0.0251, + "epoch": 1.05, + "learning_rate": 0.00014200029689486694, + "loss": 0.034, "step": 163200 }, { - "epoch": 1.77, - "learning_rate": 3.5203452527743523e-05, - "loss": 0.0265, + "epoch": 1.05, + "learning_rate": 0.00014199061554051, + "loss": 0.0452, "step": 163210 }, { - "epoch": 1.77, - "learning_rate": 3.5187228243234466e-05, - "loss": 0.0257, + "epoch": 1.05, + "learning_rate": 0.00014198093418615307, + "loss": 0.0346, "step": 163220 }, { - "epoch": 1.77, - "learning_rate": 3.5171003958725416e-05, - "loss": 0.0204, + "epoch": 1.05, + "learning_rate": 0.00014197125283179615, + "loss": 0.0352, "step": 163230 }, { - "epoch": 1.77, - "learning_rate": 3.5154779674216366e-05, - "loss": 0.023, + "epoch": 1.05, + "learning_rate": 0.0001419615714774392, + "loss": 0.0304, "step": 163240 }, { - "epoch": 1.77, - "learning_rate": 3.513855538970731e-05, - "loss": 0.0241, + "epoch": 1.05, + "learning_rate": 0.00014195189012308228, + "loss": 0.031, "step": 163250 }, { - "epoch": 1.77, - "learning_rate": 3.512233110519826e-05, - "loss": 0.0263, + "epoch": 1.05, + "learning_rate": 0.00014194220876872533, + "loss": 0.0404, "step": 163260 }, { - "epoch": 1.77, - "learning_rate": 3.51061068206892e-05, - "loss": 0.0254, + "epoch": 1.05, + "learning_rate": 0.0001419325274143684, + "loss": 0.0284, "step": 163270 }, { - "epoch": 1.77, - "learning_rate": 3.508988253618015e-05, - "loss": 0.0246, + "epoch": 1.05, + "learning_rate": 0.00014192284606001147, + "loss": 0.0363, "step": 163280 }, { - "epoch": 1.77, - "learning_rate": 3.5073658251671094e-05, - "loss": 0.0297, + "epoch": 1.05, + "learning_rate": 0.00014191316470565455, + "loss": 0.0363, "step": 163290 }, { - "epoch": 1.77, - "learning_rate": 3.5057433967162044e-05, - "loss": 0.0237, + "epoch": 1.05, + "learning_rate": 0.00014190348335129763, + "loss": 0.0344, "step": 163300 }, { - "epoch": 1.77, - "learning_rate": 3.504120968265299e-05, - "loss": 0.0262, + "epoch": 1.05, + "learning_rate": 0.00014189380199694068, + "loss": 0.0342, "step": 163310 }, { - "epoch": 1.77, - "learning_rate": 3.502498539814394e-05, - "loss": 0.025, + "epoch": 1.05, + "learning_rate": 0.00014188412064258376, + "loss": 0.0358, "step": 163320 }, { - "epoch": 1.77, - "learning_rate": 3.500876111363489e-05, - "loss": 0.0241, + "epoch": 1.05, + "learning_rate": 0.0001418744392882268, + "loss": 0.0325, "step": 163330 }, { - "epoch": 1.77, - "learning_rate": 3.499253682912583e-05, - "loss": 0.0254, + "epoch": 1.05, + "learning_rate": 0.00014186475793386986, + "loss": 0.0344, "step": 163340 }, { - "epoch": 1.77, - "learning_rate": 3.497631254461678e-05, - "loss": 0.0245, + "epoch": 1.05, + "learning_rate": 0.00014185507657951294, + "loss": 0.0332, "step": 163350 }, { - "epoch": 1.77, - "learning_rate": 3.496008826010772e-05, - "loss": 0.0258, + "epoch": 1.05, + "learning_rate": 0.00014184539522515602, + "loss": 0.0382, "step": 163360 }, { - "epoch": 1.77, - "learning_rate": 3.494386397559867e-05, - "loss": 0.0308, + "epoch": 1.05, + "learning_rate": 0.0001418357138707991, + "loss": 0.0396, "step": 163370 }, { - "epoch": 1.77, - "learning_rate": 3.492763969108962e-05, - "loss": 0.0288, + "epoch": 1.05, + "learning_rate": 0.00014182603251644216, + "loss": 0.0318, "step": 163380 }, { - "epoch": 1.77, - "learning_rate": 3.491141540658057e-05, - "loss": 0.0281, + "epoch": 1.05, + "learning_rate": 0.00014181635116208524, + "loss": 0.0374, "step": 163390 }, { - "epoch": 1.77, - "learning_rate": 3.4895191122071515e-05, - "loss": 0.0276, + "epoch": 1.05, + "learning_rate": 0.0001418066698077283, + "loss": 0.0368, "step": 163400 }, { - "epoch": 1.77, - "learning_rate": 3.4878966837562465e-05, - "loss": 0.0242, + "epoch": 1.05, + "learning_rate": 0.00014179698845337134, + "loss": 0.0345, "step": 163410 }, { - "epoch": 1.77, - "learning_rate": 3.486274255305341e-05, - "loss": 0.0267, + "epoch": 1.05, + "learning_rate": 0.00014178730709901442, + "loss": 0.0346, "step": 163420 }, { - "epoch": 1.77, - "learning_rate": 3.484651826854436e-05, - "loss": 0.0275, + "epoch": 1.05, + "learning_rate": 0.0001417776257446575, + "loss": 0.0435, "step": 163430 }, { - "epoch": 1.77, - "learning_rate": 3.48302939840353e-05, - "loss": 0.0277, + "epoch": 1.05, + "learning_rate": 0.00014176794439030058, + "loss": 0.04, "step": 163440 }, { - "epoch": 1.77, - "learning_rate": 3.481406969952625e-05, - "loss": 0.0265, + "epoch": 1.05, + "learning_rate": 0.00014175826303594363, + "loss": 0.0386, "step": 163450 }, { - "epoch": 1.77, - "learning_rate": 3.479784541501719e-05, - "loss": 0.0221, + "epoch": 1.06, + "learning_rate": 0.00014174858168158669, + "loss": 0.0358, "step": 163460 }, { - "epoch": 1.77, - "learning_rate": 3.478162113050814e-05, - "loss": 0.0268, + "epoch": 1.06, + "learning_rate": 0.00014173890032722977, + "loss": 0.0389, "step": 163470 }, { - "epoch": 1.77, - "learning_rate": 3.476539684599909e-05, - "loss": 0.0228, + "epoch": 1.06, + "learning_rate": 0.00014172921897287282, + "loss": 0.0333, "step": 163480 }, { - "epoch": 1.77, - "learning_rate": 3.4749172561490036e-05, - "loss": 0.0323, + "epoch": 1.06, + "learning_rate": 0.0001417195376185159, + "loss": 0.0359, "step": 163490 }, { - "epoch": 1.77, - "learning_rate": 3.4732948276980985e-05, - "loss": 0.0261, + "epoch": 1.06, + "learning_rate": 0.00014170985626415898, + "loss": 0.0337, "step": 163500 }, { - "epoch": 1.77, - "learning_rate": 3.471672399247193e-05, - "loss": 0.0274, + "epoch": 1.06, + "learning_rate": 0.00014170017490980206, + "loss": 0.0352, "step": 163510 }, { - "epoch": 1.77, - "learning_rate": 3.470049970796288e-05, - "loss": 0.0228, - "step": 163520 + "epoch": 1.06, + "learning_rate": 0.0001416904935554451, + "loss": 0.0351, + "step": 163520 }, { - "epoch": 1.77, - "learning_rate": 3.468427542345382e-05, - "loss": 0.0303, + "epoch": 1.06, + "learning_rate": 0.00014168081220108816, + "loss": 0.0414, "step": 163530 }, { - "epoch": 1.77, - "learning_rate": 3.466805113894477e-05, - "loss": 0.0254, + "epoch": 1.06, + "learning_rate": 0.00014167113084673124, + "loss": 0.0364, "step": 163540 }, { - "epoch": 1.77, - "learning_rate": 3.4651826854435714e-05, - "loss": 0.0237, + "epoch": 1.06, + "learning_rate": 0.0001416614494923743, + "loss": 0.0345, "step": 163550 }, { - "epoch": 1.77, - "learning_rate": 3.4635602569926664e-05, - "loss": 0.0278, + "epoch": 1.06, + "learning_rate": 0.00014165176813801738, + "loss": 0.0322, "step": 163560 }, { - "epoch": 1.77, - "learning_rate": 3.4619378285417614e-05, - "loss": 0.03, + "epoch": 1.06, + "learning_rate": 0.00014164208678366045, + "loss": 0.0313, "step": 163570 }, { - "epoch": 1.77, - "learning_rate": 3.4603154000908556e-05, - "loss": 0.0244, + "epoch": 1.06, + "learning_rate": 0.0001416324054293035, + "loss": 0.0355, "step": 163580 }, { - "epoch": 1.77, - "learning_rate": 3.4586929716399506e-05, - "loss": 0.0284, + "epoch": 1.06, + "learning_rate": 0.0001416227240749466, + "loss": 0.03, "step": 163590 }, { - "epoch": 1.77, - "learning_rate": 3.457070543189045e-05, - "loss": 0.0252, + "epoch": 1.06, + "learning_rate": 0.00014161304272058964, + "loss": 0.0314, "step": 163600 }, { - "epoch": 1.77, - "learning_rate": 3.45544811473814e-05, - "loss": 0.026, + "epoch": 1.06, + "learning_rate": 0.00014160336136623272, + "loss": 0.0329, "step": 163610 }, { - "epoch": 1.77, - "learning_rate": 3.453825686287234e-05, - "loss": 0.0257, + "epoch": 1.06, + "learning_rate": 0.00014159368001187577, + "loss": 0.0351, "step": 163620 }, { - "epoch": 1.77, - "learning_rate": 3.452203257836329e-05, - "loss": 0.024, + "epoch": 1.06, + "learning_rate": 0.00014158399865751885, + "loss": 0.0338, "step": 163630 }, { - "epoch": 1.77, - "learning_rate": 3.450580829385424e-05, - "loss": 0.0294, + "epoch": 1.06, + "learning_rate": 0.00014157431730316193, + "loss": 0.0323, "step": 163640 }, { - "epoch": 1.77, - "learning_rate": 3.4489584009345185e-05, - "loss": 0.0243, + "epoch": 1.06, + "learning_rate": 0.00014156463594880498, + "loss": 0.0297, "step": 163650 }, { - "epoch": 1.77, - "learning_rate": 3.4473359724836134e-05, - "loss": 0.0262, + "epoch": 1.06, + "learning_rate": 0.00014155495459444804, + "loss": 0.0349, "step": 163660 }, { - "epoch": 1.77, - "learning_rate": 3.445713544032708e-05, - "loss": 0.0326, + "epoch": 1.06, + "learning_rate": 0.00014154527324009112, + "loss": 0.0335, "step": 163670 }, { - "epoch": 1.77, - "learning_rate": 3.444091115581803e-05, - "loss": 0.0236, + "epoch": 1.06, + "learning_rate": 0.0001415355918857342, + "loss": 0.0342, "step": 163680 }, { - "epoch": 1.77, - "learning_rate": 3.442468687130897e-05, - "loss": 0.0275, + "epoch": 1.06, + "learning_rate": 0.00014152591053137725, + "loss": 0.0343, "step": 163690 }, { - "epoch": 1.77, - "learning_rate": 3.440846258679992e-05, - "loss": 0.0216, + "epoch": 1.06, + "learning_rate": 0.00014151622917702033, + "loss": 0.0293, "step": 163700 }, { - "epoch": 1.77, - "learning_rate": 3.439223830229086e-05, - "loss": 0.0261, + "epoch": 1.06, + "learning_rate": 0.0001415065478226634, + "loss": 0.036, "step": 163710 }, { - "epoch": 1.77, - "learning_rate": 3.437601401778181e-05, - "loss": 0.0219, + "epoch": 1.06, + "learning_rate": 0.00014149686646830646, + "loss": 0.0393, "step": 163720 }, { - "epoch": 1.77, - "learning_rate": 3.435978973327276e-05, - "loss": 0.0248, + "epoch": 1.06, + "learning_rate": 0.00014148718511394951, + "loss": 0.0341, "step": 163730 }, { - "epoch": 1.77, - "learning_rate": 3.4343565448763705e-05, - "loss": 0.026, + "epoch": 1.06, + "learning_rate": 0.0001414775037595926, + "loss": 0.0314, "step": 163740 }, { - "epoch": 1.77, - "learning_rate": 3.4327341164254655e-05, - "loss": 0.0267, + "epoch": 1.06, + "learning_rate": 0.00014146782240523567, + "loss": 0.038, "step": 163750 }, { - "epoch": 1.77, - "learning_rate": 3.43111168797456e-05, - "loss": 0.0233, + "epoch": 1.06, + "learning_rate": 0.00014145814105087873, + "loss": 0.0321, "step": 163760 }, { - "epoch": 1.77, - "learning_rate": 3.429489259523655e-05, - "loss": 0.0231, + "epoch": 1.06, + "learning_rate": 0.0001414484596965218, + "loss": 0.0301, "step": 163770 }, { - "epoch": 1.77, - "learning_rate": 3.427866831072749e-05, - "loss": 0.0281, + "epoch": 1.06, + "learning_rate": 0.00014143877834216486, + "loss": 0.0351, "step": 163780 }, { - "epoch": 1.77, - "learning_rate": 3.426244402621844e-05, - "loss": 0.0254, + "epoch": 1.06, + "learning_rate": 0.00014142909698780794, + "loss": 0.0356, "step": 163790 }, { - "epoch": 1.77, - "learning_rate": 3.4246219741709384e-05, - "loss": 0.0266, + "epoch": 1.06, + "learning_rate": 0.000141419415633451, + "loss": 0.0372, "step": 163800 }, { - "epoch": 1.77, - "learning_rate": 3.4229995457200333e-05, - "loss": 0.0257, + "epoch": 1.06, + "learning_rate": 0.00014140973427909407, + "loss": 0.0401, "step": 163810 }, { - "epoch": 1.77, - "learning_rate": 3.421377117269128e-05, - "loss": 0.0273, + "epoch": 1.06, + "learning_rate": 0.00014140005292473715, + "loss": 0.0363, "step": 163820 }, { - "epoch": 1.77, - "learning_rate": 3.4197546888182226e-05, - "loss": 0.0246, + "epoch": 1.06, + "learning_rate": 0.0001413903715703802, + "loss": 0.0398, "step": 163830 }, { - "epoch": 1.77, - "learning_rate": 3.4181322603673176e-05, - "loss": 0.0282, + "epoch": 1.06, + "learning_rate": 0.00014138069021602328, + "loss": 0.0307, "step": 163840 }, { - "epoch": 1.77, - "learning_rate": 3.416509831916412e-05, - "loss": 0.029, + "epoch": 1.06, + "learning_rate": 0.00014137100886166634, + "loss": 0.0351, "step": 163850 }, { - "epoch": 1.77, - "learning_rate": 3.414887403465507e-05, - "loss": 0.0239, + "epoch": 1.06, + "learning_rate": 0.0001413613275073094, + "loss": 0.0325, "step": 163860 }, { - "epoch": 1.77, - "learning_rate": 3.413264975014601e-05, - "loss": 0.0259, + "epoch": 1.06, + "learning_rate": 0.00014135164615295247, + "loss": 0.0356, "step": 163870 }, { - "epoch": 1.77, - "learning_rate": 3.411642546563696e-05, - "loss": 0.0296, + "epoch": 1.06, + "learning_rate": 0.00014134196479859555, + "loss": 0.032, "step": 163880 }, { - "epoch": 1.77, - "learning_rate": 3.4100201181127905e-05, - "loss": 0.0238, + "epoch": 1.06, + "learning_rate": 0.00014133228344423863, + "loss": 0.0332, "step": 163890 }, { - "epoch": 1.77, - "learning_rate": 3.4083976896618854e-05, - "loss": 0.0332, + "epoch": 1.06, + "learning_rate": 0.00014132260208988168, + "loss": 0.0274, "step": 163900 }, { - "epoch": 1.77, - "learning_rate": 3.4067752612109804e-05, - "loss": 0.0224, + "epoch": 1.06, + "learning_rate": 0.00014131292073552476, + "loss": 0.0346, "step": 163910 }, { - "epoch": 1.77, - "learning_rate": 3.405152832760075e-05, - "loss": 0.0196, + "epoch": 1.06, + "learning_rate": 0.00014130323938116781, + "loss": 0.0489, "step": 163920 }, { - "epoch": 1.77, - "learning_rate": 3.40353040430917e-05, - "loss": 0.0249, + "epoch": 1.06, + "learning_rate": 0.00014129355802681087, + "loss": 0.0384, "step": 163930 }, { - "epoch": 1.77, - "learning_rate": 3.401907975858264e-05, - "loss": 0.028, + "epoch": 1.06, + "learning_rate": 0.00014128387667245395, + "loss": 0.0361, "step": 163940 }, { - "epoch": 1.77, - "learning_rate": 3.400285547407359e-05, - "loss": 0.0245, + "epoch": 1.06, + "learning_rate": 0.00014127419531809703, + "loss": 0.0387, "step": 163950 }, { - "epoch": 1.77, - "learning_rate": 3.398663118956453e-05, - "loss": 0.0234, + "epoch": 1.06, + "learning_rate": 0.0001412645139637401, + "loss": 0.0358, "step": 163960 }, { - "epoch": 1.77, - "learning_rate": 3.397040690505549e-05, - "loss": 0.0263, + "epoch": 1.06, + "learning_rate": 0.00014125483260938316, + "loss": 0.035, "step": 163970 }, { - "epoch": 1.77, - "learning_rate": 3.395418262054643e-05, - "loss": 0.0284, + "epoch": 1.06, + "learning_rate": 0.0001412451512550262, + "loss": 0.0431, "step": 163980 }, { - "epoch": 1.77, - "learning_rate": 3.393795833603738e-05, - "loss": 0.0216, + "epoch": 1.06, + "learning_rate": 0.0001412354699006693, + "loss": 0.0316, "step": 163990 }, { - "epoch": 1.77, - "learning_rate": 3.3921734051528325e-05, - "loss": 0.0242, + "epoch": 1.06, + "learning_rate": 0.00014122578854631234, + "loss": 0.0329, "step": 164000 }, { - "epoch": 1.77, - "eval_cer": 0.9211543252741894, - "eval_loss": 0.021158745512366295, - "eval_runtime": 118.9895, - "eval_samples_per_second": 16.808, - "eval_steps_per_second": 4.202, + "epoch": 1.06, + "eval_cer": 0.9199502881030392, + "eval_loss": 0.024694031104445457, + "eval_runtime": 120.2156, + "eval_samples_per_second": 16.637, + "eval_steps_per_second": 4.159, "step": 164000 }, { - "epoch": 1.77, - "learning_rate": 3.3905509767019275e-05, - "loss": 0.0242, + "epoch": 1.06, + "learning_rate": 0.00014121610719195542, + "loss": 0.0348, "step": 164010 }, { - "epoch": 1.77, - "learning_rate": 3.388928548251022e-05, - "loss": 0.0333, + "epoch": 1.06, + "learning_rate": 0.0001412064258375985, + "loss": 0.0334, "step": 164020 }, { - "epoch": 1.77, - "learning_rate": 3.387306119800117e-05, - "loss": 0.0303, + "epoch": 1.06, + "learning_rate": 0.00014119674448324156, + "loss": 0.0377, "step": 164030 }, { - "epoch": 1.77, - "learning_rate": 3.385683691349211e-05, - "loss": 0.024, + "epoch": 1.06, + "learning_rate": 0.00014118706312888464, + "loss": 0.033, "step": 164040 }, { - "epoch": 1.77, - "learning_rate": 3.384061262898306e-05, - "loss": 0.025, + "epoch": 1.06, + "learning_rate": 0.0001411773817745277, + "loss": 0.0391, "step": 164050 }, { - "epoch": 1.77, - "learning_rate": 3.382438834447401e-05, - "loss": 0.0208, + "epoch": 1.06, + "learning_rate": 0.00014116770042017077, + "loss": 0.0366, "step": 164060 }, { - "epoch": 1.77, - "learning_rate": 3.380816405996495e-05, - "loss": 0.0354, + "epoch": 1.06, + "learning_rate": 0.00014115801906581382, + "loss": 0.0321, "step": 164070 }, { - "epoch": 1.77, - "learning_rate": 3.37919397754559e-05, - "loss": 0.0261, + "epoch": 1.06, + "learning_rate": 0.0001411483377114569, + "loss": 0.0377, "step": 164080 }, { - "epoch": 1.77, - "learning_rate": 3.3775715490946846e-05, - "loss": 0.0259, + "epoch": 1.06, + "learning_rate": 0.00014113865635709998, + "loss": 0.034, "step": 164090 }, { - "epoch": 1.77, - "learning_rate": 3.3759491206437795e-05, - "loss": 0.0307, + "epoch": 1.06, + "learning_rate": 0.00014112897500274303, + "loss": 0.0352, "step": 164100 }, { - "epoch": 1.78, - "learning_rate": 3.374326692192874e-05, - "loss": 0.0224, + "epoch": 1.06, + "learning_rate": 0.0001411192936483861, + "loss": 0.0418, "step": 164110 }, { - "epoch": 1.78, - "learning_rate": 3.372704263741969e-05, - "loss": 0.0226, + "epoch": 1.06, + "learning_rate": 0.00014110961229402917, + "loss": 0.032, "step": 164120 }, { - "epoch": 1.78, - "learning_rate": 3.371081835291063e-05, - "loss": 0.0211, + "epoch": 1.06, + "learning_rate": 0.00014109993093967225, + "loss": 0.0336, "step": 164130 }, { - "epoch": 1.78, - "learning_rate": 3.369459406840158e-05, - "loss": 0.0252, + "epoch": 1.06, + "learning_rate": 0.0001410902495853153, + "loss": 0.0342, "step": 164140 }, { - "epoch": 1.78, - "learning_rate": 3.367836978389253e-05, - "loss": 0.0262, + "epoch": 1.06, + "learning_rate": 0.00014108056823095838, + "loss": 0.0324, "step": 164150 }, { - "epoch": 1.78, - "learning_rate": 3.3662145499383474e-05, - "loss": 0.0233, + "epoch": 1.06, + "learning_rate": 0.00014107088687660146, + "loss": 0.0336, "step": 164160 }, { - "epoch": 1.78, - "learning_rate": 3.3645921214874424e-05, - "loss": 0.0217, + "epoch": 1.06, + "learning_rate": 0.0001410612055222445, + "loss": 0.0289, "step": 164170 }, { - "epoch": 1.78, - "learning_rate": 3.3629696930365367e-05, - "loss": 0.0298, + "epoch": 1.06, + "learning_rate": 0.00014105152416788756, + "loss": 0.0342, "step": 164180 }, { - "epoch": 1.78, - "learning_rate": 3.3613472645856316e-05, - "loss": 0.0233, + "epoch": 1.06, + "learning_rate": 0.00014104184281353064, + "loss": 0.0363, "step": 164190 }, { - "epoch": 1.78, - "learning_rate": 3.359724836134726e-05, - "loss": 0.0332, + "epoch": 1.06, + "learning_rate": 0.00014103216145917372, + "loss": 0.034, "step": 164200 }, { - "epoch": 1.78, - "learning_rate": 3.358102407683821e-05, - "loss": 0.0236, + "epoch": 1.06, + "learning_rate": 0.00014102248010481678, + "loss": 0.0322, "step": 164210 }, { - "epoch": 1.78, - "learning_rate": 3.356479979232916e-05, - "loss": 0.0267, + "epoch": 1.06, + "learning_rate": 0.00014101279875045986, + "loss": 0.0305, "step": 164220 }, { - "epoch": 1.78, - "learning_rate": 3.35485755078201e-05, - "loss": 0.0243, + "epoch": 1.06, + "learning_rate": 0.0001410031173961029, + "loss": 0.0365, "step": 164230 }, { - "epoch": 1.78, - "learning_rate": 3.353235122331105e-05, - "loss": 0.0274, + "epoch": 1.06, + "learning_rate": 0.000140993436041746, + "loss": 0.0333, "step": 164240 }, { - "epoch": 1.78, - "learning_rate": 3.3516126938801995e-05, - "loss": 0.0222, + "epoch": 1.06, + "learning_rate": 0.00014098375468738904, + "loss": 0.0355, "step": 164250 }, { - "epoch": 1.78, - "learning_rate": 3.3499902654292944e-05, - "loss": 0.0252, + "epoch": 1.06, + "learning_rate": 0.00014097407333303212, + "loss": 0.0353, "step": 164260 }, { - "epoch": 1.78, - "learning_rate": 3.348367836978389e-05, - "loss": 0.027, + "epoch": 1.06, + "learning_rate": 0.0001409643919786752, + "loss": 0.034, "step": 164270 }, { - "epoch": 1.78, - "learning_rate": 3.346745408527484e-05, - "loss": 0.0248, + "epoch": 1.06, + "learning_rate": 0.00014095471062431825, + "loss": 0.0327, "step": 164280 }, { - "epoch": 1.78, - "learning_rate": 3.345122980076578e-05, - "loss": 0.0293, + "epoch": 1.06, + "learning_rate": 0.00014094502926996133, + "loss": 0.0326, "step": 164290 }, { - "epoch": 1.78, - "learning_rate": 3.343500551625673e-05, - "loss": 0.0242, + "epoch": 1.06, + "learning_rate": 0.00014093534791560439, + "loss": 0.0334, "step": 164300 }, { - "epoch": 1.78, - "learning_rate": 3.341878123174768e-05, - "loss": 0.0228, + "epoch": 1.06, + "learning_rate": 0.00014092566656124746, + "loss": 0.0351, "step": 164310 }, { - "epoch": 1.78, - "learning_rate": 3.340255694723862e-05, - "loss": 0.0261, + "epoch": 1.06, + "learning_rate": 0.00014091598520689052, + "loss": 0.033, "step": 164320 }, { - "epoch": 1.78, - "learning_rate": 3.338633266272957e-05, - "loss": 0.0269, + "epoch": 1.06, + "learning_rate": 0.0001409063038525336, + "loss": 0.0319, "step": 164330 }, { - "epoch": 1.78, - "learning_rate": 3.3370108378220515e-05, - "loss": 0.0272, + "epoch": 1.06, + "learning_rate": 0.00014089662249817668, + "loss": 0.037, "step": 164340 }, { - "epoch": 1.78, - "learning_rate": 3.3353884093711465e-05, - "loss": 0.0257, + "epoch": 1.06, + "learning_rate": 0.00014088694114381973, + "loss": 0.0388, "step": 164350 }, { - "epoch": 1.78, - "learning_rate": 3.333765980920241e-05, - "loss": 0.0189, + "epoch": 1.06, + "learning_rate": 0.0001408772597894628, + "loss": 0.0339, "step": 164360 }, { - "epoch": 1.78, - "learning_rate": 3.332143552469336e-05, - "loss": 0.024, + "epoch": 1.06, + "learning_rate": 0.00014086757843510586, + "loss": 0.0359, "step": 164370 }, { - "epoch": 1.78, - "learning_rate": 3.33052112401843e-05, - "loss": 0.0255, + "epoch": 1.06, + "learning_rate": 0.00014085789708074894, + "loss": 0.0383, "step": 164380 }, { - "epoch": 1.78, - "learning_rate": 3.328898695567525e-05, - "loss": 0.0292, + "epoch": 1.06, + "learning_rate": 0.000140848215726392, + "loss": 0.0361, "step": 164390 }, { - "epoch": 1.78, - "learning_rate": 3.32727626711662e-05, - "loss": 0.0225, + "epoch": 1.06, + "learning_rate": 0.00014083853437203507, + "loss": 0.0302, "step": 164400 }, { - "epoch": 1.78, - "learning_rate": 3.3256538386657144e-05, - "loss": 0.0286, + "epoch": 1.06, + "learning_rate": 0.00014082885301767815, + "loss": 0.0361, "step": 164410 }, { - "epoch": 1.78, - "learning_rate": 3.324031410214809e-05, - "loss": 0.0209, + "epoch": 1.06, + "learning_rate": 0.0001408191716633212, + "loss": 0.0295, "step": 164420 }, { - "epoch": 1.78, - "learning_rate": 3.3224089817639036e-05, - "loss": 0.0288, + "epoch": 1.06, + "learning_rate": 0.0001408094903089643, + "loss": 0.0359, "step": 164430 }, { - "epoch": 1.78, - "learning_rate": 3.3207865533129986e-05, - "loss": 0.0239, + "epoch": 1.06, + "learning_rate": 0.00014079980895460734, + "loss": 0.034, "step": 164440 }, { - "epoch": 1.78, - "learning_rate": 3.319164124862093e-05, - "loss": 0.0275, + "epoch": 1.06, + "learning_rate": 0.00014079012760025042, + "loss": 0.0338, "step": 164450 }, { - "epoch": 1.78, - "learning_rate": 3.317541696411188e-05, - "loss": 0.0318, + "epoch": 1.06, + "learning_rate": 0.00014078044624589347, + "loss": 0.0343, "step": 164460 }, { - "epoch": 1.78, - "learning_rate": 3.315919267960282e-05, - "loss": 0.0264, + "epoch": 1.06, + "learning_rate": 0.00014077076489153655, + "loss": 0.0308, "step": 164470 }, { - "epoch": 1.78, - "learning_rate": 3.314296839509377e-05, - "loss": 0.0267, + "epoch": 1.06, + "learning_rate": 0.00014076108353717963, + "loss": 0.0335, "step": 164480 }, { - "epoch": 1.78, - "learning_rate": 3.312674411058472e-05, - "loss": 0.0274, + "epoch": 1.06, + "learning_rate": 0.00014075140218282268, + "loss": 0.0381, "step": 164490 }, { - "epoch": 1.78, - "learning_rate": 3.3110519826075664e-05, - "loss": 0.0254, + "epoch": 1.06, + "learning_rate": 0.00014074172082846574, + "loss": 0.031, "step": 164500 }, { - "epoch": 1.78, - "learning_rate": 3.3094295541566614e-05, - "loss": 0.028, + "epoch": 1.06, + "learning_rate": 0.00014073203947410882, + "loss": 0.0398, "step": 164510 }, { - "epoch": 1.78, - "learning_rate": 3.307807125705756e-05, - "loss": 0.0241, + "epoch": 1.06, + "learning_rate": 0.0001407223581197519, + "loss": 0.027, "step": 164520 }, { - "epoch": 1.78, - "learning_rate": 3.306184697254851e-05, - "loss": 0.0216, + "epoch": 1.06, + "learning_rate": 0.00014071267676539495, + "loss": 0.0364, "step": 164530 }, { - "epoch": 1.78, - "learning_rate": 3.304562268803945e-05, - "loss": 0.0241, + "epoch": 1.06, + "learning_rate": 0.00014070299541103803, + "loss": 0.0309, "step": 164540 }, { - "epoch": 1.78, - "learning_rate": 3.30293984035304e-05, - "loss": 0.0259, + "epoch": 1.06, + "learning_rate": 0.00014069331405668108, + "loss": 0.0321, "step": 164550 }, { - "epoch": 1.78, - "learning_rate": 3.301317411902135e-05, - "loss": 0.0256, + "epoch": 1.06, + "learning_rate": 0.00014068363270232416, + "loss": 0.0377, "step": 164560 }, { - "epoch": 1.78, - "learning_rate": 3.29969498345123e-05, - "loss": 0.0239, + "epoch": 1.06, + "learning_rate": 0.00014067395134796721, + "loss": 0.0385, "step": 164570 }, { - "epoch": 1.78, - "learning_rate": 3.298072555000324e-05, - "loss": 0.0227, + "epoch": 1.06, + "learning_rate": 0.0001406642699936103, + "loss": 0.0328, "step": 164580 }, { - "epoch": 1.78, - "learning_rate": 3.296450126549419e-05, - "loss": 0.0278, + "epoch": 1.06, + "learning_rate": 0.00014065458863925337, + "loss": 0.039, "step": 164590 }, { - "epoch": 1.78, - "learning_rate": 3.2948276980985135e-05, - "loss": 0.0295, + "epoch": 1.06, + "learning_rate": 0.00014064490728489643, + "loss": 0.0303, "step": 164600 }, { - "epoch": 1.78, - "learning_rate": 3.2932052696476085e-05, - "loss": 0.0271, + "epoch": 1.06, + "learning_rate": 0.0001406352259305395, + "loss": 0.0351, "step": 164610 }, { - "epoch": 1.78, - "learning_rate": 3.291582841196703e-05, - "loss": 0.0263, + "epoch": 1.06, + "learning_rate": 0.00014062554457618256, + "loss": 0.0317, "step": 164620 }, { - "epoch": 1.78, - "learning_rate": 3.289960412745798e-05, - "loss": 0.0241, + "epoch": 1.06, + "learning_rate": 0.00014061586322182564, + "loss": 0.0399, "step": 164630 }, { - "epoch": 1.78, - "learning_rate": 3.288337984294893e-05, - "loss": 0.0234, + "epoch": 1.06, + "learning_rate": 0.0001406061818674687, + "loss": 0.0332, "step": 164640 }, { - "epoch": 1.78, - "learning_rate": 3.286715555843987e-05, - "loss": 0.0256, + "epoch": 1.06, + "learning_rate": 0.00014059650051311177, + "loss": 0.0331, "step": 164650 }, { - "epoch": 1.78, - "learning_rate": 3.285093127393082e-05, - "loss": 0.0291, + "epoch": 1.06, + "learning_rate": 0.00014058681915875485, + "loss": 0.0324, "step": 164660 }, { - "epoch": 1.78, - "learning_rate": 3.283470698942176e-05, - "loss": 0.03, + "epoch": 1.06, + "learning_rate": 0.0001405771378043979, + "loss": 0.0368, "step": 164670 }, { - "epoch": 1.78, - "learning_rate": 3.281848270491271e-05, - "loss": 0.0225, + "epoch": 1.06, + "learning_rate": 0.00014056745645004098, + "loss": 0.0343, "step": 164680 }, { - "epoch": 1.78, - "learning_rate": 3.2802258420403656e-05, - "loss": 0.0265, + "epoch": 1.06, + "learning_rate": 0.00014055777509568404, + "loss": 0.031, "step": 164690 }, { - "epoch": 1.78, - "learning_rate": 3.2786034135894606e-05, - "loss": 0.0234, + "epoch": 1.06, + "learning_rate": 0.0001405480937413271, + "loss": 0.0325, "step": 164700 }, { - "epoch": 1.78, - "learning_rate": 3.2769809851385555e-05, - "loss": 0.0303, + "epoch": 1.06, + "learning_rate": 0.00014053841238697017, + "loss": 0.032, "step": 164710 }, { - "epoch": 1.78, - "learning_rate": 3.27535855668765e-05, - "loss": 0.0254, + "epoch": 1.06, + "learning_rate": 0.00014052873103261325, + "loss": 0.0392, "step": 164720 }, { - "epoch": 1.78, - "learning_rate": 3.273736128236745e-05, - "loss": 0.0207, + "epoch": 1.06, + "learning_rate": 0.00014051904967825633, + "loss": 0.0345, "step": 164730 }, { - "epoch": 1.78, - "learning_rate": 3.272113699785839e-05, - "loss": 0.0235, + "epoch": 1.06, + "learning_rate": 0.00014050936832389938, + "loss": 0.0394, "step": 164740 }, { - "epoch": 1.78, - "learning_rate": 3.270491271334934e-05, - "loss": 0.0238, + "epoch": 1.06, + "learning_rate": 0.00014049968696954243, + "loss": 0.0337, "step": 164750 }, { - "epoch": 1.78, - "learning_rate": 3.2688688428840284e-05, - "loss": 0.0314, + "epoch": 1.06, + "learning_rate": 0.0001404900056151855, + "loss": 0.039, "step": 164760 }, { - "epoch": 1.78, - "learning_rate": 3.2672464144331234e-05, - "loss": 0.027, + "epoch": 1.06, + "learning_rate": 0.00014048032426082857, + "loss": 0.0311, "step": 164770 }, { - "epoch": 1.78, - "learning_rate": 3.2656239859822177e-05, - "loss": 0.0296, + "epoch": 1.06, + "learning_rate": 0.00014047064290647165, + "loss": 0.0383, "step": 164780 }, { - "epoch": 1.78, - "learning_rate": 3.2640015575313126e-05, - "loss": 0.0248, - "step": 164790 + "epoch": 1.06, + "learning_rate": 0.00014046096155211473, + "loss": 0.0358, + "step": 164790 }, { - "epoch": 1.78, - "learning_rate": 3.2623791290804076e-05, - "loss": 0.0193, + "epoch": 1.06, + "learning_rate": 0.0001404512801977578, + "loss": 0.0366, "step": 164800 }, { - "epoch": 1.78, - "learning_rate": 3.260756700629502e-05, - "loss": 0.026, + "epoch": 1.06, + "learning_rate": 0.00014044159884340086, + "loss": 0.038, "step": 164810 }, { - "epoch": 1.78, - "learning_rate": 3.259134272178597e-05, - "loss": 0.0229, + "epoch": 1.06, + "learning_rate": 0.0001404319174890439, + "loss": 0.0387, "step": 164820 }, { - "epoch": 1.78, - "learning_rate": 3.257511843727691e-05, - "loss": 0.0252, + "epoch": 1.06, + "learning_rate": 0.000140422236134687, + "loss": 0.0398, "step": 164830 }, { - "epoch": 1.78, - "learning_rate": 3.255889415276786e-05, - "loss": 0.025, + "epoch": 1.06, + "learning_rate": 0.00014041255478033004, + "loss": 0.0356, "step": 164840 }, { - "epoch": 1.78, - "learning_rate": 3.2542669868258805e-05, - "loss": 0.0264, + "epoch": 1.06, + "learning_rate": 0.00014040287342597312, + "loss": 0.0333, "step": 164850 }, { - "epoch": 1.78, - "learning_rate": 3.2526445583749754e-05, - "loss": 0.0265, + "epoch": 1.06, + "learning_rate": 0.0001403931920716162, + "loss": 0.0345, "step": 164860 }, { - "epoch": 1.78, - "learning_rate": 3.25102212992407e-05, - "loss": 0.0225, + "epoch": 1.06, + "learning_rate": 0.00014038351071725926, + "loss": 0.0332, "step": 164870 }, { - "epoch": 1.78, - "learning_rate": 3.249399701473165e-05, - "loss": 0.0243, + "epoch": 1.06, + "learning_rate": 0.00014037382936290234, + "loss": 0.0325, "step": 164880 }, { - "epoch": 1.78, - "learning_rate": 3.24777727302226e-05, - "loss": 0.0287, + "epoch": 1.06, + "learning_rate": 0.0001403641480085454, + "loss": 0.0351, "step": 164890 }, { - "epoch": 1.78, - "learning_rate": 3.246154844571354e-05, - "loss": 0.0246, + "epoch": 1.06, + "learning_rate": 0.00014035446665418847, + "loss": 0.0366, "step": 164900 }, { - "epoch": 1.78, - "learning_rate": 3.244532416120449e-05, - "loss": 0.0223, + "epoch": 1.06, + "learning_rate": 0.00014034478529983152, + "loss": 0.0342, "step": 164910 }, { - "epoch": 1.78, - "learning_rate": 3.242909987669543e-05, - "loss": 0.0287, + "epoch": 1.06, + "learning_rate": 0.0001403351039454746, + "loss": 0.045, "step": 164920 }, { - "epoch": 1.78, - "learning_rate": 3.241287559218638e-05, - "loss": 0.0258, + "epoch": 1.06, + "learning_rate": 0.00014032542259111768, + "loss": 0.0308, "step": 164930 }, { - "epoch": 1.78, - "learning_rate": 3.2396651307677326e-05, - "loss": 0.0206, + "epoch": 1.06, + "learning_rate": 0.00014031574123676073, + "loss": 0.0359, "step": 164940 }, { - "epoch": 1.78, - "learning_rate": 3.2380427023168275e-05, - "loss": 0.0218, + "epoch": 1.06, + "learning_rate": 0.00014030605988240379, + "loss": 0.0403, "step": 164950 }, { - "epoch": 1.78, - "learning_rate": 3.236420273865922e-05, - "loss": 0.026, + "epoch": 1.06, + "learning_rate": 0.00014029637852804687, + "loss": 0.0343, "step": 164960 }, { - "epoch": 1.78, - "learning_rate": 3.234797845415017e-05, - "loss": 0.0292, + "epoch": 1.06, + "learning_rate": 0.00014028669717368995, + "loss": 0.0327, "step": 164970 }, { - "epoch": 1.78, - "learning_rate": 3.233175416964112e-05, - "loss": 0.0252, + "epoch": 1.06, + "learning_rate": 0.000140277015819333, + "loss": 0.0405, "step": 164980 }, { - "epoch": 1.78, - "learning_rate": 3.231552988513206e-05, - "loss": 0.0235, + "epoch": 1.06, + "learning_rate": 0.00014026733446497608, + "loss": 0.038, "step": 164990 }, { - "epoch": 1.78, - "learning_rate": 3.229930560062301e-05, - "loss": 0.0247, + "epoch": 1.06, + "learning_rate": 0.00014025765311061916, + "loss": 0.0393, "step": 165000 }, { - "epoch": 1.78, - "eval_cer": 0.9210818795598834, - "eval_loss": 0.021122341975569725, - "eval_runtime": 119.0675, - "eval_samples_per_second": 16.797, - "eval_steps_per_second": 4.199, + "epoch": 1.06, + "eval_cer": 0.9198345949610214, + "eval_loss": 0.02478347346186638, + "eval_runtime": 120.113, + "eval_samples_per_second": 16.651, + "eval_steps_per_second": 4.163, "step": 165000 }, { - "epoch": 1.78, - "learning_rate": 3.2283081316113954e-05, - "loss": 0.0243, + "epoch": 1.07, + "learning_rate": 0.0001402479717562622, + "loss": 0.0324, "step": 165010 }, { - "epoch": 1.78, - "learning_rate": 3.22668570316049e-05, - "loss": 0.0312, + "epoch": 1.07, + "learning_rate": 0.00014023829040190526, + "loss": 0.0342, "step": 165020 }, { - "epoch": 1.78, - "learning_rate": 3.2250632747095846e-05, - "loss": 0.0242, + "epoch": 1.07, + "learning_rate": 0.00014022860904754834, + "loss": 0.0368, "step": 165030 }, { - "epoch": 1.79, - "learning_rate": 3.2234408462586796e-05, - "loss": 0.0296, + "epoch": 1.07, + "learning_rate": 0.00014021892769319142, + "loss": 0.0332, "step": 165040 }, { - "epoch": 1.79, - "learning_rate": 3.2218184178077746e-05, - "loss": 0.033, + "epoch": 1.07, + "learning_rate": 0.00014020924633883448, + "loss": 0.0415, "step": 165050 }, { - "epoch": 1.79, - "learning_rate": 3.220195989356869e-05, - "loss": 0.025, + "epoch": 1.07, + "learning_rate": 0.00014019956498447755, + "loss": 0.0358, "step": 165060 }, { - "epoch": 1.79, - "learning_rate": 3.218573560905964e-05, - "loss": 0.0257, + "epoch": 1.07, + "learning_rate": 0.0001401898836301206, + "loss": 0.0396, "step": 165070 }, { - "epoch": 1.79, - "learning_rate": 3.216951132455058e-05, - "loss": 0.0309, + "epoch": 1.07, + "learning_rate": 0.0001401802022757637, + "loss": 0.0321, "step": 165080 }, { - "epoch": 1.79, - "learning_rate": 3.215328704004153e-05, - "loss": 0.0229, + "epoch": 1.07, + "learning_rate": 0.00014017052092140674, + "loss": 0.035, "step": 165090 }, { - "epoch": 1.79, - "learning_rate": 3.2137062755532474e-05, - "loss": 0.0293, + "epoch": 1.07, + "learning_rate": 0.00014016083956704982, + "loss": 0.0384, "step": 165100 }, { - "epoch": 1.79, - "learning_rate": 3.2120838471023424e-05, - "loss": 0.0219, + "epoch": 1.07, + "learning_rate": 0.0001401511582126929, + "loss": 0.0346, "step": 165110 }, { - "epoch": 1.79, - "learning_rate": 3.210461418651437e-05, - "loss": 0.0227, + "epoch": 1.07, + "learning_rate": 0.00014014147685833595, + "loss": 0.0337, "step": 165120 }, { - "epoch": 1.79, - "learning_rate": 3.208838990200532e-05, - "loss": 0.0218, + "epoch": 1.07, + "learning_rate": 0.00014013179550397903, + "loss": 0.0328, "step": 165130 }, { - "epoch": 1.79, - "learning_rate": 3.207216561749627e-05, - "loss": 0.0275, + "epoch": 1.07, + "learning_rate": 0.00014012211414962208, + "loss": 0.0376, "step": 165140 }, { - "epoch": 1.79, - "learning_rate": 3.2055941332987216e-05, - "loss": 0.0229, + "epoch": 1.07, + "learning_rate": 0.00014011243279526516, + "loss": 0.0354, "step": 165150 }, { - "epoch": 1.79, - "learning_rate": 3.203971704847816e-05, - "loss": 0.0249, + "epoch": 1.07, + "learning_rate": 0.00014010275144090822, + "loss": 0.036, "step": 165160 }, { - "epoch": 1.79, - "learning_rate": 3.202349276396911e-05, - "loss": 0.0285, + "epoch": 1.07, + "learning_rate": 0.0001400930700865513, + "loss": 0.0384, "step": 165170 }, { - "epoch": 1.79, - "learning_rate": 3.200726847946005e-05, - "loss": 0.0241, + "epoch": 1.07, + "learning_rate": 0.00014008338873219438, + "loss": 0.0339, "step": 165180 }, { - "epoch": 1.79, - "learning_rate": 3.1991044194951e-05, - "loss": 0.0239, + "epoch": 1.07, + "learning_rate": 0.00014007370737783743, + "loss": 0.0332, "step": 165190 }, { - "epoch": 1.79, - "learning_rate": 3.1974819910441945e-05, - "loss": 0.0253, + "epoch": 1.07, + "learning_rate": 0.0001400640260234805, + "loss": 0.0332, "step": 165200 }, { - "epoch": 1.79, - "learning_rate": 3.1958595625932895e-05, - "loss": 0.0294, + "epoch": 1.07, + "learning_rate": 0.00014005434466912356, + "loss": 0.0406, "step": 165210 }, { - "epoch": 1.79, - "learning_rate": 3.1942371341423845e-05, - "loss": 0.0296, + "epoch": 1.07, + "learning_rate": 0.00014004466331476664, + "loss": 0.0298, "step": 165220 }, { - "epoch": 1.79, - "learning_rate": 3.192614705691479e-05, - "loss": 0.0221, + "epoch": 1.07, + "learning_rate": 0.0001400349819604097, + "loss": 0.0386, "step": 165230 }, { - "epoch": 1.79, - "learning_rate": 3.190992277240574e-05, - "loss": 0.0217, + "epoch": 1.07, + "learning_rate": 0.00014002530060605277, + "loss": 0.0405, "step": 165240 }, { - "epoch": 1.79, - "learning_rate": 3.189369848789668e-05, - "loss": 0.0283, + "epoch": 1.07, + "learning_rate": 0.00014001561925169585, + "loss": 0.0315, "step": 165250 }, { - "epoch": 1.79, - "learning_rate": 3.187747420338763e-05, - "loss": 0.0254, + "epoch": 1.07, + "learning_rate": 0.0001400059378973389, + "loss": 0.0343, "step": 165260 }, { - "epoch": 1.79, - "learning_rate": 3.186124991887857e-05, - "loss": 0.0248, + "epoch": 1.07, + "learning_rate": 0.00013999625654298196, + "loss": 0.0331, "step": 165270 }, { - "epoch": 1.79, - "learning_rate": 3.184502563436952e-05, - "loss": 0.0284, + "epoch": 1.07, + "learning_rate": 0.00013998657518862504, + "loss": 0.0335, "step": 165280 }, { - "epoch": 1.79, - "learning_rate": 3.182880134986047e-05, - "loss": 0.0232, + "epoch": 1.07, + "learning_rate": 0.00013997689383426812, + "loss": 0.0327, "step": 165290 }, { - "epoch": 1.79, - "learning_rate": 3.1812577065351416e-05, - "loss": 0.0252, + "epoch": 1.07, + "learning_rate": 0.00013996721247991117, + "loss": 0.0336, "step": 165300 }, { - "epoch": 1.79, - "learning_rate": 3.1796352780842365e-05, - "loss": 0.0243, + "epoch": 1.07, + "learning_rate": 0.00013995753112555425, + "loss": 0.0289, "step": 165310 }, { - "epoch": 1.79, - "learning_rate": 3.178012849633331e-05, - "loss": 0.0239, + "epoch": 1.07, + "learning_rate": 0.00013994784977119733, + "loss": 0.0337, "step": 165320 }, { - "epoch": 1.79, - "learning_rate": 3.176390421182426e-05, - "loss": 0.0226, + "epoch": 1.07, + "learning_rate": 0.00013993816841684038, + "loss": 0.0315, "step": 165330 }, { - "epoch": 1.79, - "learning_rate": 3.17476799273152e-05, - "loss": 0.0245, + "epoch": 1.07, + "learning_rate": 0.00013992848706248344, + "loss": 0.0321, "step": 165340 }, { - "epoch": 1.79, - "learning_rate": 3.173145564280615e-05, - "loss": 0.0236, + "epoch": 1.07, + "learning_rate": 0.00013991880570812652, + "loss": 0.032, "step": 165350 }, { - "epoch": 1.79, - "learning_rate": 3.1715231358297094e-05, - "loss": 0.0302, + "epoch": 1.07, + "learning_rate": 0.0001399091243537696, + "loss": 0.0321, "step": 165360 }, { - "epoch": 1.79, - "learning_rate": 3.1699007073788044e-05, - "loss": 0.0288, + "epoch": 1.07, + "learning_rate": 0.00013989944299941265, + "loss": 0.041, "step": 165370 }, { - "epoch": 1.79, - "learning_rate": 3.1682782789278993e-05, - "loss": 0.0259, + "epoch": 1.07, + "learning_rate": 0.00013988976164505573, + "loss": 0.0325, "step": 165380 }, { - "epoch": 1.79, - "learning_rate": 3.1666558504769936e-05, - "loss": 0.026, + "epoch": 1.07, + "learning_rate": 0.00013988008029069878, + "loss": 0.0367, "step": 165390 }, { - "epoch": 1.79, - "learning_rate": 3.1650334220260886e-05, - "loss": 0.0271, + "epoch": 1.07, + "learning_rate": 0.00013987039893634186, + "loss": 0.0331, "step": 165400 }, { - "epoch": 1.79, - "learning_rate": 3.163410993575183e-05, - "loss": 0.0261, + "epoch": 1.07, + "learning_rate": 0.00013986071758198491, + "loss": 0.0361, "step": 165410 }, { - "epoch": 1.79, - "learning_rate": 3.161788565124278e-05, - "loss": 0.0265, + "epoch": 1.07, + "learning_rate": 0.000139851036227628, + "loss": 0.0335, "step": 165420 }, { - "epoch": 1.79, - "learning_rate": 3.160166136673372e-05, - "loss": 0.0266, + "epoch": 1.07, + "learning_rate": 0.00013984135487327107, + "loss": 0.0348, "step": 165430 }, { - "epoch": 1.79, - "learning_rate": 3.158543708222467e-05, - "loss": 0.0293, + "epoch": 1.07, + "learning_rate": 0.00013983167351891413, + "loss": 0.0336, "step": 165440 }, { - "epoch": 1.79, - "learning_rate": 3.1569212797715615e-05, - "loss": 0.0247, + "epoch": 1.07, + "learning_rate": 0.0001398219921645572, + "loss": 0.0376, "step": 165450 }, { - "epoch": 1.79, - "learning_rate": 3.1552988513206565e-05, - "loss": 0.0252, + "epoch": 1.07, + "learning_rate": 0.00013981231081020026, + "loss": 0.0304, "step": 165460 }, { - "epoch": 1.79, - "learning_rate": 3.1536764228697514e-05, - "loss": 0.0263, + "epoch": 1.07, + "learning_rate": 0.0001398026294558433, + "loss": 0.0325, "step": 165470 }, { - "epoch": 1.79, - "learning_rate": 3.152053994418846e-05, - "loss": 0.026, + "epoch": 1.07, + "learning_rate": 0.0001397929481014864, + "loss": 0.0334, "step": 165480 }, { - "epoch": 1.79, - "learning_rate": 3.150431565967941e-05, - "loss": 0.0227, + "epoch": 1.07, + "learning_rate": 0.00013978326674712947, + "loss": 0.0329, "step": 165490 }, { - "epoch": 1.79, - "learning_rate": 3.148809137517035e-05, - "loss": 0.0233, + "epoch": 1.07, + "learning_rate": 0.00013977358539277255, + "loss": 0.0343, "step": 165500 }, { - "epoch": 1.79, - "learning_rate": 3.14718670906613e-05, - "loss": 0.0231, + "epoch": 1.07, + "learning_rate": 0.0001397639040384156, + "loss": 0.0359, "step": 165510 }, { - "epoch": 1.79, - "learning_rate": 3.145564280615224e-05, - "loss": 0.0287, + "epoch": 1.07, + "learning_rate": 0.00013975422268405868, + "loss": 0.0354, "step": 165520 }, { - "epoch": 1.79, - "learning_rate": 3.143941852164319e-05, - "loss": 0.0214, + "epoch": 1.07, + "learning_rate": 0.00013974454132970174, + "loss": 0.0308, "step": 165530 }, { - "epoch": 1.79, - "learning_rate": 3.1423194237134136e-05, - "loss": 0.0257, + "epoch": 1.07, + "learning_rate": 0.0001397348599753448, + "loss": 0.0359, "step": 165540 }, { - "epoch": 1.79, - "learning_rate": 3.1406969952625085e-05, - "loss": 0.0281, + "epoch": 1.07, + "learning_rate": 0.00013972517862098787, + "loss": 0.0389, "step": 165550 }, { - "epoch": 1.79, - "learning_rate": 3.1390745668116035e-05, - "loss": 0.0301, + "epoch": 1.07, + "learning_rate": 0.00013971549726663095, + "loss": 0.0279, "step": 165560 }, { - "epoch": 1.79, - "learning_rate": 3.137452138360698e-05, - "loss": 0.0237, + "epoch": 1.07, + "learning_rate": 0.00013970581591227403, + "loss": 0.0295, "step": 165570 }, { - "epoch": 1.79, - "learning_rate": 3.135829709909793e-05, - "loss": 0.029, + "epoch": 1.07, + "learning_rate": 0.00013969613455791708, + "loss": 0.0285, "step": 165580 }, { - "epoch": 1.79, - "learning_rate": 3.134207281458887e-05, - "loss": 0.0241, + "epoch": 1.07, + "learning_rate": 0.00013968645320356013, + "loss": 0.0364, "step": 165590 }, { - "epoch": 1.79, - "learning_rate": 3.132584853007982e-05, - "loss": 0.0302, + "epoch": 1.07, + "learning_rate": 0.0001396767718492032, + "loss": 0.0274, "step": 165600 }, { - "epoch": 1.79, - "learning_rate": 3.1309624245570764e-05, - "loss": 0.0236, + "epoch": 1.07, + "learning_rate": 0.00013966709049484627, + "loss": 0.0344, "step": 165610 }, { - "epoch": 1.79, - "learning_rate": 3.1293399961061713e-05, - "loss": 0.0307, + "epoch": 1.07, + "learning_rate": 0.00013965740914048935, + "loss": 0.0304, "step": 165620 }, { - "epoch": 1.79, - "learning_rate": 3.127717567655266e-05, - "loss": 0.0224, + "epoch": 1.07, + "learning_rate": 0.00013964772778613243, + "loss": 0.0314, "step": 165630 }, { - "epoch": 1.79, - "learning_rate": 3.1260951392043606e-05, - "loss": 0.0262, + "epoch": 1.07, + "learning_rate": 0.00013963804643177548, + "loss": 0.0288, "step": 165640 }, { - "epoch": 1.79, - "learning_rate": 3.1244727107534556e-05, - "loss": 0.0245, + "epoch": 1.07, + "learning_rate": 0.00013962836507741856, + "loss": 0.0401, "step": 165650 }, { - "epoch": 1.79, - "learning_rate": 3.12285028230255e-05, - "loss": 0.0251, + "epoch": 1.07, + "learning_rate": 0.0001396186837230616, + "loss": 0.0314, "step": 165660 }, { - "epoch": 1.79, - "learning_rate": 3.121227853851645e-05, - "loss": 0.0304, + "epoch": 1.07, + "learning_rate": 0.0001396090023687047, + "loss": 0.0325, "step": 165670 }, { - "epoch": 1.79, - "learning_rate": 3.119605425400739e-05, - "loss": 0.0248, + "epoch": 1.07, + "learning_rate": 0.00013959932101434774, + "loss": 0.031, "step": 165680 }, { - "epoch": 1.79, - "learning_rate": 3.117982996949834e-05, - "loss": 0.0275, + "epoch": 1.07, + "learning_rate": 0.00013958963965999082, + "loss": 0.0371, "step": 165690 }, { - "epoch": 1.79, - "learning_rate": 3.1163605684989284e-05, - "loss": 0.0287, + "epoch": 1.07, + "learning_rate": 0.0001395799583056339, + "loss": 0.0367, "step": 165700 }, { - "epoch": 1.79, - "learning_rate": 3.1147381400480234e-05, - "loss": 0.0272, + "epoch": 1.07, + "learning_rate": 0.00013957027695127696, + "loss": 0.0376, "step": 165710 }, { - "epoch": 1.79, - "learning_rate": 3.1131157115971184e-05, - "loss": 0.0223, + "epoch": 1.07, + "learning_rate": 0.00013956059559692004, + "loss": 0.0356, "step": 165720 }, { - "epoch": 1.79, - "learning_rate": 3.1114932831462134e-05, - "loss": 0.023, + "epoch": 1.07, + "learning_rate": 0.0001395509142425631, + "loss": 0.0329, "step": 165730 }, { - "epoch": 1.79, - "learning_rate": 3.109870854695308e-05, - "loss": 0.0272, + "epoch": 1.07, + "learning_rate": 0.00013954123288820617, + "loss": 0.0365, "step": 165740 }, { - "epoch": 1.79, - "learning_rate": 3.1082484262444027e-05, - "loss": 0.0309, + "epoch": 1.07, + "learning_rate": 0.00013953155153384922, + "loss": 0.0436, "step": 165750 }, { - "epoch": 1.79, - "learning_rate": 3.106625997793497e-05, - "loss": 0.0188, + "epoch": 1.07, + "learning_rate": 0.0001395218701794923, + "loss": 0.0292, "step": 165760 }, { - "epoch": 1.79, - "learning_rate": 3.105003569342592e-05, - "loss": 0.0279, + "epoch": 1.07, + "learning_rate": 0.00013951218882513538, + "loss": 0.0336, "step": 165770 }, { - "epoch": 1.79, - "learning_rate": 3.103381140891687e-05, - "loss": 0.0221, + "epoch": 1.07, + "learning_rate": 0.00013950250747077843, + "loss": 0.0375, "step": 165780 }, { - "epoch": 1.79, - "learning_rate": 3.101758712440781e-05, - "loss": 0.0248, + "epoch": 1.07, + "learning_rate": 0.00013949282611642149, + "loss": 0.0303, "step": 165790 }, { - "epoch": 1.79, - "learning_rate": 3.100136283989876e-05, - "loss": 0.025, + "epoch": 1.07, + "learning_rate": 0.00013948314476206456, + "loss": 0.0289, "step": 165800 }, { - "epoch": 1.79, - "learning_rate": 3.0985138555389705e-05, - "loss": 0.024, + "epoch": 1.07, + "learning_rate": 0.00013947346340770764, + "loss": 0.0291, "step": 165810 }, { - "epoch": 1.79, - "learning_rate": 3.0968914270880655e-05, - "loss": 0.0275, + "epoch": 1.07, + "learning_rate": 0.0001394637820533507, + "loss": 0.0353, "step": 165820 }, { - "epoch": 1.79, - "learning_rate": 3.09526899863716e-05, - "loss": 0.0244, + "epoch": 1.07, + "learning_rate": 0.00013945410069899378, + "loss": 0.0315, "step": 165830 }, { - "epoch": 1.79, - "learning_rate": 3.093646570186255e-05, - "loss": 0.028, + "epoch": 1.07, + "learning_rate": 0.00013944441934463683, + "loss": 0.0369, "step": 165840 }, { - "epoch": 1.79, - "learning_rate": 3.092024141735349e-05, - "loss": 0.0239, + "epoch": 1.07, + "learning_rate": 0.0001394347379902799, + "loss": 0.0291, "step": 165850 }, { - "epoch": 1.79, - "learning_rate": 3.090401713284444e-05, - "loss": 0.027, + "epoch": 1.07, + "learning_rate": 0.00013942505663592296, + "loss": 0.0313, "step": 165860 }, { - "epoch": 1.79, - "learning_rate": 3.088779284833539e-05, - "loss": 0.0248, + "epoch": 1.07, + "learning_rate": 0.00013941537528156604, + "loss": 0.0317, "step": 165870 }, { - "epoch": 1.79, - "learning_rate": 3.087156856382633e-05, - "loss": 0.0253, + "epoch": 1.07, + "learning_rate": 0.00013940569392720912, + "loss": 0.0329, "step": 165880 }, { - "epoch": 1.79, - "learning_rate": 3.085534427931728e-05, - "loss": 0.0268, + "epoch": 1.07, + "learning_rate": 0.00013939601257285217, + "loss": 0.0367, "step": 165890 }, { - "epoch": 1.79, - "learning_rate": 3.0839119994808226e-05, - "loss": 0.0255, + "epoch": 1.07, + "learning_rate": 0.00013938633121849525, + "loss": 0.0344, "step": 165900 }, { - "epoch": 1.79, - "learning_rate": 3.0822895710299175e-05, - "loss": 0.0236, + "epoch": 1.07, + "learning_rate": 0.0001393766498641383, + "loss": 0.0281, "step": 165910 }, { - "epoch": 1.79, - "learning_rate": 3.080667142579012e-05, - "loss": 0.0259, + "epoch": 1.07, + "learning_rate": 0.0001393669685097814, + "loss": 0.0348, "step": 165920 }, { - "epoch": 1.79, - "learning_rate": 3.079044714128107e-05, - "loss": 0.0257, + "epoch": 1.07, + "learning_rate": 0.00013935728715542444, + "loss": 0.0336, "step": 165930 }, { - "epoch": 1.79, - "learning_rate": 3.077422285677201e-05, - "loss": 0.0232, + "epoch": 1.07, + "learning_rate": 0.00013934760580106752, + "loss": 0.0389, "step": 165940 }, { - "epoch": 1.79, - "learning_rate": 3.075799857226296e-05, - "loss": 0.0212, + "epoch": 1.07, + "learning_rate": 0.0001393379244467106, + "loss": 0.032, "step": 165950 }, { - "epoch": 1.8, - "learning_rate": 3.074177428775391e-05, - "loss": 0.0285, + "epoch": 1.07, + "learning_rate": 0.00013932824309235365, + "loss": 0.0386, "step": 165960 }, { - "epoch": 1.8, - "learning_rate": 3.0725550003244854e-05, - "loss": 0.027, + "epoch": 1.07, + "learning_rate": 0.00013931856173799673, + "loss": 0.0385, "step": 165970 }, { - "epoch": 1.8, - "learning_rate": 3.0709325718735804e-05, - "loss": 0.026, + "epoch": 1.07, + "learning_rate": 0.00013930888038363978, + "loss": 0.0404, "step": 165980 }, { - "epoch": 1.8, - "learning_rate": 3.0693101434226746e-05, - "loss": 0.023, + "epoch": 1.07, + "learning_rate": 0.00013929919902928286, + "loss": 0.0343, "step": 165990 }, { - "epoch": 1.8, - "learning_rate": 3.0676877149717696e-05, - "loss": 0.0227, + "epoch": 1.07, + "learning_rate": 0.00013928951767492592, + "loss": 0.0352, "step": 166000 }, { - "epoch": 1.8, - "eval_cer": 0.9210447732184097, - "eval_loss": 0.02108580619096756, - "eval_runtime": 119.0501, - "eval_samples_per_second": 16.8, - "eval_steps_per_second": 4.2, + "epoch": 1.07, + "eval_cer": 0.9198219410236131, + "eval_loss": 0.02429656684398651, + "eval_runtime": 120.1547, + "eval_samples_per_second": 16.645, + "eval_steps_per_second": 4.161, "step": 166000 }, { - "epoch": 1.8, - "learning_rate": 3.066065286520864e-05, - "loss": 0.0218, + "epoch": 1.07, + "learning_rate": 0.000139279836320569, + "loss": 0.0322, "step": 166010 }, { - "epoch": 1.8, - "learning_rate": 3.064442858069959e-05, - "loss": 0.0263, + "epoch": 1.07, + "learning_rate": 0.00013927015496621208, + "loss": 0.0341, "step": 166020 }, { - "epoch": 1.8, - "learning_rate": 3.062820429619053e-05, - "loss": 0.0217, + "epoch": 1.07, + "learning_rate": 0.00013926047361185513, + "loss": 0.0379, "step": 166030 }, { - "epoch": 1.8, - "learning_rate": 3.061198001168148e-05, - "loss": 0.0219, + "epoch": 1.07, + "learning_rate": 0.00013925079225749818, + "loss": 0.0401, "step": 166040 }, { - "epoch": 1.8, - "learning_rate": 3.059575572717243e-05, - "loss": 0.0253, + "epoch": 1.07, + "learning_rate": 0.00013924111090314126, + "loss": 0.0321, "step": 166050 }, { - "epoch": 1.8, - "learning_rate": 3.0579531442663375e-05, - "loss": 0.0324, + "epoch": 1.07, + "learning_rate": 0.00013923142954878434, + "loss": 0.0371, "step": 166060 }, { - "epoch": 1.8, - "learning_rate": 3.0563307158154324e-05, - "loss": 0.0241, + "epoch": 1.07, + "learning_rate": 0.0001392217481944274, + "loss": 0.0357, "step": 166070 }, { - "epoch": 1.8, - "learning_rate": 3.054708287364527e-05, - "loss": 0.031, + "epoch": 1.07, + "learning_rate": 0.00013921206684007047, + "loss": 0.033, "step": 166080 }, { - "epoch": 1.8, - "learning_rate": 3.053085858913622e-05, - "loss": 0.0271, + "epoch": 1.07, + "learning_rate": 0.00013920238548571355, + "loss": 0.0354, "step": 166090 }, { - "epoch": 1.8, - "learning_rate": 3.0514634304627163e-05, - "loss": 0.0234, + "epoch": 1.07, + "learning_rate": 0.0001391927041313566, + "loss": 0.0375, "step": 166100 }, { - "epoch": 1.8, - "learning_rate": 3.049841002011811e-05, - "loss": 0.0222, + "epoch": 1.07, + "learning_rate": 0.00013918302277699966, + "loss": 0.0396, "step": 166110 }, { - "epoch": 1.8, - "learning_rate": 3.0482185735609056e-05, - "loss": 0.0237, + "epoch": 1.07, + "learning_rate": 0.00013917334142264274, + "loss": 0.034, "step": 166120 }, { - "epoch": 1.8, - "learning_rate": 3.0465961451100003e-05, - "loss": 0.0303, + "epoch": 1.07, + "learning_rate": 0.00013916366006828582, + "loss": 0.0356, "step": 166130 }, { - "epoch": 1.8, - "learning_rate": 3.044973716659095e-05, - "loss": 0.0249, + "epoch": 1.07, + "learning_rate": 0.00013915397871392887, + "loss": 0.0329, "step": 166140 }, { - "epoch": 1.8, - "learning_rate": 3.0433512882081895e-05, - "loss": 0.0236, + "epoch": 1.07, + "learning_rate": 0.00013914429735957195, + "loss": 0.0275, "step": 166150 }, { - "epoch": 1.8, - "learning_rate": 3.0417288597572842e-05, - "loss": 0.0295, + "epoch": 1.07, + "learning_rate": 0.000139134616005215, + "loss": 0.0356, "step": 166160 }, { - "epoch": 1.8, - "learning_rate": 3.040106431306379e-05, - "loss": 0.0275, + "epoch": 1.07, + "learning_rate": 0.00013912493465085808, + "loss": 0.0338, "step": 166170 }, { - "epoch": 1.8, - "learning_rate": 3.0384840028554738e-05, - "loss": 0.0184, + "epoch": 1.07, + "learning_rate": 0.00013911525329650114, + "loss": 0.0357, "step": 166180 }, { - "epoch": 1.8, - "learning_rate": 3.0368615744045684e-05, - "loss": 0.0201, + "epoch": 1.07, + "learning_rate": 0.00013910557194214422, + "loss": 0.0349, "step": 166190 }, { - "epoch": 1.8, - "learning_rate": 3.035239145953663e-05, - "loss": 0.023, + "epoch": 1.07, + "learning_rate": 0.0001390958905877873, + "loss": 0.0367, "step": 166200 }, { - "epoch": 1.8, - "learning_rate": 3.0336167175027577e-05, - "loss": 0.0268, + "epoch": 1.07, + "learning_rate": 0.00013908620923343035, + "loss": 0.0328, "step": 166210 }, { - "epoch": 1.8, - "learning_rate": 3.0319942890518523e-05, - "loss": 0.0228, + "epoch": 1.07, + "learning_rate": 0.00013907652787907343, + "loss": 0.0365, "step": 166220 }, { - "epoch": 1.8, - "learning_rate": 3.030371860600947e-05, - "loss": 0.0257, + "epoch": 1.07, + "learning_rate": 0.00013906684652471648, + "loss": 0.0293, "step": 166230 }, { - "epoch": 1.8, - "learning_rate": 3.0287494321500416e-05, - "loss": 0.0282, + "epoch": 1.07, + "learning_rate": 0.00013905716517035953, + "loss": 0.0368, "step": 166240 }, { - "epoch": 1.8, - "learning_rate": 3.0271270036991366e-05, - "loss": 0.023, + "epoch": 1.07, + "learning_rate": 0.0001390474838160026, + "loss": 0.0335, "step": 166250 }, { - "epoch": 1.8, - "learning_rate": 3.0255045752482312e-05, - "loss": 0.0249, + "epoch": 1.07, + "learning_rate": 0.0001390378024616457, + "loss": 0.032, "step": 166260 }, { - "epoch": 1.8, - "learning_rate": 3.023882146797326e-05, - "loss": 0.0258, + "epoch": 1.07, + "learning_rate": 0.00013902812110728877, + "loss": 0.0345, "step": 166270 }, { - "epoch": 1.8, - "learning_rate": 3.0222597183464205e-05, - "loss": 0.0266, + "epoch": 1.07, + "learning_rate": 0.00013901843975293183, + "loss": 0.0338, "step": 166280 }, { - "epoch": 1.8, - "learning_rate": 3.020637289895515e-05, - "loss": 0.0275, + "epoch": 1.07, + "learning_rate": 0.0001390087583985749, + "loss": 0.0291, "step": 166290 }, { - "epoch": 1.8, - "learning_rate": 3.0190148614446098e-05, - "loss": 0.0229, + "epoch": 1.07, + "learning_rate": 0.00013899907704421796, + "loss": 0.0352, "step": 166300 }, { - "epoch": 1.8, - "learning_rate": 3.0173924329937044e-05, - "loss": 0.0244, + "epoch": 1.07, + "learning_rate": 0.000138989395689861, + "loss": 0.0365, "step": 166310 }, { - "epoch": 1.8, - "learning_rate": 3.0157700045427997e-05, - "loss": 0.0308, + "epoch": 1.07, + "learning_rate": 0.0001389797143355041, + "loss": 0.0347, "step": 166320 }, { - "epoch": 1.8, - "learning_rate": 3.0141475760918944e-05, - "loss": 0.0261, + "epoch": 1.07, + "learning_rate": 0.00013897003298114717, + "loss": 0.0336, "step": 166330 }, { - "epoch": 1.8, - "learning_rate": 3.012525147640989e-05, - "loss": 0.0341, + "epoch": 1.07, + "learning_rate": 0.00013896035162679025, + "loss": 0.0377, "step": 166340 }, { - "epoch": 1.8, - "learning_rate": 3.0109027191900837e-05, - "loss": 0.0216, + "epoch": 1.07, + "learning_rate": 0.0001389506702724333, + "loss": 0.0384, "step": 166350 }, { - "epoch": 1.8, - "learning_rate": 3.0092802907391783e-05, - "loss": 0.023, + "epoch": 1.07, + "learning_rate": 0.00013894098891807636, + "loss": 0.0386, "step": 166360 }, { - "epoch": 1.8, - "learning_rate": 3.007657862288273e-05, - "loss": 0.0263, + "epoch": 1.07, + "learning_rate": 0.00013893130756371944, + "loss": 0.0346, "step": 166370 }, { - "epoch": 1.8, - "learning_rate": 3.0060354338373676e-05, - "loss": 0.0251, + "epoch": 1.07, + "learning_rate": 0.0001389216262093625, + "loss": 0.0347, "step": 166380 }, { - "epoch": 1.8, - "learning_rate": 3.0044130053864622e-05, - "loss": 0.0284, + "epoch": 1.07, + "learning_rate": 0.00013891194485500557, + "loss": 0.0365, "step": 166390 }, { - "epoch": 1.8, - "learning_rate": 3.0027905769355572e-05, - "loss": 0.0268, + "epoch": 1.07, + "learning_rate": 0.00013890226350064865, + "loss": 0.0283, "step": 166400 }, { - "epoch": 1.8, - "learning_rate": 3.0011681484846518e-05, - "loss": 0.0281, + "epoch": 1.07, + "learning_rate": 0.00013889258214629173, + "loss": 0.0324, "step": 166410 }, { - "epoch": 1.8, - "learning_rate": 2.9995457200337465e-05, - "loss": 0.0212, + "epoch": 1.07, + "learning_rate": 0.00013888290079193478, + "loss": 0.0336, "step": 166420 }, { - "epoch": 1.8, - "learning_rate": 2.997923291582841e-05, - "loss": 0.0261, + "epoch": 1.07, + "learning_rate": 0.00013887321943757783, + "loss": 0.0355, "step": 166430 }, { - "epoch": 1.8, - "learning_rate": 2.9963008631319357e-05, - "loss": 0.026, + "epoch": 1.07, + "learning_rate": 0.0001388635380832209, + "loss": 0.0321, "step": 166440 }, { - "epoch": 1.8, - "learning_rate": 2.9946784346810304e-05, - "loss": 0.0214, + "epoch": 1.07, + "learning_rate": 0.00013885385672886397, + "loss": 0.0325, "step": 166450 }, { - "epoch": 1.8, - "learning_rate": 2.993056006230125e-05, - "loss": 0.0288, + "epoch": 1.07, + "learning_rate": 0.00013884417537450705, + "loss": 0.029, "step": 166460 }, { - "epoch": 1.8, - "learning_rate": 2.9914335777792197e-05, - "loss": 0.0285, + "epoch": 1.07, + "learning_rate": 0.00013883449402015012, + "loss": 0.0326, "step": 166470 }, { - "epoch": 1.8, - "learning_rate": 2.9898111493283143e-05, - "loss": 0.028, + "epoch": 1.07, + "learning_rate": 0.00013882481266579318, + "loss": 0.0334, "step": 166480 }, { - "epoch": 1.8, - "learning_rate": 2.9881887208774093e-05, - "loss": 0.0249, + "epoch": 1.07, + "learning_rate": 0.00013881513131143626, + "loss": 0.0348, "step": 166490 }, { - "epoch": 1.8, - "learning_rate": 2.986566292426504e-05, - "loss": 0.0234, + "epoch": 1.07, + "learning_rate": 0.0001388054499570793, + "loss": 0.0304, "step": 166500 }, { - "epoch": 1.8, - "learning_rate": 2.9849438639755985e-05, - "loss": 0.0326, + "epoch": 1.07, + "learning_rate": 0.0001387957686027224, + "loss": 0.0372, "step": 166510 }, { - "epoch": 1.8, - "learning_rate": 2.9833214355246932e-05, - "loss": 0.0318, + "epoch": 1.07, + "learning_rate": 0.00013878608724836544, + "loss": 0.0334, "step": 166520 }, { - "epoch": 1.8, - "learning_rate": 2.9816990070737878e-05, - "loss": 0.0243, + "epoch": 1.07, + "learning_rate": 0.00013877640589400852, + "loss": 0.0373, "step": 166530 }, { - "epoch": 1.8, - "learning_rate": 2.9800765786228825e-05, - "loss": 0.0205, + "epoch": 1.07, + "learning_rate": 0.0001387667245396516, + "loss": 0.0395, "step": 166540 }, { - "epoch": 1.8, - "learning_rate": 2.978454150171977e-05, - "loss": 0.0242, + "epoch": 1.07, + "learning_rate": 0.00013875704318529465, + "loss": 0.0346, "step": 166550 }, { - "epoch": 1.8, - "learning_rate": 2.9768317217210717e-05, - "loss": 0.0244, + "epoch": 1.08, + "learning_rate": 0.0001387473618309377, + "loss": 0.0359, "step": 166560 }, { - "epoch": 1.8, - "learning_rate": 2.9752092932701667e-05, - "loss": 0.0258, + "epoch": 1.08, + "learning_rate": 0.0001387376804765808, + "loss": 0.0331, "step": 166570 }, { - "epoch": 1.8, - "learning_rate": 2.9735868648192614e-05, - "loss": 0.0236, + "epoch": 1.08, + "learning_rate": 0.00013872799912222387, + "loss": 0.0318, "step": 166580 }, { - "epoch": 1.8, - "learning_rate": 2.971964436368356e-05, - "loss": 0.0281, + "epoch": 1.08, + "learning_rate": 0.00013871831776786692, + "loss": 0.0309, "step": 166590 }, { - "epoch": 1.8, - "learning_rate": 2.9703420079174506e-05, - "loss": 0.0247, + "epoch": 1.08, + "learning_rate": 0.00013870863641351, + "loss": 0.0336, "step": 166600 }, { - "epoch": 1.8, - "learning_rate": 2.9687195794665453e-05, - "loss": 0.0283, + "epoch": 1.08, + "learning_rate": 0.00013869895505915308, + "loss": 0.0339, "step": 166610 }, { - "epoch": 1.8, - "learning_rate": 2.96709715101564e-05, - "loss": 0.0225, + "epoch": 1.08, + "learning_rate": 0.00013868927370479613, + "loss": 0.0321, "step": 166620 }, { - "epoch": 1.8, - "learning_rate": 2.9654747225647345e-05, - "loss": 0.0249, + "epoch": 1.08, + "learning_rate": 0.00013867959235043918, + "loss": 0.0319, "step": 166630 }, { - "epoch": 1.8, - "learning_rate": 2.9638522941138292e-05, - "loss": 0.027, + "epoch": 1.08, + "learning_rate": 0.00013866991099608226, + "loss": 0.0401, "step": 166640 }, { - "epoch": 1.8, - "learning_rate": 2.9622298656629238e-05, - "loss": 0.0244, + "epoch": 1.08, + "learning_rate": 0.00013866022964172534, + "loss": 0.0326, "step": 166650 }, { - "epoch": 1.8, - "learning_rate": 2.9606074372120188e-05, - "loss": 0.0313, + "epoch": 1.08, + "learning_rate": 0.0001386505482873684, + "loss": 0.0336, "step": 166660 }, { - "epoch": 1.8, - "learning_rate": 2.9589850087611134e-05, - "loss": 0.0263, + "epoch": 1.08, + "learning_rate": 0.00013864086693301148, + "loss": 0.0397, "step": 166670 }, { - "epoch": 1.8, - "learning_rate": 2.957362580310208e-05, - "loss": 0.0223, + "epoch": 1.08, + "learning_rate": 0.00013863118557865453, + "loss": 0.0307, "step": 166680 }, { - "epoch": 1.8, - "learning_rate": 2.9557401518593027e-05, - "loss": 0.0331, + "epoch": 1.08, + "learning_rate": 0.0001386215042242976, + "loss": 0.0318, "step": 166690 }, { - "epoch": 1.8, - "learning_rate": 2.9541177234083974e-05, - "loss": 0.0293, + "epoch": 1.08, + "learning_rate": 0.00013861182286994066, + "loss": 0.0371, "step": 166700 }, { - "epoch": 1.8, - "learning_rate": 2.952495294957492e-05, - "loss": 0.0257, + "epoch": 1.08, + "learning_rate": 0.00013860214151558374, + "loss": 0.0343, "step": 166710 }, { - "epoch": 1.8, - "learning_rate": 2.9508728665065866e-05, - "loss": 0.0306, + "epoch": 1.08, + "learning_rate": 0.00013859246016122682, + "loss": 0.0311, "step": 166720 }, { - "epoch": 1.8, - "learning_rate": 2.9492504380556813e-05, - "loss": 0.0275, + "epoch": 1.08, + "learning_rate": 0.00013858277880686987, + "loss": 0.0279, "step": 166730 }, { - "epoch": 1.8, - "learning_rate": 2.947628009604776e-05, - "loss": 0.0249, + "epoch": 1.08, + "learning_rate": 0.00013857309745251295, + "loss": 0.0463, "step": 166740 }, { - "epoch": 1.8, - "learning_rate": 2.946005581153871e-05, - "loss": 0.0259, + "epoch": 1.08, + "learning_rate": 0.000138563416098156, + "loss": 0.0292, "step": 166750 }, { - "epoch": 1.8, - "learning_rate": 2.9443831527029655e-05, - "loss": 0.031, + "epoch": 1.08, + "learning_rate": 0.0001385537347437991, + "loss": 0.0314, "step": 166760 }, { - "epoch": 1.8, - "learning_rate": 2.94276072425206e-05, - "loss": 0.0226, + "epoch": 1.08, + "learning_rate": 0.00013854405338944214, + "loss": 0.0345, "step": 166770 }, { - "epoch": 1.8, - "learning_rate": 2.9411382958011548e-05, - "loss": 0.0253, + "epoch": 1.08, + "learning_rate": 0.00013853437203508522, + "loss": 0.0459, "step": 166780 }, { - "epoch": 1.8, - "learning_rate": 2.9395158673502494e-05, - "loss": 0.021, + "epoch": 1.08, + "learning_rate": 0.0001385246906807283, + "loss": 0.0378, "step": 166790 }, { - "epoch": 1.8, - "learning_rate": 2.937893438899344e-05, - "loss": 0.0196, + "epoch": 1.08, + "learning_rate": 0.00013851500932637135, + "loss": 0.034, "step": 166800 }, { - "epoch": 1.8, - "learning_rate": 2.9362710104484387e-05, - "loss": 0.0239, + "epoch": 1.08, + "learning_rate": 0.00013850532797201443, + "loss": 0.0325, "step": 166810 }, { - "epoch": 1.8, - "learning_rate": 2.9346485819975334e-05, - "loss": 0.025, + "epoch": 1.08, + "learning_rate": 0.00013849564661765748, + "loss": 0.0303, "step": 166820 }, { - "epoch": 1.8, - "learning_rate": 2.9330261535466283e-05, - "loss": 0.0207, + "epoch": 1.08, + "learning_rate": 0.00013848596526330056, + "loss": 0.0329, "step": 166830 }, { - "epoch": 1.8, - "learning_rate": 2.931403725095723e-05, - "loss": 0.0217, + "epoch": 1.08, + "learning_rate": 0.00013847628390894362, + "loss": 0.0344, "step": 166840 }, { - "epoch": 1.8, - "learning_rate": 2.9297812966448176e-05, - "loss": 0.0253, + "epoch": 1.08, + "learning_rate": 0.0001384666025545867, + "loss": 0.0326, "step": 166850 }, { - "epoch": 1.8, - "learning_rate": 2.9281588681939122e-05, - "loss": 0.0272, + "epoch": 1.08, + "learning_rate": 0.00013845692120022978, + "loss": 0.033, "step": 166860 }, { - "epoch": 1.8, - "learning_rate": 2.926536439743007e-05, - "loss": 0.0295, + "epoch": 1.08, + "learning_rate": 0.00013844723984587283, + "loss": 0.03, "step": 166870 }, { - "epoch": 1.8, - "learning_rate": 2.9249140112921015e-05, - "loss": 0.0226, + "epoch": 1.08, + "learning_rate": 0.00013843755849151588, + "loss": 0.0406, "step": 166880 }, { - "epoch": 1.81, - "learning_rate": 2.923291582841196e-05, - "loss": 0.0308, + "epoch": 1.08, + "learning_rate": 0.00013842787713715896, + "loss": 0.0331, "step": 166890 }, { - "epoch": 1.81, - "learning_rate": 2.9216691543902915e-05, - "loss": 0.0269, + "epoch": 1.08, + "learning_rate": 0.00013841819578280204, + "loss": 0.0316, "step": 166900 }, { - "epoch": 1.81, - "learning_rate": 2.920046725939386e-05, - "loss": 0.0223, + "epoch": 1.08, + "learning_rate": 0.0001384085144284451, + "loss": 0.0317, "step": 166910 }, { - "epoch": 1.81, - "learning_rate": 2.9184242974884808e-05, - "loss": 0.0289, + "epoch": 1.08, + "learning_rate": 0.00013839883307408817, + "loss": 0.0348, "step": 166920 }, { - "epoch": 1.81, - "learning_rate": 2.9168018690375754e-05, - "loss": 0.0206, + "epoch": 1.08, + "learning_rate": 0.00013838915171973123, + "loss": 0.0323, "step": 166930 }, { - "epoch": 1.81, - "learning_rate": 2.91517944058667e-05, - "loss": 0.0281, + "epoch": 1.08, + "learning_rate": 0.0001383794703653743, + "loss": 0.0344, "step": 166940 }, { - "epoch": 1.81, - "learning_rate": 2.9135570121357647e-05, - "loss": 0.0276, + "epoch": 1.08, + "learning_rate": 0.00013836978901101736, + "loss": 0.0346, "step": 166950 }, { - "epoch": 1.81, - "learning_rate": 2.9119345836848593e-05, - "loss": 0.0221, + "epoch": 1.08, + "learning_rate": 0.00013836010765666044, + "loss": 0.0354, "step": 166960 }, { - "epoch": 1.81, - "learning_rate": 2.910312155233954e-05, - "loss": 0.0244, + "epoch": 1.08, + "learning_rate": 0.00013835042630230352, + "loss": 0.0356, "step": 166970 }, { - "epoch": 1.81, - "learning_rate": 2.908689726783049e-05, - "loss": 0.0261, + "epoch": 1.08, + "learning_rate": 0.00013834074494794657, + "loss": 0.0316, "step": 166980 }, { - "epoch": 1.81, - "learning_rate": 2.9070672983321436e-05, - "loss": 0.0258, + "epoch": 1.08, + "learning_rate": 0.00013833106359358965, + "loss": 0.0351, "step": 166990 }, { - "epoch": 1.81, - "learning_rate": 2.9054448698812382e-05, - "loss": 0.0252, + "epoch": 1.08, + "learning_rate": 0.0001383213822392327, + "loss": 0.0319, "step": 167000 }, { - "epoch": 1.81, - "eval_cer": 0.9211393060407357, - "eval_loss": 0.021122299134731293, - "eval_runtime": 118.9682, - "eval_samples_per_second": 16.811, - "eval_steps_per_second": 4.203, + "epoch": 1.08, + "eval_cer": 0.919931307196927, + "eval_loss": 0.02439761720597744, + "eval_runtime": 120.0555, + "eval_samples_per_second": 16.659, + "eval_steps_per_second": 4.165, "step": 167000 }, { - "epoch": 1.81, - "learning_rate": 2.903822441430333e-05, - "loss": 0.0209, + "epoch": 1.08, + "learning_rate": 0.00013831170088487578, + "loss": 0.0326, "step": 167010 }, { - "epoch": 1.81, - "learning_rate": 2.9022000129794275e-05, - "loss": 0.028, + "epoch": 1.08, + "learning_rate": 0.00013830201953051884, + "loss": 0.0288, "step": 167020 }, { - "epoch": 1.81, - "learning_rate": 2.900577584528522e-05, - "loss": 0.0243, + "epoch": 1.08, + "learning_rate": 0.00013829233817616192, + "loss": 0.035, "step": 167030 }, { - "epoch": 1.81, - "learning_rate": 2.8989551560776167e-05, - "loss": 0.0239, + "epoch": 1.08, + "learning_rate": 0.00013828265682180497, + "loss": 0.0323, "step": 167040 }, { - "epoch": 1.81, - "learning_rate": 2.8973327276267114e-05, - "loss": 0.0268, + "epoch": 1.08, + "learning_rate": 0.00013827297546744805, + "loss": 0.038, "step": 167050 }, { - "epoch": 1.81, - "learning_rate": 2.895710299175806e-05, - "loss": 0.0291, + "epoch": 1.08, + "learning_rate": 0.00013826329411309113, + "loss": 0.0404, "step": 167060 }, { - "epoch": 1.81, - "learning_rate": 2.894087870724901e-05, - "loss": 0.0323, + "epoch": 1.08, + "learning_rate": 0.00013825361275873418, + "loss": 0.0308, "step": 167070 }, { - "epoch": 1.81, - "learning_rate": 2.8924654422739956e-05, - "loss": 0.0272, + "epoch": 1.08, + "learning_rate": 0.00013824393140437723, + "loss": 0.0345, "step": 167080 }, { - "epoch": 1.81, - "learning_rate": 2.8908430138230903e-05, - "loss": 0.029, + "epoch": 1.08, + "learning_rate": 0.0001382342500500203, + "loss": 0.0317, "step": 167090 }, { - "epoch": 1.81, - "learning_rate": 2.889220585372185e-05, - "loss": 0.0203, + "epoch": 1.08, + "learning_rate": 0.0001382245686956634, + "loss": 0.0316, "step": 167100 }, { - "epoch": 1.81, - "learning_rate": 2.8875981569212796e-05, - "loss": 0.0273, + "epoch": 1.08, + "learning_rate": 0.00013821488734130645, + "loss": 0.0335, "step": 167110 }, { - "epoch": 1.81, - "learning_rate": 2.8859757284703742e-05, - "loss": 0.0256, + "epoch": 1.08, + "learning_rate": 0.00013820520598694953, + "loss": 0.0366, "step": 167120 }, { - "epoch": 1.81, - "learning_rate": 2.884353300019469e-05, - "loss": 0.0241, + "epoch": 1.08, + "learning_rate": 0.00013819552463259258, + "loss": 0.0315, "step": 167130 }, { - "epoch": 1.81, - "learning_rate": 2.8827308715685635e-05, - "loss": 0.0291, + "epoch": 1.08, + "learning_rate": 0.00013818584327823566, + "loss": 0.0375, "step": 167140 }, { - "epoch": 1.81, - "learning_rate": 2.8811084431176584e-05, - "loss": 0.0285, + "epoch": 1.08, + "learning_rate": 0.0001381761619238787, + "loss": 0.034, "step": 167150 }, { - "epoch": 1.81, - "learning_rate": 2.879486014666753e-05, - "loss": 0.0227, + "epoch": 1.08, + "learning_rate": 0.0001381664805695218, + "loss": 0.0339, "step": 167160 }, { - "epoch": 1.81, - "learning_rate": 2.8778635862158477e-05, - "loss": 0.028, + "epoch": 1.08, + "learning_rate": 0.00013815679921516487, + "loss": 0.0314, "step": 167170 }, { - "epoch": 1.81, - "learning_rate": 2.8762411577649424e-05, - "loss": 0.0226, + "epoch": 1.08, + "learning_rate": 0.00013814711786080792, + "loss": 0.0292, "step": 167180 }, { - "epoch": 1.81, - "learning_rate": 2.874618729314037e-05, - "loss": 0.0259, + "epoch": 1.08, + "learning_rate": 0.000138137436506451, + "loss": 0.0315, "step": 167190 }, { - "epoch": 1.81, - "learning_rate": 2.8729963008631316e-05, - "loss": 0.0273, + "epoch": 1.08, + "learning_rate": 0.00013812775515209406, + "loss": 0.0322, "step": 167200 }, { - "epoch": 1.81, - "learning_rate": 2.8713738724122263e-05, - "loss": 0.0271, + "epoch": 1.08, + "learning_rate": 0.00013811807379773714, + "loss": 0.032, "step": 167210 }, { - "epoch": 1.81, - "learning_rate": 2.869751443961321e-05, - "loss": 0.0361, + "epoch": 1.08, + "learning_rate": 0.0001381083924433802, + "loss": 0.0318, "step": 167220 }, { - "epoch": 1.81, - "learning_rate": 2.8681290155104156e-05, - "loss": 0.0299, + "epoch": 1.08, + "learning_rate": 0.00013809871108902327, + "loss": 0.0293, "step": 167230 }, { - "epoch": 1.81, - "learning_rate": 2.8665065870595105e-05, - "loss": 0.0244, + "epoch": 1.08, + "learning_rate": 0.00013808902973466635, + "loss": 0.0304, "step": 167240 }, { - "epoch": 1.81, - "learning_rate": 2.864884158608605e-05, - "loss": 0.0223, + "epoch": 1.08, + "learning_rate": 0.0001380793483803094, + "loss": 0.0319, "step": 167250 }, { - "epoch": 1.81, - "learning_rate": 2.8632617301576998e-05, - "loss": 0.0336, + "epoch": 1.08, + "learning_rate": 0.00013806966702595248, + "loss": 0.0332, "step": 167260 }, { - "epoch": 1.81, - "learning_rate": 2.8616393017067944e-05, - "loss": 0.0215, + "epoch": 1.08, + "learning_rate": 0.00013805998567159553, + "loss": 0.0357, "step": 167270 }, { - "epoch": 1.81, - "learning_rate": 2.860016873255889e-05, - "loss": 0.0229, + "epoch": 1.08, + "learning_rate": 0.0001380503043172386, + "loss": 0.0307, "step": 167280 }, { - "epoch": 1.81, - "learning_rate": 2.8583944448049837e-05, - "loss": 0.0281, + "epoch": 1.08, + "learning_rate": 0.00013804062296288167, + "loss": 0.0365, "step": 167290 }, { - "epoch": 1.81, - "learning_rate": 2.8567720163540784e-05, - "loss": 0.0218, + "epoch": 1.08, + "learning_rate": 0.00013803094160852474, + "loss": 0.0352, "step": 167300 }, { - "epoch": 1.81, - "learning_rate": 2.855149587903173e-05, - "loss": 0.026, + "epoch": 1.08, + "learning_rate": 0.00013802126025416782, + "loss": 0.0307, "step": 167310 }, { - "epoch": 1.81, - "learning_rate": 2.853527159452268e-05, - "loss": 0.0236, + "epoch": 1.08, + "learning_rate": 0.00013801157889981088, + "loss": 0.0346, "step": 167320 }, { - "epoch": 1.81, - "learning_rate": 2.8519047310013626e-05, - "loss": 0.0273, - "step": 167330 + "epoch": 1.08, + "learning_rate": 0.00013800189754545393, + "loss": 0.0306, + "step": 167330 }, { - "epoch": 1.81, - "learning_rate": 2.8502823025504573e-05, - "loss": 0.0294, + "epoch": 1.08, + "learning_rate": 0.000137992216191097, + "loss": 0.0319, "step": 167340 }, { - "epoch": 1.81, - "learning_rate": 2.848659874099552e-05, - "loss": 0.031, + "epoch": 1.08, + "learning_rate": 0.0001379825348367401, + "loss": 0.0353, "step": 167350 }, { - "epoch": 1.81, - "learning_rate": 2.8470374456486465e-05, - "loss": 0.0278, + "epoch": 1.08, + "learning_rate": 0.00013797285348238314, + "loss": 0.0328, "step": 167360 }, { - "epoch": 1.81, - "learning_rate": 2.845415017197741e-05, - "loss": 0.0335, + "epoch": 1.08, + "learning_rate": 0.00013796317212802622, + "loss": 0.0346, "step": 167370 }, { - "epoch": 1.81, - "learning_rate": 2.8437925887468358e-05, - "loss": 0.0208, + "epoch": 1.08, + "learning_rate": 0.0001379534907736693, + "loss": 0.0356, "step": 167380 }, { - "epoch": 1.81, - "learning_rate": 2.8421701602959304e-05, - "loss": 0.022, + "epoch": 1.08, + "learning_rate": 0.00013794380941931235, + "loss": 0.0317, "step": 167390 }, { - "epoch": 1.81, - "learning_rate": 2.840547731845025e-05, - "loss": 0.0201, + "epoch": 1.08, + "learning_rate": 0.0001379341280649554, + "loss": 0.0312, "step": 167400 }, { - "epoch": 1.81, - "learning_rate": 2.83892530339412e-05, - "loss": 0.0281, + "epoch": 1.08, + "learning_rate": 0.0001379244467105985, + "loss": 0.0396, "step": 167410 }, { - "epoch": 1.81, - "learning_rate": 2.8373028749432147e-05, - "loss": 0.023, + "epoch": 1.08, + "learning_rate": 0.00013791476535624157, + "loss": 0.0307, "step": 167420 }, { - "epoch": 1.81, - "learning_rate": 2.8356804464923093e-05, - "loss": 0.0289, + "epoch": 1.08, + "learning_rate": 0.00013790508400188462, + "loss": 0.0302, "step": 167430 }, { - "epoch": 1.81, - "learning_rate": 2.834058018041404e-05, - "loss": 0.026, + "epoch": 1.08, + "learning_rate": 0.0001378954026475277, + "loss": 0.0299, "step": 167440 }, { - "epoch": 1.81, - "learning_rate": 2.8324355895904986e-05, - "loss": 0.0215, + "epoch": 1.08, + "learning_rate": 0.00013788572129317075, + "loss": 0.033, "step": 167450 }, { - "epoch": 1.81, - "learning_rate": 2.8308131611395932e-05, - "loss": 0.0265, + "epoch": 1.08, + "learning_rate": 0.00013787603993881383, + "loss": 0.0326, "step": 167460 }, { - "epoch": 1.81, - "learning_rate": 2.829190732688688e-05, - "loss": 0.0266, + "epoch": 1.08, + "learning_rate": 0.00013786635858445688, + "loss": 0.0327, "step": 167470 }, { - "epoch": 1.81, - "learning_rate": 2.8275683042377825e-05, - "loss": 0.0333, + "epoch": 1.08, + "learning_rate": 0.00013785667723009996, + "loss": 0.0368, "step": 167480 }, { - "epoch": 1.81, - "learning_rate": 2.825945875786878e-05, - "loss": 0.0289, + "epoch": 1.08, + "learning_rate": 0.00013784699587574304, + "loss": 0.0379, "step": 167490 }, { - "epoch": 1.81, - "learning_rate": 2.8243234473359725e-05, - "loss": 0.0208, + "epoch": 1.08, + "learning_rate": 0.0001378373145213861, + "loss": 0.0345, "step": 167500 }, { - "epoch": 1.81, - "learning_rate": 2.822701018885067e-05, - "loss": 0.0271, + "epoch": 1.08, + "learning_rate": 0.00013782763316702918, + "loss": 0.0305, "step": 167510 }, { - "epoch": 1.81, - "learning_rate": 2.8210785904341618e-05, - "loss": 0.0265, + "epoch": 1.08, + "learning_rate": 0.00013781795181267223, + "loss": 0.0362, "step": 167520 }, { - "epoch": 1.81, - "learning_rate": 2.8194561619832564e-05, - "loss": 0.0225, + "epoch": 1.08, + "learning_rate": 0.00013780827045831528, + "loss": 0.0323, "step": 167530 }, { - "epoch": 1.81, - "learning_rate": 2.817833733532351e-05, - "loss": 0.0222, + "epoch": 1.08, + "learning_rate": 0.00013779858910395836, + "loss": 0.0342, "step": 167540 }, { - "epoch": 1.81, - "learning_rate": 2.8162113050814457e-05, - "loss": 0.0257, + "epoch": 1.08, + "learning_rate": 0.00013778890774960144, + "loss": 0.0372, "step": 167550 }, { - "epoch": 1.81, - "learning_rate": 2.8145888766305406e-05, - "loss": 0.0208, + "epoch": 1.08, + "learning_rate": 0.00013777922639524452, + "loss": 0.0299, "step": 167560 }, { - "epoch": 1.81, - "learning_rate": 2.8129664481796353e-05, - "loss": 0.0261, + "epoch": 1.08, + "learning_rate": 0.00013776954504088757, + "loss": 0.0297, "step": 167570 }, { - "epoch": 1.81, - "learning_rate": 2.81134401972873e-05, - "loss": 0.0226, + "epoch": 1.08, + "learning_rate": 0.00013775986368653065, + "loss": 0.0283, "step": 167580 }, { - "epoch": 1.81, - "learning_rate": 2.8097215912778246e-05, - "loss": 0.0236, + "epoch": 1.08, + "learning_rate": 0.0001377501823321737, + "loss": 0.0304, "step": 167590 }, { - "epoch": 1.81, - "learning_rate": 2.8080991628269192e-05, - "loss": 0.0275, + "epoch": 1.08, + "learning_rate": 0.00013774050097781676, + "loss": 0.0383, "step": 167600 }, { - "epoch": 1.81, - "learning_rate": 2.806476734376014e-05, - "loss": 0.0259, + "epoch": 1.08, + "learning_rate": 0.00013773081962345984, + "loss": 0.0338, "step": 167610 }, { - "epoch": 1.81, - "learning_rate": 2.8048543059251085e-05, - "loss": 0.0271, + "epoch": 1.08, + "learning_rate": 0.00013772113826910292, + "loss": 0.0399, "step": 167620 }, { - "epoch": 1.81, - "learning_rate": 2.803231877474203e-05, - "loss": 0.025, + "epoch": 1.08, + "learning_rate": 0.000137711456914746, + "loss": 0.0384, "step": 167630 }, { - "epoch": 1.81, - "learning_rate": 2.801609449023298e-05, - "loss": 0.0271, + "epoch": 1.08, + "learning_rate": 0.00013770177556038905, + "loss": 0.0367, "step": 167640 }, { - "epoch": 1.81, - "learning_rate": 2.7999870205723927e-05, - "loss": 0.0265, + "epoch": 1.08, + "learning_rate": 0.0001376920942060321, + "loss": 0.0343, "step": 167650 }, { - "epoch": 1.81, - "learning_rate": 2.7983645921214874e-05, - "loss": 0.0268, + "epoch": 1.08, + "learning_rate": 0.00013768241285167518, + "loss": 0.0308, "step": 167660 }, { - "epoch": 1.81, - "learning_rate": 2.796742163670582e-05, - "loss": 0.0238, + "epoch": 1.08, + "learning_rate": 0.00013767273149731824, + "loss": 0.039, "step": 167670 }, { - "epoch": 1.81, - "learning_rate": 2.7951197352196766e-05, - "loss": 0.0319, + "epoch": 1.08, + "learning_rate": 0.00013766305014296132, + "loss": 0.0382, "step": 167680 }, { - "epoch": 1.81, - "learning_rate": 2.7934973067687713e-05, - "loss": 0.0234, + "epoch": 1.08, + "learning_rate": 0.0001376533687886044, + "loss": 0.0356, "step": 167690 }, { - "epoch": 1.81, - "learning_rate": 2.791874878317866e-05, - "loss": 0.0243, + "epoch": 1.08, + "learning_rate": 0.00013764368743424748, + "loss": 0.0326, "step": 167700 }, { - "epoch": 1.81, - "learning_rate": 2.7902524498669606e-05, - "loss": 0.0282, + "epoch": 1.08, + "learning_rate": 0.00013763400607989053, + "loss": 0.041, "step": 167710 }, { - "epoch": 1.81, - "learning_rate": 2.7886300214160552e-05, - "loss": 0.0216, + "epoch": 1.08, + "learning_rate": 0.00013762432472553358, + "loss": 0.033, "step": 167720 }, { - "epoch": 1.81, - "learning_rate": 2.7870075929651502e-05, - "loss": 0.0192, + "epoch": 1.08, + "learning_rate": 0.00013761464337117666, + "loss": 0.0327, "step": 167730 }, { - "epoch": 1.81, - "learning_rate": 2.7853851645142448e-05, - "loss": 0.0215, + "epoch": 1.08, + "learning_rate": 0.0001376049620168197, + "loss": 0.0359, "step": 167740 }, { - "epoch": 1.81, - "learning_rate": 2.7837627360633395e-05, - "loss": 0.0301, + "epoch": 1.08, + "learning_rate": 0.0001375952806624628, + "loss": 0.042, "step": 167750 }, { - "epoch": 1.81, - "learning_rate": 2.782140307612434e-05, - "loss": 0.0228, + "epoch": 1.08, + "learning_rate": 0.00013758559930810587, + "loss": 0.0335, "step": 167760 }, { - "epoch": 1.81, - "learning_rate": 2.7805178791615287e-05, - "loss": 0.0239, + "epoch": 1.08, + "learning_rate": 0.00013757591795374893, + "loss": 0.0358, "step": 167770 }, { - "epoch": 1.81, - "learning_rate": 2.7788954507106234e-05, - "loss": 0.0248, + "epoch": 1.08, + "learning_rate": 0.000137566236599392, + "loss": 0.0351, "step": 167780 }, { - "epoch": 1.81, - "learning_rate": 2.777273022259718e-05, - "loss": 0.0253, + "epoch": 1.08, + "learning_rate": 0.00013755655524503506, + "loss": 0.0363, "step": 167790 }, { - "epoch": 1.81, - "learning_rate": 2.7756505938088126e-05, - "loss": 0.0254, + "epoch": 1.08, + "learning_rate": 0.00013754687389067814, + "loss": 0.0387, "step": 167800 }, { - "epoch": 1.82, - "learning_rate": 2.7740281653579073e-05, - "loss": 0.0264, + "epoch": 1.08, + "learning_rate": 0.0001375371925363212, + "loss": 0.0339, "step": 167810 }, { - "epoch": 1.82, - "learning_rate": 2.7724057369070023e-05, - "loss": 0.0258, + "epoch": 1.08, + "learning_rate": 0.00013752751118196427, + "loss": 0.0275, "step": 167820 }, { - "epoch": 1.82, - "learning_rate": 2.770783308456097e-05, - "loss": 0.0241, + "epoch": 1.08, + "learning_rate": 0.00013751782982760735, + "loss": 0.0378, "step": 167830 }, { - "epoch": 1.82, - "learning_rate": 2.7691608800051915e-05, + "epoch": 1.08, + "learning_rate": 0.0001375081484732504, "loss": 0.0299, "step": 167840 }, { - "epoch": 1.82, - "learning_rate": 2.7675384515542862e-05, - "loss": 0.0226, + "epoch": 1.08, + "learning_rate": 0.00013749846711889346, + "loss": 0.0303, "step": 167850 }, { - "epoch": 1.82, - "learning_rate": 2.7659160231033808e-05, - "loss": 0.0287, + "epoch": 1.08, + "learning_rate": 0.00013748878576453654, + "loss": 0.0329, "step": 167860 }, { - "epoch": 1.82, - "learning_rate": 2.7642935946524755e-05, - "loss": 0.0209, + "epoch": 1.08, + "learning_rate": 0.00013747910441017962, + "loss": 0.0376, "step": 167870 }, { - "epoch": 1.82, - "learning_rate": 2.76267116620157e-05, - "loss": 0.0245, + "epoch": 1.08, + "learning_rate": 0.00013746942305582267, + "loss": 0.0287, "step": 167880 }, { - "epoch": 1.82, - "learning_rate": 2.7610487377506647e-05, - "loss": 0.0288, + "epoch": 1.08, + "learning_rate": 0.00013745974170146575, + "loss": 0.0306, "step": 167890 }, { - "epoch": 1.82, - "learning_rate": 2.7594263092997597e-05, - "loss": 0.0283, + "epoch": 1.08, + "learning_rate": 0.00013745006034710883, + "loss": 0.0363, "step": 167900 }, { - "epoch": 1.82, - "learning_rate": 2.7578038808488543e-05, - "loss": 0.0225, + "epoch": 1.08, + "learning_rate": 0.00013744037899275188, + "loss": 0.0311, "step": 167910 }, { - "epoch": 1.82, - "learning_rate": 2.756181452397949e-05, - "loss": 0.0342, + "epoch": 1.08, + "learning_rate": 0.00013743069763839493, + "loss": 0.0343, "step": 167920 }, { - "epoch": 1.82, - "learning_rate": 2.7545590239470436e-05, - "loss": 0.0224, + "epoch": 1.08, + "learning_rate": 0.000137421016284038, + "loss": 0.0344, "step": 167930 }, { - "epoch": 1.82, - "learning_rate": 2.7529365954961383e-05, - "loss": 0.0227, + "epoch": 1.08, + "learning_rate": 0.0001374113349296811, + "loss": 0.0298, "step": 167940 }, { - "epoch": 1.82, - "learning_rate": 2.751314167045233e-05, - "loss": 0.0222, + "epoch": 1.08, + "learning_rate": 0.00013740165357532415, + "loss": 0.0348, "step": 167950 }, { - "epoch": 1.82, - "learning_rate": 2.7496917385943275e-05, - "loss": 0.0227, + "epoch": 1.08, + "learning_rate": 0.00013739197222096722, + "loss": 0.0306, "step": 167960 }, { - "epoch": 1.82, - "learning_rate": 2.7480693101434222e-05, - "loss": 0.0287, + "epoch": 1.08, + "learning_rate": 0.00013738229086661028, + "loss": 0.0333, "step": 167970 }, { - "epoch": 1.82, - "learning_rate": 2.7464468816925168e-05, - "loss": 0.0259, + "epoch": 1.08, + "learning_rate": 0.00013737260951225336, + "loss": 0.0335, "step": 167980 }, { - "epoch": 1.82, - "learning_rate": 2.7448244532416118e-05, - "loss": 0.0243, + "epoch": 1.08, + "learning_rate": 0.0001373629281578964, + "loss": 0.0299, "step": 167990 }, { - "epoch": 1.82, - "learning_rate": 2.7432020247907064e-05, - "loss": 0.0269, + "epoch": 1.08, + "learning_rate": 0.0001373532468035395, + "loss": 0.0315, "step": 168000 }, { - "epoch": 1.82, - "eval_cer": 0.9210968987933371, - "eval_loss": 0.02078932523727417, - "eval_runtime": 119.0631, - "eval_samples_per_second": 16.798, - "eval_steps_per_second": 4.199, + "epoch": 1.08, + "eval_cer": 0.9197975370014687, + "eval_loss": 0.025038884952664375, + "eval_runtime": 120.1957, + "eval_samples_per_second": 16.64, + "eval_steps_per_second": 4.16, "step": 168000 }, { - "epoch": 1.82, - "learning_rate": 2.741579596339801e-05, - "loss": 0.0282, + "epoch": 1.08, + "learning_rate": 0.00013734356544918257, + "loss": 0.032, "step": 168010 }, { - "epoch": 1.82, - "learning_rate": 2.7399571678888957e-05, - "loss": 0.0241, + "epoch": 1.08, + "learning_rate": 0.00013733388409482562, + "loss": 0.0329, "step": 168020 }, { - "epoch": 1.82, - "learning_rate": 2.7383347394379903e-05, - "loss": 0.0221, + "epoch": 1.08, + "learning_rate": 0.0001373242027404687, + "loss": 0.0369, "step": 168030 }, { - "epoch": 1.82, - "learning_rate": 2.736712310987085e-05, - "loss": 0.0225, + "epoch": 1.08, + "learning_rate": 0.00013731452138611175, + "loss": 0.0352, "step": 168040 }, { - "epoch": 1.82, - "learning_rate": 2.7350898825361796e-05, - "loss": 0.026, + "epoch": 1.08, + "learning_rate": 0.00013730484003175483, + "loss": 0.0345, "step": 168050 }, { - "epoch": 1.82, - "learning_rate": 2.7334674540852743e-05, - "loss": 0.0242, + "epoch": 1.08, + "learning_rate": 0.0001372951586773979, + "loss": 0.0385, "step": 168060 }, { - "epoch": 1.82, - "learning_rate": 2.7318450256343692e-05, - "loss": 0.0289, + "epoch": 1.08, + "learning_rate": 0.00013728547732304097, + "loss": 0.0317, "step": 168070 }, { - "epoch": 1.82, - "learning_rate": 2.7302225971834642e-05, - "loss": 0.0205, + "epoch": 1.08, + "learning_rate": 0.00013727579596868405, + "loss": 0.0367, "step": 168080 }, { - "epoch": 1.82, - "learning_rate": 2.728600168732559e-05, - "loss": 0.027, + "epoch": 1.08, + "learning_rate": 0.0001372661146143271, + "loss": 0.0338, "step": 168090 }, { - "epoch": 1.82, - "learning_rate": 2.7269777402816535e-05, - "loss": 0.0259, + "epoch": 1.08, + "learning_rate": 0.00013725643325997018, + "loss": 0.0355, "step": 168100 }, { - "epoch": 1.82, - "learning_rate": 2.725355311830748e-05, - "loss": 0.0284, + "epoch": 1.09, + "learning_rate": 0.00013724675190561323, + "loss": 0.0461, "step": 168110 }, { - "epoch": 1.82, - "learning_rate": 2.7237328833798428e-05, - "loss": 0.0198, + "epoch": 1.09, + "learning_rate": 0.0001372370705512563, + "loss": 0.0359, "step": 168120 }, { - "epoch": 1.82, - "learning_rate": 2.7221104549289374e-05, - "loss": 0.0252, + "epoch": 1.09, + "learning_rate": 0.00013722738919689936, + "loss": 0.0339, "step": 168130 }, { - "epoch": 1.82, - "learning_rate": 2.7204880264780324e-05, - "loss": 0.0255, + "epoch": 1.09, + "learning_rate": 0.00013721770784254244, + "loss": 0.0359, "step": 168140 }, { - "epoch": 1.82, - "learning_rate": 2.718865598027127e-05, - "loss": 0.0219, + "epoch": 1.09, + "learning_rate": 0.00013720802648818552, + "loss": 0.0297, "step": 168150 }, { - "epoch": 1.82, - "learning_rate": 2.7172431695762217e-05, - "loss": 0.0232, + "epoch": 1.09, + "learning_rate": 0.00013719834513382858, + "loss": 0.0328, "step": 168160 }, { - "epoch": 1.82, - "learning_rate": 2.7156207411253163e-05, - "loss": 0.0245, + "epoch": 1.09, + "learning_rate": 0.00013718866377947163, + "loss": 0.0355, "step": 168170 }, { - "epoch": 1.82, - "learning_rate": 2.713998312674411e-05, - "loss": 0.0238, + "epoch": 1.09, + "learning_rate": 0.0001371789824251147, + "loss": 0.038, "step": 168180 }, { - "epoch": 1.82, - "learning_rate": 2.7123758842235056e-05, - "loss": 0.0227, + "epoch": 1.09, + "learning_rate": 0.0001371693010707578, + "loss": 0.0357, "step": 168190 }, { - "epoch": 1.82, - "learning_rate": 2.7107534557726002e-05, - "loss": 0.0272, + "epoch": 1.09, + "learning_rate": 0.00013715961971640084, + "loss": 0.0329, "step": 168200 }, { - "epoch": 1.82, - "learning_rate": 2.709131027321695e-05, - "loss": 0.0209, + "epoch": 1.09, + "learning_rate": 0.00013714993836204392, + "loss": 0.033, "step": 168210 }, { - "epoch": 1.82, - "learning_rate": 2.7075085988707898e-05, - "loss": 0.0268, + "epoch": 1.09, + "learning_rate": 0.00013714025700768697, + "loss": 0.0375, "step": 168220 }, { - "epoch": 1.82, - "learning_rate": 2.7058861704198845e-05, - "loss": 0.0266, + "epoch": 1.09, + "learning_rate": 0.00013713057565333005, + "loss": 0.0318, "step": 168230 }, { - "epoch": 1.82, - "learning_rate": 2.704263741968979e-05, - "loss": 0.0234, + "epoch": 1.09, + "learning_rate": 0.0001371208942989731, + "loss": 0.0323, "step": 168240 }, { - "epoch": 1.82, - "learning_rate": 2.7026413135180737e-05, - "loss": 0.0269, + "epoch": 1.09, + "learning_rate": 0.0001371112129446162, + "loss": 0.0343, "step": 168250 }, { - "epoch": 1.82, - "learning_rate": 2.7010188850671684e-05, - "loss": 0.0231, + "epoch": 1.09, + "learning_rate": 0.00013710153159025927, + "loss": 0.0303, "step": 168260 }, { - "epoch": 1.82, - "learning_rate": 2.699396456616263e-05, - "loss": 0.0207, + "epoch": 1.09, + "learning_rate": 0.00013709185023590232, + "loss": 0.0356, "step": 168270 }, { - "epoch": 1.82, - "learning_rate": 2.6977740281653577e-05, - "loss": 0.0236, + "epoch": 1.09, + "learning_rate": 0.0001370821688815454, + "loss": 0.0318, "step": 168280 }, { - "epoch": 1.82, - "learning_rate": 2.6961515997144523e-05, - "loss": 0.0271, + "epoch": 1.09, + "learning_rate": 0.00013707248752718845, + "loss": 0.032, "step": 168290 }, { - "epoch": 1.82, - "learning_rate": 2.694529171263547e-05, - "loss": 0.0234, + "epoch": 1.09, + "learning_rate": 0.00013706280617283153, + "loss": 0.0327, "step": 168300 }, { - "epoch": 1.82, - "learning_rate": 2.692906742812642e-05, - "loss": 0.026, + "epoch": 1.09, + "learning_rate": 0.00013705312481847458, + "loss": 0.0378, "step": 168310 }, { - "epoch": 1.82, - "learning_rate": 2.6912843143617365e-05, - "loss": 0.0229, + "epoch": 1.09, + "learning_rate": 0.00013704344346411766, + "loss": 0.0341, "step": 168320 }, { - "epoch": 1.82, - "learning_rate": 2.6896618859108312e-05, - "loss": 0.0233, + "epoch": 1.09, + "learning_rate": 0.00013703376210976074, + "loss": 0.0334, "step": 168330 }, { - "epoch": 1.82, - "learning_rate": 2.6880394574599258e-05, - "loss": 0.0243, + "epoch": 1.09, + "learning_rate": 0.0001370240807554038, + "loss": 0.04, "step": 168340 }, { - "epoch": 1.82, - "learning_rate": 2.6864170290090205e-05, - "loss": 0.0198, + "epoch": 1.09, + "learning_rate": 0.00013701439940104688, + "loss": 0.0299, "step": 168350 }, { - "epoch": 1.82, - "learning_rate": 2.684794600558115e-05, - "loss": 0.0237, + "epoch": 1.09, + "learning_rate": 0.00013700471804668993, + "loss": 0.0389, "step": 168360 }, { - "epoch": 1.82, - "learning_rate": 2.6831721721072097e-05, - "loss": 0.0239, + "epoch": 1.09, + "learning_rate": 0.00013699503669233298, + "loss": 0.0389, "step": 168370 }, { - "epoch": 1.82, - "learning_rate": 2.6815497436563044e-05, - "loss": 0.0269, + "epoch": 1.09, + "learning_rate": 0.00013698535533797606, + "loss": 0.032, "step": 168380 }, { - "epoch": 1.82, - "learning_rate": 2.6799273152053994e-05, - "loss": 0.0298, + "epoch": 1.09, + "learning_rate": 0.00013697567398361914, + "loss": 0.0352, "step": 168390 }, { - "epoch": 1.82, - "learning_rate": 2.678304886754494e-05, - "loss": 0.0255, + "epoch": 1.09, + "learning_rate": 0.00013696599262926222, + "loss": 0.0341, "step": 168400 }, { - "epoch": 1.82, - "learning_rate": 2.6766824583035886e-05, - "loss": 0.0288, + "epoch": 1.09, + "learning_rate": 0.00013695631127490527, + "loss": 0.0362, "step": 168410 }, { - "epoch": 1.82, - "learning_rate": 2.6750600298526833e-05, - "loss": 0.022, + "epoch": 1.09, + "learning_rate": 0.00013694662992054833, + "loss": 0.0329, "step": 168420 }, { - "epoch": 1.82, - "learning_rate": 2.673437601401778e-05, - "loss": 0.0223, + "epoch": 1.09, + "learning_rate": 0.0001369369485661914, + "loss": 0.0342, "step": 168430 }, { - "epoch": 1.82, - "learning_rate": 2.6718151729508725e-05, - "loss": 0.0258, + "epoch": 1.09, + "learning_rate": 0.00013692726721183446, + "loss": 0.0281, "step": 168440 }, { - "epoch": 1.82, - "learning_rate": 2.6701927444999672e-05, - "loss": 0.0261, + "epoch": 1.09, + "learning_rate": 0.00013691758585747754, + "loss": 0.0325, "step": 168450 }, { - "epoch": 1.82, - "learning_rate": 2.6685703160490618e-05, - "loss": 0.0252, + "epoch": 1.09, + "learning_rate": 0.00013690790450312062, + "loss": 0.03, "step": 168460 }, { - "epoch": 1.82, - "learning_rate": 2.6669478875981565e-05, - "loss": 0.0248, + "epoch": 1.09, + "learning_rate": 0.0001368982231487637, + "loss": 0.0342, "step": 168470 }, { - "epoch": 1.82, - "learning_rate": 2.6653254591472514e-05, - "loss": 0.0281, + "epoch": 1.09, + "learning_rate": 0.00013688854179440675, + "loss": 0.0316, "step": 168480 }, { - "epoch": 1.82, - "learning_rate": 2.663703030696346e-05, - "loss": 0.0233, + "epoch": 1.09, + "learning_rate": 0.0001368788604400498, + "loss": 0.0337, "step": 168490 }, { - "epoch": 1.82, - "learning_rate": 2.6620806022454407e-05, - "loss": 0.0249, + "epoch": 1.09, + "learning_rate": 0.00013686917908569288, + "loss": 0.0381, "step": 168500 }, { - "epoch": 1.82, - "learning_rate": 2.6604581737945353e-05, - "loss": 0.0215, + "epoch": 1.09, + "learning_rate": 0.00013685949773133594, + "loss": 0.0368, "step": 168510 }, { - "epoch": 1.82, - "learning_rate": 2.65883574534363e-05, - "loss": 0.0276, + "epoch": 1.09, + "learning_rate": 0.00013684981637697902, + "loss": 0.0306, "step": 168520 }, { - "epoch": 1.82, - "learning_rate": 2.6572133168927246e-05, - "loss": 0.023, + "epoch": 1.09, + "learning_rate": 0.0001368401350226221, + "loss": 0.0299, "step": 168530 }, { - "epoch": 1.82, - "learning_rate": 2.6555908884418193e-05, - "loss": 0.0273, + "epoch": 1.09, + "learning_rate": 0.00013683045366826515, + "loss": 0.0346, "step": 168540 }, { - "epoch": 1.82, - "learning_rate": 2.653968459990914e-05, - "loss": 0.0261, + "epoch": 1.09, + "learning_rate": 0.00013682077231390823, + "loss": 0.034, "step": 168550 }, { - "epoch": 1.82, - "learning_rate": 2.652346031540009e-05, - "loss": 0.0232, + "epoch": 1.09, + "learning_rate": 0.00013681109095955128, + "loss": 0.0348, "step": 168560 }, { - "epoch": 1.82, - "learning_rate": 2.6507236030891035e-05, - "loss": 0.0248, + "epoch": 1.09, + "learning_rate": 0.00013680140960519436, + "loss": 0.0326, "step": 168570 }, { - "epoch": 1.82, - "learning_rate": 2.649101174638198e-05, - "loss": 0.0273, + "epoch": 1.09, + "learning_rate": 0.0001367917282508374, + "loss": 0.0326, "step": 168580 }, { - "epoch": 1.82, - "learning_rate": 2.6474787461872928e-05, - "loss": 0.0254, + "epoch": 1.09, + "learning_rate": 0.0001367820468964805, + "loss": 0.0347, "step": 168590 }, { - "epoch": 1.82, - "learning_rate": 2.6458563177363874e-05, - "loss": 0.0252, + "epoch": 1.09, + "learning_rate": 0.00013677236554212357, + "loss": 0.0486, "step": 168600 }, { - "epoch": 1.82, - "learning_rate": 2.644233889285482e-05, - "loss": 0.0245, + "epoch": 1.09, + "learning_rate": 0.00013676268418776663, + "loss": 0.0364, "step": 168610 }, { - "epoch": 1.82, - "learning_rate": 2.6426114608345767e-05, - "loss": 0.0212, + "epoch": 1.09, + "learning_rate": 0.0001367530028334097, + "loss": 0.0375, "step": 168620 }, { - "epoch": 1.82, - "learning_rate": 2.6409890323836713e-05, - "loss": 0.0245, + "epoch": 1.09, + "learning_rate": 0.00013674332147905276, + "loss": 0.0357, "step": 168630 }, { - "epoch": 1.82, - "learning_rate": 2.639366603932766e-05, - "loss": 0.0287, + "epoch": 1.09, + "learning_rate": 0.00013673364012469584, + "loss": 0.0381, "step": 168640 }, { - "epoch": 1.82, - "learning_rate": 2.637744175481861e-05, - "loss": 0.0277, + "epoch": 1.09, + "learning_rate": 0.0001367239587703389, + "loss": 0.0317, "step": 168650 }, { - "epoch": 1.82, - "learning_rate": 2.636121747030956e-05, - "loss": 0.0267, + "epoch": 1.09, + "learning_rate": 0.00013671427741598197, + "loss": 0.0312, "step": 168660 }, { - "epoch": 1.82, - "learning_rate": 2.6344993185800506e-05, - "loss": 0.0259, + "epoch": 1.09, + "learning_rate": 0.00013670459606162505, + "loss": 0.0335, "step": 168670 }, { - "epoch": 1.82, - "learning_rate": 2.6328768901291452e-05, - "loss": 0.0238, + "epoch": 1.09, + "learning_rate": 0.0001366949147072681, + "loss": 0.0325, "step": 168680 }, { - "epoch": 1.82, - "learning_rate": 2.63125446167824e-05, - "loss": 0.0223, + "epoch": 1.09, + "learning_rate": 0.00013668523335291116, + "loss": 0.0338, "step": 168690 }, { - "epoch": 1.82, - "learning_rate": 2.6296320332273345e-05, - "loss": 0.0269, + "epoch": 1.09, + "learning_rate": 0.00013667555199855424, + "loss": 0.0318, "step": 168700 }, { - "epoch": 1.82, - "learning_rate": 2.6280096047764295e-05, - "loss": 0.0237, + "epoch": 1.09, + "learning_rate": 0.00013666587064419731, + "loss": 0.0339, "step": 168710 }, { - "epoch": 1.82, - "learning_rate": 2.626387176325524e-05, - "loss": 0.0257, + "epoch": 1.09, + "learning_rate": 0.00013665618928984037, + "loss": 0.0305, "step": 168720 }, { - "epoch": 1.82, - "learning_rate": 2.6247647478746187e-05, - "loss": 0.028, + "epoch": 1.09, + "learning_rate": 0.00013664650793548345, + "loss": 0.0352, "step": 168730 }, { - "epoch": 1.83, - "learning_rate": 2.6231423194237134e-05, - "loss": 0.0262, + "epoch": 1.09, + "learning_rate": 0.0001366368265811265, + "loss": 0.0374, "step": 168740 }, { - "epoch": 1.83, - "learning_rate": 2.621519890972808e-05, - "loss": 0.0237, + "epoch": 1.09, + "learning_rate": 0.00013662714522676958, + "loss": 0.0331, "step": 168750 }, { - "epoch": 1.83, - "learning_rate": 2.6198974625219027e-05, - "loss": 0.0327, + "epoch": 1.09, + "learning_rate": 0.00013661746387241263, + "loss": 0.0339, "step": 168760 }, { - "epoch": 1.83, - "learning_rate": 2.6182750340709973e-05, - "loss": 0.0285, + "epoch": 1.09, + "learning_rate": 0.0001366077825180557, + "loss": 0.0344, "step": 168770 }, { - "epoch": 1.83, - "learning_rate": 2.616652605620092e-05, - "loss": 0.0222, + "epoch": 1.09, + "learning_rate": 0.0001365981011636988, + "loss": 0.0322, "step": 168780 }, { - "epoch": 1.83, - "learning_rate": 2.6150301771691866e-05, - "loss": 0.0232, + "epoch": 1.09, + "learning_rate": 0.00013658841980934184, + "loss": 0.0329, "step": 168790 }, { - "epoch": 1.83, - "learning_rate": 2.6134077487182816e-05, - "loss": 0.0244, + "epoch": 1.09, + "learning_rate": 0.00013657873845498492, + "loss": 0.0415, "step": 168800 }, { - "epoch": 1.83, - "learning_rate": 2.6117853202673762e-05, - "loss": 0.027, + "epoch": 1.09, + "learning_rate": 0.00013656905710062798, + "loss": 0.0363, "step": 168810 }, { - "epoch": 1.83, - "learning_rate": 2.6101628918164708e-05, - "loss": 0.0246, + "epoch": 1.09, + "learning_rate": 0.00013655937574627106, + "loss": 0.0359, "step": 168820 }, { - "epoch": 1.83, - "learning_rate": 2.6085404633655655e-05, - "loss": 0.0217, + "epoch": 1.09, + "learning_rate": 0.0001365496943919141, + "loss": 0.0304, "step": 168830 }, { - "epoch": 1.83, - "learning_rate": 2.60691803491466e-05, - "loss": 0.0244, + "epoch": 1.09, + "learning_rate": 0.0001365400130375572, + "loss": 0.0377, "step": 168840 }, { - "epoch": 1.83, - "learning_rate": 2.6052956064637547e-05, - "loss": 0.023, + "epoch": 1.09, + "learning_rate": 0.00013653033168320027, + "loss": 0.0289, "step": 168850 }, { - "epoch": 1.83, - "learning_rate": 2.6036731780128494e-05, - "loss": 0.0272, + "epoch": 1.09, + "learning_rate": 0.00013652065032884332, + "loss": 0.0347, "step": 168860 }, { - "epoch": 1.83, - "learning_rate": 2.602050749561944e-05, - "loss": 0.0285, + "epoch": 1.09, + "learning_rate": 0.0001365109689744864, + "loss": 0.0384, "step": 168870 }, { - "epoch": 1.83, - "learning_rate": 2.6004283211110387e-05, - "loss": 0.0239, + "epoch": 1.09, + "learning_rate": 0.00013650128762012945, + "loss": 0.0294, "step": 168880 }, { - "epoch": 1.83, - "learning_rate": 2.5988058926601336e-05, - "loss": 0.0262, + "epoch": 1.09, + "learning_rate": 0.00013649160626577253, + "loss": 0.0401, "step": 168890 }, { - "epoch": 1.83, - "learning_rate": 2.5971834642092283e-05, - "loss": 0.0233, + "epoch": 1.09, + "learning_rate": 0.0001364819249114156, + "loss": 0.0321, "step": 168900 }, { - "epoch": 1.83, - "learning_rate": 2.595561035758323e-05, - "loss": 0.0255, + "epoch": 1.09, + "learning_rate": 0.00013647224355705867, + "loss": 0.0386, "step": 168910 }, { - "epoch": 1.83, - "learning_rate": 2.5939386073074175e-05, - "loss": 0.0266, + "epoch": 1.09, + "learning_rate": 0.00013646256220270175, + "loss": 0.0304, "step": 168920 }, { - "epoch": 1.83, - "learning_rate": 2.5923161788565122e-05, - "loss": 0.0245, + "epoch": 1.09, + "learning_rate": 0.0001364528808483448, + "loss": 0.0364, "step": 168930 }, { - "epoch": 1.83, - "learning_rate": 2.5906937504056068e-05, - "loss": 0.0237, + "epoch": 1.09, + "learning_rate": 0.00013644319949398785, + "loss": 0.0349, "step": 168940 }, { - "epoch": 1.83, - "learning_rate": 2.5890713219547015e-05, - "loss": 0.0327, + "epoch": 1.09, + "learning_rate": 0.00013643351813963093, + "loss": 0.0346, "step": 168950 }, { - "epoch": 1.83, - "learning_rate": 2.587448893503796e-05, - "loss": 0.0213, + "epoch": 1.09, + "learning_rate": 0.000136423836785274, + "loss": 0.029, "step": 168960 }, { - "epoch": 1.83, - "learning_rate": 2.585826465052891e-05, - "loss": 0.0287, + "epoch": 1.09, + "learning_rate": 0.00013641415543091706, + "loss": 0.0307, "step": 168970 }, { - "epoch": 1.83, - "learning_rate": 2.5842040366019857e-05, - "loss": 0.0258, + "epoch": 1.09, + "learning_rate": 0.00013640447407656014, + "loss": 0.031, "step": 168980 }, { - "epoch": 1.83, - "learning_rate": 2.5825816081510804e-05, - "loss": 0.023, + "epoch": 1.09, + "learning_rate": 0.00013639479272220322, + "loss": 0.0345, "step": 168990 }, { - "epoch": 1.83, - "learning_rate": 2.580959179700175e-05, - "loss": 0.0256, + "epoch": 1.09, + "learning_rate": 0.00013638511136784628, + "loss": 0.0345, "step": 169000 }, { - "epoch": 1.83, - "eval_cer": 0.9211092675738284, - "eval_loss": 0.020907822996377945, - "eval_runtime": 119.2241, - "eval_samples_per_second": 16.775, - "eval_steps_per_second": 4.194, + "epoch": 1.09, + "eval_cer": 0.9198879222686702, + "eval_loss": 0.0242831502109766, + "eval_runtime": 120.0326, + "eval_samples_per_second": 16.662, + "eval_steps_per_second": 4.166, "step": 169000 }, { - "epoch": 1.83, - "learning_rate": 2.5793367512492696e-05, - "loss": 0.0256, + "epoch": 1.09, + "learning_rate": 0.00013637543001348933, + "loss": 0.0327, "step": 169010 }, { - "epoch": 1.83, - "learning_rate": 2.5777143227983643e-05, - "loss": 0.0226, + "epoch": 1.09, + "learning_rate": 0.0001363657486591324, + "loss": 0.0332, "step": 169020 }, { - "epoch": 1.83, - "learning_rate": 2.576091894347459e-05, - "loss": 0.0233, + "epoch": 1.09, + "learning_rate": 0.0001363560673047755, + "loss": 0.0379, "step": 169030 }, { - "epoch": 1.83, - "learning_rate": 2.5744694658965535e-05, - "loss": 0.0227, + "epoch": 1.09, + "learning_rate": 0.00013634638595041854, + "loss": 0.0331, "step": 169040 }, { - "epoch": 1.83, - "learning_rate": 2.5728470374456482e-05, - "loss": 0.0259, + "epoch": 1.09, + "learning_rate": 0.00013633670459606162, + "loss": 0.0326, "step": 169050 }, { - "epoch": 1.83, - "learning_rate": 2.571224608994743e-05, - "loss": 0.0248, + "epoch": 1.09, + "learning_rate": 0.00013632702324170467, + "loss": 0.0342, "step": 169060 }, { - "epoch": 1.83, - "learning_rate": 2.5696021805438378e-05, - "loss": 0.0262, + "epoch": 1.09, + "learning_rate": 0.00013631734188734775, + "loss": 0.035, "step": 169070 }, { - "epoch": 1.83, - "learning_rate": 2.5679797520929324e-05, - "loss": 0.0235, + "epoch": 1.09, + "learning_rate": 0.0001363076605329908, + "loss": 0.0402, "step": 169080 }, { - "epoch": 1.83, - "learning_rate": 2.566357323642027e-05, - "loss": 0.0195, + "epoch": 1.09, + "learning_rate": 0.00013629797917863389, + "loss": 0.0369, "step": 169090 }, { - "epoch": 1.83, - "learning_rate": 2.5647348951911217e-05, - "loss": 0.0237, + "epoch": 1.09, + "learning_rate": 0.00013628829782427697, + "loss": 0.0314, "step": 169100 }, { - "epoch": 1.83, - "learning_rate": 2.5631124667402164e-05, - "loss": 0.0266, + "epoch": 1.09, + "learning_rate": 0.00013627861646992002, + "loss": 0.0357, "step": 169110 }, { - "epoch": 1.83, - "learning_rate": 2.561490038289311e-05, - "loss": 0.0259, + "epoch": 1.09, + "learning_rate": 0.0001362689351155631, + "loss": 0.0285, "step": 169120 }, { - "epoch": 1.83, - "learning_rate": 2.5598676098384056e-05, - "loss": 0.0242, + "epoch": 1.09, + "learning_rate": 0.00013625925376120615, + "loss": 0.0357, "step": 169130 }, { - "epoch": 1.83, - "learning_rate": 2.5582451813875006e-05, - "loss": 0.0254, + "epoch": 1.09, + "learning_rate": 0.0001362495724068492, + "loss": 0.0357, "step": 169140 }, { - "epoch": 1.83, - "learning_rate": 2.5566227529365952e-05, - "loss": 0.0189, + "epoch": 1.09, + "learning_rate": 0.00013623989105249228, + "loss": 0.0314, "step": 169150 }, { - "epoch": 1.83, - "learning_rate": 2.55500032448569e-05, - "loss": 0.0248, + "epoch": 1.09, + "learning_rate": 0.00013623020969813536, + "loss": 0.034, "step": 169160 }, { - "epoch": 1.83, - "learning_rate": 2.5533778960347845e-05, - "loss": 0.0245, + "epoch": 1.09, + "learning_rate": 0.00013622052834377844, + "loss": 0.0275, "step": 169170 }, { - "epoch": 1.83, - "learning_rate": 2.551755467583879e-05, - "loss": 0.0227, + "epoch": 1.09, + "learning_rate": 0.0001362108469894215, + "loss": 0.0358, "step": 169180 }, { - "epoch": 1.83, - "learning_rate": 2.5501330391329738e-05, - "loss": 0.0239, + "epoch": 1.09, + "learning_rate": 0.00013620116563506458, + "loss": 0.0365, "step": 169190 }, { - "epoch": 1.83, - "learning_rate": 2.5485106106820684e-05, - "loss": 0.0255, + "epoch": 1.09, + "learning_rate": 0.00013619148428070763, + "loss": 0.0341, "step": 169200 }, { - "epoch": 1.83, - "learning_rate": 2.546888182231163e-05, - "loss": 0.0227, + "epoch": 1.09, + "learning_rate": 0.00013618180292635068, + "loss": 0.035, "step": 169210 }, { - "epoch": 1.83, - "learning_rate": 2.5452657537802577e-05, - "loss": 0.0293, + "epoch": 1.09, + "learning_rate": 0.00013617212157199376, + "loss": 0.032, "step": 169220 }, { - "epoch": 1.83, - "learning_rate": 2.5436433253293527e-05, - "loss": 0.0286, + "epoch": 1.09, + "learning_rate": 0.00013616244021763684, + "loss": 0.0356, "step": 169230 }, { - "epoch": 1.83, - "learning_rate": 2.5420208968784473e-05, - "loss": 0.0234, + "epoch": 1.09, + "learning_rate": 0.00013615275886327992, + "loss": 0.0314, "step": 169240 }, { - "epoch": 1.83, - "learning_rate": 2.5403984684275423e-05, - "loss": 0.0255, + "epoch": 1.09, + "learning_rate": 0.00013614307750892297, + "loss": 0.0359, "step": 169250 }, { - "epoch": 1.83, - "learning_rate": 2.538776039976637e-05, - "loss": 0.0267, + "epoch": 1.09, + "learning_rate": 0.00013613339615456603, + "loss": 0.0381, "step": 169260 }, { - "epoch": 1.83, - "learning_rate": 2.5371536115257316e-05, - "loss": 0.0274, + "epoch": 1.09, + "learning_rate": 0.0001361237148002091, + "loss": 0.0356, "step": 169270 }, { - "epoch": 1.83, - "learning_rate": 2.5355311830748262e-05, - "loss": 0.0224, + "epoch": 1.09, + "learning_rate": 0.00013611403344585216, + "loss": 0.0323, "step": 169280 }, { - "epoch": 1.83, - "learning_rate": 2.5339087546239212e-05, - "loss": 0.0214, + "epoch": 1.09, + "learning_rate": 0.00013610435209149524, + "loss": 0.0299, "step": 169290 }, { - "epoch": 1.83, - "learning_rate": 2.532286326173016e-05, - "loss": 0.0256, + "epoch": 1.09, + "learning_rate": 0.00013609467073713832, + "loss": 0.0361, "step": 169300 }, { - "epoch": 1.83, - "learning_rate": 2.5306638977221105e-05, - "loss": 0.0279, + "epoch": 1.09, + "learning_rate": 0.0001360849893827814, + "loss": 0.0311, "step": 169310 }, { - "epoch": 1.83, - "learning_rate": 2.529041469271205e-05, - "loss": 0.0202, + "epoch": 1.09, + "learning_rate": 0.00013607530802842445, + "loss": 0.0301, "step": 169320 }, { - "epoch": 1.83, - "learning_rate": 2.5274190408202998e-05, - "loss": 0.022, + "epoch": 1.09, + "learning_rate": 0.0001360656266740675, + "loss": 0.0369, "step": 169330 }, { - "epoch": 1.83, - "learning_rate": 2.5257966123693944e-05, - "loss": 0.0262, + "epoch": 1.09, + "learning_rate": 0.00013605594531971058, + "loss": 0.0322, "step": 169340 }, { - "epoch": 1.83, - "learning_rate": 2.524174183918489e-05, - "loss": 0.021, + "epoch": 1.09, + "learning_rate": 0.00013604626396535364, + "loss": 0.0368, "step": 169350 }, { - "epoch": 1.83, - "learning_rate": 2.5225517554675837e-05, - "loss": 0.0287, + "epoch": 1.09, + "learning_rate": 0.00013603658261099672, + "loss": 0.0384, "step": 169360 }, { - "epoch": 1.83, - "learning_rate": 2.5209293270166783e-05, - "loss": 0.0228, + "epoch": 1.09, + "learning_rate": 0.0001360269012566398, + "loss": 0.0302, "step": 169370 }, { - "epoch": 1.83, - "learning_rate": 2.5193068985657733e-05, - "loss": 0.0288, + "epoch": 1.09, + "learning_rate": 0.00013601721990228285, + "loss": 0.031, "step": 169380 }, { - "epoch": 1.83, - "learning_rate": 2.517684470114868e-05, - "loss": 0.0249, + "epoch": 1.09, + "learning_rate": 0.00013600753854792593, + "loss": 0.0363, "step": 169390 }, { - "epoch": 1.83, - "learning_rate": 2.5160620416639626e-05, - "loss": 0.0218, + "epoch": 1.09, + "learning_rate": 0.00013599785719356898, + "loss": 0.0326, "step": 169400 }, { - "epoch": 1.83, - "learning_rate": 2.5144396132130572e-05, - "loss": 0.0235, + "epoch": 1.09, + "learning_rate": 0.00013598817583921206, + "loss": 0.0305, "step": 169410 }, { - "epoch": 1.83, - "learning_rate": 2.512817184762152e-05, - "loss": 0.0312, + "epoch": 1.09, + "learning_rate": 0.0001359784944848551, + "loss": 0.037, "step": 169420 }, { - "epoch": 1.83, - "learning_rate": 2.5111947563112465e-05, - "loss": 0.0269, + "epoch": 1.09, + "learning_rate": 0.0001359688131304982, + "loss": 0.0318, "step": 169430 }, { - "epoch": 1.83, - "learning_rate": 2.509572327860341e-05, - "loss": 0.0327, + "epoch": 1.09, + "learning_rate": 0.00013595913177614127, + "loss": 0.0275, "step": 169440 }, { - "epoch": 1.83, - "learning_rate": 2.5079498994094357e-05, - "loss": 0.0244, + "epoch": 1.09, + "learning_rate": 0.00013594945042178433, + "loss": 0.0314, "step": 169450 }, { - "epoch": 1.83, - "learning_rate": 2.5063274709585307e-05, - "loss": 0.0255, + "epoch": 1.09, + "learning_rate": 0.00013593976906742738, + "loss": 0.033, "step": 169460 }, { - "epoch": 1.83, - "learning_rate": 2.5047050425076254e-05, - "loss": 0.0194, + "epoch": 1.09, + "learning_rate": 0.00013593008771307046, + "loss": 0.0343, "step": 169470 }, { - "epoch": 1.83, - "learning_rate": 2.50308261405672e-05, - "loss": 0.0255, + "epoch": 1.09, + "learning_rate": 0.00013592040635871354, + "loss": 0.03, "step": 169480 }, { - "epoch": 1.83, - "learning_rate": 2.5014601856058146e-05, - "loss": 0.0271, + "epoch": 1.09, + "learning_rate": 0.0001359107250043566, + "loss": 0.0342, "step": 169490 }, { - "epoch": 1.83, - "learning_rate": 2.4998377571549093e-05, - "loss": 0.0299, + "epoch": 1.09, + "learning_rate": 0.00013590104364999967, + "loss": 0.0334, "step": 169500 }, { - "epoch": 1.83, - "learning_rate": 2.498215328704004e-05, - "loss": 0.0231, + "epoch": 1.09, + "learning_rate": 0.00013589136229564275, + "loss": 0.0363, "step": 169510 }, { - "epoch": 1.83, - "learning_rate": 2.4965929002530986e-05, - "loss": 0.0236, + "epoch": 1.09, + "learning_rate": 0.0001358816809412858, + "loss": 0.0346, "step": 169520 }, { - "epoch": 1.83, - "learning_rate": 2.4949704718021932e-05, - "loss": 0.0279, + "epoch": 1.09, + "learning_rate": 0.00013587199958692885, + "loss": 0.0286, "step": 169530 }, { - "epoch": 1.83, - "learning_rate": 2.493348043351288e-05, - "loss": 0.0273, + "epoch": 1.09, + "learning_rate": 0.00013586231823257193, + "loss": 0.0296, "step": 169540 }, { - "epoch": 1.83, - "learning_rate": 2.4917256149003828e-05, - "loss": 0.0237, + "epoch": 1.09, + "learning_rate": 0.00013585263687821501, + "loss": 0.0307, "step": 169550 }, { - "epoch": 1.83, - "learning_rate": 2.4901031864494774e-05, - "loss": 0.0244, + "epoch": 1.09, + "learning_rate": 0.00013584295552385807, + "loss": 0.0324, "step": 169560 }, { - "epoch": 1.83, - "learning_rate": 2.488480757998572e-05, - "loss": 0.0244, + "epoch": 1.09, + "learning_rate": 0.00013583327416950115, + "loss": 0.031, "step": 169570 }, { - "epoch": 1.83, - "learning_rate": 2.4868583295476667e-05, - "loss": 0.0225, + "epoch": 1.09, + "learning_rate": 0.0001358235928151442, + "loss": 0.0347, "step": 169580 }, { - "epoch": 1.83, - "learning_rate": 2.4852359010967614e-05, - "loss": 0.0257, + "epoch": 1.09, + "learning_rate": 0.00013581391146078728, + "loss": 0.037, "step": 169590 }, { - "epoch": 1.83, - "learning_rate": 2.483613472645856e-05, - "loss": 0.0229, + "epoch": 1.09, + "learning_rate": 0.00013580423010643033, + "loss": 0.0319, "step": 169600 }, { - "epoch": 1.83, - "learning_rate": 2.4819910441949506e-05, - "loss": 0.0228, + "epoch": 1.09, + "learning_rate": 0.0001357945487520734, + "loss": 0.0367, "step": 169610 }, { - "epoch": 1.83, - "learning_rate": 2.4803686157440453e-05, - "loss": 0.0253, + "epoch": 1.09, + "learning_rate": 0.0001357848673977165, + "loss": 0.0363, "step": 169620 }, { - "epoch": 1.83, - "learning_rate": 2.4787461872931403e-05, - "loss": 0.0252, + "epoch": 1.09, + "learning_rate": 0.00013577518604335954, + "loss": 0.0409, "step": 169630 }, { - "epoch": 1.83, - "learning_rate": 2.477123758842235e-05, - "loss": 0.0253, + "epoch": 1.09, + "learning_rate": 0.00013576550468900262, + "loss": 0.0356, "step": 169640 }, { - "epoch": 1.83, - "learning_rate": 2.4755013303913295e-05, - "loss": 0.027, + "epoch": 1.09, + "learning_rate": 0.00013575582333464568, + "loss": 0.0358, "step": 169650 }, { - "epoch": 1.84, - "learning_rate": 2.473878901940424e-05, - "loss": 0.0266, + "epoch": 1.1, + "learning_rate": 0.00013574614198028876, + "loss": 0.0378, "step": 169660 }, { - "epoch": 1.84, - "learning_rate": 2.4722564734895188e-05, - "loss": 0.0249, + "epoch": 1.1, + "learning_rate": 0.0001357364606259318, + "loss": 0.0391, "step": 169670 }, { - "epoch": 1.84, - "learning_rate": 2.4706340450386134e-05, - "loss": 0.0253, + "epoch": 1.1, + "learning_rate": 0.0001357267792715749, + "loss": 0.035, "step": 169680 }, { - "epoch": 1.84, - "learning_rate": 2.469011616587708e-05, - "loss": 0.0223, + "epoch": 1.1, + "learning_rate": 0.00013571709791721797, + "loss": 0.0315, "step": 169690 }, { - "epoch": 1.84, - "learning_rate": 2.4673891881368027e-05, - "loss": 0.0272, + "epoch": 1.1, + "learning_rate": 0.00013570741656286102, + "loss": 0.0344, "step": 169700 }, { - "epoch": 1.84, - "learning_rate": 2.4657667596858974e-05, - "loss": 0.0304, + "epoch": 1.1, + "learning_rate": 0.0001356977352085041, + "loss": 0.0352, "step": 169710 }, { - "epoch": 1.84, - "learning_rate": 2.4641443312349923e-05, - "loss": 0.0234, + "epoch": 1.1, + "learning_rate": 0.00013568805385414715, + "loss": 0.0336, "step": 169720 }, { - "epoch": 1.84, - "learning_rate": 2.462521902784087e-05, - "loss": 0.0321, + "epoch": 1.1, + "learning_rate": 0.00013567837249979023, + "loss": 0.0382, "step": 169730 }, { - "epoch": 1.84, - "learning_rate": 2.4608994743331816e-05, - "loss": 0.0266, + "epoch": 1.1, + "learning_rate": 0.0001356686911454333, + "loss": 0.0329, "step": 169740 }, { - "epoch": 1.84, - "learning_rate": 2.4592770458822763e-05, - "loss": 0.0232, + "epoch": 1.1, + "learning_rate": 0.00013565900979107637, + "loss": 0.032, "step": 169750 }, { - "epoch": 1.84, - "learning_rate": 2.457654617431371e-05, - "loss": 0.029, + "epoch": 1.1, + "learning_rate": 0.00013564932843671945, + "loss": 0.0374, "step": 169760 }, { - "epoch": 1.84, - "learning_rate": 2.4560321889804655e-05, - "loss": 0.0223, + "epoch": 1.1, + "learning_rate": 0.0001356396470823625, + "loss": 0.0308, "step": 169770 }, { - "epoch": 1.84, - "learning_rate": 2.45440976052956e-05, - "loss": 0.0204, + "epoch": 1.1, + "learning_rate": 0.00013562996572800555, + "loss": 0.0313, "step": 169780 }, { - "epoch": 1.84, - "learning_rate": 2.4527873320786548e-05, - "loss": 0.0225, + "epoch": 1.1, + "learning_rate": 0.00013562028437364863, + "loss": 0.0321, "step": 169790 }, { - "epoch": 1.84, - "learning_rate": 2.4511649036277498e-05, - "loss": 0.0259, + "epoch": 1.1, + "learning_rate": 0.0001356106030192917, + "loss": 0.0334, "step": 169800 }, { - "epoch": 1.84, - "learning_rate": 2.4495424751768444e-05, - "loss": 0.022, + "epoch": 1.1, + "learning_rate": 0.00013560092166493476, + "loss": 0.0335, "step": 169810 }, { - "epoch": 1.84, - "learning_rate": 2.447920046725939e-05, - "loss": 0.0296, + "epoch": 1.1, + "learning_rate": 0.00013559124031057784, + "loss": 0.0359, "step": 169820 }, { - "epoch": 1.84, - "learning_rate": 2.4462976182750337e-05, - "loss": 0.0243, + "epoch": 1.1, + "learning_rate": 0.0001355815589562209, + "loss": 0.0349, "step": 169830 }, { - "epoch": 1.84, - "learning_rate": 2.4446751898241287e-05, - "loss": 0.0213, + "epoch": 1.1, + "learning_rate": 0.00013557187760186398, + "loss": 0.0385, "step": 169840 }, { - "epoch": 1.84, - "learning_rate": 2.4430527613732233e-05, - "loss": 0.0254, + "epoch": 1.1, + "learning_rate": 0.00013556219624750703, + "loss": 0.0337, "step": 169850 }, { - "epoch": 1.84, - "learning_rate": 2.441430332922318e-05, - "loss": 0.0245, + "epoch": 1.1, + "learning_rate": 0.0001355525148931501, + "loss": 0.0369, "step": 169860 }, { - "epoch": 1.84, - "learning_rate": 2.439807904471413e-05, - "loss": 0.0255, + "epoch": 1.1, + "learning_rate": 0.0001355428335387932, + "loss": 0.034, "step": 169870 }, { - "epoch": 1.84, - "learning_rate": 2.4381854760205076e-05, - "loss": 0.0249, - "step": 169880 + "epoch": 1.1, + "learning_rate": 0.00013553315218443624, + "loss": 0.0321, + "step": 169880 }, { - "epoch": 1.84, - "learning_rate": 2.4365630475696022e-05, - "loss": 0.026, + "epoch": 1.1, + "learning_rate": 0.00013552347083007932, + "loss": 0.0295, "step": 169890 }, { - "epoch": 1.84, - "learning_rate": 2.434940619118697e-05, - "loss": 0.0302, + "epoch": 1.1, + "learning_rate": 0.00013551378947572237, + "loss": 0.0397, "step": 169900 }, { - "epoch": 1.84, - "learning_rate": 2.4333181906677915e-05, - "loss": 0.0227, + "epoch": 1.1, + "learning_rate": 0.00013550410812136545, + "loss": 0.0299, "step": 169910 }, { - "epoch": 1.84, - "learning_rate": 2.431695762216886e-05, - "loss": 0.0271, + "epoch": 1.1, + "learning_rate": 0.0001354944267670085, + "loss": 0.0391, "step": 169920 }, { - "epoch": 1.84, - "learning_rate": 2.4300733337659808e-05, - "loss": 0.0237, + "epoch": 1.1, + "learning_rate": 0.00013548474541265159, + "loss": 0.0381, "step": 169930 }, { - "epoch": 1.84, - "learning_rate": 2.4284509053150754e-05, - "loss": 0.0243, + "epoch": 1.1, + "learning_rate": 0.00013547506405829467, + "loss": 0.037, "step": 169940 }, { - "epoch": 1.84, - "learning_rate": 2.42682847686417e-05, - "loss": 0.0319, + "epoch": 1.1, + "learning_rate": 0.00013546538270393772, + "loss": 0.0291, "step": 169950 }, { - "epoch": 1.84, - "learning_rate": 2.425206048413265e-05, - "loss": 0.026, + "epoch": 1.1, + "learning_rate": 0.0001354557013495808, + "loss": 0.0314, "step": 169960 }, { - "epoch": 1.84, - "learning_rate": 2.4235836199623596e-05, - "loss": 0.0205, + "epoch": 1.1, + "learning_rate": 0.00013544601999522385, + "loss": 0.0286, "step": 169970 }, { - "epoch": 1.84, - "learning_rate": 2.4219611915114543e-05, - "loss": 0.0285, + "epoch": 1.1, + "learning_rate": 0.0001354363386408669, + "loss": 0.0317, "step": 169980 }, { - "epoch": 1.84, - "learning_rate": 2.420338763060549e-05, - "loss": 0.0276, + "epoch": 1.1, + "learning_rate": 0.00013542665728650998, + "loss": 0.0413, "step": 169990 }, { - "epoch": 1.84, - "learning_rate": 2.4187163346096436e-05, - "loss": 0.0234, + "epoch": 1.1, + "learning_rate": 0.00013541697593215306, + "loss": 0.0341, "step": 170000 }, { - "epoch": 1.84, - "eval_cer": 0.9210562585145802, - "eval_loss": 0.020689187571406364, - "eval_runtime": 119.1219, - "eval_samples_per_second": 16.79, - "eval_steps_per_second": 4.197, + "epoch": 1.1, + "eval_cer": 0.9198942492373743, + "eval_loss": 0.024668850004673004, + "eval_runtime": 120.0558, + "eval_samples_per_second": 16.659, + "eval_steps_per_second": 4.165, "step": 170000 }, { - "epoch": 1.84, - "learning_rate": 2.4170939061587382e-05, - "loss": 0.0296, + "epoch": 1.1, + "learning_rate": 0.00013540729457779614, + "loss": 0.0414, "step": 170010 }, { - "epoch": 1.84, - "learning_rate": 2.415471477707833e-05, - "loss": 0.0257, + "epoch": 1.1, + "learning_rate": 0.0001353976132234392, + "loss": 0.0341, "step": 170020 }, { - "epoch": 1.84, - "learning_rate": 2.4138490492569275e-05, - "loss": 0.0249, + "epoch": 1.1, + "learning_rate": 0.00013538793186908225, + "loss": 0.0359, "step": 170030 }, { - "epoch": 1.84, - "learning_rate": 2.4122266208060225e-05, - "loss": 0.0256, + "epoch": 1.1, + "learning_rate": 0.00013537825051472533, + "loss": 0.0384, "step": 170040 }, { - "epoch": 1.84, - "learning_rate": 2.410604192355117e-05, - "loss": 0.0262, + "epoch": 1.1, + "learning_rate": 0.00013536856916036838, + "loss": 0.0321, "step": 170050 }, { - "epoch": 1.84, - "learning_rate": 2.4089817639042117e-05, - "loss": 0.0226, + "epoch": 1.1, + "learning_rate": 0.00013535888780601146, + "loss": 0.0336, "step": 170060 }, { - "epoch": 1.84, - "learning_rate": 2.4073593354533064e-05, - "loss": 0.025, + "epoch": 1.1, + "learning_rate": 0.00013534920645165454, + "loss": 0.0315, "step": 170070 }, { - "epoch": 1.84, - "learning_rate": 2.405736907002401e-05, - "loss": 0.0271, + "epoch": 1.1, + "learning_rate": 0.00013533952509729762, + "loss": 0.042, "step": 170080 }, { - "epoch": 1.84, - "learning_rate": 2.4041144785514956e-05, - "loss": 0.0247, + "epoch": 1.1, + "learning_rate": 0.00013532984374294067, + "loss": 0.0338, "step": 170090 }, { - "epoch": 1.84, - "learning_rate": 2.4024920501005903e-05, - "loss": 0.0238, + "epoch": 1.1, + "learning_rate": 0.00013532016238858373, + "loss": 0.033, "step": 170100 }, { - "epoch": 1.84, - "learning_rate": 2.400869621649685e-05, - "loss": 0.023, + "epoch": 1.1, + "learning_rate": 0.0001353104810342268, + "loss": 0.0316, "step": 170110 }, { - "epoch": 1.84, - "learning_rate": 2.3992471931987796e-05, - "loss": 0.0225, + "epoch": 1.1, + "learning_rate": 0.00013530079967986986, + "loss": 0.0311, "step": 170120 }, { - "epoch": 1.84, - "learning_rate": 2.3976247647478745e-05, - "loss": 0.0259, + "epoch": 1.1, + "learning_rate": 0.00013529111832551294, + "loss": 0.0338, "step": 170130 }, { - "epoch": 1.84, - "learning_rate": 2.3960023362969692e-05, - "loss": 0.028, + "epoch": 1.1, + "learning_rate": 0.00013528143697115602, + "loss": 0.0346, "step": 170140 }, { - "epoch": 1.84, - "learning_rate": 2.3943799078460638e-05, - "loss": 0.0224, + "epoch": 1.1, + "learning_rate": 0.00013527175561679907, + "loss": 0.0355, "step": 170150 }, { - "epoch": 1.84, - "learning_rate": 2.3927574793951585e-05, - "loss": 0.0218, + "epoch": 1.1, + "learning_rate": 0.00013526207426244215, + "loss": 0.0343, "step": 170160 }, { - "epoch": 1.84, - "learning_rate": 2.391135050944253e-05, - "loss": 0.025, + "epoch": 1.1, + "learning_rate": 0.0001352523929080852, + "loss": 0.0349, "step": 170170 }, { - "epoch": 1.84, - "learning_rate": 2.3895126224933477e-05, - "loss": 0.0287, + "epoch": 1.1, + "learning_rate": 0.00013524271155372828, + "loss": 0.0359, "step": 170180 }, { - "epoch": 1.84, - "learning_rate": 2.3878901940424424e-05, - "loss": 0.0262, + "epoch": 1.1, + "learning_rate": 0.00013523303019937134, + "loss": 0.032, "step": 170190 }, { - "epoch": 1.84, - "learning_rate": 2.386267765591537e-05, - "loss": 0.0217, + "epoch": 1.1, + "learning_rate": 0.00013522334884501441, + "loss": 0.0331, "step": 170200 }, { - "epoch": 1.84, - "learning_rate": 2.384645337140632e-05, - "loss": 0.0274, + "epoch": 1.1, + "learning_rate": 0.0001352136674906575, + "loss": 0.0293, "step": 170210 }, { - "epoch": 1.84, - "learning_rate": 2.3830229086897266e-05, - "loss": 0.0269, + "epoch": 1.1, + "learning_rate": 0.00013520398613630055, + "loss": 0.0307, "step": 170220 }, { - "epoch": 1.84, - "learning_rate": 2.3814004802388213e-05, - "loss": 0.0329, + "epoch": 1.1, + "learning_rate": 0.0001351943047819436, + "loss": 0.0314, "step": 170230 }, { - "epoch": 1.84, - "learning_rate": 2.379778051787916e-05, - "loss": 0.031, + "epoch": 1.1, + "learning_rate": 0.00013518462342758668, + "loss": 0.0328, "step": 170240 }, { - "epoch": 1.84, - "learning_rate": 2.3781556233370105e-05, - "loss": 0.0263, + "epoch": 1.1, + "learning_rate": 0.00013517494207322976, + "loss": 0.0348, "step": 170250 }, { - "epoch": 1.84, - "learning_rate": 2.3765331948861052e-05, - "loss": 0.0235, + "epoch": 1.1, + "learning_rate": 0.0001351652607188728, + "loss": 0.0382, "step": 170260 }, { - "epoch": 1.84, - "learning_rate": 2.3749107664351998e-05, - "loss": 0.0223, + "epoch": 1.1, + "learning_rate": 0.0001351555793645159, + "loss": 0.0326, "step": 170270 }, { - "epoch": 1.84, - "learning_rate": 2.3732883379842945e-05, - "loss": 0.0263, + "epoch": 1.1, + "learning_rate": 0.00013514589801015897, + "loss": 0.033, "step": 170280 }, { - "epoch": 1.84, - "learning_rate": 2.371665909533389e-05, - "loss": 0.0258, + "epoch": 1.1, + "learning_rate": 0.00013513621665580202, + "loss": 0.0333, "step": 170290 }, { - "epoch": 1.84, - "learning_rate": 2.370043481082484e-05, - "loss": 0.026, + "epoch": 1.1, + "learning_rate": 0.00013512653530144508, + "loss": 0.0358, "step": 170300 }, { - "epoch": 1.84, - "learning_rate": 2.3684210526315787e-05, - "loss": 0.0255, + "epoch": 1.1, + "learning_rate": 0.00013511685394708816, + "loss": 0.0347, "step": 170310 }, { - "epoch": 1.84, - "learning_rate": 2.3667986241806733e-05, - "loss": 0.0239, + "epoch": 1.1, + "learning_rate": 0.00013510717259273124, + "loss": 0.0336, "step": 170320 }, { - "epoch": 1.84, - "learning_rate": 2.365176195729768e-05, - "loss": 0.0253, + "epoch": 1.1, + "learning_rate": 0.0001350974912383743, + "loss": 0.0362, "step": 170330 }, { - "epoch": 1.84, - "learning_rate": 2.3635537672788626e-05, - "loss": 0.026, + "epoch": 1.1, + "learning_rate": 0.00013508780988401737, + "loss": 0.0345, "step": 170340 }, { - "epoch": 1.84, - "learning_rate": 2.3619313388279573e-05, - "loss": 0.0222, + "epoch": 1.1, + "learning_rate": 0.00013507812852966042, + "loss": 0.0308, "step": 170350 }, { - "epoch": 1.84, - "learning_rate": 2.360308910377052e-05, - "loss": 0.0218, + "epoch": 1.1, + "learning_rate": 0.0001350684471753035, + "loss": 0.0326, "step": 170360 }, { - "epoch": 1.84, - "learning_rate": 2.3586864819261465e-05, - "loss": 0.0285, + "epoch": 1.1, + "learning_rate": 0.00013505876582094655, + "loss": 0.0371, "step": 170370 }, { - "epoch": 1.84, - "learning_rate": 2.3570640534752415e-05, - "loss": 0.0243, + "epoch": 1.1, + "learning_rate": 0.00013504908446658963, + "loss": 0.0313, "step": 170380 }, { - "epoch": 1.84, - "learning_rate": 2.355441625024336e-05, - "loss": 0.0253, + "epoch": 1.1, + "learning_rate": 0.00013503940311223271, + "loss": 0.0314, "step": 170390 }, { - "epoch": 1.84, - "learning_rate": 2.3538191965734308e-05, - "loss": 0.0309, + "epoch": 1.1, + "learning_rate": 0.00013502972175787577, + "loss": 0.0316, "step": 170400 }, { - "epoch": 1.84, - "learning_rate": 2.3521967681225254e-05, - "loss": 0.0173, + "epoch": 1.1, + "learning_rate": 0.00013502004040351885, + "loss": 0.037, "step": 170410 }, { - "epoch": 1.84, - "learning_rate": 2.3505743396716204e-05, - "loss": 0.0233, + "epoch": 1.1, + "learning_rate": 0.0001350103590491619, + "loss": 0.0292, "step": 170420 }, { - "epoch": 1.84, - "learning_rate": 2.348951911220715e-05, - "loss": 0.0217, + "epoch": 1.1, + "learning_rate": 0.00013500067769480498, + "loss": 0.0303, "step": 170430 }, { - "epoch": 1.84, - "learning_rate": 2.3473294827698097e-05, - "loss": 0.0227, + "epoch": 1.1, + "learning_rate": 0.00013499099634044803, + "loss": 0.0355, "step": 170440 }, { - "epoch": 1.84, - "learning_rate": 2.3457070543189047e-05, - "loss": 0.0212, + "epoch": 1.1, + "learning_rate": 0.0001349813149860911, + "loss": 0.0378, "step": 170450 }, { - "epoch": 1.84, - "learning_rate": 2.3440846258679993e-05, - "loss": 0.0214, + "epoch": 1.1, + "learning_rate": 0.0001349716336317342, + "loss": 0.0345, "step": 170460 }, { - "epoch": 1.84, - "learning_rate": 2.342462197417094e-05, - "loss": 0.0257, + "epoch": 1.1, + "learning_rate": 0.00013496195227737724, + "loss": 0.0375, "step": 170470 }, { - "epoch": 1.84, - "learning_rate": 2.3408397689661886e-05, - "loss": 0.0245, + "epoch": 1.1, + "learning_rate": 0.00013495227092302032, + "loss": 0.0313, "step": 170480 }, { - "epoch": 1.84, - "learning_rate": 2.3392173405152832e-05, - "loss": 0.0272, + "epoch": 1.1, + "learning_rate": 0.00013494258956866338, + "loss": 0.0366, "step": 170490 }, { - "epoch": 1.84, - "learning_rate": 2.337594912064378e-05, - "loss": 0.0263, + "epoch": 1.1, + "learning_rate": 0.00013493290821430643, + "loss": 0.0308, "step": 170500 }, { - "epoch": 1.84, - "learning_rate": 2.3359724836134725e-05, - "loss": 0.0287, + "epoch": 1.1, + "learning_rate": 0.0001349232268599495, + "loss": 0.0323, "step": 170510 }, { - "epoch": 1.84, - "learning_rate": 2.334350055162567e-05, - "loss": 0.0245, + "epoch": 1.1, + "learning_rate": 0.0001349135455055926, + "loss": 0.0302, "step": 170520 }, { - "epoch": 1.84, - "learning_rate": 2.332727626711662e-05, - "loss": 0.0277, + "epoch": 1.1, + "learning_rate": 0.00013490386415123567, + "loss": 0.032, "step": 170530 }, { - "epoch": 1.84, - "learning_rate": 2.3311051982607567e-05, - "loss": 0.0233, + "epoch": 1.1, + "learning_rate": 0.00013489418279687872, + "loss": 0.0295, "step": 170540 }, { - "epoch": 1.84, - "learning_rate": 2.3294827698098514e-05, - "loss": 0.0231, + "epoch": 1.1, + "learning_rate": 0.00013488450144252177, + "loss": 0.0364, "step": 170550 }, { - "epoch": 1.84, - "learning_rate": 2.327860341358946e-05, - "loss": 0.0313, + "epoch": 1.1, + "learning_rate": 0.00013487482008816485, + "loss": 0.0349, "step": 170560 }, { - "epoch": 1.84, - "learning_rate": 2.3262379129080407e-05, - "loss": 0.0189, + "epoch": 1.1, + "learning_rate": 0.0001348651387338079, + "loss": 0.0355, "step": 170570 }, { - "epoch": 1.85, - "learning_rate": 2.3246154844571353e-05, - "loss": 0.0225, + "epoch": 1.1, + "learning_rate": 0.00013485545737945099, + "loss": 0.0314, "step": 170580 }, { - "epoch": 1.85, - "learning_rate": 2.32299305600623e-05, - "loss": 0.0295, + "epoch": 1.1, + "learning_rate": 0.00013484577602509407, + "loss": 0.0389, "step": 170590 }, { - "epoch": 1.85, - "learning_rate": 2.3213706275553246e-05, - "loss": 0.0275, + "epoch": 1.1, + "learning_rate": 0.00013483609467073715, + "loss": 0.0395, "step": 170600 }, { - "epoch": 1.85, - "learning_rate": 2.3197481991044192e-05, - "loss": 0.0227, + "epoch": 1.1, + "learning_rate": 0.0001348264133163802, + "loss": 0.0268, "step": 170610 }, { - "epoch": 1.85, - "learning_rate": 2.3181257706535142e-05, - "loss": 0.0233, + "epoch": 1.1, + "learning_rate": 0.00013481673196202325, + "loss": 0.0331, "step": 170620 }, { - "epoch": 1.85, - "learning_rate": 2.3165033422026088e-05, - "loss": 0.0224, + "epoch": 1.1, + "learning_rate": 0.00013480705060766633, + "loss": 0.0328, "step": 170630 }, { - "epoch": 1.85, - "learning_rate": 2.3148809137517035e-05, - "loss": 0.0232, + "epoch": 1.1, + "learning_rate": 0.00013479736925330938, + "loss": 0.0256, "step": 170640 }, { - "epoch": 1.85, - "learning_rate": 2.313258485300798e-05, - "loss": 0.0236, + "epoch": 1.1, + "learning_rate": 0.00013478768789895246, + "loss": 0.0354, "step": 170650 }, { - "epoch": 1.85, - "learning_rate": 2.3116360568498927e-05, - "loss": 0.0219, + "epoch": 1.1, + "learning_rate": 0.00013477800654459554, + "loss": 0.031, "step": 170660 }, { - "epoch": 1.85, - "learning_rate": 2.3100136283989874e-05, - "loss": 0.0272, + "epoch": 1.1, + "learning_rate": 0.0001347683251902386, + "loss": 0.0314, "step": 170670 }, { - "epoch": 1.85, - "learning_rate": 2.308391199948082e-05, - "loss": 0.0251, + "epoch": 1.1, + "learning_rate": 0.00013475864383588168, + "loss": 0.0315, "step": 170680 }, { - "epoch": 1.85, - "learning_rate": 2.3067687714971767e-05, - "loss": 0.023, + "epoch": 1.1, + "learning_rate": 0.00013474896248152473, + "loss": 0.0344, "step": 170690 }, { - "epoch": 1.85, - "learning_rate": 2.3051463430462716e-05, - "loss": 0.0259, + "epoch": 1.1, + "learning_rate": 0.0001347392811271678, + "loss": 0.0322, "step": 170700 }, { - "epoch": 1.85, - "learning_rate": 2.3035239145953663e-05, - "loss": 0.0292, + "epoch": 1.1, + "learning_rate": 0.00013472959977281086, + "loss": 0.0363, "step": 170710 }, { - "epoch": 1.85, - "learning_rate": 2.301901486144461e-05, - "loss": 0.0225, + "epoch": 1.1, + "learning_rate": 0.00013471991841845394, + "loss": 0.0417, "step": 170720 }, { - "epoch": 1.85, - "learning_rate": 2.3002790576935555e-05, - "loss": 0.0255, + "epoch": 1.1, + "learning_rate": 0.00013471023706409702, + "loss": 0.0351, "step": 170730 }, { - "epoch": 1.85, - "learning_rate": 2.2986566292426502e-05, - "loss": 0.0304, + "epoch": 1.1, + "learning_rate": 0.00013470055570974007, + "loss": 0.0338, "step": 170740 }, { - "epoch": 1.85, - "learning_rate": 2.2970342007917448e-05, - "loss": 0.0277, + "epoch": 1.1, + "learning_rate": 0.00013469087435538313, + "loss": 0.033, "step": 170750 }, { - "epoch": 1.85, - "learning_rate": 2.2954117723408395e-05, - "loss": 0.0328, + "epoch": 1.1, + "learning_rate": 0.0001346811930010262, + "loss": 0.0358, "step": 170760 }, { - "epoch": 1.85, - "learning_rate": 2.293789343889934e-05, - "loss": 0.0253, + "epoch": 1.1, + "learning_rate": 0.00013467151164666929, + "loss": 0.0349, "step": 170770 }, { - "epoch": 1.85, - "learning_rate": 2.2921669154390287e-05, - "loss": 0.0236, + "epoch": 1.1, + "learning_rate": 0.00013466183029231234, + "loss": 0.0316, "step": 170780 }, { - "epoch": 1.85, - "learning_rate": 2.2905444869881237e-05, - "loss": 0.0255, + "epoch": 1.1, + "learning_rate": 0.00013465214893795542, + "loss": 0.0299, "step": 170790 }, { - "epoch": 1.85, - "learning_rate": 2.2889220585372184e-05, - "loss": 0.0223, + "epoch": 1.1, + "learning_rate": 0.0001346424675835985, + "loss": 0.0363, "step": 170800 }, { - "epoch": 1.85, - "learning_rate": 2.287299630086313e-05, - "loss": 0.0266, + "epoch": 1.1, + "learning_rate": 0.00013463278622924155, + "loss": 0.0322, "step": 170810 }, { - "epoch": 1.85, - "learning_rate": 2.2856772016354076e-05, - "loss": 0.0229, + "epoch": 1.1, + "learning_rate": 0.0001346231048748846, + "loss": 0.0375, "step": 170820 }, { - "epoch": 1.85, - "learning_rate": 2.2840547731845023e-05, - "loss": 0.0283, + "epoch": 1.1, + "learning_rate": 0.00013461342352052768, + "loss": 0.0388, "step": 170830 }, { - "epoch": 1.85, - "learning_rate": 2.282432344733597e-05, - "loss": 0.0239, + "epoch": 1.1, + "learning_rate": 0.00013460374216617076, + "loss": 0.0366, "step": 170840 }, { - "epoch": 1.85, - "learning_rate": 2.2808099162826915e-05, - "loss": 0.0246, + "epoch": 1.1, + "learning_rate": 0.00013459406081181382, + "loss": 0.0349, "step": 170850 }, { - "epoch": 1.85, - "learning_rate": 2.2791874878317862e-05, - "loss": 0.0224, + "epoch": 1.1, + "learning_rate": 0.0001345843794574569, + "loss": 0.0353, "step": 170860 }, { - "epoch": 1.85, - "learning_rate": 2.277565059380881e-05, - "loss": 0.02, + "epoch": 1.1, + "learning_rate": 0.00013457469810309995, + "loss": 0.0304, "step": 170870 }, { - "epoch": 1.85, - "learning_rate": 2.2759426309299758e-05, - "loss": 0.0235, + "epoch": 1.1, + "learning_rate": 0.00013456501674874303, + "loss": 0.0347, "step": 170880 }, { - "epoch": 1.85, - "learning_rate": 2.2743202024790704e-05, - "loss": 0.0306, + "epoch": 1.1, + "learning_rate": 0.00013455533539438608, + "loss": 0.0348, "step": 170890 }, { - "epoch": 1.85, - "learning_rate": 2.272697774028165e-05, - "loss": 0.0257, + "epoch": 1.1, + "learning_rate": 0.00013454565404002916, + "loss": 0.035, "step": 170900 }, { - "epoch": 1.85, - "learning_rate": 2.2710753455772597e-05, - "loss": 0.0249, + "epoch": 1.1, + "learning_rate": 0.00013453597268567224, + "loss": 0.036, "step": 170910 }, { - "epoch": 1.85, - "learning_rate": 2.2694529171263543e-05, - "loss": 0.0218, + "epoch": 1.1, + "learning_rate": 0.0001345262913313153, + "loss": 0.029, "step": 170920 }, { - "epoch": 1.85, - "learning_rate": 2.267830488675449e-05, - "loss": 0.0238, + "epoch": 1.1, + "learning_rate": 0.00013451660997695837, + "loss": 0.0285, "step": 170930 }, { - "epoch": 1.85, - "learning_rate": 2.2662080602245436e-05, - "loss": 0.0205, + "epoch": 1.1, + "learning_rate": 0.00013450692862260143, + "loss": 0.0304, "step": 170940 }, { - "epoch": 1.85, - "learning_rate": 2.2645856317736383e-05, - "loss": 0.0256, + "epoch": 1.1, + "learning_rate": 0.0001344972472682445, + "loss": 0.0289, "step": 170950 }, { - "epoch": 1.85, - "learning_rate": 2.2629632033227332e-05, - "loss": 0.0215, + "epoch": 1.1, + "learning_rate": 0.00013448756591388756, + "loss": 0.0368, "step": 170960 }, { - "epoch": 1.85, - "learning_rate": 2.261340774871828e-05, - "loss": 0.0281, + "epoch": 1.1, + "learning_rate": 0.00013447788455953064, + "loss": 0.0324, "step": 170970 }, { - "epoch": 1.85, - "learning_rate": 2.2597183464209225e-05, - "loss": 0.0277, + "epoch": 1.1, + "learning_rate": 0.00013446820320517372, + "loss": 0.0304, "step": 170980 }, { - "epoch": 1.85, - "learning_rate": 2.258095917970017e-05, - "loss": 0.0206, + "epoch": 1.1, + "learning_rate": 0.00013445852185081677, + "loss": 0.0285, "step": 170990 }, { - "epoch": 1.85, - "learning_rate": 2.2564734895191118e-05, - "loss": 0.0258, + "epoch": 1.1, + "learning_rate": 0.00013444884049645985, + "loss": 0.0317, "step": 171000 }, { - "epoch": 1.85, - "eval_cer": 0.9210854134971667, - "eval_loss": 0.02065623179078102, - "eval_runtime": 119.1493, - "eval_samples_per_second": 16.786, - "eval_steps_per_second": 4.196, + "epoch": 1.1, + "eval_cer": 0.9198897299740142, + "eval_loss": 0.02412121742963791, + "eval_runtime": 120.2503, + "eval_samples_per_second": 16.632, + "eval_steps_per_second": 4.158, "step": 171000 }, { - "epoch": 1.85, - "learning_rate": 2.2548510610682068e-05, - "loss": 0.0251, + "epoch": 1.1, + "learning_rate": 0.0001344391591421029, + "loss": 0.0346, "step": 171010 }, { - "epoch": 1.85, - "learning_rate": 2.2532286326173014e-05, - "loss": 0.0262, + "epoch": 1.1, + "learning_rate": 0.00013442947778774598, + "loss": 0.0328, "step": 171020 }, { - "epoch": 1.85, - "learning_rate": 2.2516062041663964e-05, - "loss": 0.0233, + "epoch": 1.1, + "learning_rate": 0.00013441979643338903, + "loss": 0.0325, "step": 171030 }, { - "epoch": 1.85, - "learning_rate": 2.249983775715491e-05, - "loss": 0.0254, + "epoch": 1.1, + "learning_rate": 0.00013441011507903211, + "loss": 0.031, "step": 171040 }, { - "epoch": 1.85, - "learning_rate": 2.2483613472645857e-05, - "loss": 0.033, + "epoch": 1.1, + "learning_rate": 0.0001344004337246752, + "loss": 0.0392, "step": 171050 }, { - "epoch": 1.85, - "learning_rate": 2.2467389188136803e-05, - "loss": 0.0265, + "epoch": 1.1, + "learning_rate": 0.00013439075237031825, + "loss": 0.037, "step": 171060 }, { - "epoch": 1.85, - "learning_rate": 2.245116490362775e-05, - "loss": 0.0293, + "epoch": 1.1, + "learning_rate": 0.0001343810710159613, + "loss": 0.0339, "step": 171070 }, { - "epoch": 1.85, - "learning_rate": 2.2434940619118696e-05, - "loss": 0.0251, + "epoch": 1.1, + "learning_rate": 0.00013437138966160438, + "loss": 0.0384, "step": 171080 }, { - "epoch": 1.85, - "learning_rate": 2.2418716334609642e-05, - "loss": 0.0221, + "epoch": 1.1, + "learning_rate": 0.00013436170830724746, + "loss": 0.0305, "step": 171090 }, { - "epoch": 1.85, - "learning_rate": 2.240249205010059e-05, - "loss": 0.0248, + "epoch": 1.1, + "learning_rate": 0.0001343520269528905, + "loss": 0.0352, "step": 171100 }, { - "epoch": 1.85, - "learning_rate": 2.2386267765591538e-05, - "loss": 0.025, + "epoch": 1.1, + "learning_rate": 0.0001343423455985336, + "loss": 0.0357, "step": 171110 }, { - "epoch": 1.85, - "learning_rate": 2.2370043481082485e-05, - "loss": 0.0234, + "epoch": 1.1, + "learning_rate": 0.00013433266424417664, + "loss": 0.0385, "step": 171120 }, { - "epoch": 1.85, - "learning_rate": 2.235381919657343e-05, - "loss": 0.0349, + "epoch": 1.1, + "learning_rate": 0.00013432298288981972, + "loss": 0.0313, "step": 171130 }, { - "epoch": 1.85, - "learning_rate": 2.2337594912064377e-05, - "loss": 0.0272, + "epoch": 1.1, + "learning_rate": 0.00013431330153546278, + "loss": 0.0324, "step": 171140 }, { - "epoch": 1.85, - "learning_rate": 2.2321370627555324e-05, - "loss": 0.025, + "epoch": 1.1, + "learning_rate": 0.00013430362018110586, + "loss": 0.0349, "step": 171150 }, { - "epoch": 1.85, - "learning_rate": 2.230514634304627e-05, - "loss": 0.0225, + "epoch": 1.1, + "learning_rate": 0.00013429393882674894, + "loss": 0.0312, "step": 171160 }, { - "epoch": 1.85, - "learning_rate": 2.2288922058537217e-05, - "loss": 0.0242, + "epoch": 1.1, + "learning_rate": 0.000134284257472392, + "loss": 0.0311, "step": 171170 }, { - "epoch": 1.85, - "learning_rate": 2.2272697774028163e-05, - "loss": 0.0215, + "epoch": 1.1, + "learning_rate": 0.00013427457611803507, + "loss": 0.0366, "step": 171180 }, { - "epoch": 1.85, - "learning_rate": 2.225647348951911e-05, - "loss": 0.0226, + "epoch": 1.1, + "learning_rate": 0.00013426489476367812, + "loss": 0.0346, "step": 171190 }, { - "epoch": 1.85, - "learning_rate": 2.224024920501006e-05, - "loss": 0.0286, + "epoch": 1.1, + "learning_rate": 0.0001342552134093212, + "loss": 0.0306, "step": 171200 }, { - "epoch": 1.85, - "learning_rate": 2.2224024920501006e-05, - "loss": 0.0256, + "epoch": 1.11, + "learning_rate": 0.00013424553205496425, + "loss": 0.0386, "step": 171210 }, { - "epoch": 1.85, - "learning_rate": 2.2207800635991952e-05, - "loss": 0.0256, + "epoch": 1.11, + "learning_rate": 0.00013423585070060733, + "loss": 0.0331, "step": 171220 }, { - "epoch": 1.85, - "learning_rate": 2.2191576351482898e-05, - "loss": 0.0327, + "epoch": 1.11, + "learning_rate": 0.00013422616934625041, + "loss": 0.0356, "step": 171230 }, { - "epoch": 1.85, - "learning_rate": 2.2175352066973845e-05, - "loss": 0.0221, + "epoch": 1.11, + "learning_rate": 0.00013421648799189347, + "loss": 0.0303, "step": 171240 }, { - "epoch": 1.85, - "learning_rate": 2.215912778246479e-05, - "loss": 0.028, + "epoch": 1.11, + "learning_rate": 0.00013420680663753655, + "loss": 0.0339, "step": 171250 }, { - "epoch": 1.85, - "learning_rate": 2.2142903497955737e-05, - "loss": 0.0275, + "epoch": 1.11, + "learning_rate": 0.0001341971252831796, + "loss": 0.0336, "step": 171260 }, { - "epoch": 1.85, - "learning_rate": 2.2126679213446684e-05, - "loss": 0.0316, + "epoch": 1.11, + "learning_rate": 0.00013418744392882265, + "loss": 0.0356, "step": 171270 }, { - "epoch": 1.85, - "learning_rate": 2.2110454928937634e-05, - "loss": 0.0253, + "epoch": 1.11, + "learning_rate": 0.00013417776257446573, + "loss": 0.0357, "step": 171280 }, { - "epoch": 1.85, - "learning_rate": 2.209423064442858e-05, - "loss": 0.0234, + "epoch": 1.11, + "learning_rate": 0.0001341680812201088, + "loss": 0.0357, "step": 171290 }, { - "epoch": 1.85, - "learning_rate": 2.2078006359919526e-05, - "loss": 0.0233, + "epoch": 1.11, + "learning_rate": 0.0001341583998657519, + "loss": 0.0342, "step": 171300 }, { - "epoch": 1.85, - "learning_rate": 2.2061782075410473e-05, - "loss": 0.0269, + "epoch": 1.11, + "learning_rate": 0.00013414871851139494, + "loss": 0.0335, "step": 171310 }, { - "epoch": 1.85, - "learning_rate": 2.204555779090142e-05, - "loss": 0.0265, + "epoch": 1.11, + "learning_rate": 0.000134139037157038, + "loss": 0.0315, "step": 171320 }, { - "epoch": 1.85, - "learning_rate": 2.2029333506392365e-05, - "loss": 0.0274, + "epoch": 1.11, + "learning_rate": 0.00013412935580268108, + "loss": 0.0331, "step": 171330 }, { - "epoch": 1.85, - "learning_rate": 2.2013109221883312e-05, - "loss": 0.024, + "epoch": 1.11, + "learning_rate": 0.00013411967444832413, + "loss": 0.0269, "step": 171340 }, { - "epoch": 1.85, - "learning_rate": 2.1996884937374258e-05, - "loss": 0.0206, + "epoch": 1.11, + "learning_rate": 0.0001341099930939672, + "loss": 0.0323, "step": 171350 }, { - "epoch": 1.85, - "learning_rate": 2.1980660652865205e-05, - "loss": 0.0241, + "epoch": 1.11, + "learning_rate": 0.0001341003117396103, + "loss": 0.0336, "step": 171360 }, { - "epoch": 1.85, - "learning_rate": 2.1964436368356154e-05, - "loss": 0.0218, + "epoch": 1.11, + "learning_rate": 0.00013409063038525337, + "loss": 0.0312, "step": 171370 }, { - "epoch": 1.85, - "learning_rate": 2.19482120838471e-05, - "loss": 0.0241, + "epoch": 1.11, + "learning_rate": 0.00013408094903089642, + "loss": 0.0338, "step": 171380 }, { - "epoch": 1.85, - "learning_rate": 2.1931987799338047e-05, - "loss": 0.0268, + "epoch": 1.11, + "learning_rate": 0.00013407126767653947, + "loss": 0.0361, "step": 171390 }, { - "epoch": 1.85, - "learning_rate": 2.1915763514828994e-05, - "loss": 0.0225, + "epoch": 1.11, + "learning_rate": 0.00013406158632218255, + "loss": 0.0406, "step": 171400 }, { - "epoch": 1.85, - "learning_rate": 2.189953923031994e-05, - "loss": 0.0312, + "epoch": 1.11, + "learning_rate": 0.0001340519049678256, + "loss": 0.0371, "step": 171410 }, { - "epoch": 1.85, - "learning_rate": 2.1883314945810886e-05, - "loss": 0.0298, + "epoch": 1.11, + "learning_rate": 0.00013404222361346869, + "loss": 0.0377, "step": 171420 }, { - "epoch": 1.85, - "learning_rate": 2.1867090661301833e-05, - "loss": 0.0277, + "epoch": 1.11, + "learning_rate": 0.00013403254225911177, + "loss": 0.0352, "step": 171430 }, { - "epoch": 1.85, - "learning_rate": 2.185086637679278e-05, - "loss": 0.0258, + "epoch": 1.11, + "learning_rate": 0.00013402286090475482, + "loss": 0.0304, "step": 171440 }, { - "epoch": 1.85, - "learning_rate": 2.183464209228373e-05, - "loss": 0.0214, + "epoch": 1.11, + "learning_rate": 0.0001340131795503979, + "loss": 0.0311, "step": 171450 }, { - "epoch": 1.85, - "learning_rate": 2.1818417807774675e-05, - "loss": 0.0272, + "epoch": 1.11, + "learning_rate": 0.00013400349819604095, + "loss": 0.0347, "step": 171460 }, { - "epoch": 1.85, - "learning_rate": 2.180219352326562e-05, - "loss": 0.022, + "epoch": 1.11, + "learning_rate": 0.00013399381684168403, + "loss": 0.0315, "step": 171470 }, { - "epoch": 1.85, - "learning_rate": 2.1785969238756568e-05, - "loss": 0.024, + "epoch": 1.11, + "learning_rate": 0.00013398413548732708, + "loss": 0.0349, "step": 171480 }, { - "epoch": 1.85, - "learning_rate": 2.1769744954247514e-05, - "loss": 0.0268, + "epoch": 1.11, + "learning_rate": 0.00013397445413297016, + "loss": 0.0341, "step": 171490 }, { - "epoch": 1.85, - "learning_rate": 2.175352066973846e-05, - "loss": 0.0282, + "epoch": 1.11, + "learning_rate": 0.00013396477277861324, + "loss": 0.0338, "step": 171500 }, { - "epoch": 1.86, - "learning_rate": 2.1737296385229407e-05, - "loss": 0.0237, + "epoch": 1.11, + "learning_rate": 0.0001339550914242563, + "loss": 0.0307, "step": 171510 }, { - "epoch": 1.86, - "learning_rate": 2.1721072100720354e-05, - "loss": 0.024, + "epoch": 1.11, + "learning_rate": 0.00013394541006989935, + "loss": 0.0377, "step": 171520 }, { - "epoch": 1.86, - "learning_rate": 2.17048478162113e-05, - "loss": 0.0259, + "epoch": 1.11, + "learning_rate": 0.00013393572871554243, + "loss": 0.0287, "step": 171530 }, { - "epoch": 1.86, - "learning_rate": 2.168862353170225e-05, - "loss": 0.0205, + "epoch": 1.11, + "learning_rate": 0.0001339260473611855, + "loss": 0.0287, "step": 171540 }, { - "epoch": 1.86, - "learning_rate": 2.1672399247193196e-05, - "loss": 0.0237, + "epoch": 1.11, + "learning_rate": 0.00013391636600682856, + "loss": 0.0366, "step": 171550 }, { - "epoch": 1.86, - "learning_rate": 2.1656174962684142e-05, - "loss": 0.0209, + "epoch": 1.11, + "learning_rate": 0.00013390668465247164, + "loss": 0.0397, "step": 171560 }, { - "epoch": 1.86, - "learning_rate": 2.163995067817509e-05, - "loss": 0.0228, + "epoch": 1.11, + "learning_rate": 0.00013389700329811472, + "loss": 0.0289, "step": 171570 }, { - "epoch": 1.86, - "learning_rate": 2.1623726393666035e-05, - "loss": 0.021, + "epoch": 1.11, + "learning_rate": 0.00013388732194375777, + "loss": 0.0362, "step": 171580 }, { - "epoch": 1.86, - "learning_rate": 2.160750210915698e-05, - "loss": 0.0245, + "epoch": 1.11, + "learning_rate": 0.00013387764058940083, + "loss": 0.0392, "step": 171590 }, { - "epoch": 1.86, - "learning_rate": 2.1591277824647935e-05, - "loss": 0.0329, + "epoch": 1.11, + "learning_rate": 0.0001338679592350439, + "loss": 0.0339, "step": 171600 }, { - "epoch": 1.86, - "learning_rate": 2.157505354013888e-05, - "loss": 0.0253, + "epoch": 1.11, + "learning_rate": 0.00013385827788068699, + "loss": 0.0328, "step": 171610 }, { - "epoch": 1.86, - "learning_rate": 2.1558829255629828e-05, - "loss": 0.0243, + "epoch": 1.11, + "learning_rate": 0.00013384859652633004, + "loss": 0.0355, "step": 171620 }, { - "epoch": 1.86, - "learning_rate": 2.1542604971120774e-05, - "loss": 0.0257, + "epoch": 1.11, + "learning_rate": 0.00013383891517197312, + "loss": 0.0364, "step": 171630 }, { - "epoch": 1.86, - "learning_rate": 2.152638068661172e-05, - "loss": 0.0277, + "epoch": 1.11, + "learning_rate": 0.00013382923381761617, + "loss": 0.0433, "step": 171640 }, { - "epoch": 1.86, - "learning_rate": 2.1510156402102667e-05, - "loss": 0.0236, + "epoch": 1.11, + "learning_rate": 0.00013381955246325925, + "loss": 0.0342, "step": 171650 }, { - "epoch": 1.86, - "learning_rate": 2.1493932117593613e-05, - "loss": 0.0248, + "epoch": 1.11, + "learning_rate": 0.0001338098711089023, + "loss": 0.0342, "step": 171660 }, { - "epoch": 1.86, - "learning_rate": 2.147770783308456e-05, - "loss": 0.0209, + "epoch": 1.11, + "learning_rate": 0.00013380018975454538, + "loss": 0.0363, "step": 171670 }, { - "epoch": 1.86, - "learning_rate": 2.1461483548575506e-05, - "loss": 0.0213, + "epoch": 1.11, + "learning_rate": 0.00013379050840018846, + "loss": 0.0344, "step": 171680 }, { - "epoch": 1.86, - "learning_rate": 2.1445259264066456e-05, - "loss": 0.0321, + "epoch": 1.11, + "learning_rate": 0.00013378082704583151, + "loss": 0.0301, "step": 171690 }, { - "epoch": 1.86, - "learning_rate": 2.1429034979557402e-05, - "loss": 0.0212, + "epoch": 1.11, + "learning_rate": 0.0001337711456914746, + "loss": 0.0296, "step": 171700 }, { - "epoch": 1.86, - "learning_rate": 2.141281069504835e-05, - "loss": 0.0278, + "epoch": 1.11, + "learning_rate": 0.00013376146433711765, + "loss": 0.0314, "step": 171710 }, { - "epoch": 1.86, - "learning_rate": 2.1396586410539295e-05, - "loss": 0.0193, + "epoch": 1.11, + "learning_rate": 0.00013375178298276073, + "loss": 0.0353, "step": 171720 }, { - "epoch": 1.86, - "learning_rate": 2.138036212603024e-05, - "loss": 0.0263, + "epoch": 1.11, + "learning_rate": 0.00013374210162840378, + "loss": 0.0348, "step": 171730 }, { - "epoch": 1.86, - "learning_rate": 2.1364137841521188e-05, - "loss": 0.0253, + "epoch": 1.11, + "learning_rate": 0.00013373242027404686, + "loss": 0.0299, "step": 171740 }, { - "epoch": 1.86, - "learning_rate": 2.1347913557012134e-05, - "loss": 0.0218, + "epoch": 1.11, + "learning_rate": 0.00013372273891968994, + "loss": 0.0333, "step": 171750 }, { - "epoch": 1.86, - "learning_rate": 2.133168927250308e-05, - "loss": 0.0211, + "epoch": 1.11, + "learning_rate": 0.000133713057565333, + "loss": 0.0342, "step": 171760 }, { - "epoch": 1.86, - "learning_rate": 2.131546498799403e-05, - "loss": 0.0226, + "epoch": 1.11, + "learning_rate": 0.00013370337621097607, + "loss": 0.0338, "step": 171770 }, { - "epoch": 1.86, - "learning_rate": 2.1299240703484976e-05, - "loss": 0.0254, + "epoch": 1.11, + "learning_rate": 0.00013369369485661912, + "loss": 0.0338, "step": 171780 }, { - "epoch": 1.86, - "learning_rate": 2.1283016418975923e-05, - "loss": 0.0259, + "epoch": 1.11, + "learning_rate": 0.0001336840135022622, + "loss": 0.0324, "step": 171790 }, { - "epoch": 1.86, - "learning_rate": 2.126679213446687e-05, - "loss": 0.0246, + "epoch": 1.11, + "learning_rate": 0.00013367433214790526, + "loss": 0.034, "step": 171800 }, { - "epoch": 1.86, - "learning_rate": 2.1250567849957816e-05, - "loss": 0.022, + "epoch": 1.11, + "learning_rate": 0.00013366465079354834, + "loss": 0.0362, "step": 171810 }, { - "epoch": 1.86, - "learning_rate": 2.1234343565448762e-05, - "loss": 0.0238, + "epoch": 1.11, + "learning_rate": 0.00013365496943919142, + "loss": 0.0285, "step": 171820 }, { - "epoch": 1.86, - "learning_rate": 2.121811928093971e-05, - "loss": 0.0255, + "epoch": 1.11, + "learning_rate": 0.00013364528808483447, + "loss": 0.0346, "step": 171830 }, { - "epoch": 1.86, - "learning_rate": 2.1201894996430655e-05, - "loss": 0.0275, + "epoch": 1.11, + "learning_rate": 0.00013363560673047752, + "loss": 0.0357, "step": 171840 }, { - "epoch": 1.86, - "learning_rate": 2.11856707119216e-05, - "loss": 0.0284, + "epoch": 1.11, + "learning_rate": 0.0001336259253761206, + "loss": 0.0297, "step": 171850 }, { - "epoch": 1.86, - "learning_rate": 2.116944642741255e-05, - "loss": 0.0254, + "epoch": 1.11, + "learning_rate": 0.00013361624402176368, + "loss": 0.0335, "step": 171860 }, { - "epoch": 1.86, - "learning_rate": 2.1153222142903497e-05, - "loss": 0.0209, + "epoch": 1.11, + "learning_rate": 0.00013360656266740673, + "loss": 0.032, "step": 171870 }, { - "epoch": 1.86, - "learning_rate": 2.1136997858394444e-05, - "loss": 0.027, + "epoch": 1.11, + "learning_rate": 0.00013359688131304981, + "loss": 0.0346, "step": 171880 }, { - "epoch": 1.86, - "learning_rate": 2.112077357388539e-05, - "loss": 0.0224, + "epoch": 1.11, + "learning_rate": 0.0001335871999586929, + "loss": 0.0335, "step": 171890 }, { - "epoch": 1.86, - "learning_rate": 2.1104549289376336e-05, - "loss": 0.0246, + "epoch": 1.11, + "learning_rate": 0.00013357751860433595, + "loss": 0.0299, "step": 171900 }, { - "epoch": 1.86, - "learning_rate": 2.1088325004867283e-05, - "loss": 0.029, + "epoch": 1.11, + "learning_rate": 0.000133567837249979, + "loss": 0.0322, "step": 171910 }, { - "epoch": 1.86, - "learning_rate": 2.107210072035823e-05, - "loss": 0.0224, + "epoch": 1.11, + "learning_rate": 0.00013355815589562208, + "loss": 0.0313, "step": 171920 }, { - "epoch": 1.86, - "learning_rate": 2.1055876435849176e-05, - "loss": 0.0224, + "epoch": 1.11, + "learning_rate": 0.00013354847454126516, + "loss": 0.0348, "step": 171930 }, { - "epoch": 1.86, - "learning_rate": 2.1039652151340125e-05, - "loss": 0.0243, + "epoch": 1.11, + "learning_rate": 0.0001335387931869082, + "loss": 0.0306, "step": 171940 }, { - "epoch": 1.86, - "learning_rate": 2.1023427866831072e-05, - "loss": 0.0257, + "epoch": 1.11, + "learning_rate": 0.0001335291118325513, + "loss": 0.0323, "step": 171950 }, { - "epoch": 1.86, - "learning_rate": 2.1007203582322018e-05, - "loss": 0.0231, + "epoch": 1.11, + "learning_rate": 0.00013351943047819434, + "loss": 0.03, "step": 171960 }, { - "epoch": 1.86, - "learning_rate": 2.0990979297812964e-05, - "loss": 0.0242, + "epoch": 1.11, + "learning_rate": 0.00013350974912383742, + "loss": 0.031, "step": 171970 }, { - "epoch": 1.86, - "learning_rate": 2.097475501330391e-05, - "loss": 0.0207, + "epoch": 1.11, + "learning_rate": 0.00013350006776948048, + "loss": 0.0367, "step": 171980 }, { - "epoch": 1.86, - "learning_rate": 2.0958530728794857e-05, - "loss": 0.0186, + "epoch": 1.11, + "learning_rate": 0.00013349038641512356, + "loss": 0.0312, "step": 171990 }, { - "epoch": 1.86, - "learning_rate": 2.0942306444285804e-05, - "loss": 0.0282, + "epoch": 1.11, + "learning_rate": 0.00013348070506076664, + "loss": 0.0313, "step": 172000 }, { - "epoch": 1.86, - "eval_cer": 0.9210412392811265, - "eval_loss": 0.02053496427834034, - "eval_runtime": 118.9554, - "eval_samples_per_second": 16.813, - "eval_steps_per_second": 4.203, + "epoch": 1.11, + "eval_cer": 0.9199041916167665, + "eval_loss": 0.02452256716787815, + "eval_runtime": 120.1075, + "eval_samples_per_second": 16.652, + "eval_steps_per_second": 4.163, "step": 172000 }, { - "epoch": 1.86, - "learning_rate": 2.092608215977675e-05, - "loss": 0.0216, + "epoch": 1.11, + "learning_rate": 0.0001334710237064097, + "loss": 0.0282, "step": 172010 }, { - "epoch": 1.86, - "learning_rate": 2.0909857875267696e-05, - "loss": 0.0291, + "epoch": 1.11, + "learning_rate": 0.00013346134235205277, + "loss": 0.0308, "step": 172020 }, { - "epoch": 1.86, - "learning_rate": 2.0893633590758646e-05, - "loss": 0.0255, + "epoch": 1.11, + "learning_rate": 0.00013345166099769582, + "loss": 0.0338, "step": 172030 }, { - "epoch": 1.86, - "learning_rate": 2.0877409306249593e-05, - "loss": 0.0198, + "epoch": 1.11, + "learning_rate": 0.00013344197964333887, + "loss": 0.0327, "step": 172040 }, { - "epoch": 1.86, - "learning_rate": 2.086118502174054e-05, - "loss": 0.0234, + "epoch": 1.11, + "learning_rate": 0.00013343229828898195, + "loss": 0.0342, "step": 172050 }, { - "epoch": 1.86, - "learning_rate": 2.0844960737231485e-05, - "loss": 0.0317, + "epoch": 1.11, + "learning_rate": 0.00013342261693462503, + "loss": 0.0495, "step": 172060 }, { - "epoch": 1.86, - "learning_rate": 2.082873645272243e-05, - "loss": 0.0291, + "epoch": 1.11, + "learning_rate": 0.0001334129355802681, + "loss": 0.0319, "step": 172070 }, { - "epoch": 1.86, - "learning_rate": 2.0812512168213378e-05, - "loss": 0.0237, + "epoch": 1.11, + "learning_rate": 0.00013340325422591117, + "loss": 0.0312, "step": 172080 }, { - "epoch": 1.86, - "learning_rate": 2.0796287883704324e-05, - "loss": 0.0275, + "epoch": 1.11, + "learning_rate": 0.00013339357287155425, + "loss": 0.0295, "step": 172090 }, { - "epoch": 1.86, - "learning_rate": 2.078006359919527e-05, - "loss": 0.0194, + "epoch": 1.11, + "learning_rate": 0.0001333838915171973, + "loss": 0.0353, "step": 172100 }, { - "epoch": 1.86, - "learning_rate": 2.076383931468622e-05, - "loss": 0.0235, + "epoch": 1.11, + "learning_rate": 0.00013337421016284035, + "loss": 0.0354, "step": 172110 }, { - "epoch": 1.86, - "learning_rate": 2.0747615030177167e-05, - "loss": 0.0231, + "epoch": 1.11, + "learning_rate": 0.00013336452880848343, + "loss": 0.0314, "step": 172120 }, { - "epoch": 1.86, - "learning_rate": 2.0731390745668113e-05, - "loss": 0.0249, + "epoch": 1.11, + "learning_rate": 0.0001333548474541265, + "loss": 0.0412, "step": 172130 }, { - "epoch": 1.86, - "learning_rate": 2.071516646115906e-05, - "loss": 0.0265, + "epoch": 1.11, + "learning_rate": 0.0001333451660997696, + "loss": 0.033, "step": 172140 }, { - "epoch": 1.86, - "learning_rate": 2.0698942176650006e-05, - "loss": 0.0209, + "epoch": 1.11, + "learning_rate": 0.00013333548474541264, + "loss": 0.0431, "step": 172150 }, { - "epoch": 1.86, - "learning_rate": 2.0682717892140953e-05, - "loss": 0.0278, + "epoch": 1.11, + "learning_rate": 0.0001333258033910557, + "loss": 0.0381, "step": 172160 }, { - "epoch": 1.86, - "learning_rate": 2.06664936076319e-05, - "loss": 0.0289, + "epoch": 1.11, + "learning_rate": 0.00013331612203669878, + "loss": 0.0331, "step": 172170 }, { - "epoch": 1.86, - "learning_rate": 2.0650269323122852e-05, - "loss": 0.024, + "epoch": 1.11, + "learning_rate": 0.00013330644068234183, + "loss": 0.0387, "step": 172180 }, { - "epoch": 1.86, - "learning_rate": 2.06340450386138e-05, - "loss": 0.0243, + "epoch": 1.11, + "learning_rate": 0.0001332967593279849, + "loss": 0.0359, "step": 172190 }, { - "epoch": 1.86, - "learning_rate": 2.0617820754104745e-05, - "loss": 0.0237, + "epoch": 1.11, + "learning_rate": 0.000133287077973628, + "loss": 0.0362, "step": 172200 }, { - "epoch": 1.86, - "learning_rate": 2.060159646959569e-05, - "loss": 0.0245, + "epoch": 1.11, + "learning_rate": 0.00013327739661927104, + "loss": 0.0367, "step": 172210 }, { - "epoch": 1.86, - "learning_rate": 2.0585372185086638e-05, - "loss": 0.027, + "epoch": 1.11, + "learning_rate": 0.00013326771526491412, + "loss": 0.0325, "step": 172220 }, { - "epoch": 1.86, - "learning_rate": 2.0569147900577584e-05, - "loss": 0.0217, + "epoch": 1.11, + "learning_rate": 0.00013325803391055717, + "loss": 0.0374, "step": 172230 }, { - "epoch": 1.86, - "learning_rate": 2.055292361606853e-05, - "loss": 0.023, + "epoch": 1.11, + "learning_rate": 0.00013324835255620025, + "loss": 0.0324, "step": 172240 }, { - "epoch": 1.86, - "learning_rate": 2.0536699331559477e-05, - "loss": 0.0262, + "epoch": 1.11, + "learning_rate": 0.0001332386712018433, + "loss": 0.0292, "step": 172250 }, { - "epoch": 1.86, - "learning_rate": 2.0520475047050423e-05, - "loss": 0.0253, + "epoch": 1.11, + "learning_rate": 0.00013322898984748639, + "loss": 0.0342, "step": 172260 }, { - "epoch": 1.86, - "learning_rate": 2.0504250762541373e-05, - "loss": 0.0244, + "epoch": 1.11, + "learning_rate": 0.00013321930849312947, + "loss": 0.0329, "step": 172270 }, { - "epoch": 1.86, - "learning_rate": 2.048802647803232e-05, - "loss": 0.0254, + "epoch": 1.11, + "learning_rate": 0.00013320962713877252, + "loss": 0.0325, "step": 172280 }, { - "epoch": 1.86, - "learning_rate": 2.0471802193523266e-05, - "loss": 0.0244, + "epoch": 1.11, + "learning_rate": 0.0001331999457844156, + "loss": 0.0319, "step": 172290 }, { - "epoch": 1.86, - "learning_rate": 2.0455577909014212e-05, - "loss": 0.0265, + "epoch": 1.11, + "learning_rate": 0.00013319026443005865, + "loss": 0.0326, "step": 172300 }, { - "epoch": 1.86, - "learning_rate": 2.043935362450516e-05, - "loss": 0.0227, + "epoch": 1.11, + "learning_rate": 0.00013318058307570173, + "loss": 0.0386, "step": 172310 }, { - "epoch": 1.86, - "learning_rate": 2.0423129339996105e-05, - "loss": 0.0284, + "epoch": 1.11, + "learning_rate": 0.00013317090172134478, + "loss": 0.0399, "step": 172320 }, { - "epoch": 1.86, - "learning_rate": 2.040690505548705e-05, - "loss": 0.0264, + "epoch": 1.11, + "learning_rate": 0.00013316122036698786, + "loss": 0.0324, "step": 172330 }, { - "epoch": 1.86, - "learning_rate": 2.0390680770977998e-05, - "loss": 0.0226, + "epoch": 1.11, + "learning_rate": 0.00013315153901263094, + "loss": 0.0357, "step": 172340 }, { - "epoch": 1.86, - "learning_rate": 2.0374456486468947e-05, - "loss": 0.0252, + "epoch": 1.11, + "learning_rate": 0.000133141857658274, + "loss": 0.0378, "step": 172350 }, { - "epoch": 1.86, - "learning_rate": 2.0358232201959894e-05, - "loss": 0.0246, + "epoch": 1.11, + "learning_rate": 0.00013313217630391705, + "loss": 0.0296, "step": 172360 }, { - "epoch": 1.86, - "learning_rate": 2.034200791745084e-05, - "loss": 0.0241, + "epoch": 1.11, + "learning_rate": 0.00013312249494956013, + "loss": 0.037, "step": 172370 }, { - "epoch": 1.86, - "learning_rate": 2.0325783632941786e-05, - "loss": 0.0304, + "epoch": 1.11, + "learning_rate": 0.0001331128135952032, + "loss": 0.0328, "step": 172380 }, { - "epoch": 1.86, - "learning_rate": 2.0309559348432733e-05, - "loss": 0.0304, + "epoch": 1.11, + "learning_rate": 0.00013310313224084626, + "loss": 0.035, "step": 172390 }, { - "epoch": 1.86, - "learning_rate": 2.029333506392368e-05, - "loss": 0.0193, + "epoch": 1.11, + "learning_rate": 0.00013309345088648934, + "loss": 0.0327, "step": 172400 }, { - "epoch": 1.86, - "learning_rate": 2.0277110779414626e-05, - "loss": 0.0232, + "epoch": 1.11, + "learning_rate": 0.0001330837695321324, + "loss": 0.0289, "step": 172410 }, { - "epoch": 1.86, - "learning_rate": 2.0260886494905572e-05, - "loss": 0.0248, - "step": 172420 + "epoch": 1.11, + "learning_rate": 0.00013307408817777547, + "loss": 0.0346, + "step": 172420 }, { - "epoch": 1.87, - "learning_rate": 2.024466221039652e-05, - "loss": 0.0272, + "epoch": 1.11, + "learning_rate": 0.00013306440682341853, + "loss": 0.0353, "step": 172430 }, { - "epoch": 1.87, - "learning_rate": 2.0228437925887468e-05, - "loss": 0.0237, + "epoch": 1.11, + "learning_rate": 0.0001330547254690616, + "loss": 0.0338, "step": 172440 }, { - "epoch": 1.87, - "learning_rate": 2.0212213641378415e-05, - "loss": 0.0205, + "epoch": 1.11, + "learning_rate": 0.00013304504411470468, + "loss": 0.0339, "step": 172450 }, { - "epoch": 1.87, - "learning_rate": 2.019598935686936e-05, - "loss": 0.0252, + "epoch": 1.11, + "learning_rate": 0.00013303536276034774, + "loss": 0.0337, "step": 172460 }, { - "epoch": 1.87, - "learning_rate": 2.0179765072360307e-05, - "loss": 0.0231, + "epoch": 1.11, + "learning_rate": 0.00013302568140599082, + "loss": 0.0366, "step": 172470 }, { - "epoch": 1.87, - "learning_rate": 2.0163540787851254e-05, - "loss": 0.0209, + "epoch": 1.11, + "learning_rate": 0.00013301600005163387, + "loss": 0.037, "step": 172480 }, { - "epoch": 1.87, - "learning_rate": 2.01473165033422e-05, - "loss": 0.0225, + "epoch": 1.11, + "learning_rate": 0.00013300631869727695, + "loss": 0.029, "step": 172490 }, { - "epoch": 1.87, - "learning_rate": 2.0131092218833146e-05, - "loss": 0.0224, + "epoch": 1.11, + "learning_rate": 0.00013299663734292, + "loss": 0.033, "step": 172500 }, { - "epoch": 1.87, - "learning_rate": 2.0114867934324093e-05, - "loss": 0.0256, + "epoch": 1.11, + "learning_rate": 0.00013298695598856308, + "loss": 0.0299, "step": 172510 }, { - "epoch": 1.87, - "learning_rate": 2.0098643649815043e-05, - "loss": 0.0197, + "epoch": 1.11, + "learning_rate": 0.00013297727463420616, + "loss": 0.0368, "step": 172520 }, { - "epoch": 1.87, - "learning_rate": 2.008241936530599e-05, - "loss": 0.0266, + "epoch": 1.11, + "learning_rate": 0.00013296759327984921, + "loss": 0.0333, "step": 172530 }, { - "epoch": 1.87, - "learning_rate": 2.0066195080796935e-05, - "loss": 0.0179, + "epoch": 1.11, + "learning_rate": 0.0001329579119254923, + "loss": 0.0322, "step": 172540 }, { - "epoch": 1.87, - "learning_rate": 2.0049970796287882e-05, - "loss": 0.0271, + "epoch": 1.11, + "learning_rate": 0.00013294823057113535, + "loss": 0.0424, "step": 172550 }, { - "epoch": 1.87, - "learning_rate": 2.0033746511778828e-05, - "loss": 0.0244, + "epoch": 1.11, + "learning_rate": 0.00013293854921677843, + "loss": 0.0355, "step": 172560 }, { - "epoch": 1.87, - "learning_rate": 2.0017522227269775e-05, - "loss": 0.02, + "epoch": 1.11, + "learning_rate": 0.00013292886786242148, + "loss": 0.032, "step": 172570 }, { - "epoch": 1.87, - "learning_rate": 2.000129794276072e-05, - "loss": 0.0243, + "epoch": 1.11, + "learning_rate": 0.00013291918650806456, + "loss": 0.0361, "step": 172580 }, { - "epoch": 1.87, - "learning_rate": 1.9985073658251667e-05, - "loss": 0.0269, + "epoch": 1.11, + "learning_rate": 0.00013290950515370764, + "loss": 0.0268, "step": 172590 }, { - "epoch": 1.87, - "learning_rate": 1.9968849373742614e-05, - "loss": 0.0234, + "epoch": 1.11, + "learning_rate": 0.0001328998237993507, + "loss": 0.0348, "step": 172600 }, { - "epoch": 1.87, - "learning_rate": 1.9952625089233563e-05, - "loss": 0.0235, + "epoch": 1.11, + "learning_rate": 0.00013289014244499374, + "loss": 0.0307, "step": 172610 }, { - "epoch": 1.87, - "learning_rate": 1.993640080472451e-05, - "loss": 0.0266, + "epoch": 1.11, + "learning_rate": 0.00013288046109063682, + "loss": 0.0349, "step": 172620 }, { - "epoch": 1.87, - "learning_rate": 1.9920176520215456e-05, - "loss": 0.0254, + "epoch": 1.11, + "learning_rate": 0.0001328707797362799, + "loss": 0.0331, "step": 172630 }, { - "epoch": 1.87, - "learning_rate": 1.9903952235706403e-05, - "loss": 0.0223, + "epoch": 1.11, + "learning_rate": 0.00013286109838192296, + "loss": 0.0335, "step": 172640 }, { - "epoch": 1.87, - "learning_rate": 1.988772795119735e-05, - "loss": 0.023, + "epoch": 1.11, + "learning_rate": 0.00013285141702756604, + "loss": 0.0404, "step": 172650 }, { - "epoch": 1.87, - "learning_rate": 1.9871503666688295e-05, - "loss": 0.0232, + "epoch": 1.11, + "learning_rate": 0.00013284173567320912, + "loss": 0.037, "step": 172660 }, { - "epoch": 1.87, - "learning_rate": 1.9855279382179242e-05, - "loss": 0.0276, + "epoch": 1.11, + "learning_rate": 0.00013283205431885217, + "loss": 0.0353, "step": 172670 }, { - "epoch": 1.87, - "learning_rate": 1.9839055097670188e-05, - "loss": 0.0283, + "epoch": 1.11, + "learning_rate": 0.00013282237296449522, + "loss": 0.0416, "step": 172680 }, { - "epoch": 1.87, - "learning_rate": 1.9822830813161138e-05, - "loss": 0.0262, + "epoch": 1.11, + "learning_rate": 0.0001328126916101383, + "loss": 0.0286, "step": 172690 }, { - "epoch": 1.87, - "learning_rate": 1.9806606528652084e-05, - "loss": 0.0282, + "epoch": 1.11, + "learning_rate": 0.00013280301025578138, + "loss": 0.034, "step": 172700 }, { - "epoch": 1.87, - "learning_rate": 1.979038224414303e-05, - "loss": 0.0224, + "epoch": 1.11, + "learning_rate": 0.00013279332890142443, + "loss": 0.0373, "step": 172710 }, { - "epoch": 1.87, - "learning_rate": 1.9774157959633977e-05, - "loss": 0.0214, + "epoch": 1.11, + "learning_rate": 0.00013278364754706751, + "loss": 0.0348, "step": 172720 }, { - "epoch": 1.87, - "learning_rate": 1.9757933675124923e-05, - "loss": 0.0251, + "epoch": 1.11, + "learning_rate": 0.00013277396619271057, + "loss": 0.0323, "step": 172730 }, { - "epoch": 1.87, - "learning_rate": 1.974170939061587e-05, - "loss": 0.022, + "epoch": 1.11, + "learning_rate": 0.00013276428483835365, + "loss": 0.0336, "step": 172740 }, { - "epoch": 1.87, - "learning_rate": 1.9725485106106816e-05, - "loss": 0.0247, + "epoch": 1.11, + "learning_rate": 0.0001327546034839967, + "loss": 0.034, "step": 172750 }, { - "epoch": 1.87, - "learning_rate": 1.9709260821597763e-05, - "loss": 0.0268, + "epoch": 1.12, + "learning_rate": 0.00013274492212963978, + "loss": 0.0408, "step": 172760 }, { - "epoch": 1.87, - "learning_rate": 1.9693036537088716e-05, - "loss": 0.0257, + "epoch": 1.12, + "learning_rate": 0.00013273524077528286, + "loss": 0.0348, "step": 172770 }, { - "epoch": 1.87, - "learning_rate": 1.9676812252579662e-05, - "loss": 0.0223, + "epoch": 1.12, + "learning_rate": 0.0001327255594209259, + "loss": 0.0354, "step": 172780 }, { - "epoch": 1.87, - "learning_rate": 1.966058796807061e-05, - "loss": 0.0268, + "epoch": 1.12, + "learning_rate": 0.000132715878066569, + "loss": 0.0308, "step": 172790 }, { - "epoch": 1.87, - "learning_rate": 1.9644363683561555e-05, - "loss": 0.0329, + "epoch": 1.12, + "learning_rate": 0.00013270619671221204, + "loss": 0.0386, "step": 172800 }, { - "epoch": 1.87, - "learning_rate": 1.96281393990525e-05, - "loss": 0.025, + "epoch": 1.12, + "learning_rate": 0.0001326965153578551, + "loss": 0.0378, "step": 172810 }, { - "epoch": 1.87, - "learning_rate": 1.9611915114543448e-05, - "loss": 0.023, + "epoch": 1.12, + "learning_rate": 0.00013268683400349818, + "loss": 0.0343, "step": 172820 }, { - "epoch": 1.87, - "learning_rate": 1.9595690830034394e-05, - "loss": 0.0226, + "epoch": 1.12, + "learning_rate": 0.00013267715264914126, + "loss": 0.0326, "step": 172830 }, { - "epoch": 1.87, - "learning_rate": 1.9579466545525344e-05, - "loss": 0.0222, + "epoch": 1.12, + "learning_rate": 0.00013266747129478434, + "loss": 0.0382, "step": 172840 }, { - "epoch": 1.87, - "learning_rate": 1.956324226101629e-05, - "loss": 0.0249, + "epoch": 1.12, + "learning_rate": 0.0001326577899404274, + "loss": 0.0342, "step": 172850 }, { - "epoch": 1.87, - "learning_rate": 1.9547017976507237e-05, - "loss": 0.0246, + "epoch": 1.12, + "learning_rate": 0.00013264810858607047, + "loss": 0.0324, "step": 172860 }, { - "epoch": 1.87, - "learning_rate": 1.9530793691998183e-05, - "loss": 0.0223, + "epoch": 1.12, + "learning_rate": 0.00013263842723171352, + "loss": 0.0348, "step": 172870 }, { - "epoch": 1.87, - "learning_rate": 1.951456940748913e-05, - "loss": 0.0282, + "epoch": 1.12, + "learning_rate": 0.00013262874587735657, + "loss": 0.0317, "step": 172880 }, { - "epoch": 1.87, - "learning_rate": 1.9498345122980076e-05, - "loss": 0.0236, + "epoch": 1.12, + "learning_rate": 0.00013261906452299965, + "loss": 0.0353, "step": 172890 }, { - "epoch": 1.87, - "learning_rate": 1.9482120838471022e-05, - "loss": 0.025, + "epoch": 1.12, + "learning_rate": 0.00013260938316864273, + "loss": 0.0375, "step": 172900 }, { - "epoch": 1.87, - "learning_rate": 1.946589655396197e-05, - "loss": 0.0227, + "epoch": 1.12, + "learning_rate": 0.0001325997018142858, + "loss": 0.0394, "step": 172910 }, { - "epoch": 1.87, - "learning_rate": 1.9449672269452915e-05, - "loss": 0.0228, + "epoch": 1.12, + "learning_rate": 0.00013259002045992887, + "loss": 0.0354, "step": 172920 }, { - "epoch": 1.87, - "learning_rate": 1.9433447984943865e-05, - "loss": 0.0271, + "epoch": 1.12, + "learning_rate": 0.00013258033910557192, + "loss": 0.0395, "step": 172930 }, { - "epoch": 1.87, - "learning_rate": 1.941722370043481e-05, - "loss": 0.0257, + "epoch": 1.12, + "learning_rate": 0.000132570657751215, + "loss": 0.0312, "step": 172940 }, { - "epoch": 1.87, - "learning_rate": 1.9400999415925757e-05, - "loss": 0.0218, + "epoch": 1.12, + "learning_rate": 0.00013256097639685805, + "loss": 0.0313, "step": 172950 }, { - "epoch": 1.87, - "learning_rate": 1.9384775131416704e-05, - "loss": 0.0237, + "epoch": 1.12, + "learning_rate": 0.00013255129504250113, + "loss": 0.0334, "step": 172960 }, { - "epoch": 1.87, - "learning_rate": 1.936855084690765e-05, - "loss": 0.0255, + "epoch": 1.12, + "learning_rate": 0.0001325416136881442, + "loss": 0.0323, "step": 172970 }, { - "epoch": 1.87, - "learning_rate": 1.9352326562398597e-05, - "loss": 0.0253, + "epoch": 1.12, + "learning_rate": 0.0001325319323337873, + "loss": 0.0309, "step": 172980 }, { - "epoch": 1.87, - "learning_rate": 1.9336102277889543e-05, - "loss": 0.0224, + "epoch": 1.12, + "learning_rate": 0.00013252225097943034, + "loss": 0.0355, "step": 172990 }, { - "epoch": 1.87, - "learning_rate": 1.931987799338049e-05, - "loss": 0.0282, + "epoch": 1.12, + "learning_rate": 0.0001325125696250734, + "loss": 0.033, "step": 173000 }, { - "epoch": 1.87, - "eval_cer": 0.9210324044379185, - "eval_loss": 0.020626498386263847, - "eval_runtime": 118.8752, - "eval_samples_per_second": 16.824, - "eval_steps_per_second": 4.206, + "epoch": 1.12, + "eval_cer": 0.9199412495763191, + "eval_loss": 0.023672111332416534, + "eval_runtime": 120.0714, + "eval_samples_per_second": 16.657, + "eval_steps_per_second": 4.164, "step": 173000 }, { - "epoch": 1.87, - "learning_rate": 1.930365370887144e-05, - "loss": 0.0275, + "epoch": 1.12, + "learning_rate": 0.00013250288827071648, + "loss": 0.0387, "step": 173010 }, { - "epoch": 1.87, - "learning_rate": 1.9287429424362385e-05, - "loss": 0.0223, + "epoch": 1.12, + "learning_rate": 0.00013249320691635953, + "loss": 0.0389, "step": 173020 }, { - "epoch": 1.87, - "learning_rate": 1.9271205139853332e-05, - "loss": 0.027, + "epoch": 1.12, + "learning_rate": 0.0001324835255620026, + "loss": 0.0371, "step": 173030 }, { - "epoch": 1.87, - "learning_rate": 1.9254980855344278e-05, - "loss": 0.0267, + "epoch": 1.12, + "learning_rate": 0.0001324738442076457, + "loss": 0.0329, "step": 173040 }, { - "epoch": 1.87, - "learning_rate": 1.9238756570835225e-05, - "loss": 0.0286, + "epoch": 1.12, + "learning_rate": 0.00013246416285328874, + "loss": 0.032, "step": 173050 }, { - "epoch": 1.87, - "learning_rate": 1.922253228632617e-05, - "loss": 0.02, + "epoch": 1.12, + "learning_rate": 0.00013245448149893182, + "loss": 0.0347, "step": 173060 }, { - "epoch": 1.87, - "learning_rate": 1.9206308001817117e-05, - "loss": 0.0263, + "epoch": 1.12, + "learning_rate": 0.00013244480014457487, + "loss": 0.0365, "step": 173070 }, { - "epoch": 1.87, - "learning_rate": 1.9190083717308064e-05, - "loss": 0.0224, + "epoch": 1.12, + "learning_rate": 0.00013243511879021795, + "loss": 0.0345, "step": 173080 }, { - "epoch": 1.87, - "learning_rate": 1.917385943279901e-05, - "loss": 0.0262, + "epoch": 1.12, + "learning_rate": 0.000132425437435861, + "loss": 0.0355, "step": 173090 }, { - "epoch": 1.87, - "learning_rate": 1.915763514828996e-05, - "loss": 0.027, + "epoch": 1.12, + "learning_rate": 0.00013241575608150409, + "loss": 0.0356, "step": 173100 }, { - "epoch": 1.87, - "learning_rate": 1.9141410863780906e-05, - "loss": 0.0206, + "epoch": 1.12, + "learning_rate": 0.00013240607472714716, + "loss": 0.0398, "step": 173110 }, { - "epoch": 1.87, - "learning_rate": 1.9125186579271853e-05, - "loss": 0.0237, + "epoch": 1.12, + "learning_rate": 0.00013239639337279022, + "loss": 0.0319, "step": 173120 }, { - "epoch": 1.87, - "learning_rate": 1.91089622947628e-05, - "loss": 0.0241, + "epoch": 1.12, + "learning_rate": 0.00013238671201843327, + "loss": 0.0371, "step": 173130 }, { - "epoch": 1.87, - "learning_rate": 1.9092738010253745e-05, - "loss": 0.0277, + "epoch": 1.12, + "learning_rate": 0.00013237703066407635, + "loss": 0.0308, "step": 173140 }, { - "epoch": 1.87, - "learning_rate": 1.9076513725744692e-05, - "loss": 0.0185, + "epoch": 1.12, + "learning_rate": 0.00013236734930971943, + "loss": 0.0365, "step": 173150 }, { - "epoch": 1.87, - "learning_rate": 1.9060289441235638e-05, - "loss": 0.0199, + "epoch": 1.12, + "learning_rate": 0.00013235766795536248, + "loss": 0.0377, "step": 173160 }, { - "epoch": 1.87, - "learning_rate": 1.9044065156726585e-05, - "loss": 0.029, + "epoch": 1.12, + "learning_rate": 0.00013234798660100556, + "loss": 0.0335, "step": 173170 }, { - "epoch": 1.87, - "learning_rate": 1.9027840872217534e-05, - "loss": 0.024, + "epoch": 1.12, + "learning_rate": 0.00013233830524664864, + "loss": 0.0315, "step": 173180 }, { - "epoch": 1.87, - "learning_rate": 1.901161658770848e-05, - "loss": 0.023, + "epoch": 1.12, + "learning_rate": 0.0001323286238922917, + "loss": 0.0314, "step": 173190 }, { - "epoch": 1.87, - "learning_rate": 1.8995392303199427e-05, - "loss": 0.0276, + "epoch": 1.12, + "learning_rate": 0.00013231894253793475, + "loss": 0.0288, "step": 173200 }, { - "epoch": 1.87, - "learning_rate": 1.8979168018690374e-05, - "loss": 0.0286, + "epoch": 1.12, + "learning_rate": 0.00013230926118357783, + "loss": 0.0351, "step": 173210 }, { - "epoch": 1.87, - "learning_rate": 1.896294373418132e-05, - "loss": 0.0272, + "epoch": 1.12, + "learning_rate": 0.0001322995798292209, + "loss": 0.0331, "step": 173220 }, { - "epoch": 1.87, - "learning_rate": 1.8946719449672266e-05, - "loss": 0.0258, + "epoch": 1.12, + "learning_rate": 0.00013228989847486396, + "loss": 0.0327, "step": 173230 }, { - "epoch": 1.87, - "learning_rate": 1.8930495165163213e-05, - "loss": 0.026, + "epoch": 1.12, + "learning_rate": 0.00013228021712050704, + "loss": 0.0307, "step": 173240 }, { - "epoch": 1.87, - "learning_rate": 1.891427088065416e-05, - "loss": 0.0266, + "epoch": 1.12, + "learning_rate": 0.0001322705357661501, + "loss": 0.0275, "step": 173250 }, { - "epoch": 1.87, - "learning_rate": 1.8898046596145105e-05, - "loss": 0.0214, + "epoch": 1.12, + "learning_rate": 0.00013226085441179317, + "loss": 0.0314, "step": 173260 }, { - "epoch": 1.87, - "learning_rate": 1.8881822311636055e-05, - "loss": 0.0239, + "epoch": 1.12, + "learning_rate": 0.00013225117305743622, + "loss": 0.0328, "step": 173270 }, { - "epoch": 1.87, - "learning_rate": 1.8865598027127e-05, - "loss": 0.0318, + "epoch": 1.12, + "learning_rate": 0.0001322414917030793, + "loss": 0.032, "step": 173280 }, { - "epoch": 1.87, - "learning_rate": 1.8849373742617948e-05, - "loss": 0.0239, + "epoch": 1.12, + "learning_rate": 0.00013223181034872238, + "loss": 0.0373, "step": 173290 }, { - "epoch": 1.87, - "learning_rate": 1.8833149458108894e-05, - "loss": 0.0244, + "epoch": 1.12, + "learning_rate": 0.00013222212899436544, + "loss": 0.0327, "step": 173300 }, { - "epoch": 1.87, - "learning_rate": 1.881692517359984e-05, - "loss": 0.0245, + "epoch": 1.12, + "learning_rate": 0.00013221244764000852, + "loss": 0.0365, "step": 173310 }, { - "epoch": 1.87, - "learning_rate": 1.8800700889090787e-05, - "loss": 0.023, + "epoch": 1.12, + "learning_rate": 0.00013220276628565157, + "loss": 0.0356, "step": 173320 }, { - "epoch": 1.87, - "learning_rate": 1.8784476604581733e-05, - "loss": 0.0216, + "epoch": 1.12, + "learning_rate": 0.00013219308493129465, + "loss": 0.0333, "step": 173330 }, { - "epoch": 1.87, - "learning_rate": 1.876825232007268e-05, - "loss": 0.0254, + "epoch": 1.12, + "learning_rate": 0.0001321834035769377, + "loss": 0.0352, "step": 173340 }, { - "epoch": 1.87, - "learning_rate": 1.8752028035563626e-05, - "loss": 0.0219, + "epoch": 1.12, + "learning_rate": 0.00013217372222258078, + "loss": 0.0323, "step": 173350 }, { - "epoch": 1.88, - "learning_rate": 1.8735803751054576e-05, - "loss": 0.0245, + "epoch": 1.12, + "learning_rate": 0.00013216404086822386, + "loss": 0.0372, "step": 173360 }, { - "epoch": 1.88, - "learning_rate": 1.8719579466545522e-05, - "loss": 0.0201, + "epoch": 1.12, + "learning_rate": 0.00013215435951386691, + "loss": 0.0342, "step": 173370 }, { - "epoch": 1.88, - "learning_rate": 1.870335518203647e-05, - "loss": 0.0256, + "epoch": 1.12, + "learning_rate": 0.00013214467815951, + "loss": 0.0358, "step": 173380 }, { - "epoch": 1.88, - "learning_rate": 1.868713089752742e-05, - "loss": 0.0299, + "epoch": 1.12, + "learning_rate": 0.00013213499680515305, + "loss": 0.0349, "step": 173390 }, { - "epoch": 1.88, - "learning_rate": 1.8670906613018365e-05, - "loss": 0.0187, + "epoch": 1.12, + "learning_rate": 0.00013212531545079613, + "loss": 0.0345, "step": 173400 }, { - "epoch": 1.88, - "learning_rate": 1.865468232850931e-05, - "loss": 0.0218, + "epoch": 1.12, + "learning_rate": 0.00013211563409643918, + "loss": 0.0321, "step": 173410 }, { - "epoch": 1.88, - "learning_rate": 1.8638458044000258e-05, - "loss": 0.0302, + "epoch": 1.12, + "learning_rate": 0.00013210595274208226, + "loss": 0.0299, "step": 173420 }, { - "epoch": 1.88, - "learning_rate": 1.8622233759491204e-05, - "loss": 0.0207, + "epoch": 1.12, + "learning_rate": 0.00013209627138772534, + "loss": 0.0345, "step": 173430 }, { - "epoch": 1.88, - "learning_rate": 1.860600947498215e-05, - "loss": 0.0233, + "epoch": 1.12, + "learning_rate": 0.0001320865900333684, + "loss": 0.0334, "step": 173440 }, { - "epoch": 1.88, - "learning_rate": 1.8589785190473097e-05, - "loss": 0.0234, + "epoch": 1.12, + "learning_rate": 0.00013207690867901144, + "loss": 0.0281, "step": 173450 }, { - "epoch": 1.88, - "learning_rate": 1.8573560905964043e-05, - "loss": 0.0243, + "epoch": 1.12, + "learning_rate": 0.00013206722732465452, + "loss": 0.0302, "step": 173460 }, { - "epoch": 1.88, - "learning_rate": 1.8557336621454993e-05, - "loss": 0.0258, + "epoch": 1.12, + "learning_rate": 0.0001320575459702976, + "loss": 0.0295, "step": 173470 }, { - "epoch": 1.88, - "learning_rate": 1.854111233694594e-05, - "loss": 0.022, + "epoch": 1.12, + "learning_rate": 0.00013204786461594066, + "loss": 0.0344, "step": 173480 }, { - "epoch": 1.88, - "learning_rate": 1.8524888052436886e-05, - "loss": 0.0232, + "epoch": 1.12, + "learning_rate": 0.00013203818326158374, + "loss": 0.0352, "step": 173490 }, { - "epoch": 1.88, - "learning_rate": 1.8508663767927832e-05, - "loss": 0.0261, + "epoch": 1.12, + "learning_rate": 0.00013202850190722682, + "loss": 0.0314, "step": 173500 }, { - "epoch": 1.88, - "learning_rate": 1.8492439483418782e-05, - "loss": 0.0294, + "epoch": 1.12, + "learning_rate": 0.00013201882055286987, + "loss": 0.0426, "step": 173510 }, { - "epoch": 1.88, - "learning_rate": 1.8476215198909728e-05, - "loss": 0.0254, + "epoch": 1.12, + "learning_rate": 0.00013200913919851292, + "loss": 0.033, "step": 173520 }, { - "epoch": 1.88, - "learning_rate": 1.8459990914400675e-05, - "loss": 0.0277, + "epoch": 1.12, + "learning_rate": 0.000131999457844156, + "loss": 0.0363, "step": 173530 }, { - "epoch": 1.88, - "learning_rate": 1.844376662989162e-05, - "loss": 0.0268, + "epoch": 1.12, + "learning_rate": 0.00013198977648979908, + "loss": 0.0371, "step": 173540 }, { - "epoch": 1.88, - "learning_rate": 1.8427542345382567e-05, - "loss": 0.026, + "epoch": 1.12, + "learning_rate": 0.00013198009513544213, + "loss": 0.0359, "step": 173550 }, { - "epoch": 1.88, - "learning_rate": 1.8411318060873514e-05, - "loss": 0.027, + "epoch": 1.12, + "learning_rate": 0.0001319704137810852, + "loss": 0.0368, "step": 173560 }, { - "epoch": 1.88, - "learning_rate": 1.839509377636446e-05, - "loss": 0.0188, + "epoch": 1.12, + "learning_rate": 0.00013196073242672827, + "loss": 0.0345, "step": 173570 }, { - "epoch": 1.88, - "learning_rate": 1.8378869491855407e-05, - "loss": 0.0252, + "epoch": 1.12, + "learning_rate": 0.00013195105107237135, + "loss": 0.0341, "step": 173580 }, { - "epoch": 1.88, - "learning_rate": 1.8362645207346356e-05, - "loss": 0.0264, + "epoch": 1.12, + "learning_rate": 0.0001319413697180144, + "loss": 0.0335, "step": 173590 }, { - "epoch": 1.88, - "learning_rate": 1.8346420922837303e-05, - "loss": 0.027, + "epoch": 1.12, + "learning_rate": 0.00013193168836365748, + "loss": 0.0358, "step": 173600 }, { - "epoch": 1.88, - "learning_rate": 1.833019663832825e-05, - "loss": 0.0182, + "epoch": 1.12, + "learning_rate": 0.00013192200700930056, + "loss": 0.0286, "step": 173610 }, { - "epoch": 1.88, - "learning_rate": 1.8313972353819196e-05, - "loss": 0.0276, + "epoch": 1.12, + "learning_rate": 0.0001319123256549436, + "loss": 0.0321, "step": 173620 }, { - "epoch": 1.88, - "learning_rate": 1.8297748069310142e-05, - "loss": 0.0295, + "epoch": 1.12, + "learning_rate": 0.0001319026443005867, + "loss": 0.0282, "step": 173630 }, { - "epoch": 1.88, - "learning_rate": 1.8281523784801088e-05, - "loss": 0.0247, + "epoch": 1.12, + "learning_rate": 0.00013189296294622974, + "loss": 0.0333, "step": 173640 }, { - "epoch": 1.88, - "learning_rate": 1.8265299500292035e-05, - "loss": 0.0224, + "epoch": 1.12, + "learning_rate": 0.0001318832815918728, + "loss": 0.033, "step": 173650 }, { - "epoch": 1.88, - "learning_rate": 1.824907521578298e-05, - "loss": 0.0292, + "epoch": 1.12, + "learning_rate": 0.00013187360023751588, + "loss": 0.032, "step": 173660 }, { - "epoch": 1.88, - "learning_rate": 1.8232850931273927e-05, - "loss": 0.0258, + "epoch": 1.12, + "learning_rate": 0.00013186391888315896, + "loss": 0.0301, "step": 173670 }, { - "epoch": 1.88, - "learning_rate": 1.8216626646764877e-05, - "loss": 0.0268, + "epoch": 1.12, + "learning_rate": 0.00013185423752880204, + "loss": 0.0303, "step": 173680 }, { - "epoch": 1.88, - "learning_rate": 1.8200402362255824e-05, - "loss": 0.024, - "step": 173690 + "epoch": 1.12, + "learning_rate": 0.0001318445561744451, + "loss": 0.0378, + "step": 173690 }, { - "epoch": 1.88, - "learning_rate": 1.818417807774677e-05, - "loss": 0.0177, + "epoch": 1.12, + "learning_rate": 0.00013183487482008817, + "loss": 0.0328, "step": 173700 }, { - "epoch": 1.88, - "learning_rate": 1.8167953793237716e-05, - "loss": 0.0216, + "epoch": 1.12, + "learning_rate": 0.00013182519346573122, + "loss": 0.0338, "step": 173710 }, { - "epoch": 1.88, - "learning_rate": 1.8151729508728663e-05, - "loss": 0.0252, + "epoch": 1.12, + "learning_rate": 0.00013181551211137427, + "loss": 0.0294, "step": 173720 }, { - "epoch": 1.88, - "learning_rate": 1.813550522421961e-05, - "loss": 0.023, + "epoch": 1.12, + "learning_rate": 0.00013180583075701735, + "loss": 0.0325, "step": 173730 }, { - "epoch": 1.88, - "learning_rate": 1.8119280939710555e-05, - "loss": 0.0254, + "epoch": 1.12, + "learning_rate": 0.00013179614940266043, + "loss": 0.0297, "step": 173740 }, { - "epoch": 1.88, - "learning_rate": 1.8103056655201502e-05, - "loss": 0.0296, + "epoch": 1.12, + "learning_rate": 0.0001317864680483035, + "loss": 0.0367, "step": 173750 }, { - "epoch": 1.88, - "learning_rate": 1.808683237069245e-05, - "loss": 0.0273, + "epoch": 1.12, + "learning_rate": 0.00013177678669394657, + "loss": 0.0339, "step": 173760 }, { - "epoch": 1.88, - "learning_rate": 1.8070608086183398e-05, - "loss": 0.03, + "epoch": 1.12, + "learning_rate": 0.00013176710533958962, + "loss": 0.0341, "step": 173770 }, { - "epoch": 1.88, - "learning_rate": 1.8054383801674344e-05, - "loss": 0.0192, + "epoch": 1.12, + "learning_rate": 0.0001317574239852327, + "loss": 0.0347, "step": 173780 }, { - "epoch": 1.88, - "learning_rate": 1.803815951716529e-05, - "loss": 0.0233, + "epoch": 1.12, + "learning_rate": 0.00013174774263087575, + "loss": 0.0312, "step": 173790 }, { - "epoch": 1.88, - "learning_rate": 1.802193523265624e-05, - "loss": 0.0216, + "epoch": 1.12, + "learning_rate": 0.00013173806127651883, + "loss": 0.0367, "step": 173800 }, { - "epoch": 1.88, - "learning_rate": 1.8005710948147187e-05, - "loss": 0.0262, + "epoch": 1.12, + "learning_rate": 0.0001317283799221619, + "loss": 0.0366, "step": 173810 }, { - "epoch": 1.88, - "learning_rate": 1.7989486663638133e-05, - "loss": 0.0227, + "epoch": 1.12, + "learning_rate": 0.00013171869856780496, + "loss": 0.0316, "step": 173820 }, { - "epoch": 1.88, - "learning_rate": 1.797326237912908e-05, - "loss": 0.0253, + "epoch": 1.12, + "learning_rate": 0.00013170901721344804, + "loss": 0.0329, "step": 173830 }, { - "epoch": 1.88, - "learning_rate": 1.7957038094620026e-05, - "loss": 0.0241, + "epoch": 1.12, + "learning_rate": 0.0001316993358590911, + "loss": 0.0327, "step": 173840 }, { - "epoch": 1.88, - "learning_rate": 1.7940813810110972e-05, - "loss": 0.0256, + "epoch": 1.12, + "learning_rate": 0.00013168965450473417, + "loss": 0.0364, "step": 173850 }, { - "epoch": 1.88, - "learning_rate": 1.792458952560192e-05, - "loss": 0.0258, + "epoch": 1.12, + "learning_rate": 0.00013167997315037723, + "loss": 0.0363, "step": 173860 }, { - "epoch": 1.88, - "learning_rate": 1.7908365241092865e-05, - "loss": 0.0225, + "epoch": 1.12, + "learning_rate": 0.0001316702917960203, + "loss": 0.027, "step": 173870 }, { - "epoch": 1.88, - "learning_rate": 1.7892140956583815e-05, - "loss": 0.0236, + "epoch": 1.12, + "learning_rate": 0.0001316606104416634, + "loss": 0.0358, "step": 173880 }, { - "epoch": 1.88, - "learning_rate": 1.787591667207476e-05, - "loss": 0.024, + "epoch": 1.12, + "learning_rate": 0.00013165092908730644, + "loss": 0.0326, "step": 173890 }, { - "epoch": 1.88, - "learning_rate": 1.7859692387565708e-05, - "loss": 0.0219, + "epoch": 1.12, + "learning_rate": 0.00013164124773294952, + "loss": 0.0351, "step": 173900 }, { - "epoch": 1.88, - "learning_rate": 1.7843468103056654e-05, - "loss": 0.023, + "epoch": 1.12, + "learning_rate": 0.00013163156637859257, + "loss": 0.0355, "step": 173910 }, { - "epoch": 1.88, - "learning_rate": 1.78272438185476e-05, - "loss": 0.0225, + "epoch": 1.12, + "learning_rate": 0.00013162188502423565, + "loss": 0.0325, "step": 173920 }, { - "epoch": 1.88, - "learning_rate": 1.7811019534038547e-05, - "loss": 0.0225, + "epoch": 1.12, + "learning_rate": 0.0001316122036698787, + "loss": 0.0319, "step": 173930 }, { - "epoch": 1.88, - "learning_rate": 1.7794795249529493e-05, - "loss": 0.0237, + "epoch": 1.12, + "learning_rate": 0.00013160252231552178, + "loss": 0.038, "step": 173940 }, { - "epoch": 1.88, - "learning_rate": 1.777857096502044e-05, - "loss": 0.0239, + "epoch": 1.12, + "learning_rate": 0.00013159284096116486, + "loss": 0.0319, "step": 173950 }, { - "epoch": 1.88, - "learning_rate": 1.7762346680511386e-05, - "loss": 0.027, + "epoch": 1.12, + "learning_rate": 0.00013158315960680792, + "loss": 0.0368, "step": 173960 }, { - "epoch": 1.88, - "learning_rate": 1.7746122396002336e-05, - "loss": 0.0244, + "epoch": 1.12, + "learning_rate": 0.00013157347825245097, + "loss": 0.036, "step": 173970 }, { - "epoch": 1.88, - "learning_rate": 1.7729898111493282e-05, - "loss": 0.0209, + "epoch": 1.12, + "learning_rate": 0.00013156379689809405, + "loss": 0.0406, "step": 173980 }, { - "epoch": 1.88, - "learning_rate": 1.771367382698423e-05, - "loss": 0.0221, + "epoch": 1.12, + "learning_rate": 0.00013155411554373713, + "loss": 0.034, "step": 173990 }, { - "epoch": 1.88, - "learning_rate": 1.7697449542475175e-05, - "loss": 0.0234, + "epoch": 1.12, + "learning_rate": 0.00013154443418938018, + "loss": 0.0339, "step": 174000 }, { - "epoch": 1.88, - "eval_cer": 0.9210792291069211, - "eval_loss": 0.020512666553258896, - "eval_runtime": 118.9491, - "eval_samples_per_second": 16.814, - "eval_steps_per_second": 4.203, + "epoch": 1.12, + "eval_cer": 0.9199159417015027, + "eval_loss": 0.0237259678542614, + "eval_runtime": 120.3788, + "eval_samples_per_second": 16.614, + "eval_steps_per_second": 4.154, "step": 174000 }, { - "epoch": 1.88, - "learning_rate": 1.768122525796612e-05, - "loss": 0.0274, + "epoch": 1.12, + "learning_rate": 0.00013153475283502326, + "loss": 0.0352, "step": 174010 }, { - "epoch": 1.88, - "learning_rate": 1.7665000973457068e-05, - "loss": 0.0275, + "epoch": 1.12, + "learning_rate": 0.00013152507148066631, + "loss": 0.034, "step": 174020 }, { - "epoch": 1.88, - "learning_rate": 1.7648776688948014e-05, - "loss": 0.026, + "epoch": 1.12, + "learning_rate": 0.0001315153901263094, + "loss": 0.0366, "step": 174030 }, { - "epoch": 1.88, - "learning_rate": 1.763255240443896e-05, - "loss": 0.0242, + "epoch": 1.12, + "learning_rate": 0.00013150570877195245, + "loss": 0.0344, "step": 174040 }, { - "epoch": 1.88, - "learning_rate": 1.761632811992991e-05, - "loss": 0.0291, + "epoch": 1.12, + "learning_rate": 0.00013149602741759553, + "loss": 0.0332, "step": 174050 }, { - "epoch": 1.88, - "learning_rate": 1.7600103835420857e-05, - "loss": 0.0269, + "epoch": 1.12, + "learning_rate": 0.0001314863460632386, + "loss": 0.0311, "step": 174060 }, { - "epoch": 1.88, - "learning_rate": 1.7583879550911803e-05, - "loss": 0.022, + "epoch": 1.12, + "learning_rate": 0.00013147666470888166, + "loss": 0.0377, "step": 174070 }, { - "epoch": 1.88, - "learning_rate": 1.756765526640275e-05, - "loss": 0.0247, + "epoch": 1.12, + "learning_rate": 0.00013146698335452474, + "loss": 0.034, "step": 174080 }, { - "epoch": 1.88, - "learning_rate": 1.75514309818937e-05, - "loss": 0.0212, + "epoch": 1.12, + "learning_rate": 0.0001314573020001678, + "loss": 0.0359, "step": 174090 }, { - "epoch": 1.88, - "learning_rate": 1.7535206697384646e-05, - "loss": 0.028, + "epoch": 1.12, + "learning_rate": 0.00013144762064581087, + "loss": 0.0361, "step": 174100 }, { - "epoch": 1.88, - "learning_rate": 1.7518982412875592e-05, - "loss": 0.0244, + "epoch": 1.12, + "learning_rate": 0.00013143793929145392, + "loss": 0.0343, "step": 174110 }, { - "epoch": 1.88, - "learning_rate": 1.750275812836654e-05, - "loss": 0.0273, + "epoch": 1.12, + "learning_rate": 0.000131428257937097, + "loss": 0.0348, "step": 174120 }, { - "epoch": 1.88, - "learning_rate": 1.7486533843857485e-05, - "loss": 0.0175, + "epoch": 1.12, + "learning_rate": 0.00013141857658274008, + "loss": 0.0363, "step": 174130 }, { - "epoch": 1.88, - "learning_rate": 1.747030955934843e-05, - "loss": 0.0247, + "epoch": 1.12, + "learning_rate": 0.00013140889522838314, + "loss": 0.0383, "step": 174140 }, { - "epoch": 1.88, - "learning_rate": 1.7454085274839378e-05, - "loss": 0.0261, + "epoch": 1.12, + "learning_rate": 0.00013139921387402622, + "loss": 0.0319, "step": 174150 }, { - "epoch": 1.88, - "learning_rate": 1.7437860990330324e-05, - "loss": 0.0226, + "epoch": 1.12, + "learning_rate": 0.00013138953251966927, + "loss": 0.0326, "step": 174160 }, { - "epoch": 1.88, - "learning_rate": 1.7421636705821274e-05, - "loss": 0.0223, + "epoch": 1.12, + "learning_rate": 0.00013137985116531232, + "loss": 0.0366, "step": 174170 }, { - "epoch": 1.88, - "learning_rate": 1.740541242131222e-05, - "loss": 0.0231, + "epoch": 1.12, + "learning_rate": 0.0001313701698109554, + "loss": 0.0302, "step": 174180 }, { - "epoch": 1.88, - "learning_rate": 1.7389188136803166e-05, - "loss": 0.0256, + "epoch": 1.12, + "learning_rate": 0.00013136048845659848, + "loss": 0.0372, "step": 174190 }, { - "epoch": 1.88, - "learning_rate": 1.7372963852294113e-05, - "loss": 0.0232, + "epoch": 1.12, + "learning_rate": 0.00013135080710224156, + "loss": 0.0339, "step": 174200 }, { - "epoch": 1.88, - "learning_rate": 1.735673956778506e-05, - "loss": 0.0253, + "epoch": 1.12, + "learning_rate": 0.00013134112574788461, + "loss": 0.0316, "step": 174210 }, { - "epoch": 1.88, - "learning_rate": 1.7340515283276006e-05, - "loss": 0.0246, + "epoch": 1.12, + "learning_rate": 0.00013133144439352767, + "loss": 0.0332, "step": 174220 }, { - "epoch": 1.88, - "learning_rate": 1.7324290998766952e-05, - "loss": 0.0256, + "epoch": 1.12, + "learning_rate": 0.00013132176303917075, + "loss": 0.0353, "step": 174230 }, { - "epoch": 1.88, - "learning_rate": 1.73080667142579e-05, - "loss": 0.0218, + "epoch": 1.12, + "learning_rate": 0.0001313120816848138, + "loss": 0.0442, "step": 174240 }, { - "epoch": 1.88, - "learning_rate": 1.7291842429748848e-05, - "loss": 0.0226, + "epoch": 1.12, + "learning_rate": 0.00013130240033045688, + "loss": 0.0302, "step": 174250 }, { - "epoch": 1.88, - "learning_rate": 1.7275618145239794e-05, - "loss": 0.0251, + "epoch": 1.12, + "learning_rate": 0.00013129271897609996, + "loss": 0.0368, "step": 174260 }, { - "epoch": 1.88, - "learning_rate": 1.725939386073074e-05, - "loss": 0.0243, + "epoch": 1.12, + "learning_rate": 0.00013128303762174304, + "loss": 0.0331, "step": 174270 }, { - "epoch": 1.89, - "learning_rate": 1.7243169576221687e-05, - "loss": 0.0251, + "epoch": 1.12, + "learning_rate": 0.0001312733562673861, + "loss": 0.043, "step": 174280 }, { - "epoch": 1.89, - "learning_rate": 1.7226945291712634e-05, - "loss": 0.022, + "epoch": 1.12, + "learning_rate": 0.00013126367491302914, + "loss": 0.0365, "step": 174290 }, { - "epoch": 1.89, - "learning_rate": 1.721072100720358e-05, - "loss": 0.023, + "epoch": 1.12, + "learning_rate": 0.00013125399355867222, + "loss": 0.0367, "step": 174300 }, { - "epoch": 1.89, - "learning_rate": 1.7194496722694526e-05, - "loss": 0.0295, + "epoch": 1.13, + "learning_rate": 0.00013124431220431528, + "loss": 0.0319, "step": 174310 }, { - "epoch": 1.89, - "learning_rate": 1.7178272438185473e-05, - "loss": 0.0241, + "epoch": 1.13, + "learning_rate": 0.00013123463084995836, + "loss": 0.0333, "step": 174320 }, { - "epoch": 1.89, - "learning_rate": 1.716204815367642e-05, - "loss": 0.0311, + "epoch": 1.13, + "learning_rate": 0.00013122494949560144, + "loss": 0.034, "step": 174330 }, { - "epoch": 1.89, - "learning_rate": 1.714582386916737e-05, - "loss": 0.0217, + "epoch": 1.13, + "learning_rate": 0.0001312152681412445, + "loss": 0.0295, "step": 174340 }, { - "epoch": 1.89, - "learning_rate": 1.7129599584658315e-05, - "loss": 0.0259, + "epoch": 1.13, + "learning_rate": 0.00013120558678688757, + "loss": 0.0365, "step": 174350 }, { - "epoch": 1.89, - "learning_rate": 1.7113375300149262e-05, - "loss": 0.0252, + "epoch": 1.13, + "learning_rate": 0.00013119590543253062, + "loss": 0.0343, "step": 174360 }, { - "epoch": 1.89, - "learning_rate": 1.7097151015640208e-05, - "loss": 0.03, + "epoch": 1.13, + "learning_rate": 0.0001311862240781737, + "loss": 0.0302, "step": 174370 }, { - "epoch": 1.89, - "learning_rate": 1.7080926731131158e-05, - "loss": 0.0222, + "epoch": 1.13, + "learning_rate": 0.00013117654272381675, + "loss": 0.0328, "step": 174380 }, { - "epoch": 1.89, - "learning_rate": 1.7064702446622104e-05, - "loss": 0.0252, + "epoch": 1.13, + "learning_rate": 0.00013116686136945983, + "loss": 0.0348, "step": 174390 }, { - "epoch": 1.89, - "learning_rate": 1.704847816211305e-05, - "loss": 0.0285, + "epoch": 1.13, + "learning_rate": 0.0001311571800151029, + "loss": 0.0378, "step": 174400 }, { - "epoch": 1.89, - "learning_rate": 1.7032253877603997e-05, - "loss": 0.0268, + "epoch": 1.13, + "learning_rate": 0.00013114749866074597, + "loss": 0.0356, "step": 174410 }, { - "epoch": 1.89, - "learning_rate": 1.7016029593094943e-05, - "loss": 0.0265, + "epoch": 1.13, + "learning_rate": 0.00013113781730638902, + "loss": 0.0313, "step": 174420 }, { - "epoch": 1.89, - "learning_rate": 1.699980530858589e-05, - "loss": 0.023, + "epoch": 1.13, + "learning_rate": 0.0001311281359520321, + "loss": 0.0357, "step": 174430 }, { - "epoch": 1.89, - "learning_rate": 1.6983581024076836e-05, - "loss": 0.0215, + "epoch": 1.13, + "learning_rate": 0.00013111845459767518, + "loss": 0.0483, "step": 174440 }, { - "epoch": 1.89, - "learning_rate": 1.6967356739567783e-05, - "loss": 0.0269, + "epoch": 1.13, + "learning_rate": 0.00013110877324331823, + "loss": 0.0275, "step": 174450 }, { - "epoch": 1.89, - "learning_rate": 1.6951132455058732e-05, - "loss": 0.031, + "epoch": 1.13, + "learning_rate": 0.0001310990918889613, + "loss": 0.0361, "step": 174460 }, { - "epoch": 1.89, - "learning_rate": 1.693490817054968e-05, - "loss": 0.0247, + "epoch": 1.13, + "learning_rate": 0.0001310894105346044, + "loss": 0.0319, "step": 174470 }, { - "epoch": 1.89, - "learning_rate": 1.6918683886040625e-05, - "loss": 0.0251, + "epoch": 1.13, + "learning_rate": 0.00013107972918024744, + "loss": 0.0294, "step": 174480 }, { - "epoch": 1.89, - "learning_rate": 1.690245960153157e-05, - "loss": 0.0265, + "epoch": 1.13, + "learning_rate": 0.0001310700478258905, + "loss": 0.0392, "step": 174490 }, { - "epoch": 1.89, - "learning_rate": 1.6886235317022518e-05, - "loss": 0.0267, + "epoch": 1.13, + "learning_rate": 0.00013106036647153358, + "loss": 0.0364, "step": 174500 }, { - "epoch": 1.89, - "learning_rate": 1.6870011032513464e-05, - "loss": 0.0265, + "epoch": 1.13, + "learning_rate": 0.00013105068511717666, + "loss": 0.0306, "step": 174510 }, { - "epoch": 1.89, - "learning_rate": 1.685378674800441e-05, - "loss": 0.0287, + "epoch": 1.13, + "learning_rate": 0.0001310410037628197, + "loss": 0.0295, "step": 174520 }, { - "epoch": 1.89, - "learning_rate": 1.6837562463495357e-05, - "loss": 0.0261, + "epoch": 1.13, + "learning_rate": 0.0001310313224084628, + "loss": 0.0345, "step": 174530 }, { - "epoch": 1.89, - "learning_rate": 1.6821338178986307e-05, - "loss": 0.0228, + "epoch": 1.13, + "learning_rate": 0.00013102164105410584, + "loss": 0.0344, "step": 174540 }, { - "epoch": 1.89, - "learning_rate": 1.6805113894477253e-05, - "loss": 0.0269, + "epoch": 1.13, + "learning_rate": 0.00013101195969974892, + "loss": 0.0346, "step": 174550 }, { - "epoch": 1.89, - "learning_rate": 1.67888896099682e-05, - "loss": 0.0203, + "epoch": 1.13, + "learning_rate": 0.00013100227834539197, + "loss": 0.0325, "step": 174560 }, { - "epoch": 1.89, - "learning_rate": 1.6772665325459146e-05, - "loss": 0.0276, + "epoch": 1.13, + "learning_rate": 0.00013099259699103505, + "loss": 0.0334, "step": 174570 }, { - "epoch": 1.89, - "learning_rate": 1.6756441040950092e-05, - "loss": 0.0235, + "epoch": 1.13, + "learning_rate": 0.00013098291563667813, + "loss": 0.0329, "step": 174580 }, { - "epoch": 1.89, - "learning_rate": 1.674021675644104e-05, - "loss": 0.0236, + "epoch": 1.13, + "learning_rate": 0.00013097323428232119, + "loss": 0.0289, "step": 174590 }, { - "epoch": 1.89, - "learning_rate": 1.6723992471931985e-05, - "loss": 0.0251, + "epoch": 1.13, + "learning_rate": 0.00013096355292796426, + "loss": 0.0311, "step": 174600 }, { - "epoch": 1.89, - "learning_rate": 1.670776818742293e-05, - "loss": 0.0259, + "epoch": 1.13, + "learning_rate": 0.00013095387157360732, + "loss": 0.0359, "step": 174610 }, { - "epoch": 1.89, - "learning_rate": 1.6691543902913878e-05, - "loss": 0.0231, + "epoch": 1.13, + "learning_rate": 0.0001309441902192504, + "loss": 0.037, "step": 174620 }, { - "epoch": 1.89, - "learning_rate": 1.6675319618404828e-05, - "loss": 0.0251, + "epoch": 1.13, + "learning_rate": 0.00013093450886489345, + "loss": 0.034, "step": 174630 }, { - "epoch": 1.89, - "learning_rate": 1.6659095333895774e-05, - "loss": 0.0249, + "epoch": 1.13, + "learning_rate": 0.00013092482751053653, + "loss": 0.0352, "step": 174640 }, { - "epoch": 1.89, - "learning_rate": 1.664287104938672e-05, - "loss": 0.0261, + "epoch": 1.13, + "learning_rate": 0.0001309151461561796, + "loss": 0.038, "step": 174650 }, { - "epoch": 1.89, - "learning_rate": 1.6626646764877667e-05, - "loss": 0.0247, + "epoch": 1.13, + "learning_rate": 0.00013090546480182266, + "loss": 0.0338, "step": 174660 }, { - "epoch": 1.89, - "learning_rate": 1.6610422480368613e-05, - "loss": 0.0262, + "epoch": 1.13, + "learning_rate": 0.00013089578344746574, + "loss": 0.0315, "step": 174670 }, { - "epoch": 1.89, - "learning_rate": 1.6594198195859563e-05, - "loss": 0.0232, + "epoch": 1.13, + "learning_rate": 0.0001308861020931088, + "loss": 0.0321, "step": 174680 }, { - "epoch": 1.89, - "learning_rate": 1.657797391135051e-05, - "loss": 0.0273, + "epoch": 1.13, + "learning_rate": 0.00013087642073875187, + "loss": 0.035, "step": 174690 }, { - "epoch": 1.89, - "learning_rate": 1.6561749626841456e-05, - "loss": 0.0226, + "epoch": 1.13, + "learning_rate": 0.00013086673938439493, + "loss": 0.0314, "step": 174700 }, { - "epoch": 1.89, - "learning_rate": 1.6545525342332402e-05, - "loss": 0.0229, + "epoch": 1.13, + "learning_rate": 0.000130857058030038, + "loss": 0.0268, "step": 174710 }, { - "epoch": 1.89, - "learning_rate": 1.652930105782335e-05, - "loss": 0.0321, + "epoch": 1.13, + "learning_rate": 0.0001308473766756811, + "loss": 0.037, "step": 174720 }, { - "epoch": 1.89, - "learning_rate": 1.6513076773314295e-05, - "loss": 0.0259, + "epoch": 1.13, + "learning_rate": 0.00013083769532132414, + "loss": 0.0311, "step": 174730 }, { - "epoch": 1.89, - "learning_rate": 1.649685248880524e-05, - "loss": 0.0196, + "epoch": 1.13, + "learning_rate": 0.0001308280139669672, + "loss": 0.0354, "step": 174740 }, { - "epoch": 1.89, - "learning_rate": 1.648062820429619e-05, - "loss": 0.0204, + "epoch": 1.13, + "learning_rate": 0.00013081833261261027, + "loss": 0.0254, "step": 174750 }, { - "epoch": 1.89, - "learning_rate": 1.6464403919787137e-05, - "loss": 0.0204, + "epoch": 1.13, + "learning_rate": 0.00013080865125825335, + "loss": 0.0355, "step": 174760 }, { - "epoch": 1.89, - "learning_rate": 1.6448179635278084e-05, - "loss": 0.0262, + "epoch": 1.13, + "learning_rate": 0.0001307989699038964, + "loss": 0.0286, "step": 174770 }, { - "epoch": 1.89, - "learning_rate": 1.643195535076903e-05, - "loss": 0.0239, + "epoch": 1.13, + "learning_rate": 0.00013078928854953948, + "loss": 0.0319, "step": 174780 }, { - "epoch": 1.89, - "learning_rate": 1.6415731066259976e-05, - "loss": 0.0265, + "epoch": 1.13, + "learning_rate": 0.00013077960719518256, + "loss": 0.0308, "step": 174790 }, { - "epoch": 1.89, - "learning_rate": 1.6399506781750923e-05, - "loss": 0.0205, + "epoch": 1.13, + "learning_rate": 0.00013076992584082562, + "loss": 0.0341, "step": 174800 }, { - "epoch": 1.89, - "learning_rate": 1.638328249724187e-05, - "loss": 0.0219, + "epoch": 1.13, + "learning_rate": 0.00013076024448646867, + "loss": 0.0301, "step": 174810 }, { - "epoch": 1.89, - "learning_rate": 1.6367058212732816e-05, - "loss": 0.0218, + "epoch": 1.13, + "learning_rate": 0.00013075056313211175, + "loss": 0.0337, "step": 174820 }, { - "epoch": 1.89, - "learning_rate": 1.6350833928223765e-05, - "loss": 0.0212, + "epoch": 1.13, + "learning_rate": 0.00013074088177775483, + "loss": 0.0404, "step": 174830 }, { - "epoch": 1.89, - "learning_rate": 1.6334609643714712e-05, - "loss": 0.0247, + "epoch": 1.13, + "learning_rate": 0.00013073120042339788, + "loss": 0.0337, "step": 174840 }, { - "epoch": 1.89, - "learning_rate": 1.6318385359205658e-05, - "loss": 0.0227, + "epoch": 1.13, + "learning_rate": 0.00013072151906904096, + "loss": 0.043, "step": 174850 }, { - "epoch": 1.89, - "learning_rate": 1.6302161074696605e-05, - "loss": 0.0251, + "epoch": 1.13, + "learning_rate": 0.00013071183771468401, + "loss": 0.0414, "step": 174860 }, { - "epoch": 1.89, - "learning_rate": 1.628593679018755e-05, - "loss": 0.0235, + "epoch": 1.13, + "learning_rate": 0.0001307021563603271, + "loss": 0.0317, "step": 174870 }, { - "epoch": 1.89, - "learning_rate": 1.6269712505678497e-05, - "loss": 0.0241, + "epoch": 1.13, + "learning_rate": 0.00013069247500597015, + "loss": 0.0357, "step": 174880 }, { - "epoch": 1.89, - "learning_rate": 1.6253488221169444e-05, - "loss": 0.0265, + "epoch": 1.13, + "learning_rate": 0.00013068279365161323, + "loss": 0.0308, "step": 174890 }, { - "epoch": 1.89, - "learning_rate": 1.623726393666039e-05, - "loss": 0.0219, + "epoch": 1.13, + "learning_rate": 0.0001306731122972563, + "loss": 0.0335, "step": 174900 }, { - "epoch": 1.89, - "learning_rate": 1.6221039652151336e-05, - "loss": 0.0229, + "epoch": 1.13, + "learning_rate": 0.00013066343094289936, + "loss": 0.0325, "step": 174910 }, { - "epoch": 1.89, - "learning_rate": 1.6204815367642286e-05, - "loss": 0.0233, + "epoch": 1.13, + "learning_rate": 0.00013065374958854244, + "loss": 0.0371, "step": 174920 }, { - "epoch": 1.89, - "learning_rate": 1.6188591083133233e-05, - "loss": 0.0245, + "epoch": 1.13, + "learning_rate": 0.0001306440682341855, + "loss": 0.0341, "step": 174930 }, { - "epoch": 1.89, - "learning_rate": 1.617236679862418e-05, - "loss": 0.0269, + "epoch": 1.13, + "learning_rate": 0.00013063438687982854, + "loss": 0.0352, "step": 174940 }, { - "epoch": 1.89, - "learning_rate": 1.6156142514115125e-05, - "loss": 0.0224, + "epoch": 1.13, + "learning_rate": 0.00013062470552547162, + "loss": 0.0365, "step": 174950 }, { - "epoch": 1.89, - "learning_rate": 1.6139918229606072e-05, - "loss": 0.0234, - "step": 174960 + "epoch": 1.13, + "learning_rate": 0.0001306150241711147, + "loss": 0.0393, + "step": 174960 }, { - "epoch": 1.89, - "learning_rate": 1.612369394509702e-05, - "loss": 0.0236, + "epoch": 1.13, + "learning_rate": 0.00013060534281675778, + "loss": 0.033, "step": 174970 }, { - "epoch": 1.89, - "learning_rate": 1.6107469660587968e-05, - "loss": 0.0237, + "epoch": 1.13, + "learning_rate": 0.00013059566146240084, + "loss": 0.0382, "step": 174980 }, { - "epoch": 1.89, - "learning_rate": 1.6091245376078914e-05, - "loss": 0.0239, + "epoch": 1.13, + "learning_rate": 0.00013058598010804392, + "loss": 0.0389, "step": 174990 }, { - "epoch": 1.89, - "learning_rate": 1.607502109156986e-05, - "loss": 0.0222, + "epoch": 1.13, + "learning_rate": 0.00013057629875368697, + "loss": 0.0319, "step": 175000 }, { - "epoch": 1.89, - "eval_cer": 0.921070394263713, - "eval_loss": 0.020397888496518135, - "eval_runtime": 118.8774, - "eval_samples_per_second": 16.824, - "eval_steps_per_second": 4.206, + "epoch": 1.13, + "eval_cer": 0.919877979889278, + "eval_loss": 0.02397312968969345, + "eval_runtime": 120.0597, + "eval_samples_per_second": 16.658, + "eval_steps_per_second": 4.165, "step": 175000 }, { - "epoch": 1.89, - "learning_rate": 1.6058796807060807e-05, - "loss": 0.0214, + "epoch": 1.13, + "learning_rate": 0.00013056661739933002, + "loss": 0.0353, "step": 175010 }, { - "epoch": 1.89, - "learning_rate": 1.6042572522551753e-05, - "loss": 0.0345, + "epoch": 1.13, + "learning_rate": 0.0001305569360449731, + "loss": 0.0348, "step": 175020 }, { - "epoch": 1.89, - "learning_rate": 1.60263482380427e-05, - "loss": 0.0266, + "epoch": 1.13, + "learning_rate": 0.00013054725469061618, + "loss": 0.033, "step": 175030 }, { - "epoch": 1.89, - "learning_rate": 1.601012395353365e-05, - "loss": 0.0257, + "epoch": 1.13, + "learning_rate": 0.00013053757333625926, + "loss": 0.0311, "step": 175040 }, { - "epoch": 1.89, - "learning_rate": 1.5993899669024596e-05, - "loss": 0.024, + "epoch": 1.13, + "learning_rate": 0.0001305278919819023, + "loss": 0.0347, "step": 175050 }, { - "epoch": 1.89, - "learning_rate": 1.5977675384515542e-05, - "loss": 0.0226, + "epoch": 1.13, + "learning_rate": 0.00013051821062754537, + "loss": 0.0364, "step": 175060 }, { - "epoch": 1.89, - "learning_rate": 1.596145110000649e-05, - "loss": 0.0218, + "epoch": 1.13, + "learning_rate": 0.00013050852927318845, + "loss": 0.0294, "step": 175070 }, { - "epoch": 1.89, - "learning_rate": 1.5945226815497435e-05, - "loss": 0.0231, + "epoch": 1.13, + "learning_rate": 0.0001304988479188315, + "loss": 0.0339, "step": 175080 }, { - "epoch": 1.89, - "learning_rate": 1.592900253098838e-05, - "loss": 0.0277, + "epoch": 1.13, + "learning_rate": 0.00013048916656447458, + "loss": 0.0276, "step": 175090 }, { - "epoch": 1.89, - "learning_rate": 1.5912778246479328e-05, - "loss": 0.0223, + "epoch": 1.13, + "learning_rate": 0.00013047948521011766, + "loss": 0.03, "step": 175100 }, { - "epoch": 1.89, - "learning_rate": 1.5896553961970274e-05, - "loss": 0.0213, + "epoch": 1.13, + "learning_rate": 0.0001304698038557607, + "loss": 0.0315, "step": 175110 }, { - "epoch": 1.89, - "learning_rate": 1.5880329677461224e-05, - "loss": 0.0228, + "epoch": 1.13, + "learning_rate": 0.0001304601225014038, + "loss": 0.0339, "step": 175120 }, { - "epoch": 1.89, - "learning_rate": 1.586410539295217e-05, - "loss": 0.0198, + "epoch": 1.13, + "learning_rate": 0.00013045044114704684, + "loss": 0.0343, "step": 175130 }, { - "epoch": 1.89, - "learning_rate": 1.5847881108443117e-05, - "loss": 0.0227, + "epoch": 1.13, + "learning_rate": 0.00013044075979268992, + "loss": 0.0279, "step": 175140 }, { - "epoch": 1.89, - "learning_rate": 1.5831656823934063e-05, - "loss": 0.0276, + "epoch": 1.13, + "learning_rate": 0.00013043107843833298, + "loss": 0.0371, "step": 175150 }, { - "epoch": 1.89, - "learning_rate": 1.581543253942501e-05, - "loss": 0.0217, + "epoch": 1.13, + "learning_rate": 0.00013042139708397606, + "loss": 0.0344, "step": 175160 }, { - "epoch": 1.89, - "learning_rate": 1.5799208254915956e-05, - "loss": 0.0206, + "epoch": 1.13, + "learning_rate": 0.00013041171572961914, + "loss": 0.0362, "step": 175170 }, { - "epoch": 1.89, - "learning_rate": 1.5782983970406902e-05, - "loss": 0.0258, + "epoch": 1.13, + "learning_rate": 0.0001304020343752622, + "loss": 0.0308, "step": 175180 }, { - "epoch": 1.89, - "learning_rate": 1.576675968589785e-05, - "loss": 0.0226, + "epoch": 1.13, + "learning_rate": 0.00013039235302090527, + "loss": 0.0371, "step": 175190 }, { - "epoch": 1.89, - "learning_rate": 1.5750535401388795e-05, - "loss": 0.0242, + "epoch": 1.13, + "learning_rate": 0.00013038267166654832, + "loss": 0.0369, "step": 175200 }, { - "epoch": 1.9, - "learning_rate": 1.5734311116879745e-05, - "loss": 0.0224, + "epoch": 1.13, + "learning_rate": 0.0001303729903121914, + "loss": 0.0312, "step": 175210 }, { - "epoch": 1.9, - "learning_rate": 1.571808683237069e-05, - "loss": 0.0265, + "epoch": 1.13, + "learning_rate": 0.00013036330895783445, + "loss": 0.0325, "step": 175220 }, { - "epoch": 1.9, - "learning_rate": 1.5701862547861638e-05, - "loss": 0.0265, + "epoch": 1.13, + "learning_rate": 0.00013035362760347753, + "loss": 0.0351, "step": 175230 }, { - "epoch": 1.9, - "learning_rate": 1.5685638263352584e-05, - "loss": 0.0207, + "epoch": 1.13, + "learning_rate": 0.0001303439462491206, + "loss": 0.0323, "step": 175240 }, { - "epoch": 1.9, - "learning_rate": 1.566941397884353e-05, - "loss": 0.0217, + "epoch": 1.13, + "learning_rate": 0.00013033426489476367, + "loss": 0.0375, "step": 175250 }, { - "epoch": 1.9, - "learning_rate": 1.565318969433448e-05, - "loss": 0.027, + "epoch": 1.13, + "learning_rate": 0.00013032458354040672, + "loss": 0.0378, "step": 175260 }, { - "epoch": 1.9, - "learning_rate": 1.5636965409825427e-05, - "loss": 0.0227, + "epoch": 1.13, + "learning_rate": 0.0001303149021860498, + "loss": 0.0388, "step": 175270 }, { - "epoch": 1.9, - "learning_rate": 1.5620741125316373e-05, - "loss": 0.0258, + "epoch": 1.13, + "learning_rate": 0.00013030522083169288, + "loss": 0.0283, "step": 175280 }, { - "epoch": 1.9, - "learning_rate": 1.560451684080732e-05, - "loss": 0.0214, + "epoch": 1.13, + "learning_rate": 0.00013029553947733593, + "loss": 0.0351, "step": 175290 }, { - "epoch": 1.9, - "learning_rate": 1.5588292556298266e-05, - "loss": 0.0257, + "epoch": 1.13, + "learning_rate": 0.000130285858122979, + "loss": 0.0305, "step": 175300 }, { - "epoch": 1.9, - "learning_rate": 1.5572068271789212e-05, - "loss": 0.0217, + "epoch": 1.13, + "learning_rate": 0.00013027617676862206, + "loss": 0.0288, "step": 175310 }, { - "epoch": 1.9, - "learning_rate": 1.5555843987280162e-05, - "loss": 0.0195, + "epoch": 1.13, + "learning_rate": 0.00013026649541426514, + "loss": 0.0328, "step": 175320 }, { - "epoch": 1.9, - "learning_rate": 1.5539619702771108e-05, - "loss": 0.0212, + "epoch": 1.13, + "learning_rate": 0.0001302568140599082, + "loss": 0.0343, "step": 175330 }, { - "epoch": 1.9, - "learning_rate": 1.5523395418262055e-05, - "loss": 0.0196, + "epoch": 1.13, + "learning_rate": 0.00013024713270555128, + "loss": 0.0327, "step": 175340 }, { - "epoch": 1.9, - "learning_rate": 1.5507171133753e-05, + "epoch": 1.13, + "learning_rate": 0.00013023745135119435, "loss": 0.0286, "step": 175350 }, { - "epoch": 1.9, - "learning_rate": 1.5490946849243947e-05, - "loss": 0.0218, + "epoch": 1.13, + "learning_rate": 0.0001302277699968374, + "loss": 0.0326, "step": 175360 }, { - "epoch": 1.9, - "learning_rate": 1.5474722564734894e-05, - "loss": 0.0249, + "epoch": 1.13, + "learning_rate": 0.0001302180886424805, + "loss": 0.0313, "step": 175370 }, { - "epoch": 1.9, - "learning_rate": 1.545849828022584e-05, - "loss": 0.0244, + "epoch": 1.13, + "learning_rate": 0.00013020840728812354, + "loss": 0.037, "step": 175380 }, { - "epoch": 1.9, - "learning_rate": 1.5442273995716787e-05, - "loss": 0.0274, + "epoch": 1.13, + "learning_rate": 0.00013019872593376662, + "loss": 0.0359, "step": 175390 }, { - "epoch": 1.9, - "learning_rate": 1.5426049711207733e-05, - "loss": 0.0217, + "epoch": 1.13, + "learning_rate": 0.00013018904457940967, + "loss": 0.0415, "step": 175400 }, { - "epoch": 1.9, - "learning_rate": 1.5409825426698683e-05, - "loss": 0.0238, + "epoch": 1.13, + "learning_rate": 0.00013017936322505275, + "loss": 0.0319, "step": 175410 }, { - "epoch": 1.9, - "learning_rate": 1.539360114218963e-05, - "loss": 0.0203, + "epoch": 1.13, + "learning_rate": 0.00013016968187069583, + "loss": 0.0282, "step": 175420 }, { - "epoch": 1.9, - "learning_rate": 1.5377376857680575e-05, - "loss": 0.0208, + "epoch": 1.13, + "learning_rate": 0.00013016000051633888, + "loss": 0.0297, "step": 175430 }, { - "epoch": 1.9, - "learning_rate": 1.5361152573171522e-05, - "loss": 0.0251, + "epoch": 1.13, + "learning_rate": 0.00013015031916198196, + "loss": 0.036, "step": 175440 }, { - "epoch": 1.9, - "learning_rate": 1.5344928288662468e-05, - "loss": 0.02, + "epoch": 1.13, + "learning_rate": 0.00013014063780762502, + "loss": 0.0337, "step": 175450 }, { - "epoch": 1.9, - "learning_rate": 1.5328704004153415e-05, - "loss": 0.0278, + "epoch": 1.13, + "learning_rate": 0.0001301309564532681, + "loss": 0.0391, "step": 175460 }, { - "epoch": 1.9, - "learning_rate": 1.531247971964436e-05, - "loss": 0.0267, + "epoch": 1.13, + "learning_rate": 0.00013012127509891115, + "loss": 0.0305, "step": 175470 }, { - "epoch": 1.9, - "learning_rate": 1.5296255435135307e-05, - "loss": 0.028, + "epoch": 1.13, + "learning_rate": 0.00013011159374455423, + "loss": 0.0329, "step": 175480 }, { - "epoch": 1.9, - "learning_rate": 1.5280031150626254e-05, - "loss": 0.0271, + "epoch": 1.13, + "learning_rate": 0.0001301019123901973, + "loss": 0.0361, "step": 175490 }, { - "epoch": 1.9, - "learning_rate": 1.5263806866117204e-05, - "loss": 0.0239, + "epoch": 1.13, + "learning_rate": 0.00013009223103584036, + "loss": 0.0313, "step": 175500 }, { - "epoch": 1.9, - "learning_rate": 1.5247582581608148e-05, - "loss": 0.0268, + "epoch": 1.13, + "learning_rate": 0.00013008254968148341, + "loss": 0.0354, "step": 175510 }, { - "epoch": 1.9, - "learning_rate": 1.5231358297099096e-05, - "loss": 0.0213, + "epoch": 1.13, + "learning_rate": 0.0001300728683271265, + "loss": 0.0278, "step": 175520 }, { - "epoch": 1.9, - "learning_rate": 1.5215134012590043e-05, - "loss": 0.0248, + "epoch": 1.13, + "learning_rate": 0.00013006318697276957, + "loss": 0.0384, "step": 175530 }, { - "epoch": 1.9, - "learning_rate": 1.5198909728080989e-05, - "loss": 0.0227, + "epoch": 1.13, + "learning_rate": 0.00013005350561841263, + "loss": 0.0324, "step": 175540 }, { - "epoch": 1.9, - "learning_rate": 1.5182685443571935e-05, - "loss": 0.0222, + "epoch": 1.13, + "learning_rate": 0.0001300438242640557, + "loss": 0.0398, "step": 175550 }, { - "epoch": 1.9, - "learning_rate": 1.5166461159062885e-05, - "loss": 0.0205, + "epoch": 1.13, + "learning_rate": 0.0001300341429096988, + "loss": 0.0349, "step": 175560 }, { - "epoch": 1.9, - "learning_rate": 1.5150236874553832e-05, - "loss": 0.0267, + "epoch": 1.13, + "learning_rate": 0.00013002446155534184, + "loss": 0.0332, "step": 175570 }, { - "epoch": 1.9, - "learning_rate": 1.5134012590044778e-05, - "loss": 0.0214, + "epoch": 1.13, + "learning_rate": 0.0001300147802009849, + "loss": 0.0267, "step": 175580 }, { - "epoch": 1.9, - "learning_rate": 1.5117788305535726e-05, - "loss": 0.0222, + "epoch": 1.13, + "learning_rate": 0.00013000509884662797, + "loss": 0.0336, "step": 175590 }, { - "epoch": 1.9, - "learning_rate": 1.5101564021026672e-05, - "loss": 0.0272, + "epoch": 1.13, + "learning_rate": 0.00012999541749227105, + "loss": 0.0286, "step": 175600 }, { - "epoch": 1.9, - "learning_rate": 1.5085339736517619e-05, - "loss": 0.0346, + "epoch": 1.13, + "learning_rate": 0.0001299857361379141, + "loss": 0.0293, "step": 175610 }, { - "epoch": 1.9, - "learning_rate": 1.5069115452008565e-05, - "loss": 0.027, + "epoch": 1.13, + "learning_rate": 0.00012997605478355718, + "loss": 0.0324, "step": 175620 }, { - "epoch": 1.9, - "learning_rate": 1.5052891167499513e-05, - "loss": 0.029, + "epoch": 1.13, + "learning_rate": 0.00012996637342920024, + "loss": 0.0304, "step": 175630 }, { - "epoch": 1.9, - "learning_rate": 1.503666688299046e-05, - "loss": 0.0255, + "epoch": 1.13, + "learning_rate": 0.00012995669207484332, + "loss": 0.0337, "step": 175640 }, { - "epoch": 1.9, - "learning_rate": 1.5020442598481406e-05, - "loss": 0.0267, + "epoch": 1.13, + "learning_rate": 0.00012994701072048637, + "loss": 0.0302, "step": 175650 }, { - "epoch": 1.9, - "learning_rate": 1.5004218313972352e-05, - "loss": 0.0269, + "epoch": 1.13, + "learning_rate": 0.00012993732936612945, + "loss": 0.0301, "step": 175660 }, { - "epoch": 1.9, - "learning_rate": 1.4987994029463299e-05, - "loss": 0.0267, + "epoch": 1.13, + "learning_rate": 0.00012992764801177253, + "loss": 0.0327, "step": 175670 }, { - "epoch": 1.9, - "learning_rate": 1.4971769744954247e-05, - "loss": 0.0222, + "epoch": 1.13, + "learning_rate": 0.00012991796665741558, + "loss": 0.0408, "step": 175680 }, { - "epoch": 1.9, - "learning_rate": 1.4955545460445193e-05, - "loss": 0.0226, + "epoch": 1.13, + "learning_rate": 0.00012990828530305866, + "loss": 0.0317, "step": 175690 }, { - "epoch": 1.9, - "learning_rate": 1.493932117593614e-05, - "loss": 0.0278, + "epoch": 1.13, + "learning_rate": 0.00012989860394870171, + "loss": 0.036, "step": 175700 }, { - "epoch": 1.9, - "learning_rate": 1.4923096891427086e-05, - "loss": 0.0248, + "epoch": 1.13, + "learning_rate": 0.00012988892259434477, + "loss": 0.0295, "step": 175710 }, { - "epoch": 1.9, - "learning_rate": 1.4906872606918034e-05, - "loss": 0.0245, + "epoch": 1.13, + "learning_rate": 0.00012987924123998785, + "loss": 0.0311, "step": 175720 }, { - "epoch": 1.9, - "learning_rate": 1.489064832240898e-05, - "loss": 0.0192, + "epoch": 1.13, + "learning_rate": 0.00012986955988563093, + "loss": 0.0295, "step": 175730 }, { - "epoch": 1.9, - "learning_rate": 1.4874424037899927e-05, - "loss": 0.022, + "epoch": 1.13, + "learning_rate": 0.000129859878531274, + "loss": 0.0322, "step": 175740 }, { - "epoch": 1.9, - "learning_rate": 1.4858199753390873e-05, - "loss": 0.0215, + "epoch": 1.13, + "learning_rate": 0.00012985019717691706, + "loss": 0.0348, "step": 175750 }, { - "epoch": 1.9, - "learning_rate": 1.4841975468881821e-05, - "loss": 0.0239, + "epoch": 1.13, + "learning_rate": 0.00012984051582256014, + "loss": 0.0276, "step": 175760 }, { - "epoch": 1.9, - "learning_rate": 1.4825751184372768e-05, - "loss": 0.0306, + "epoch": 1.13, + "learning_rate": 0.0001298308344682032, + "loss": 0.0319, "step": 175770 }, { - "epoch": 1.9, - "learning_rate": 1.4809526899863714e-05, - "loss": 0.0245, + "epoch": 1.13, + "learning_rate": 0.00012982115311384624, + "loss": 0.0343, "step": 175780 }, { - "epoch": 1.9, - "learning_rate": 1.479330261535466e-05, - "loss": 0.0266, + "epoch": 1.13, + "learning_rate": 0.00012981147175948932, + "loss": 0.0313, "step": 175790 }, { - "epoch": 1.9, - "learning_rate": 1.4777078330845607e-05, - "loss": 0.0245, + "epoch": 1.13, + "learning_rate": 0.0001298017904051324, + "loss": 0.0284, "step": 175800 }, { - "epoch": 1.9, - "learning_rate": 1.4760854046336555e-05, - "loss": 0.0249, + "epoch": 1.13, + "learning_rate": 0.00012979210905077548, + "loss": 0.0317, "step": 175810 }, { - "epoch": 1.9, - "learning_rate": 1.4744629761827501e-05, - "loss": 0.0266, + "epoch": 1.13, + "learning_rate": 0.00012978242769641854, + "loss": 0.0316, "step": 175820 }, { - "epoch": 1.9, - "learning_rate": 1.4728405477318448e-05, - "loss": 0.0236, + "epoch": 1.13, + "learning_rate": 0.0001297727463420616, + "loss": 0.0286, "step": 175830 }, { - "epoch": 1.9, - "learning_rate": 1.4712181192809394e-05, - "loss": 0.0314, + "epoch": 1.13, + "learning_rate": 0.00012976306498770467, + "loss": 0.0374, "step": 175840 }, { - "epoch": 1.9, - "learning_rate": 1.4695956908300344e-05, - "loss": 0.0213, + "epoch": 1.13, + "learning_rate": 0.00012975338363334772, + "loss": 0.0368, "step": 175850 }, { - "epoch": 1.9, - "learning_rate": 1.467973262379129e-05, - "loss": 0.0238, + "epoch": 1.14, + "learning_rate": 0.0001297437022789908, + "loss": 0.0359, "step": 175860 }, { - "epoch": 1.9, - "learning_rate": 1.4663508339282237e-05, - "loss": 0.0273, + "epoch": 1.14, + "learning_rate": 0.00012973402092463388, + "loss": 0.0326, "step": 175870 }, { - "epoch": 1.9, - "learning_rate": 1.4647284054773185e-05, - "loss": 0.0306, + "epoch": 1.14, + "learning_rate": 0.00012972433957027696, + "loss": 0.0283, "step": 175880 }, { - "epoch": 1.9, - "learning_rate": 1.4631059770264131e-05, - "loss": 0.0259, + "epoch": 1.14, + "learning_rate": 0.00012971465821592, + "loss": 0.035, "step": 175890 }, { - "epoch": 1.9, - "learning_rate": 1.4614835485755077e-05, - "loss": 0.0248, + "epoch": 1.14, + "learning_rate": 0.00012970497686156307, + "loss": 0.0304, "step": 175900 }, { - "epoch": 1.9, - "learning_rate": 1.4598611201246024e-05, - "loss": 0.0251, + "epoch": 1.14, + "learning_rate": 0.00012969529550720615, + "loss": 0.0334, "step": 175910 }, { - "epoch": 1.9, - "learning_rate": 1.4582386916736972e-05, - "loss": 0.0255, + "epoch": 1.14, + "learning_rate": 0.0001296856141528492, + "loss": 0.034, "step": 175920 }, { - "epoch": 1.9, - "learning_rate": 1.4566162632227918e-05, - "loss": 0.0269, + "epoch": 1.14, + "learning_rate": 0.00012967593279849228, + "loss": 0.0319, "step": 175930 }, { - "epoch": 1.9, - "learning_rate": 1.4549938347718865e-05, - "loss": 0.0297, + "epoch": 1.14, + "learning_rate": 0.00012966625144413536, + "loss": 0.0338, "step": 175940 }, { - "epoch": 1.9, - "learning_rate": 1.4533714063209811e-05, - "loss": 0.0275, + "epoch": 1.14, + "learning_rate": 0.0001296565700897784, + "loss": 0.0277, "step": 175950 }, { - "epoch": 1.9, - "learning_rate": 1.4517489778700757e-05, - "loss": 0.0206, + "epoch": 1.14, + "learning_rate": 0.0001296468887354215, + "loss": 0.0338, "step": 175960 }, { - "epoch": 1.9, - "learning_rate": 1.4501265494191706e-05, - "loss": 0.0247, + "epoch": 1.14, + "learning_rate": 0.00012963720738106454, + "loss": 0.0318, "step": 175970 }, { - "epoch": 1.9, - "learning_rate": 1.4485041209682652e-05, - "loss": 0.0234, + "epoch": 1.14, + "learning_rate": 0.00012962752602670762, + "loss": 0.0329, "step": 175980 }, { - "epoch": 1.9, - "learning_rate": 1.4468816925173598e-05, - "loss": 0.0222, + "epoch": 1.14, + "learning_rate": 0.00012961784467235068, + "loss": 0.0344, "step": 175990 }, { - "epoch": 1.9, - "learning_rate": 1.4452592640664545e-05, - "loss": 0.0237, + "epoch": 1.14, + "learning_rate": 0.00012960816331799376, + "loss": 0.0391, "step": 176000 }, { - "epoch": 1.9, - "eval_cer": 0.9210783456226003, - "eval_loss": 0.02026102878153324, - "eval_runtime": 119.0712, - "eval_samples_per_second": 16.797, - "eval_steps_per_second": 4.199, + "epoch": 1.14, + "eval_cer": 0.919873460625918, + "eval_loss": 0.024145476520061493, + "eval_runtime": 120.3294, + "eval_samples_per_second": 16.621, + "eval_steps_per_second": 4.155, "step": 176000 }, { - "epoch": 1.9, - "learning_rate": 1.4436368356155493e-05, - "loss": 0.0293, + "epoch": 1.14, + "learning_rate": 0.00012959848196363684, + "loss": 0.0324, "step": 176010 }, { - "epoch": 1.9, - "learning_rate": 1.4420144071646439e-05, - "loss": 0.0226, + "epoch": 1.14, + "learning_rate": 0.0001295888006092799, + "loss": 0.0371, "step": 176020 }, { - "epoch": 1.9, - "learning_rate": 1.4403919787137386e-05, - "loss": 0.0236, + "epoch": 1.14, + "learning_rate": 0.00012957911925492294, + "loss": 0.0411, "step": 176030 }, { - "epoch": 1.9, - "learning_rate": 1.4387695502628332e-05, - "loss": 0.0191, + "epoch": 1.14, + "learning_rate": 0.00012956943790056602, + "loss": 0.0299, "step": 176040 }, { - "epoch": 1.9, - "learning_rate": 1.437147121811928e-05, - "loss": 0.0202, + "epoch": 1.14, + "learning_rate": 0.0001295597565462091, + "loss": 0.0317, "step": 176050 }, { - "epoch": 1.9, - "learning_rate": 1.4355246933610226e-05, - "loss": 0.0289, + "epoch": 1.14, + "learning_rate": 0.00012955007519185215, + "loss": 0.0347, "step": 176060 }, { - "epoch": 1.9, - "learning_rate": 1.4339022649101173e-05, - "loss": 0.0193, + "epoch": 1.14, + "learning_rate": 0.00012954039383749523, + "loss": 0.0362, "step": 176070 }, { - "epoch": 1.9, - "learning_rate": 1.4322798364592119e-05, - "loss": 0.0275, + "epoch": 1.14, + "learning_rate": 0.0001295307124831383, + "loss": 0.0379, "step": 176080 }, { - "epoch": 1.9, - "learning_rate": 1.4306574080083067e-05, - "loss": 0.022, + "epoch": 1.14, + "learning_rate": 0.00012952103112878136, + "loss": 0.0341, "step": 176090 }, { - "epoch": 1.9, - "learning_rate": 1.4290349795574014e-05, - "loss": 0.0256, + "epoch": 1.14, + "learning_rate": 0.00012951134977442442, + "loss": 0.0313, "step": 176100 }, { - "epoch": 1.9, - "learning_rate": 1.427412551106496e-05, - "loss": 0.0214, + "epoch": 1.14, + "learning_rate": 0.0001295016684200675, + "loss": 0.0337, "step": 176110 }, { - "epoch": 1.9, - "learning_rate": 1.4257901226555906e-05, - "loss": 0.0257, + "epoch": 1.14, + "learning_rate": 0.00012949198706571058, + "loss": 0.0312, "step": 176120 }, { - "epoch": 1.91, - "learning_rate": 1.4241676942046853e-05, - "loss": 0.0255, + "epoch": 1.14, + "learning_rate": 0.00012948230571135363, + "loss": 0.0362, "step": 176130 }, { - "epoch": 1.91, - "learning_rate": 1.4225452657537803e-05, - "loss": 0.0249, + "epoch": 1.14, + "learning_rate": 0.0001294726243569967, + "loss": 0.033, "step": 176140 }, { - "epoch": 1.91, - "learning_rate": 1.4209228373028749e-05, - "loss": 0.0332, + "epoch": 1.14, + "learning_rate": 0.00012946294300263976, + "loss": 0.0342, "step": 176150 }, { - "epoch": 1.91, - "learning_rate": 1.4193004088519695e-05, - "loss": 0.0276, + "epoch": 1.14, + "learning_rate": 0.00012945326164828284, + "loss": 0.0309, "step": 176160 }, { - "epoch": 1.91, - "learning_rate": 1.4176779804010643e-05, - "loss": 0.0268, + "epoch": 1.14, + "learning_rate": 0.0001294435802939259, + "loss": 0.0338, "step": 176170 }, { - "epoch": 1.91, - "learning_rate": 1.416055551950159e-05, - "loss": 0.0255, + "epoch": 1.14, + "learning_rate": 0.00012943389893956897, + "loss": 0.0345, "step": 176180 }, { - "epoch": 1.91, - "learning_rate": 1.4144331234992536e-05, - "loss": 0.0265, + "epoch": 1.14, + "learning_rate": 0.00012942421758521205, + "loss": 0.0318, "step": 176190 }, { - "epoch": 1.91, - "learning_rate": 1.4128106950483482e-05, - "loss": 0.0208, + "epoch": 1.14, + "learning_rate": 0.0001294145362308551, + "loss": 0.0362, "step": 176200 }, { - "epoch": 1.91, - "learning_rate": 1.411188266597443e-05, - "loss": 0.0231, + "epoch": 1.14, + "learning_rate": 0.0001294048548764982, + "loss": 0.0335, "step": 176210 }, { - "epoch": 1.91, - "learning_rate": 1.4095658381465377e-05, - "loss": 0.0241, + "epoch": 1.14, + "learning_rate": 0.00012939517352214124, + "loss": 0.033, "step": 176220 }, { - "epoch": 1.91, - "learning_rate": 1.4079434096956323e-05, - "loss": 0.0269, - "step": 176230 + "epoch": 1.14, + "learning_rate": 0.00012938549216778432, + "loss": 0.0354, + "step": 176230 }, { - "epoch": 1.91, - "learning_rate": 1.406320981244727e-05, - "loss": 0.0255, + "epoch": 1.14, + "learning_rate": 0.00012937581081342737, + "loss": 0.0346, "step": 176240 }, { - "epoch": 1.91, - "learning_rate": 1.4046985527938216e-05, - "loss": 0.0196, + "epoch": 1.14, + "learning_rate": 0.00012936612945907045, + "loss": 0.0364, "step": 176250 }, { - "epoch": 1.91, - "learning_rate": 1.4030761243429164e-05, - "loss": 0.0239, + "epoch": 1.14, + "learning_rate": 0.00012935644810471353, + "loss": 0.0395, "step": 176260 }, { - "epoch": 1.91, - "learning_rate": 1.401453695892011e-05, - "loss": 0.0236, + "epoch": 1.14, + "learning_rate": 0.00012934676675035658, + "loss": 0.0298, "step": 176270 }, { - "epoch": 1.91, - "learning_rate": 1.3998312674411057e-05, - "loss": 0.0317, + "epoch": 1.14, + "learning_rate": 0.00012933708539599966, + "loss": 0.0289, "step": 176280 }, { - "epoch": 1.91, - "learning_rate": 1.3982088389902003e-05, - "loss": 0.0209, + "epoch": 1.14, + "learning_rate": 0.00012932740404164272, + "loss": 0.0331, "step": 176290 }, { - "epoch": 1.91, - "learning_rate": 1.3965864105392951e-05, - "loss": 0.0264, + "epoch": 1.14, + "learning_rate": 0.0001293177226872858, + "loss": 0.032, "step": 176300 }, { - "epoch": 1.91, - "learning_rate": 1.3949639820883898e-05, - "loss": 0.0235, + "epoch": 1.14, + "learning_rate": 0.00012930804133292885, + "loss": 0.0302, "step": 176310 }, { - "epoch": 1.91, - "learning_rate": 1.3933415536374844e-05, - "loss": 0.0282, + "epoch": 1.14, + "learning_rate": 0.00012929835997857193, + "loss": 0.0326, "step": 176320 }, { - "epoch": 1.91, - "learning_rate": 1.391719125186579e-05, - "loss": 0.0224, + "epoch": 1.14, + "learning_rate": 0.000129288678624215, + "loss": 0.0304, "step": 176330 }, { - "epoch": 1.91, - "learning_rate": 1.3900966967356739e-05, - "loss": 0.0231, + "epoch": 1.14, + "learning_rate": 0.00012927899726985806, + "loss": 0.0303, "step": 176340 }, { - "epoch": 1.91, - "learning_rate": 1.3884742682847685e-05, - "loss": 0.0233, + "epoch": 1.14, + "learning_rate": 0.00012926931591550111, + "loss": 0.0376, "step": 176350 }, { - "epoch": 1.91, - "learning_rate": 1.3868518398338631e-05, - "loss": 0.0316, + "epoch": 1.14, + "learning_rate": 0.0001292596345611442, + "loss": 0.0304, "step": 176360 }, { - "epoch": 1.91, - "learning_rate": 1.3852294113829578e-05, - "loss": 0.026, + "epoch": 1.14, + "learning_rate": 0.00012924995320678727, + "loss": 0.0346, "step": 176370 }, { - "epoch": 1.91, - "learning_rate": 1.3836069829320526e-05, - "loss": 0.0286, + "epoch": 1.14, + "learning_rate": 0.00012924027185243033, + "loss": 0.0335, "step": 176380 }, { - "epoch": 1.91, - "learning_rate": 1.3819845544811472e-05, - "loss": 0.0254, + "epoch": 1.14, + "learning_rate": 0.0001292305904980734, + "loss": 0.0311, "step": 176390 }, { - "epoch": 1.91, - "learning_rate": 1.3803621260302419e-05, - "loss": 0.0196, + "epoch": 1.14, + "learning_rate": 0.00012922090914371646, + "loss": 0.0318, "step": 176400 }, { - "epoch": 1.91, - "learning_rate": 1.3787396975793365e-05, - "loss": 0.0233, + "epoch": 1.14, + "learning_rate": 0.00012921122778935954, + "loss": 0.0396, "step": 176410 }, { - "epoch": 1.91, - "learning_rate": 1.3771172691284311e-05, - "loss": 0.0256, + "epoch": 1.14, + "learning_rate": 0.0001292015464350026, + "loss": 0.0323, "step": 176420 }, { - "epoch": 1.91, - "learning_rate": 1.375494840677526e-05, - "loss": 0.0219, + "epoch": 1.14, + "learning_rate": 0.00012919186508064567, + "loss": 0.0321, "step": 176430 }, { - "epoch": 1.91, - "learning_rate": 1.3738724122266208e-05, - "loss": 0.0255, + "epoch": 1.14, + "learning_rate": 0.00012918218372628875, + "loss": 0.0309, "step": 176440 }, { - "epoch": 1.91, - "learning_rate": 1.3722499837757154e-05, - "loss": 0.0196, + "epoch": 1.14, + "learning_rate": 0.0001291725023719318, + "loss": 0.0313, "step": 176450 }, { - "epoch": 1.91, - "learning_rate": 1.3706275553248102e-05, - "loss": 0.0236, + "epoch": 1.14, + "learning_rate": 0.00012916282101757488, + "loss": 0.0326, "step": 176460 }, { - "epoch": 1.91, - "learning_rate": 1.3690051268739048e-05, - "loss": 0.0207, + "epoch": 1.14, + "learning_rate": 0.00012915313966321794, + "loss": 0.0359, "step": 176470 }, { - "epoch": 1.91, - "learning_rate": 1.3673826984229995e-05, - "loss": 0.0236, + "epoch": 1.14, + "learning_rate": 0.00012914345830886102, + "loss": 0.0332, "step": 176480 }, { - "epoch": 1.91, - "learning_rate": 1.3657602699720941e-05, - "loss": 0.0222, + "epoch": 1.14, + "learning_rate": 0.00012913377695450407, + "loss": 0.035, "step": 176490 }, { - "epoch": 1.91, - "learning_rate": 1.364137841521189e-05, - "loss": 0.0263, + "epoch": 1.14, + "learning_rate": 0.00012912409560014715, + "loss": 0.0386, "step": 176500 }, { - "epoch": 1.91, - "learning_rate": 1.3625154130702836e-05, - "loss": 0.0268, + "epoch": 1.14, + "learning_rate": 0.00012911441424579023, + "loss": 0.0308, "step": 176510 }, { - "epoch": 1.91, - "learning_rate": 1.3608929846193782e-05, - "loss": 0.024, + "epoch": 1.14, + "learning_rate": 0.00012910473289143328, + "loss": 0.0279, "step": 176520 }, { - "epoch": 1.91, - "learning_rate": 1.3592705561684728e-05, - "loss": 0.0279, + "epoch": 1.14, + "learning_rate": 0.00012909505153707636, + "loss": 0.0297, "step": 176530 }, { - "epoch": 1.91, - "learning_rate": 1.3576481277175676e-05, - "loss": 0.0202, + "epoch": 1.14, + "learning_rate": 0.0001290853701827194, + "loss": 0.0397, "step": 176540 }, { - "epoch": 1.91, - "learning_rate": 1.3560256992666623e-05, - "loss": 0.0244, + "epoch": 1.14, + "learning_rate": 0.00012907568882836247, + "loss": 0.0384, "step": 176550 }, { - "epoch": 1.91, - "learning_rate": 1.354403270815757e-05, - "loss": 0.0282, + "epoch": 1.14, + "learning_rate": 0.00012906600747400555, + "loss": 0.0304, "step": 176560 }, { - "epoch": 1.91, - "learning_rate": 1.3527808423648516e-05, - "loss": 0.026, + "epoch": 1.14, + "learning_rate": 0.00012905632611964863, + "loss": 0.0346, "step": 176570 }, { - "epoch": 1.91, - "learning_rate": 1.3511584139139462e-05, - "loss": 0.0233, + "epoch": 1.14, + "learning_rate": 0.0001290466447652917, + "loss": 0.0334, "step": 176580 }, { - "epoch": 1.91, - "learning_rate": 1.349535985463041e-05, - "loss": 0.0307, + "epoch": 1.14, + "learning_rate": 0.00012903696341093476, + "loss": 0.0387, "step": 176590 }, { - "epoch": 1.91, - "learning_rate": 1.3479135570121356e-05, - "loss": 0.0225, + "epoch": 1.14, + "learning_rate": 0.0001290272820565778, + "loss": 0.0328, "step": 176600 }, { - "epoch": 1.91, - "learning_rate": 1.3462911285612303e-05, - "loss": 0.0306, + "epoch": 1.14, + "learning_rate": 0.0001290176007022209, + "loss": 0.0344, "step": 176610 }, { - "epoch": 1.91, - "learning_rate": 1.344668700110325e-05, - "loss": 0.028, + "epoch": 1.14, + "learning_rate": 0.00012900791934786394, + "loss": 0.0396, "step": 176620 }, { - "epoch": 1.91, - "learning_rate": 1.3430462716594197e-05, - "loss": 0.0241, + "epoch": 1.14, + "learning_rate": 0.00012899823799350702, + "loss": 0.0326, "step": 176630 }, { - "epoch": 1.91, - "learning_rate": 1.3414238432085144e-05, - "loss": 0.02, + "epoch": 1.14, + "learning_rate": 0.0001289885566391501, + "loss": 0.0301, "step": 176640 }, { - "epoch": 1.91, - "learning_rate": 1.339801414757609e-05, - "loss": 0.0258, + "epoch": 1.14, + "learning_rate": 0.00012897887528479318, + "loss": 0.0465, "step": 176650 }, { - "epoch": 1.91, - "learning_rate": 1.3381789863067036e-05, - "loss": 0.0219, + "epoch": 1.14, + "learning_rate": 0.00012896919393043624, + "loss": 0.0371, "step": 176660 }, { - "epoch": 1.91, - "learning_rate": 1.3365565578557984e-05, - "loss": 0.0179, + "epoch": 1.14, + "learning_rate": 0.0001289595125760793, + "loss": 0.0412, "step": 176670 }, { - "epoch": 1.91, - "learning_rate": 1.3349341294048931e-05, - "loss": 0.0276, + "epoch": 1.14, + "learning_rate": 0.00012894983122172237, + "loss": 0.0344, "step": 176680 }, { - "epoch": 1.91, - "learning_rate": 1.3333117009539877e-05, - "loss": 0.0227, + "epoch": 1.14, + "learning_rate": 0.00012894014986736542, + "loss": 0.0342, "step": 176690 }, { - "epoch": 1.91, - "learning_rate": 1.3316892725030824e-05, - "loss": 0.0217, + "epoch": 1.14, + "learning_rate": 0.0001289304685130085, + "loss": 0.0394, "step": 176700 }, { - "epoch": 1.91, - "learning_rate": 1.3300668440521772e-05, - "loss": 0.0247, + "epoch": 1.14, + "learning_rate": 0.00012892078715865158, + "loss": 0.0314, "step": 176710 }, { - "epoch": 1.91, - "learning_rate": 1.3284444156012718e-05, - "loss": 0.0192, + "epoch": 1.14, + "learning_rate": 0.00012891110580429463, + "loss": 0.0328, "step": 176720 }, { - "epoch": 1.91, - "learning_rate": 1.3268219871503666e-05, - "loss": 0.0194, + "epoch": 1.14, + "learning_rate": 0.0001289014244499377, + "loss": 0.0313, "step": 176730 }, { - "epoch": 1.91, - "learning_rate": 1.3251995586994613e-05, - "loss": 0.0218, + "epoch": 1.14, + "learning_rate": 0.00012889174309558077, + "loss": 0.0303, "step": 176740 }, { - "epoch": 1.91, - "learning_rate": 1.323577130248556e-05, - "loss": 0.0272, + "epoch": 1.14, + "learning_rate": 0.00012888206174122385, + "loss": 0.0294, "step": 176750 }, { - "epoch": 1.91, - "learning_rate": 1.3219547017976507e-05, - "loss": 0.0309, + "epoch": 1.14, + "learning_rate": 0.0001288723803868669, + "loss": 0.0377, "step": 176760 }, { - "epoch": 1.91, - "learning_rate": 1.3203322733467453e-05, - "loss": 0.0226, + "epoch": 1.14, + "learning_rate": 0.00012886269903250998, + "loss": 0.0285, "step": 176770 }, { - "epoch": 1.91, - "learning_rate": 1.31870984489584e-05, - "loss": 0.0221, + "epoch": 1.14, + "learning_rate": 0.00012885301767815306, + "loss": 0.0316, "step": 176780 }, { - "epoch": 1.91, - "learning_rate": 1.3170874164449348e-05, - "loss": 0.0305, + "epoch": 1.14, + "learning_rate": 0.0001288433363237961, + "loss": 0.0362, "step": 176790 }, { - "epoch": 1.91, - "learning_rate": 1.3154649879940294e-05, - "loss": 0.0236, + "epoch": 1.14, + "learning_rate": 0.00012883365496943916, + "loss": 0.0398, "step": 176800 }, { - "epoch": 1.91, - "learning_rate": 1.313842559543124e-05, - "loss": 0.0216, + "epoch": 1.14, + "learning_rate": 0.00012882397361508224, + "loss": 0.0315, "step": 176810 }, { - "epoch": 1.91, - "learning_rate": 1.3122201310922187e-05, - "loss": 0.0261, + "epoch": 1.14, + "learning_rate": 0.00012881429226072532, + "loss": 0.034, "step": 176820 }, { - "epoch": 1.91, - "learning_rate": 1.3105977026413135e-05, - "loss": 0.0235, + "epoch": 1.14, + "learning_rate": 0.00012880461090636838, + "loss": 0.035, "step": 176830 }, { - "epoch": 1.91, - "learning_rate": 1.3089752741904081e-05, - "loss": 0.0239, + "epoch": 1.14, + "learning_rate": 0.00012879492955201145, + "loss": 0.0297, "step": 176840 }, { - "epoch": 1.91, - "learning_rate": 1.3073528457395028e-05, - "loss": 0.0214, + "epoch": 1.14, + "learning_rate": 0.00012878524819765453, + "loss": 0.031, "step": 176850 }, { - "epoch": 1.91, - "learning_rate": 1.3057304172885974e-05, - "loss": 0.0305, + "epoch": 1.14, + "learning_rate": 0.0001287755668432976, + "loss": 0.0299, "step": 176860 }, { - "epoch": 1.91, - "learning_rate": 1.304107988837692e-05, - "loss": 0.0245, + "epoch": 1.14, + "learning_rate": 0.00012876588548894064, + "loss": 0.0291, "step": 176870 }, { - "epoch": 1.91, - "learning_rate": 1.3024855603867869e-05, - "loss": 0.0245, + "epoch": 1.14, + "learning_rate": 0.00012875620413458372, + "loss": 0.0284, "step": 176880 }, { - "epoch": 1.91, - "learning_rate": 1.3008631319358815e-05, - "loss": 0.0206, + "epoch": 1.14, + "learning_rate": 0.0001287465227802268, + "loss": 0.0324, "step": 176890 }, { - "epoch": 1.91, - "learning_rate": 1.2992407034849761e-05, - "loss": 0.0265, + "epoch": 1.14, + "learning_rate": 0.00012873684142586985, + "loss": 0.0319, "step": 176900 }, { - "epoch": 1.91, - "learning_rate": 1.2976182750340708e-05, - "loss": 0.0213, + "epoch": 1.14, + "learning_rate": 0.00012872716007151293, + "loss": 0.0289, "step": 176910 }, { - "epoch": 1.91, - "learning_rate": 1.2959958465831656e-05, - "loss": 0.0255, + "epoch": 1.14, + "learning_rate": 0.00012871747871715598, + "loss": 0.0324, "step": 176920 }, { - "epoch": 1.91, - "learning_rate": 1.2943734181322602e-05, - "loss": 0.0205, + "epoch": 1.14, + "learning_rate": 0.00012870779736279906, + "loss": 0.0286, "step": 176930 }, { - "epoch": 1.91, - "learning_rate": 1.2927509896813549e-05, - "loss": 0.0246, + "epoch": 1.14, + "learning_rate": 0.00012869811600844212, + "loss": 0.0299, "step": 176940 }, { - "epoch": 1.91, - "learning_rate": 1.2911285612304495e-05, - "loss": 0.0194, + "epoch": 1.14, + "learning_rate": 0.0001286884346540852, + "loss": 0.0372, "step": 176950 }, { - "epoch": 1.91, - "learning_rate": 1.2895061327795443e-05, - "loss": 0.025, + "epoch": 1.14, + "learning_rate": 0.00012867875329972828, + "loss": 0.0301, "step": 176960 }, { - "epoch": 1.91, - "learning_rate": 1.287883704328639e-05, - "loss": 0.0252, + "epoch": 1.14, + "learning_rate": 0.00012866907194537133, + "loss": 0.0335, "step": 176970 }, { - "epoch": 1.91, - "learning_rate": 1.2862612758777336e-05, - "loss": 0.0263, + "epoch": 1.14, + "learning_rate": 0.0001286593905910144, + "loss": 0.0344, "step": 176980 }, { - "epoch": 1.91, - "learning_rate": 1.2846388474268282e-05, - "loss": 0.0215, + "epoch": 1.14, + "learning_rate": 0.00012864970923665746, + "loss": 0.0358, "step": 176990 }, { - "epoch": 1.91, - "learning_rate": 1.283016418975923e-05, - "loss": 0.0299, + "epoch": 1.14, + "learning_rate": 0.00012864002788230054, + "loss": 0.0325, "step": 177000 }, { - "epoch": 1.91, - "eval_cer": 0.921057141998901, - "eval_loss": 0.02032814733684063, - "eval_runtime": 119.0598, - "eval_samples_per_second": 16.798, - "eval_steps_per_second": 4.2, + "epoch": 1.14, + "eval_cer": 0.9199520958083832, + "eval_loss": 0.023923007771372795, + "eval_runtime": 120.1567, + "eval_samples_per_second": 16.645, + "eval_steps_per_second": 4.161, "step": 177000 }, { - "epoch": 1.91, - "learning_rate": 1.2813939905250177e-05, - "loss": 0.0205, + "epoch": 1.14, + "learning_rate": 0.0001286303465279436, + "loss": 0.0333, "step": 177010 }, { - "epoch": 1.91, - "learning_rate": 1.2797715620741125e-05, - "loss": 0.0227, + "epoch": 1.14, + "learning_rate": 0.00012862066517358667, + "loss": 0.0348, "step": 177020 }, { - "epoch": 1.91, - "learning_rate": 1.2781491336232071e-05, - "loss": 0.0238, + "epoch": 1.14, + "learning_rate": 0.00012861098381922975, + "loss": 0.0363, "step": 177030 }, { - "epoch": 1.91, - "learning_rate": 1.276526705172302e-05, - "loss": 0.0247, + "epoch": 1.14, + "learning_rate": 0.0001286013024648728, + "loss": 0.0368, "step": 177040 }, { - "epoch": 1.91, - "learning_rate": 1.2749042767213966e-05, - "loss": 0.0218, + "epoch": 1.14, + "learning_rate": 0.0001285916211105159, + "loss": 0.0334, "step": 177050 }, { - "epoch": 1.92, - "learning_rate": 1.2732818482704912e-05, - "loss": 0.0217, + "epoch": 1.14, + "learning_rate": 0.00012858193975615894, + "loss": 0.0297, "step": 177060 }, { - "epoch": 1.92, - "learning_rate": 1.2716594198195858e-05, - "loss": 0.0248, + "epoch": 1.14, + "learning_rate": 0.00012857225840180202, + "loss": 0.0342, "step": 177070 }, { - "epoch": 1.92, - "learning_rate": 1.2700369913686807e-05, - "loss": 0.0221, + "epoch": 1.14, + "learning_rate": 0.00012856257704744507, + "loss": 0.0317, "step": 177080 }, { - "epoch": 1.92, - "learning_rate": 1.2684145629177753e-05, - "loss": 0.0279, + "epoch": 1.14, + "learning_rate": 0.00012855289569308815, + "loss": 0.0352, "step": 177090 }, { - "epoch": 1.92, - "learning_rate": 1.26679213446687e-05, - "loss": 0.0234, + "epoch": 1.14, + "learning_rate": 0.00012854321433873123, + "loss": 0.0324, "step": 177100 }, { - "epoch": 1.92, - "learning_rate": 1.2651697060159646e-05, - "loss": 0.0235, + "epoch": 1.14, + "learning_rate": 0.00012853353298437428, + "loss": 0.0362, "step": 177110 }, { - "epoch": 1.92, - "learning_rate": 1.2635472775650594e-05, - "loss": 0.0237, + "epoch": 1.14, + "learning_rate": 0.00012852385163001734, + "loss": 0.0274, "step": 177120 }, { - "epoch": 1.92, - "learning_rate": 1.261924849114154e-05, - "loss": 0.029, + "epoch": 1.14, + "learning_rate": 0.00012851417027566042, + "loss": 0.0321, "step": 177130 }, { - "epoch": 1.92, - "learning_rate": 1.2603024206632486e-05, - "loss": 0.0271, + "epoch": 1.14, + "learning_rate": 0.0001285044889213035, + "loss": 0.033, "step": 177140 }, { - "epoch": 1.92, - "learning_rate": 1.2586799922123433e-05, - "loss": 0.0287, + "epoch": 1.14, + "learning_rate": 0.00012849480756694655, + "loss": 0.0288, "step": 177150 }, { - "epoch": 1.92, - "learning_rate": 1.2570575637614381e-05, - "loss": 0.0252, + "epoch": 1.14, + "learning_rate": 0.00012848512621258963, + "loss": 0.0337, "step": 177160 }, { - "epoch": 1.92, - "learning_rate": 1.2554351353105327e-05, - "loss": 0.0248, + "epoch": 1.14, + "learning_rate": 0.0001284754448582327, + "loss": 0.0328, "step": 177170 }, { - "epoch": 1.92, - "learning_rate": 1.2538127068596274e-05, - "loss": 0.0256, + "epoch": 1.14, + "learning_rate": 0.00012846576350387576, + "loss": 0.0343, "step": 177180 }, { - "epoch": 1.92, - "learning_rate": 1.252190278408722e-05, - "loss": 0.0257, + "epoch": 1.14, + "learning_rate": 0.00012845608214951881, + "loss": 0.035, "step": 177190 }, { - "epoch": 1.92, - "learning_rate": 1.2505678499578166e-05, - "loss": 0.0272, + "epoch": 1.14, + "learning_rate": 0.0001284464007951619, + "loss": 0.036, "step": 177200 }, { - "epoch": 1.92, - "learning_rate": 1.2489454215069115e-05, - "loss": 0.025, + "epoch": 1.14, + "learning_rate": 0.00012843671944080497, + "loss": 0.0407, "step": 177210 }, { - "epoch": 1.92, - "learning_rate": 1.2473229930560061e-05, - "loss": 0.0238, + "epoch": 1.14, + "learning_rate": 0.00012842703808644803, + "loss": 0.0376, "step": 177220 }, { - "epoch": 1.92, - "learning_rate": 1.2457005646051007e-05, - "loss": 0.026, + "epoch": 1.14, + "learning_rate": 0.0001284173567320911, + "loss": 0.0297, "step": 177230 }, { - "epoch": 1.92, - "learning_rate": 1.2440781361541954e-05, - "loss": 0.0225, + "epoch": 1.14, + "learning_rate": 0.00012840767537773416, + "loss": 0.0311, "step": 177240 }, { - "epoch": 1.92, - "learning_rate": 1.2424557077032902e-05, - "loss": 0.0229, + "epoch": 1.14, + "learning_rate": 0.00012839799402337724, + "loss": 0.0329, "step": 177250 }, { - "epoch": 1.92, - "learning_rate": 1.2408332792523848e-05, - "loss": 0.0234, + "epoch": 1.14, + "learning_rate": 0.0001283883126690203, + "loss": 0.0411, "step": 177260 }, { - "epoch": 1.92, - "learning_rate": 1.2392108508014795e-05, - "loss": 0.0191, + "epoch": 1.14, + "learning_rate": 0.00012837863131466337, + "loss": 0.0309, "step": 177270 }, { - "epoch": 1.92, - "learning_rate": 1.2375884223505741e-05, - "loss": 0.0211, + "epoch": 1.14, + "learning_rate": 0.00012836894996030645, + "loss": 0.0346, "step": 177280 }, { - "epoch": 1.92, - "learning_rate": 1.2359659938996689e-05, - "loss": 0.0288, + "epoch": 1.14, + "learning_rate": 0.0001283592686059495, + "loss": 0.0346, "step": 177290 }, { - "epoch": 1.92, - "learning_rate": 1.2343435654487635e-05, - "loss": 0.025, + "epoch": 1.14, + "learning_rate": 0.00012834958725159258, + "loss": 0.033, "step": 177300 }, { - "epoch": 1.92, - "learning_rate": 1.2327211369978582e-05, - "loss": 0.0312, + "epoch": 1.14, + "learning_rate": 0.00012833990589723564, + "loss": 0.0335, "step": 177310 }, { - "epoch": 1.92, - "learning_rate": 1.231098708546953e-05, - "loss": 0.0228, + "epoch": 1.14, + "learning_rate": 0.0001283302245428787, + "loss": 0.0329, "step": 177320 }, { - "epoch": 1.92, - "learning_rate": 1.2294762800960478e-05, - "loss": 0.0276, + "epoch": 1.14, + "learning_rate": 0.00012832054318852177, + "loss": 0.0337, "step": 177330 }, { - "epoch": 1.92, - "learning_rate": 1.2278538516451424e-05, - "loss": 0.0238, + "epoch": 1.14, + "learning_rate": 0.00012831086183416485, + "loss": 0.0372, "step": 177340 }, { - "epoch": 1.92, - "learning_rate": 1.226231423194237e-05, - "loss": 0.0232, + "epoch": 1.14, + "learning_rate": 0.0001283011804798079, + "loss": 0.0365, "step": 177350 }, { - "epoch": 1.92, - "learning_rate": 1.2246089947433317e-05, - "loss": 0.0237, + "epoch": 1.14, + "learning_rate": 0.00012829149912545098, + "loss": 0.0384, "step": 177360 }, { - "epoch": 1.92, - "learning_rate": 1.2229865662924265e-05, - "loss": 0.0273, + "epoch": 1.14, + "learning_rate": 0.00012828181777109406, + "loss": 0.0342, "step": 177370 }, { - "epoch": 1.92, - "learning_rate": 1.2213641378415212e-05, - "loss": 0.023, + "epoch": 1.14, + "learning_rate": 0.0001282721364167371, + "loss": 0.0329, "step": 177380 }, { - "epoch": 1.92, - "learning_rate": 1.2197417093906158e-05, - "loss": 0.0229, + "epoch": 1.14, + "learning_rate": 0.00012826245506238017, + "loss": 0.0372, "step": 177390 }, { - "epoch": 1.92, - "learning_rate": 1.2181192809397104e-05, - "loss": 0.0279, + "epoch": 1.14, + "learning_rate": 0.00012825277370802325, + "loss": 0.0352, "step": 177400 }, { - "epoch": 1.92, - "learning_rate": 1.2164968524888052e-05, - "loss": 0.0199, + "epoch": 1.15, + "learning_rate": 0.00012824309235366633, + "loss": 0.032, "step": 177410 }, { - "epoch": 1.92, - "learning_rate": 1.2148744240378999e-05, - "loss": 0.027, + "epoch": 1.15, + "learning_rate": 0.00012823341099930938, + "loss": 0.0348, "step": 177420 }, { - "epoch": 1.92, - "learning_rate": 1.2132519955869945e-05, - "loss": 0.0196, + "epoch": 1.15, + "learning_rate": 0.00012822372964495246, + "loss": 0.0362, "step": 177430 }, { - "epoch": 1.92, - "learning_rate": 1.2116295671360892e-05, - "loss": 0.0231, + "epoch": 1.15, + "learning_rate": 0.0001282140482905955, + "loss": 0.037, "step": 177440 }, { - "epoch": 1.92, - "learning_rate": 1.210007138685184e-05, - "loss": 0.0222, + "epoch": 1.15, + "learning_rate": 0.0001282043669362386, + "loss": 0.0324, "step": 177450 }, { - "epoch": 1.92, - "learning_rate": 1.2083847102342786e-05, - "loss": 0.0235, + "epoch": 1.15, + "learning_rate": 0.00012819468558188164, + "loss": 0.0394, "step": 177460 }, { - "epoch": 1.92, - "learning_rate": 1.2067622817833732e-05, - "loss": 0.0282, + "epoch": 1.15, + "learning_rate": 0.00012818500422752472, + "loss": 0.0372, "step": 177470 }, { - "epoch": 1.92, - "learning_rate": 1.2051398533324679e-05, - "loss": 0.0213, + "epoch": 1.15, + "learning_rate": 0.0001281753228731678, + "loss": 0.0323, "step": 177480 }, { - "epoch": 1.92, - "learning_rate": 1.2035174248815625e-05, - "loss": 0.0224, + "epoch": 1.15, + "learning_rate": 0.00012816564151881086, + "loss": 0.0381, "step": 177490 }, { - "epoch": 1.92, - "learning_rate": 1.2018949964306573e-05, - "loss": 0.0271, - "step": 177500 + "epoch": 1.15, + "learning_rate": 0.00012815596016445394, + "loss": 0.0325, + "step": 177500 }, { - "epoch": 1.92, - "learning_rate": 1.200272567979752e-05, - "loss": 0.0196, + "epoch": 1.15, + "learning_rate": 0.000128146278810097, + "loss": 0.0305, "step": 177510 }, { - "epoch": 1.92, - "learning_rate": 1.1986501395288466e-05, - "loss": 0.0198, + "epoch": 1.15, + "learning_rate": 0.00012813659745574007, + "loss": 0.0347, "step": 177520 }, { - "epoch": 1.92, - "learning_rate": 1.1970277110779412e-05, - "loss": 0.0238, + "epoch": 1.15, + "learning_rate": 0.00012812691610138312, + "loss": 0.0359, "step": 177530 }, { - "epoch": 1.92, - "learning_rate": 1.195405282627036e-05, - "loss": 0.0269, + "epoch": 1.15, + "learning_rate": 0.0001281172347470262, + "loss": 0.0386, "step": 177540 }, { - "epoch": 1.92, - "learning_rate": 1.1937828541761307e-05, - "loss": 0.0248, + "epoch": 1.15, + "learning_rate": 0.00012810755339266928, + "loss": 0.0299, "step": 177550 }, { - "epoch": 1.92, - "learning_rate": 1.1921604257252253e-05, - "loss": 0.0242, + "epoch": 1.15, + "learning_rate": 0.00012809787203831233, + "loss": 0.0352, "step": 177560 }, { - "epoch": 1.92, - "learning_rate": 1.19053799727432e-05, - "loss": 0.0266, + "epoch": 1.15, + "learning_rate": 0.0001280881906839554, + "loss": 0.0324, "step": 177570 }, { - "epoch": 1.92, - "learning_rate": 1.1889155688234148e-05, - "loss": 0.0208, + "epoch": 1.15, + "learning_rate": 0.00012807850932959846, + "loss": 0.0313, "step": 177580 }, { - "epoch": 1.92, - "learning_rate": 1.1872931403725094e-05, - "loss": 0.0232, + "epoch": 1.15, + "learning_rate": 0.00012806882797524154, + "loss": 0.0329, "step": 177590 }, { - "epoch": 1.92, - "learning_rate": 1.185670711921604e-05, - "loss": 0.0261, + "epoch": 1.15, + "learning_rate": 0.0001280591466208846, + "loss": 0.0272, "step": 177600 }, { - "epoch": 1.92, - "learning_rate": 1.184048283470699e-05, - "loss": 0.0266, + "epoch": 1.15, + "learning_rate": 0.00012804946526652768, + "loss": 0.0341, "step": 177610 }, { - "epoch": 1.92, - "learning_rate": 1.1824258550197937e-05, - "loss": 0.0242, + "epoch": 1.15, + "learning_rate": 0.00012803978391217076, + "loss": 0.0311, "step": 177620 }, { - "epoch": 1.92, - "learning_rate": 1.1808034265688883e-05, - "loss": 0.0241, + "epoch": 1.15, + "learning_rate": 0.0001280301025578138, + "loss": 0.0342, "step": 177630 }, { - "epoch": 1.92, - "learning_rate": 1.179180998117983e-05, - "loss": 0.0256, + "epoch": 1.15, + "learning_rate": 0.00012802042120345686, + "loss": 0.0311, "step": 177640 }, { - "epoch": 1.92, - "learning_rate": 1.1775585696670776e-05, - "loss": 0.0229, + "epoch": 1.15, + "learning_rate": 0.00012801073984909994, + "loss": 0.0262, "step": 177650 }, { - "epoch": 1.92, - "learning_rate": 1.1759361412161724e-05, - "loss": 0.0213, + "epoch": 1.15, + "learning_rate": 0.00012800105849474302, + "loss": 0.0367, "step": 177660 }, { - "epoch": 1.92, - "learning_rate": 1.174313712765267e-05, - "loss": 0.0251, + "epoch": 1.15, + "learning_rate": 0.00012799137714038607, + "loss": 0.0326, "step": 177670 }, { - "epoch": 1.92, - "learning_rate": 1.1726912843143617e-05, - "loss": 0.0204, + "epoch": 1.15, + "learning_rate": 0.00012798169578602915, + "loss": 0.0305, "step": 177680 }, { - "epoch": 1.92, - "learning_rate": 1.1710688558634563e-05, - "loss": 0.0227, + "epoch": 1.15, + "learning_rate": 0.0001279720144316722, + "loss": 0.0318, "step": 177690 }, { - "epoch": 1.92, - "learning_rate": 1.1694464274125511e-05, - "loss": 0.0243, + "epoch": 1.15, + "learning_rate": 0.0001279623330773153, + "loss": 0.0381, "step": 177700 }, { - "epoch": 1.92, - "learning_rate": 1.1678239989616457e-05, - "loss": 0.0209, + "epoch": 1.15, + "learning_rate": 0.00012795265172295834, + "loss": 0.0337, "step": 177710 }, { - "epoch": 1.92, - "learning_rate": 1.1662015705107404e-05, - "loss": 0.0327, + "epoch": 1.15, + "learning_rate": 0.00012794297036860142, + "loss": 0.0315, "step": 177720 }, { - "epoch": 1.92, - "learning_rate": 1.164579142059835e-05, - "loss": 0.0275, + "epoch": 1.15, + "learning_rate": 0.0001279332890142445, + "loss": 0.0326, "step": 177730 }, { - "epoch": 1.92, - "learning_rate": 1.1629567136089298e-05, - "loss": 0.0229, + "epoch": 1.15, + "learning_rate": 0.00012792360765988755, + "loss": 0.0327, "step": 177740 }, { - "epoch": 1.92, - "learning_rate": 1.1613342851580245e-05, - "loss": 0.0248, + "epoch": 1.15, + "learning_rate": 0.00012791392630553063, + "loss": 0.0303, "step": 177750 }, { - "epoch": 1.92, - "learning_rate": 1.1597118567071191e-05, - "loss": 0.0216, + "epoch": 1.15, + "learning_rate": 0.00012790424495117368, + "loss": 0.0285, "step": 177760 }, { - "epoch": 1.92, - "learning_rate": 1.1580894282562137e-05, - "loss": 0.0255, + "epoch": 1.15, + "learning_rate": 0.00012789456359681676, + "loss": 0.0361, "step": 177770 }, { - "epoch": 1.92, - "learning_rate": 1.1564669998053085e-05, - "loss": 0.0208, + "epoch": 1.15, + "learning_rate": 0.00012788488224245982, + "loss": 0.0323, "step": 177780 }, { - "epoch": 1.92, - "learning_rate": 1.1548445713544032e-05, - "loss": 0.0232, + "epoch": 1.15, + "learning_rate": 0.0001278752008881029, + "loss": 0.031, "step": 177790 }, { - "epoch": 1.92, - "learning_rate": 1.1532221429034978e-05, - "loss": 0.0263, + "epoch": 1.15, + "learning_rate": 0.00012786551953374598, + "loss": 0.033, "step": 177800 }, { - "epoch": 1.92, - "learning_rate": 1.1515997144525925e-05, - "loss": 0.0263, + "epoch": 1.15, + "learning_rate": 0.00012785583817938903, + "loss": 0.028, "step": 177810 }, { - "epoch": 1.92, - "learning_rate": 1.1499772860016871e-05, - "loss": 0.0265, + "epoch": 1.15, + "learning_rate": 0.0001278461568250321, + "loss": 0.0314, "step": 177820 }, { - "epoch": 1.92, - "learning_rate": 1.1483548575507819e-05, - "loss": 0.023, + "epoch": 1.15, + "learning_rate": 0.00012783647547067516, + "loss": 0.0338, "step": 177830 }, { - "epoch": 1.92, - "learning_rate": 1.1467324290998765e-05, - "loss": 0.0241, + "epoch": 1.15, + "learning_rate": 0.00012782679411631821, + "loss": 0.0291, "step": 177840 }, { - "epoch": 1.92, - "learning_rate": 1.1451100006489712e-05, - "loss": 0.0205, + "epoch": 1.15, + "learning_rate": 0.0001278171127619613, + "loss": 0.0365, "step": 177850 }, { - "epoch": 1.92, - "learning_rate": 1.1434875721980658e-05, - "loss": 0.018, + "epoch": 1.15, + "learning_rate": 0.00012780743140760437, + "loss": 0.0289, "step": 177860 }, { - "epoch": 1.92, - "learning_rate": 1.1418651437471606e-05, - "loss": 0.0284, + "epoch": 1.15, + "learning_rate": 0.00012779775005324745, + "loss": 0.0321, "step": 177870 }, { - "epoch": 1.92, - "learning_rate": 1.1402427152962553e-05, - "loss": 0.0274, + "epoch": 1.15, + "learning_rate": 0.0001277880686988905, + "loss": 0.0279, "step": 177880 }, { - "epoch": 1.92, - "learning_rate": 1.1386202868453499e-05, - "loss": 0.0276, + "epoch": 1.15, + "learning_rate": 0.00012777838734453359, + "loss": 0.0286, "step": 177890 }, { - "epoch": 1.92, - "learning_rate": 1.1369978583944449e-05, - "loss": 0.0235, + "epoch": 1.15, + "learning_rate": 0.00012776870599017664, + "loss": 0.0367, "step": 177900 }, { - "epoch": 1.92, - "learning_rate": 1.1353754299435395e-05, - "loss": 0.03, + "epoch": 1.15, + "learning_rate": 0.0001277590246358197, + "loss": 0.0289, "step": 177910 }, { - "epoch": 1.92, - "learning_rate": 1.1337530014926342e-05, - "loss": 0.0209, + "epoch": 1.15, + "learning_rate": 0.00012774934328146277, + "loss": 0.0301, "step": 177920 }, { - "epoch": 1.92, - "learning_rate": 1.1321305730417288e-05, - "loss": 0.0242, + "epoch": 1.15, + "learning_rate": 0.00012773966192710585, + "loss": 0.0305, "step": 177930 }, { - "epoch": 1.92, - "learning_rate": 1.1305081445908234e-05, - "loss": 0.0206, + "epoch": 1.15, + "learning_rate": 0.00012772998057274893, + "loss": 0.0358, "step": 177940 }, { - "epoch": 1.92, - "learning_rate": 1.1288857161399182e-05, - "loss": 0.023, + "epoch": 1.15, + "learning_rate": 0.00012772029921839198, + "loss": 0.0363, "step": 177950 }, { - "epoch": 1.92, - "learning_rate": 1.1272632876890129e-05, - "loss": 0.024, + "epoch": 1.15, + "learning_rate": 0.00012771061786403504, + "loss": 0.0273, "step": 177960 }, { - "epoch": 1.92, - "learning_rate": 1.1256408592381075e-05, - "loss": 0.021, + "epoch": 1.15, + "learning_rate": 0.00012770093650967812, + "loss": 0.0303, "step": 177970 }, { - "epoch": 1.93, - "learning_rate": 1.1240184307872022e-05, - "loss": 0.0284, + "epoch": 1.15, + "learning_rate": 0.00012769125515532117, + "loss": 0.0346, "step": 177980 }, { - "epoch": 1.93, - "learning_rate": 1.122396002336297e-05, - "loss": 0.0236, + "epoch": 1.15, + "learning_rate": 0.00012768157380096425, + "loss": 0.0322, "step": 177990 }, { - "epoch": 1.93, - "learning_rate": 1.1207735738853916e-05, - "loss": 0.0246, + "epoch": 1.15, + "learning_rate": 0.00012767189244660733, + "loss": 0.0295, "step": 178000 }, { - "epoch": 1.93, - "eval_cer": 0.9210589089675425, - "eval_loss": 0.020328855141997337, - "eval_runtime": 119.0589, - "eval_samples_per_second": 16.798, - "eval_steps_per_second": 4.2, + "epoch": 1.15, + "eval_cer": 0.9198888261213423, + "eval_loss": 0.02403685823082924, + "eval_runtime": 120.1071, + "eval_samples_per_second": 16.652, + "eval_steps_per_second": 4.163, "step": 178000 }, { - "epoch": 1.93, - "learning_rate": 1.1191511454344862e-05, - "loss": 0.0249, + "epoch": 1.15, + "learning_rate": 0.00012766221109225038, + "loss": 0.0355, "step": 178010 }, { - "epoch": 1.93, - "learning_rate": 1.1175287169835809e-05, - "loss": 0.0267, + "epoch": 1.15, + "learning_rate": 0.00012765252973789346, + "loss": 0.0298, "step": 178020 }, { - "epoch": 1.93, - "learning_rate": 1.1159062885326757e-05, - "loss": 0.0232, + "epoch": 1.15, + "learning_rate": 0.0001276428483835365, + "loss": 0.0328, "step": 178030 }, { - "epoch": 1.93, - "learning_rate": 1.1142838600817703e-05, - "loss": 0.0238, + "epoch": 1.15, + "learning_rate": 0.0001276331670291796, + "loss": 0.0325, "step": 178040 }, { - "epoch": 1.93, - "learning_rate": 1.112661431630865e-05, - "loss": 0.0236, + "epoch": 1.15, + "learning_rate": 0.00012762348567482265, + "loss": 0.0347, "step": 178050 }, { - "epoch": 1.93, - "learning_rate": 1.1110390031799596e-05, - "loss": 0.0309, + "epoch": 1.15, + "learning_rate": 0.00012761380432046573, + "loss": 0.0248, "step": 178060 }, { - "epoch": 1.93, - "learning_rate": 1.1094165747290544e-05, - "loss": 0.0232, + "epoch": 1.15, + "learning_rate": 0.0001276041229661088, + "loss": 0.0347, "step": 178070 }, { - "epoch": 1.93, - "learning_rate": 1.107794146278149e-05, - "loss": 0.0192, + "epoch": 1.15, + "learning_rate": 0.00012759444161175186, + "loss": 0.0365, "step": 178080 }, { - "epoch": 1.93, - "learning_rate": 1.1061717178272437e-05, - "loss": 0.0234, + "epoch": 1.15, + "learning_rate": 0.00012758476025739494, + "loss": 0.0323, "step": 178090 }, { - "epoch": 1.93, - "learning_rate": 1.1045492893763383e-05, - "loss": 0.0215, + "epoch": 1.15, + "learning_rate": 0.000127575078903038, + "loss": 0.0311, "step": 178100 }, { - "epoch": 1.93, - "learning_rate": 1.102926860925433e-05, - "loss": 0.0216, + "epoch": 1.15, + "learning_rate": 0.00012756539754868107, + "loss": 0.0311, "step": 178110 }, { - "epoch": 1.93, - "learning_rate": 1.1013044324745278e-05, - "loss": 0.0227, + "epoch": 1.15, + "learning_rate": 0.00012755571619432412, + "loss": 0.0334, "step": 178120 }, { - "epoch": 1.93, - "learning_rate": 1.0996820040236224e-05, - "loss": 0.0255, + "epoch": 1.15, + "learning_rate": 0.0001275460348399672, + "loss": 0.0345, "step": 178130 }, { - "epoch": 1.93, - "learning_rate": 1.098059575572717e-05, - "loss": 0.0257, + "epoch": 1.15, + "learning_rate": 0.00012753635348561028, + "loss": 0.0382, "step": 178140 }, { - "epoch": 1.93, - "learning_rate": 1.0964371471218117e-05, - "loss": 0.0213, + "epoch": 1.15, + "learning_rate": 0.00012752667213125334, + "loss": 0.0345, "step": 178150 }, { - "epoch": 1.93, - "learning_rate": 1.0948147186709065e-05, - "loss": 0.0261, + "epoch": 1.15, + "learning_rate": 0.0001275169907768964, + "loss": 0.0327, "step": 178160 }, { - "epoch": 1.93, - "learning_rate": 1.0931922902200011e-05, - "loss": 0.0214, + "epoch": 1.15, + "learning_rate": 0.00012750730942253947, + "loss": 0.033, "step": 178170 }, { - "epoch": 1.93, - "learning_rate": 1.0915698617690958e-05, - "loss": 0.0216, + "epoch": 1.15, + "learning_rate": 0.00012749762806818255, + "loss": 0.0279, "step": 178180 }, { - "epoch": 1.93, - "learning_rate": 1.0899474333181904e-05, - "loss": 0.0249, + "epoch": 1.15, + "learning_rate": 0.0001274879467138256, + "loss": 0.0326, "step": 178190 }, { - "epoch": 1.93, - "learning_rate": 1.0883250048672854e-05, - "loss": 0.022, + "epoch": 1.15, + "learning_rate": 0.00012747826535946868, + "loss": 0.0272, "step": 178200 }, { - "epoch": 1.93, - "learning_rate": 1.08670257641638e-05, - "loss": 0.0211, + "epoch": 1.15, + "learning_rate": 0.00012746858400511173, + "loss": 0.0344, "step": 178210 }, { - "epoch": 1.93, - "learning_rate": 1.0850801479654747e-05, - "loss": 0.0247, + "epoch": 1.15, + "learning_rate": 0.0001274589026507548, + "loss": 0.0405, "step": 178220 }, { - "epoch": 1.93, - "learning_rate": 1.0834577195145695e-05, - "loss": 0.0243, + "epoch": 1.15, + "learning_rate": 0.00012744922129639787, + "loss": 0.0308, "step": 178230 }, { - "epoch": 1.93, - "learning_rate": 1.0818352910636641e-05, - "loss": 0.023, + "epoch": 1.15, + "learning_rate": 0.00012743953994204095, + "loss": 0.0302, "step": 178240 }, { - "epoch": 1.93, - "learning_rate": 1.0802128626127587e-05, - "loss": 0.022, + "epoch": 1.15, + "learning_rate": 0.00012742985858768402, + "loss": 0.0345, "step": 178250 }, { - "epoch": 1.93, - "learning_rate": 1.0785904341618534e-05, - "loss": 0.0211, + "epoch": 1.15, + "learning_rate": 0.00012742017723332708, + "loss": 0.0335, "step": 178260 }, { - "epoch": 1.93, - "learning_rate": 1.076968005710948e-05, - "loss": 0.0217, + "epoch": 1.15, + "learning_rate": 0.00012741049587897016, + "loss": 0.0405, "step": 178270 }, { - "epoch": 1.93, - "learning_rate": 1.0753455772600428e-05, - "loss": 0.0216, + "epoch": 1.15, + "learning_rate": 0.0001274008145246132, + "loss": 0.0344, "step": 178280 }, { - "epoch": 1.93, - "learning_rate": 1.0737231488091375e-05, - "loss": 0.0211, + "epoch": 1.15, + "learning_rate": 0.0001273911331702563, + "loss": 0.0325, "step": 178290 }, { - "epoch": 1.93, - "learning_rate": 1.0721007203582321e-05, - "loss": 0.0229, + "epoch": 1.15, + "learning_rate": 0.00012738145181589934, + "loss": 0.0311, "step": 178300 }, { - "epoch": 1.93, - "learning_rate": 1.0704782919073267e-05, - "loss": 0.0187, + "epoch": 1.15, + "learning_rate": 0.00012737177046154242, + "loss": 0.035, "step": 178310 }, { - "epoch": 1.93, - "learning_rate": 1.0688558634564216e-05, - "loss": 0.0229, + "epoch": 1.15, + "learning_rate": 0.0001273620891071855, + "loss": 0.0317, "step": 178320 }, { - "epoch": 1.93, - "learning_rate": 1.0672334350055162e-05, - "loss": 0.0178, + "epoch": 1.15, + "learning_rate": 0.00012735240775282855, + "loss": 0.0364, "step": 178330 }, { - "epoch": 1.93, - "learning_rate": 1.0656110065546108e-05, - "loss": 0.0291, + "epoch": 1.15, + "learning_rate": 0.00012734272639847163, + "loss": 0.0356, "step": 178340 }, { - "epoch": 1.93, - "learning_rate": 1.0639885781037055e-05, - "loss": 0.0183, + "epoch": 1.15, + "learning_rate": 0.0001273330450441147, + "loss": 0.0357, "step": 178350 }, { - "epoch": 1.93, - "learning_rate": 1.0623661496528003e-05, - "loss": 0.0236, + "epoch": 1.15, + "learning_rate": 0.00012732336368975777, + "loss": 0.0339, "step": 178360 }, { - "epoch": 1.93, - "learning_rate": 1.0607437212018949e-05, - "loss": 0.0208, + "epoch": 1.15, + "learning_rate": 0.00012731368233540082, + "loss": 0.0346, "step": 178370 }, { - "epoch": 1.93, - "learning_rate": 1.0591212927509896e-05, - "loss": 0.026, + "epoch": 1.15, + "learning_rate": 0.0001273040009810439, + "loss": 0.0333, "step": 178380 }, { - "epoch": 1.93, - "learning_rate": 1.0574988643000842e-05, - "loss": 0.0212, + "epoch": 1.15, + "learning_rate": 0.00012729431962668698, + "loss": 0.039, "step": 178390 }, { - "epoch": 1.93, - "learning_rate": 1.055876435849179e-05, - "loss": 0.0278, + "epoch": 1.15, + "learning_rate": 0.00012728463827233003, + "loss": 0.0374, "step": 178400 }, { - "epoch": 1.93, - "learning_rate": 1.0542540073982736e-05, - "loss": 0.023, + "epoch": 1.15, + "learning_rate": 0.00012727495691797308, + "loss": 0.03, "step": 178410 }, { - "epoch": 1.93, - "learning_rate": 1.0526315789473683e-05, - "loss": 0.0232, + "epoch": 1.15, + "learning_rate": 0.00012726527556361616, + "loss": 0.0338, "step": 178420 }, { - "epoch": 1.93, - "learning_rate": 1.0510091504964629e-05, - "loss": 0.0243, + "epoch": 1.15, + "learning_rate": 0.00012725559420925924, + "loss": 0.0292, "step": 178430 }, { - "epoch": 1.93, - "learning_rate": 1.0493867220455576e-05, - "loss": 0.0233, + "epoch": 1.15, + "learning_rate": 0.0001272459128549023, + "loss": 0.0315, "step": 178440 }, { - "epoch": 1.93, - "learning_rate": 1.0477642935946524e-05, - "loss": 0.0235, + "epoch": 1.15, + "learning_rate": 0.00012723623150054538, + "loss": 0.0375, "step": 178450 }, { - "epoch": 1.93, - "learning_rate": 1.046141865143747e-05, - "loss": 0.0256, + "epoch": 1.15, + "learning_rate": 0.00012722655014618846, + "loss": 0.0349, "step": 178460 }, { - "epoch": 1.93, - "learning_rate": 1.0445194366928416e-05, - "loss": 0.0193, + "epoch": 1.15, + "learning_rate": 0.0001272168687918315, + "loss": 0.0293, "step": 178470 }, { - "epoch": 1.93, - "learning_rate": 1.0428970082419363e-05, - "loss": 0.0213, + "epoch": 1.15, + "learning_rate": 0.00012720718743747456, + "loss": 0.0345, "step": 178480 }, { - "epoch": 1.93, - "learning_rate": 1.0412745797910313e-05, - "loss": 0.0203, + "epoch": 1.15, + "learning_rate": 0.00012719750608311764, + "loss": 0.03, "step": 178490 }, { - "epoch": 1.93, - "learning_rate": 1.0396521513401259e-05, - "loss": 0.0223, + "epoch": 1.15, + "learning_rate": 0.00012718782472876072, + "loss": 0.0304, "step": 178500 }, { - "epoch": 1.93, - "learning_rate": 1.0380297228892205e-05, - "loss": 0.0181, + "epoch": 1.15, + "learning_rate": 0.00012717814337440377, + "loss": 0.0341, "step": 178510 }, { - "epoch": 1.93, - "learning_rate": 1.0364072944383153e-05, - "loss": 0.0205, + "epoch": 1.15, + "learning_rate": 0.00012716846202004685, + "loss": 0.0319, "step": 178520 }, { - "epoch": 1.93, - "learning_rate": 1.03478486598741e-05, - "loss": 0.0253, + "epoch": 1.15, + "learning_rate": 0.0001271587806656899, + "loss": 0.0356, "step": 178530 }, { - "epoch": 1.93, - "learning_rate": 1.0331624375365046e-05, - "loss": 0.0251, + "epoch": 1.15, + "learning_rate": 0.000127149099311333, + "loss": 0.0416, "step": 178540 }, { - "epoch": 1.93, - "learning_rate": 1.0315400090855993e-05, - "loss": 0.0201, + "epoch": 1.15, + "learning_rate": 0.00012713941795697604, + "loss": 0.0327, "step": 178550 }, { - "epoch": 1.93, - "learning_rate": 1.0299175806346939e-05, - "loss": 0.0215, + "epoch": 1.15, + "learning_rate": 0.00012712973660261912, + "loss": 0.0272, "step": 178560 }, { - "epoch": 1.93, - "learning_rate": 1.0282951521837887e-05, - "loss": 0.0245, + "epoch": 1.15, + "learning_rate": 0.0001271200552482622, + "loss": 0.0369, "step": 178570 }, { - "epoch": 1.93, - "learning_rate": 1.0266727237328833e-05, - "loss": 0.0297, + "epoch": 1.15, + "learning_rate": 0.00012711037389390525, + "loss": 0.0346, "step": 178580 }, { - "epoch": 1.93, - "learning_rate": 1.025050295281978e-05, - "loss": 0.0221, + "epoch": 1.15, + "learning_rate": 0.00012710069253954833, + "loss": 0.0354, "step": 178590 }, { - "epoch": 1.93, - "learning_rate": 1.0234278668310726e-05, - "loss": 0.0205, + "epoch": 1.15, + "learning_rate": 0.00012709101118519138, + "loss": 0.0399, "step": 178600 }, { - "epoch": 1.93, - "learning_rate": 1.0218054383801674e-05, - "loss": 0.0233, + "epoch": 1.15, + "learning_rate": 0.00012708132983083444, + "loss": 0.0325, "step": 178610 }, { - "epoch": 1.93, - "learning_rate": 1.020183009929262e-05, - "loss": 0.0198, + "epoch": 1.15, + "learning_rate": 0.00012707164847647752, + "loss": 0.0352, "step": 178620 }, { - "epoch": 1.93, - "learning_rate": 1.0185605814783567e-05, - "loss": 0.0246, + "epoch": 1.15, + "learning_rate": 0.0001270619671221206, + "loss": 0.0325, "step": 178630 }, { - "epoch": 1.93, - "learning_rate": 1.0169381530274513e-05, - "loss": 0.0264, + "epoch": 1.15, + "learning_rate": 0.00012705228576776368, + "loss": 0.0342, "step": 178640 }, { - "epoch": 1.93, - "learning_rate": 1.0153157245765461e-05, - "loss": 0.0212, + "epoch": 1.15, + "learning_rate": 0.00012704260441340673, + "loss": 0.0313, "step": 178650 }, { - "epoch": 1.93, - "learning_rate": 1.0136932961256408e-05, - "loss": 0.0221, + "epoch": 1.15, + "learning_rate": 0.0001270329230590498, + "loss": 0.0369, "step": 178660 }, { - "epoch": 1.93, - "learning_rate": 1.0120708676747354e-05, - "loss": 0.0255, + "epoch": 1.15, + "learning_rate": 0.00012702324170469286, + "loss": 0.036, "step": 178670 }, { - "epoch": 1.93, - "learning_rate": 1.01044843922383e-05, - "loss": 0.0216, + "epoch": 1.15, + "learning_rate": 0.00012701356035033591, + "loss": 0.0286, "step": 178680 }, { - "epoch": 1.93, - "learning_rate": 1.0088260107729249e-05, - "loss": 0.0241, + "epoch": 1.15, + "learning_rate": 0.000127003878995979, + "loss": 0.0347, "step": 178690 }, { - "epoch": 1.93, - "learning_rate": 1.0072035823220195e-05, - "loss": 0.0224, + "epoch": 1.15, + "learning_rate": 0.00012699419764162207, + "loss": 0.0338, "step": 178700 }, { - "epoch": 1.93, - "learning_rate": 1.0055811538711141e-05, - "loss": 0.0231, + "epoch": 1.15, + "learning_rate": 0.00012698451628726515, + "loss": 0.0352, "step": 178710 }, { - "epoch": 1.93, - "learning_rate": 1.0039587254202088e-05, - "loss": 0.0198, + "epoch": 1.15, + "learning_rate": 0.0001269748349329082, + "loss": 0.034, "step": 178720 }, { - "epoch": 1.93, - "learning_rate": 1.0023362969693034e-05, - "loss": 0.0205, + "epoch": 1.15, + "learning_rate": 0.00012696515357855126, + "loss": 0.0304, "step": 178730 }, { - "epoch": 1.93, - "learning_rate": 1.0007138685183982e-05, - "loss": 0.0258, + "epoch": 1.15, + "learning_rate": 0.00012695547222419434, + "loss": 0.0413, "step": 178740 }, { - "epoch": 1.93, - "learning_rate": 9.990914400674929e-06, - "loss": 0.0231, + "epoch": 1.15, + "learning_rate": 0.0001269457908698374, + "loss": 0.033, "step": 178750 }, { - "epoch": 1.93, - "learning_rate": 9.974690116165875e-06, - "loss": 0.0257, + "epoch": 1.15, + "learning_rate": 0.00012693610951548047, + "loss": 0.0334, "step": 178760 }, { - "epoch": 1.93, - "learning_rate": 9.958465831656821e-06, - "loss": 0.023, - "step": 178770 + "epoch": 1.15, + "learning_rate": 0.00012692642816112355, + "loss": 0.034, + "step": 178770 }, { - "epoch": 1.93, - "learning_rate": 9.942241547147771e-06, - "loss": 0.0202, + "epoch": 1.15, + "learning_rate": 0.00012691674680676663, + "loss": 0.0293, "step": 178780 }, { - "epoch": 1.93, - "learning_rate": 9.926017262638718e-06, - "loss": 0.0231, + "epoch": 1.15, + "learning_rate": 0.00012690706545240968, + "loss": 0.0312, "step": 178790 }, { - "epoch": 1.93, - "learning_rate": 9.909792978129664e-06, - "loss": 0.0317, + "epoch": 1.15, + "learning_rate": 0.00012689738409805274, + "loss": 0.0288, "step": 178800 }, { - "epoch": 1.93, - "learning_rate": 9.893568693620612e-06, - "loss": 0.0219, + "epoch": 1.15, + "learning_rate": 0.00012688770274369582, + "loss": 0.0327, "step": 178810 }, { - "epoch": 1.93, - "learning_rate": 9.877344409111558e-06, - "loss": 0.026, + "epoch": 1.15, + "learning_rate": 0.00012687802138933887, + "loss": 0.0316, "step": 178820 }, { - "epoch": 1.93, - "learning_rate": 9.861120124602505e-06, - "loss": 0.0223, + "epoch": 1.15, + "learning_rate": 0.00012686834003498195, + "loss": 0.0347, "step": 178830 }, { - "epoch": 1.93, - "learning_rate": 9.844895840093451e-06, - "loss": 0.0235, + "epoch": 1.15, + "learning_rate": 0.00012685865868062503, + "loss": 0.0337, "step": 178840 }, { - "epoch": 1.93, - "learning_rate": 9.8286715555844e-06, - "loss": 0.0272, + "epoch": 1.15, + "learning_rate": 0.00012684897732626808, + "loss": 0.0276, "step": 178850 }, { - "epoch": 1.93, - "learning_rate": 9.812447271075346e-06, - "loss": 0.0186, + "epoch": 1.15, + "learning_rate": 0.00012683929597191116, + "loss": 0.0339, "step": 178860 }, { - "epoch": 1.93, - "learning_rate": 9.796222986566292e-06, - "loss": 0.0248, + "epoch": 1.15, + "learning_rate": 0.0001268296146175542, + "loss": 0.0312, "step": 178870 }, { - "epoch": 1.93, - "learning_rate": 9.779998702057238e-06, - "loss": 0.0271, + "epoch": 1.15, + "learning_rate": 0.0001268199332631973, + "loss": 0.0261, "step": 178880 }, { - "epoch": 1.93, - "learning_rate": 9.763774417548185e-06, - "loss": 0.0239, + "epoch": 1.15, + "learning_rate": 0.00012681025190884035, + "loss": 0.0316, "step": 178890 }, { - "epoch": 1.93, - "learning_rate": 9.747550133039133e-06, - "loss": 0.0223, + "epoch": 1.15, + "learning_rate": 0.00012680057055448343, + "loss": 0.0291, "step": 178900 }, { - "epoch": 1.94, - "learning_rate": 9.73132584853008e-06, - "loss": 0.0227, + "epoch": 1.15, + "learning_rate": 0.0001267908892001265, + "loss": 0.0307, "step": 178910 }, { - "epoch": 1.94, - "learning_rate": 9.715101564021026e-06, - "loss": 0.0216, + "epoch": 1.15, + "learning_rate": 0.00012678120784576956, + "loss": 0.0325, "step": 178920 }, { - "epoch": 1.94, - "learning_rate": 9.698877279511972e-06, - "loss": 0.0271, + "epoch": 1.15, + "learning_rate": 0.0001267715264914126, + "loss": 0.0375, "step": 178930 }, { - "epoch": 1.94, - "learning_rate": 9.68265299500292e-06, - "loss": 0.0238, + "epoch": 1.15, + "learning_rate": 0.0001267618451370557, + "loss": 0.038, "step": 178940 }, { - "epoch": 1.94, - "learning_rate": 9.666428710493866e-06, - "loss": 0.0234, + "epoch": 1.15, + "learning_rate": 0.00012675216378269877, + "loss": 0.0323, "step": 178950 }, { - "epoch": 1.94, - "learning_rate": 9.650204425984813e-06, - "loss": 0.025, + "epoch": 1.16, + "learning_rate": 0.00012674248242834182, + "loss": 0.0321, "step": 178960 }, { - "epoch": 1.94, - "learning_rate": 9.63398014147576e-06, - "loss": 0.0225, + "epoch": 1.16, + "learning_rate": 0.0001267328010739849, + "loss": 0.0334, "step": 178970 }, { - "epoch": 1.94, - "learning_rate": 9.617755856966707e-06, - "loss": 0.0258, + "epoch": 1.16, + "learning_rate": 0.00012672311971962798, + "loss": 0.0335, "step": 178980 }, { - "epoch": 1.94, - "learning_rate": 9.601531572457654e-06, - "loss": 0.0249, + "epoch": 1.16, + "learning_rate": 0.00012671343836527104, + "loss": 0.0333, "step": 178990 }, { - "epoch": 1.94, - "learning_rate": 9.5853072879486e-06, - "loss": 0.0227, + "epoch": 1.16, + "learning_rate": 0.0001267037570109141, + "loss": 0.0288, "step": 179000 }, { - "epoch": 1.94, - "eval_cer": 0.9210615594205049, - "eval_loss": 0.020359842106699944, - "eval_runtime": 118.929, - "eval_samples_per_second": 16.817, - "eval_steps_per_second": 4.204, + "epoch": 1.16, + "eval_cer": 0.9199475765450231, + "eval_loss": 0.023168489336967468, + "eval_runtime": 120.4946, + "eval_samples_per_second": 16.598, + "eval_steps_per_second": 4.15, "step": 179000 }, { - "epoch": 1.94, - "learning_rate": 9.569083003439546e-06, - "loss": 0.0243, + "epoch": 1.16, + "learning_rate": 0.00012669407565655717, + "loss": 0.0343, "step": 179010 }, { - "epoch": 1.94, - "learning_rate": 9.552858718930493e-06, - "loss": 0.0247, + "epoch": 1.16, + "learning_rate": 0.00012668439430220025, + "loss": 0.0291, "step": 179020 }, { - "epoch": 1.94, - "learning_rate": 9.536634434421441e-06, - "loss": 0.0201, + "epoch": 1.16, + "learning_rate": 0.0001266747129478433, + "loss": 0.0318, "step": 179030 }, { - "epoch": 1.94, - "learning_rate": 9.520410149912387e-06, - "loss": 0.0235, + "epoch": 1.16, + "learning_rate": 0.00012666503159348638, + "loss": 0.0302, "step": 179040 }, { - "epoch": 1.94, - "learning_rate": 9.504185865403334e-06, - "loss": 0.0247, + "epoch": 1.16, + "learning_rate": 0.00012665535023912943, + "loss": 0.0339, "step": 179050 }, { - "epoch": 1.94, - "learning_rate": 9.48796158089428e-06, - "loss": 0.0225, + "epoch": 1.16, + "learning_rate": 0.0001266456688847725, + "loss": 0.0305, "step": 179060 }, { - "epoch": 1.94, - "learning_rate": 9.471737296385228e-06, - "loss": 0.0232, + "epoch": 1.16, + "learning_rate": 0.00012663598753041556, + "loss": 0.0303, "step": 179070 }, { - "epoch": 1.94, - "learning_rate": 9.455513011876176e-06, - "loss": 0.0254, + "epoch": 1.16, + "learning_rate": 0.00012662630617605864, + "loss": 0.0334, "step": 179080 }, { - "epoch": 1.94, - "learning_rate": 9.439288727367123e-06, - "loss": 0.0213, + "epoch": 1.16, + "learning_rate": 0.00012661662482170172, + "loss": 0.0333, "step": 179090 }, { - "epoch": 1.94, - "learning_rate": 9.42306444285807e-06, - "loss": 0.0307, + "epoch": 1.16, + "learning_rate": 0.00012660694346734478, + "loss": 0.0271, "step": 179100 }, { - "epoch": 1.94, - "learning_rate": 9.406840158349017e-06, - "loss": 0.0252, + "epoch": 1.16, + "learning_rate": 0.00012659726211298786, + "loss": 0.0307, "step": 179110 }, { - "epoch": 1.94, - "learning_rate": 9.390615873839963e-06, - "loss": 0.0233, + "epoch": 1.16, + "learning_rate": 0.0001265875807586309, + "loss": 0.0302, "step": 179120 }, { - "epoch": 1.94, - "learning_rate": 9.37439158933091e-06, - "loss": 0.0283, + "epoch": 1.16, + "learning_rate": 0.000126577899404274, + "loss": 0.0338, "step": 179130 }, { - "epoch": 1.94, - "learning_rate": 9.358167304821856e-06, - "loss": 0.0214, + "epoch": 1.16, + "learning_rate": 0.00012656821804991704, + "loss": 0.0276, "step": 179140 }, { - "epoch": 1.94, - "learning_rate": 9.341943020312804e-06, - "loss": 0.0229, + "epoch": 1.16, + "learning_rate": 0.00012655853669556012, + "loss": 0.0359, "step": 179150 }, { - "epoch": 1.94, - "learning_rate": 9.32571873580375e-06, - "loss": 0.0241, + "epoch": 1.16, + "learning_rate": 0.0001265488553412032, + "loss": 0.0343, "step": 179160 }, { - "epoch": 1.94, - "learning_rate": 9.309494451294697e-06, - "loss": 0.0232, + "epoch": 1.16, + "learning_rate": 0.00012653917398684625, + "loss": 0.0316, "step": 179170 }, { - "epoch": 1.94, - "learning_rate": 9.293270166785643e-06, - "loss": 0.021, + "epoch": 1.16, + "learning_rate": 0.00012652949263248933, + "loss": 0.0292, "step": 179180 }, { - "epoch": 1.94, - "learning_rate": 9.277045882276591e-06, - "loss": 0.0245, + "epoch": 1.16, + "learning_rate": 0.0001265198112781324, + "loss": 0.0391, "step": 179190 }, { - "epoch": 1.94, - "learning_rate": 9.260821597767538e-06, - "loss": 0.0235, + "epoch": 1.16, + "learning_rate": 0.00012651012992377547, + "loss": 0.0359, "step": 179200 }, { - "epoch": 1.94, - "learning_rate": 9.244597313258484e-06, - "loss": 0.0251, + "epoch": 1.16, + "learning_rate": 0.00012650044856941852, + "loss": 0.0342, "step": 179210 }, { - "epoch": 1.94, - "learning_rate": 9.22837302874943e-06, - "loss": 0.0211, + "epoch": 1.16, + "learning_rate": 0.0001264907672150616, + "loss": 0.033, "step": 179220 }, { - "epoch": 1.94, - "learning_rate": 9.212148744240379e-06, - "loss": 0.0191, + "epoch": 1.16, + "learning_rate": 0.00012648108586070468, + "loss": 0.0364, "step": 179230 }, { - "epoch": 1.94, - "learning_rate": 9.195924459731325e-06, - "loss": 0.0245, + "epoch": 1.16, + "learning_rate": 0.00012647140450634773, + "loss": 0.0326, "step": 179240 }, { - "epoch": 1.94, - "learning_rate": 9.179700175222271e-06, - "loss": 0.0243, + "epoch": 1.16, + "learning_rate": 0.00012646172315199078, + "loss": 0.0348, "step": 179250 }, { - "epoch": 1.94, - "learning_rate": 9.163475890713218e-06, - "loss": 0.0218, + "epoch": 1.16, + "learning_rate": 0.00012645204179763386, + "loss": 0.0336, "step": 179260 }, { - "epoch": 1.94, - "learning_rate": 9.147251606204166e-06, - "loss": 0.0256, + "epoch": 1.16, + "learning_rate": 0.00012644236044327694, + "loss": 0.036, "step": 179270 }, { - "epoch": 1.94, - "learning_rate": 9.131027321695112e-06, - "loss": 0.0232, + "epoch": 1.16, + "learning_rate": 0.00012643267908892, + "loss": 0.0283, "step": 179280 }, { - "epoch": 1.94, - "learning_rate": 9.114803037186059e-06, - "loss": 0.0277, + "epoch": 1.16, + "learning_rate": 0.00012642299773456308, + "loss": 0.0382, "step": 179290 }, { - "epoch": 1.94, - "learning_rate": 9.098578752677007e-06, - "loss": 0.0215, + "epoch": 1.16, + "learning_rate": 0.00012641331638020613, + "loss": 0.0318, "step": 179300 }, { - "epoch": 1.94, - "learning_rate": 9.082354468167953e-06, - "loss": 0.0259, + "epoch": 1.16, + "learning_rate": 0.0001264036350258492, + "loss": 0.0365, "step": 179310 }, { - "epoch": 1.94, - "learning_rate": 9.0661301836589e-06, - "loss": 0.019, + "epoch": 1.16, + "learning_rate": 0.00012639395367149226, + "loss": 0.0293, "step": 179320 }, { - "epoch": 1.94, - "learning_rate": 9.049905899149848e-06, - "loss": 0.0198, + "epoch": 1.16, + "learning_rate": 0.00012638427231713534, + "loss": 0.0368, "step": 179330 }, { - "epoch": 1.94, - "learning_rate": 9.033681614640794e-06, - "loss": 0.0248, + "epoch": 1.16, + "learning_rate": 0.00012637459096277842, + "loss": 0.0306, "step": 179340 }, { - "epoch": 1.94, - "learning_rate": 9.01745733013174e-06, - "loss": 0.025, + "epoch": 1.16, + "learning_rate": 0.00012636490960842147, + "loss": 0.0303, "step": 179350 }, { - "epoch": 1.94, - "learning_rate": 9.001233045622687e-06, - "loss": 0.0241, + "epoch": 1.16, + "learning_rate": 0.00012635522825406455, + "loss": 0.0296, "step": 179360 }, { - "epoch": 1.94, - "learning_rate": 8.985008761113635e-06, - "loss": 0.0256, + "epoch": 1.16, + "learning_rate": 0.0001263455468997076, + "loss": 0.0362, "step": 179370 }, { - "epoch": 1.94, - "learning_rate": 8.968784476604581e-06, - "loss": 0.0247, + "epoch": 1.16, + "learning_rate": 0.00012633586554535069, + "loss": 0.0345, "step": 179380 }, { - "epoch": 1.94, - "learning_rate": 8.952560192095528e-06, - "loss": 0.0256, + "epoch": 1.16, + "learning_rate": 0.00012632618419099374, + "loss": 0.0306, "step": 179390 }, { - "epoch": 1.94, - "learning_rate": 8.936335907586474e-06, - "loss": 0.023, + "epoch": 1.16, + "learning_rate": 0.00012631650283663682, + "loss": 0.0333, "step": 179400 }, { - "epoch": 1.94, - "learning_rate": 8.92011162307742e-06, - "loss": 0.0244, + "epoch": 1.16, + "learning_rate": 0.0001263068214822799, + "loss": 0.0316, "step": 179410 }, { - "epoch": 1.94, - "learning_rate": 8.903887338568368e-06, - "loss": 0.0234, + "epoch": 1.16, + "learning_rate": 0.00012629714012792295, + "loss": 0.0304, "step": 179420 }, { - "epoch": 1.94, - "learning_rate": 8.887663054059315e-06, - "loss": 0.0241, + "epoch": 1.16, + "learning_rate": 0.00012628745877356603, + "loss": 0.0318, "step": 179430 }, { - "epoch": 1.94, - "learning_rate": 8.871438769550263e-06, - "loss": 0.0284, + "epoch": 1.16, + "learning_rate": 0.00012627777741920908, + "loss": 0.0317, "step": 179440 }, { - "epoch": 1.94, - "learning_rate": 8.85521448504121e-06, - "loss": 0.0265, + "epoch": 1.16, + "learning_rate": 0.00012626809606485214, + "loss": 0.0359, "step": 179450 }, { - "epoch": 1.94, - "learning_rate": 8.838990200532156e-06, - "loss": 0.0224, + "epoch": 1.16, + "learning_rate": 0.00012625841471049522, + "loss": 0.0343, "step": 179460 }, { - "epoch": 1.94, - "learning_rate": 8.822765916023104e-06, - "loss": 0.0234, + "epoch": 1.16, + "learning_rate": 0.0001262487333561383, + "loss": 0.0366, "step": 179470 }, { - "epoch": 1.94, - "learning_rate": 8.80654163151405e-06, - "loss": 0.0212, + "epoch": 1.16, + "learning_rate": 0.00012623905200178138, + "loss": 0.0307, "step": 179480 }, { - "epoch": 1.94, - "learning_rate": 8.790317347004997e-06, - "loss": 0.0247, + "epoch": 1.16, + "learning_rate": 0.00012622937064742443, + "loss": 0.0361, "step": 179490 }, { - "epoch": 1.94, - "learning_rate": 8.774093062495943e-06, - "loss": 0.0239, + "epoch": 1.16, + "learning_rate": 0.00012621968929306748, + "loss": 0.0324, "step": 179500 }, { - "epoch": 1.94, - "learning_rate": 8.75786877798689e-06, - "loss": 0.0216, + "epoch": 1.16, + "learning_rate": 0.00012621000793871056, + "loss": 0.035, "step": 179510 }, { - "epoch": 1.94, - "learning_rate": 8.741644493477837e-06, - "loss": 0.0279, + "epoch": 1.16, + "learning_rate": 0.0001262003265843536, + "loss": 0.0405, "step": 179520 }, { - "epoch": 1.94, - "learning_rate": 8.725420208968784e-06, - "loss": 0.025, + "epoch": 1.16, + "learning_rate": 0.0001261906452299967, + "loss": 0.0441, "step": 179530 }, { - "epoch": 1.94, - "learning_rate": 8.70919592445973e-06, - "loss": 0.0192, + "epoch": 1.16, + "learning_rate": 0.00012618096387563977, + "loss": 0.0379, "step": 179540 }, { - "epoch": 1.94, - "learning_rate": 8.692971639950676e-06, - "loss": 0.0201, + "epoch": 1.16, + "learning_rate": 0.00012617128252128285, + "loss": 0.031, "step": 179550 }, { - "epoch": 1.94, - "learning_rate": 8.676747355441625e-06, - "loss": 0.0206, + "epoch": 1.16, + "learning_rate": 0.0001261616011669259, + "loss": 0.0281, "step": 179560 }, { - "epoch": 1.94, - "learning_rate": 8.660523070932571e-06, - "loss": 0.0246, + "epoch": 1.16, + "learning_rate": 0.00012615191981256896, + "loss": 0.0274, "step": 179570 }, { - "epoch": 1.94, - "learning_rate": 8.644298786423517e-06, - "loss": 0.0244, + "epoch": 1.16, + "learning_rate": 0.00012614223845821204, + "loss": 0.0312, "step": 179580 }, { - "epoch": 1.94, - "learning_rate": 8.628074501914465e-06, - "loss": 0.0265, + "epoch": 1.16, + "learning_rate": 0.0001261325571038551, + "loss": 0.0372, "step": 179590 }, { - "epoch": 1.94, - "learning_rate": 8.611850217405412e-06, - "loss": 0.025, + "epoch": 1.16, + "learning_rate": 0.00012612287574949817, + "loss": 0.0311, "step": 179600 }, { - "epoch": 1.94, - "learning_rate": 8.595625932896358e-06, - "loss": 0.0211, + "epoch": 1.16, + "learning_rate": 0.00012611319439514125, + "loss": 0.0317, "step": 179610 }, { - "epoch": 1.94, - "learning_rate": 8.579401648387306e-06, - "loss": 0.022, + "epoch": 1.16, + "learning_rate": 0.0001261035130407843, + "loss": 0.0286, "step": 179620 }, { - "epoch": 1.94, - "learning_rate": 8.563177363878253e-06, - "loss": 0.0226, + "epoch": 1.16, + "learning_rate": 0.00012609383168642738, + "loss": 0.0376, "step": 179630 }, { - "epoch": 1.94, - "learning_rate": 8.546953079369199e-06, - "loss": 0.0258, + "epoch": 1.16, + "learning_rate": 0.00012608415033207044, + "loss": 0.0339, "step": 179640 }, { - "epoch": 1.94, - "learning_rate": 8.530728794860145e-06, - "loss": 0.0212, + "epoch": 1.16, + "learning_rate": 0.00012607446897771352, + "loss": 0.0324, "step": 179650 }, { - "epoch": 1.94, - "learning_rate": 8.514504510351093e-06, - "loss": 0.0254, + "epoch": 1.16, + "learning_rate": 0.00012606478762335657, + "loss": 0.0346, "step": 179660 }, { - "epoch": 1.94, - "learning_rate": 8.49828022584204e-06, - "loss": 0.0268, + "epoch": 1.16, + "learning_rate": 0.00012605510626899965, + "loss": 0.0366, "step": 179670 }, { - "epoch": 1.94, - "learning_rate": 8.482055941332986e-06, - "loss": 0.0213, + "epoch": 1.16, + "learning_rate": 0.00012604542491464273, + "loss": 0.0291, "step": 179680 }, { - "epoch": 1.94, - "learning_rate": 8.465831656823933e-06, - "loss": 0.022, + "epoch": 1.16, + "learning_rate": 0.00012603574356028578, + "loss": 0.0303, "step": 179690 }, { - "epoch": 1.94, - "learning_rate": 8.44960737231488e-06, - "loss": 0.0236, + "epoch": 1.16, + "learning_rate": 0.00012602606220592883, + "loss": 0.0351, "step": 179700 }, { - "epoch": 1.94, - "learning_rate": 8.433383087805827e-06, - "loss": 0.0266, + "epoch": 1.16, + "learning_rate": 0.0001260163808515719, + "loss": 0.0298, "step": 179710 }, { - "epoch": 1.94, - "learning_rate": 8.417158803296773e-06, - "loss": 0.0393, + "epoch": 1.16, + "learning_rate": 0.000126006699497215, + "loss": 0.0374, "step": 179720 }, { - "epoch": 1.94, - "learning_rate": 8.40093451878772e-06, - "loss": 0.0209, + "epoch": 1.16, + "learning_rate": 0.00012599701814285805, + "loss": 0.0258, "step": 179730 }, { - "epoch": 1.94, - "learning_rate": 8.384710234278668e-06, - "loss": 0.0213, + "epoch": 1.16, + "learning_rate": 0.00012598733678850112, + "loss": 0.0305, "step": 179740 }, { - "epoch": 1.94, - "learning_rate": 8.368485949769614e-06, - "loss": 0.0244, + "epoch": 1.16, + "learning_rate": 0.0001259776554341442, + "loss": 0.0374, "step": 179750 }, { - "epoch": 1.94, - "learning_rate": 8.352261665260562e-06, - "loss": 0.02, + "epoch": 1.16, + "learning_rate": 0.00012596797407978726, + "loss": 0.0385, "step": 179760 }, { - "epoch": 1.94, - "learning_rate": 8.336037380751509e-06, - "loss": 0.0271, + "epoch": 1.16, + "learning_rate": 0.0001259582927254303, + "loss": 0.039, "step": 179770 }, { - "epoch": 1.94, - "learning_rate": 8.319813096242455e-06, - "loss": 0.0263, + "epoch": 1.16, + "learning_rate": 0.0001259486113710734, + "loss": 0.0348, "step": 179780 }, { - "epoch": 1.94, - "learning_rate": 8.303588811733402e-06, - "loss": 0.0237, + "epoch": 1.16, + "learning_rate": 0.00012593893001671647, + "loss": 0.0336, "step": 179790 }, { - "epoch": 1.94, - "learning_rate": 8.287364527224348e-06, - "loss": 0.0183, + "epoch": 1.16, + "learning_rate": 0.00012592924866235952, + "loss": 0.0302, "step": 179800 }, { - "epoch": 1.94, - "learning_rate": 8.271140242715296e-06, - "loss": 0.0221, + "epoch": 1.16, + "learning_rate": 0.0001259195673080026, + "loss": 0.0297, "step": 179810 }, { - "epoch": 1.94, - "learning_rate": 8.254915958206242e-06, - "loss": 0.0236, + "epoch": 1.16, + "learning_rate": 0.00012590988595364565, + "loss": 0.0305, "step": 179820 }, { - "epoch": 1.95, - "learning_rate": 8.238691673697189e-06, - "loss": 0.0291, + "epoch": 1.16, + "learning_rate": 0.00012590020459928873, + "loss": 0.0394, "step": 179830 }, { - "epoch": 1.95, - "learning_rate": 8.222467389188135e-06, - "loss": 0.0304, + "epoch": 1.16, + "learning_rate": 0.0001258905232449318, + "loss": 0.0309, "step": 179840 }, { - "epoch": 1.95, - "learning_rate": 8.206243104679083e-06, - "loss": 0.0284, + "epoch": 1.16, + "learning_rate": 0.00012588084189057487, + "loss": 0.0342, "step": 179850 }, { - "epoch": 1.95, - "learning_rate": 8.19001882017003e-06, - "loss": 0.0304, + "epoch": 1.16, + "learning_rate": 0.00012587116053621795, + "loss": 0.0303, "step": 179860 }, { - "epoch": 1.95, - "learning_rate": 8.173794535660976e-06, - "loss": 0.022, + "epoch": 1.16, + "learning_rate": 0.000125861479181861, + "loss": 0.0337, "step": 179870 }, { - "epoch": 1.95, - "learning_rate": 8.157570251151924e-06, - "loss": 0.0275, + "epoch": 1.16, + "learning_rate": 0.00012585179782750408, + "loss": 0.0285, "step": 179880 }, { - "epoch": 1.95, - "learning_rate": 8.14134596664287e-06, - "loss": 0.0212, + "epoch": 1.16, + "learning_rate": 0.00012584211647314713, + "loss": 0.0342, "step": 179890 }, { - "epoch": 1.95, - "learning_rate": 8.125121682133817e-06, - "loss": 0.0222, + "epoch": 1.16, + "learning_rate": 0.0001258324351187902, + "loss": 0.0282, "step": 179900 }, { - "epoch": 1.95, - "learning_rate": 8.108897397624765e-06, - "loss": 0.0242, + "epoch": 1.16, + "learning_rate": 0.00012582275376443326, + "loss": 0.0333, "step": 179910 }, { - "epoch": 1.95, - "learning_rate": 8.092673113115711e-06, - "loss": 0.0192, + "epoch": 1.16, + "learning_rate": 0.00012581307241007634, + "loss": 0.0336, "step": 179920 }, { - "epoch": 1.95, - "learning_rate": 8.076448828606658e-06, - "loss": 0.0244, + "epoch": 1.16, + "learning_rate": 0.00012580339105571942, + "loss": 0.0346, "step": 179930 }, { - "epoch": 1.95, - "learning_rate": 8.060224544097604e-06, - "loss": 0.0228, + "epoch": 1.16, + "learning_rate": 0.00012579370970136248, + "loss": 0.0358, "step": 179940 }, { - "epoch": 1.95, - "learning_rate": 8.044000259588552e-06, - "loss": 0.0254, + "epoch": 1.16, + "learning_rate": 0.00012578402834700556, + "loss": 0.032, "step": 179950 }, { - "epoch": 1.95, - "learning_rate": 8.027775975079499e-06, - "loss": 0.0282, + "epoch": 1.16, + "learning_rate": 0.0001257743469926486, + "loss": 0.0328, "step": 179960 }, { - "epoch": 1.95, - "learning_rate": 8.011551690570445e-06, - "loss": 0.0246, + "epoch": 1.16, + "learning_rate": 0.0001257646656382917, + "loss": 0.0302, "step": 179970 }, { - "epoch": 1.95, - "learning_rate": 7.995327406061391e-06, - "loss": 0.0243, + "epoch": 1.16, + "learning_rate": 0.00012575498428393474, + "loss": 0.0298, "step": 179980 }, { - "epoch": 1.95, - "learning_rate": 7.97910312155234e-06, - "loss": 0.0242, + "epoch": 1.16, + "learning_rate": 0.00012574530292957782, + "loss": 0.0314, "step": 179990 }, { - "epoch": 1.95, - "learning_rate": 7.962878837043286e-06, - "loss": 0.0253, + "epoch": 1.16, + "learning_rate": 0.0001257356215752209, + "loss": 0.0347, "step": 180000 }, { - "epoch": 1.95, - "eval_cer": 0.9210765786539586, - "eval_loss": 0.020238224416971207, - "eval_runtime": 119.0708, - "eval_samples_per_second": 16.797, - "eval_steps_per_second": 4.199, + "epoch": 1.16, + "eval_cer": 0.91986984521523, + "eval_loss": 0.023445699363946915, + "eval_runtime": 120.1491, + "eval_samples_per_second": 16.646, + "eval_steps_per_second": 4.161, "step": 180000 }, { - "epoch": 1.95, - "learning_rate": 7.946654552534232e-06, - "loss": 0.0234, + "epoch": 1.16, + "learning_rate": 0.00012572594022086395, + "loss": 0.0369, "step": 180010 }, { - "epoch": 1.95, - "learning_rate": 7.930430268025178e-06, - "loss": 0.0201, + "epoch": 1.16, + "learning_rate": 0.000125716258866507, + "loss": 0.0321, "step": 180020 }, { - "epoch": 1.95, - "learning_rate": 7.914205983516127e-06, - "loss": 0.0265, + "epoch": 1.16, + "learning_rate": 0.0001257065775121501, + "loss": 0.0381, "step": 180030 }, { - "epoch": 1.95, - "learning_rate": 7.897981699007073e-06, - "loss": 0.0234, + "epoch": 1.16, + "learning_rate": 0.00012569689615779317, + "loss": 0.0293, "step": 180040 }, { - "epoch": 1.95, - "learning_rate": 7.881757414498021e-06, - "loss": 0.0243, + "epoch": 1.16, + "learning_rate": 0.00012568721480343622, + "loss": 0.0329, "step": 180050 }, { - "epoch": 1.95, - "learning_rate": 7.865533129988967e-06, - "loss": 0.0256, + "epoch": 1.16, + "learning_rate": 0.0001256775334490793, + "loss": 0.0317, "step": 180060 }, { - "epoch": 1.95, - "learning_rate": 7.849308845479914e-06, - "loss": 0.0193, + "epoch": 1.16, + "learning_rate": 0.00012566785209472238, + "loss": 0.0315, "step": 180070 }, { - "epoch": 1.95, - "learning_rate": 7.83308456097086e-06, - "loss": 0.0271, + "epoch": 1.16, + "learning_rate": 0.00012565817074036543, + "loss": 0.0343, "step": 180080 }, { - "epoch": 1.95, - "learning_rate": 7.816860276461807e-06, - "loss": 0.0198, + "epoch": 1.16, + "learning_rate": 0.00012564848938600848, + "loss": 0.0353, "step": 180090 }, { - "epoch": 1.95, - "learning_rate": 7.800635991952755e-06, - "loss": 0.0221, + "epoch": 1.16, + "learning_rate": 0.00012563880803165156, + "loss": 0.0315, "step": 180100 }, { - "epoch": 1.95, - "learning_rate": 7.784411707443701e-06, - "loss": 0.024, + "epoch": 1.16, + "learning_rate": 0.00012562912667729464, + "loss": 0.0347, "step": 180110 }, { - "epoch": 1.95, - "learning_rate": 7.768187422934647e-06, - "loss": 0.0249, + "epoch": 1.16, + "learning_rate": 0.0001256194453229377, + "loss": 0.0293, "step": 180120 }, { - "epoch": 1.95, - "learning_rate": 7.751963138425594e-06, - "loss": 0.0209, + "epoch": 1.16, + "learning_rate": 0.00012560976396858078, + "loss": 0.0307, "step": 180130 }, { - "epoch": 1.95, - "learning_rate": 7.735738853916542e-06, - "loss": 0.0231, + "epoch": 1.16, + "learning_rate": 0.00012560008261422383, + "loss": 0.0324, "step": 180140 }, { - "epoch": 1.95, - "learning_rate": 7.719514569407488e-06, - "loss": 0.0231, + "epoch": 1.16, + "learning_rate": 0.0001255904012598669, + "loss": 0.036, "step": 180150 }, { - "epoch": 1.95, - "learning_rate": 7.703290284898435e-06, - "loss": 0.0201, + "epoch": 1.16, + "learning_rate": 0.00012558071990550996, + "loss": 0.0346, "step": 180160 }, { - "epoch": 1.95, - "learning_rate": 7.687066000389381e-06, - "loss": 0.024, + "epoch": 1.16, + "learning_rate": 0.00012557103855115304, + "loss": 0.0372, "step": 180170 }, { - "epoch": 1.95, - "learning_rate": 7.670841715880329e-06, - "loss": 0.0279, + "epoch": 1.16, + "learning_rate": 0.00012556135719679612, + "loss": 0.036, "step": 180180 }, { - "epoch": 1.95, - "learning_rate": 7.654617431371275e-06, - "loss": 0.022, + "epoch": 1.16, + "learning_rate": 0.00012555167584243917, + "loss": 0.0353, "step": 180190 }, { - "epoch": 1.95, - "learning_rate": 7.638393146862224e-06, - "loss": 0.0248, + "epoch": 1.16, + "learning_rate": 0.00012554199448808225, + "loss": 0.0279, "step": 180200 }, { - "epoch": 1.95, - "learning_rate": 7.62216886235317e-06, - "loss": 0.0221, + "epoch": 1.16, + "learning_rate": 0.0001255323131337253, + "loss": 0.0296, "step": 180210 }, { - "epoch": 1.95, - "learning_rate": 7.605944577844116e-06, - "loss": 0.0243, + "epoch": 1.16, + "learning_rate": 0.00012552263177936836, + "loss": 0.0374, "step": 180220 }, { - "epoch": 1.95, - "learning_rate": 7.5897202933350635e-06, - "loss": 0.028, + "epoch": 1.16, + "learning_rate": 0.00012551295042501144, + "loss": 0.0308, "step": 180230 }, { - "epoch": 1.95, - "learning_rate": 7.57349600882601e-06, - "loss": 0.0263, + "epoch": 1.16, + "learning_rate": 0.00012550326907065452, + "loss": 0.0323, "step": 180240 }, { - "epoch": 1.95, - "learning_rate": 7.557271724316957e-06, - "loss": 0.0252, + "epoch": 1.16, + "learning_rate": 0.0001254935877162976, + "loss": 0.0335, "step": 180250 }, { - "epoch": 1.95, - "learning_rate": 7.5410474398079035e-06, - "loss": 0.0214, + "epoch": 1.16, + "learning_rate": 0.00012548390636194065, + "loss": 0.037, "step": 180260 }, { - "epoch": 1.95, - "learning_rate": 7.524823155298851e-06, - "loss": 0.0256, + "epoch": 1.16, + "learning_rate": 0.00012547422500758373, + "loss": 0.0328, "step": 180270 }, { - "epoch": 1.95, - "learning_rate": 7.508598870789797e-06, - "loss": 0.0215, + "epoch": 1.16, + "learning_rate": 0.00012546454365322678, + "loss": 0.0342, "step": 180280 }, { - "epoch": 1.95, - "learning_rate": 7.492374586280744e-06, - "loss": 0.0175, + "epoch": 1.16, + "learning_rate": 0.00012545486229886984, + "loss": 0.0323, "step": 180290 }, { - "epoch": 1.95, - "learning_rate": 7.476150301771691e-06, - "loss": 0.03, + "epoch": 1.16, + "learning_rate": 0.00012544518094451292, + "loss": 0.0323, "step": 180300 }, { - "epoch": 1.95, - "learning_rate": 7.459926017262638e-06, - "loss": 0.0211, + "epoch": 1.16, + "learning_rate": 0.000125435499590156, + "loss": 0.0295, "step": 180310 }, { - "epoch": 1.95, - "learning_rate": 7.443701732753585e-06, - "loss": 0.021, + "epoch": 1.16, + "learning_rate": 0.00012542581823579908, + "loss": 0.0319, "step": 180320 }, { - "epoch": 1.95, - "learning_rate": 7.4274774482445325e-06, - "loss": 0.0208, + "epoch": 1.16, + "learning_rate": 0.00012541613688144213, + "loss": 0.0383, "step": 180330 }, { - "epoch": 1.95, - "learning_rate": 7.411253163735479e-06, - "loss": 0.0238, + "epoch": 1.16, + "learning_rate": 0.00012540645552708518, + "loss": 0.0332, "step": 180340 }, { - "epoch": 1.95, - "learning_rate": 7.395028879226426e-06, - "loss": 0.0261, + "epoch": 1.16, + "learning_rate": 0.00012539677417272826, + "loss": 0.0291, "step": 180350 }, { - "epoch": 1.95, - "learning_rate": 7.3788045947173724e-06, - "loss": 0.031, + "epoch": 1.16, + "learning_rate": 0.0001253870928183713, + "loss": 0.0367, "step": 180360 }, { - "epoch": 1.95, - "learning_rate": 7.36258031020832e-06, - "loss": 0.0254, + "epoch": 1.16, + "learning_rate": 0.0001253774114640144, + "loss": 0.0302, "step": 180370 }, { - "epoch": 1.95, - "learning_rate": 7.346356025699266e-06, - "loss": 0.019, + "epoch": 1.16, + "learning_rate": 0.00012536773010965747, + "loss": 0.0335, "step": 180380 }, { - "epoch": 1.95, - "learning_rate": 7.330131741190213e-06, - "loss": 0.0268, + "epoch": 1.16, + "learning_rate": 0.00012535804875530053, + "loss": 0.0343, "step": 180390 }, { - "epoch": 1.95, - "learning_rate": 7.31390745668116e-06, - "loss": 0.0266, + "epoch": 1.16, + "learning_rate": 0.0001253483674009436, + "loss": 0.0345, "step": 180400 }, { - "epoch": 1.95, - "learning_rate": 7.297683172172106e-06, - "loss": 0.0262, + "epoch": 1.16, + "learning_rate": 0.00012533868604658666, + "loss": 0.0305, "step": 180410 }, { - "epoch": 1.95, - "learning_rate": 7.281458887663053e-06, - "loss": 0.0219, + "epoch": 1.16, + "learning_rate": 0.00012532900469222974, + "loss": 0.0329, "step": 180420 }, { - "epoch": 1.95, - "learning_rate": 7.265234603154e-06, - "loss": 0.0241, + "epoch": 1.16, + "learning_rate": 0.0001253193233378728, + "loss": 0.0403, "step": 180430 }, { - "epoch": 1.95, - "learning_rate": 7.249010318644947e-06, - "loss": 0.0293, + "epoch": 1.16, + "learning_rate": 0.00012530964198351587, + "loss": 0.0335, "step": 180440 }, { - "epoch": 1.95, - "learning_rate": 7.232786034135893e-06, - "loss": 0.0246, + "epoch": 1.16, + "learning_rate": 0.00012529996062915895, + "loss": 0.031, "step": 180450 }, { - "epoch": 1.95, - "learning_rate": 7.2165617496268405e-06, - "loss": 0.0207, + "epoch": 1.16, + "learning_rate": 0.000125290279274802, + "loss": 0.032, "step": 180460 }, { - "epoch": 1.95, - "learning_rate": 7.200337465117788e-06, - "loss": 0.0244, + "epoch": 1.16, + "learning_rate": 0.00012528059792044508, + "loss": 0.0373, "step": 180470 }, { - "epoch": 1.95, - "learning_rate": 7.184113180608735e-06, - "loss": 0.0232, + "epoch": 1.16, + "learning_rate": 0.00012527091656608814, + "loss": 0.0295, "step": 180480 }, { - "epoch": 1.95, - "learning_rate": 7.167888896099681e-06, - "loss": 0.0219, + "epoch": 1.16, + "learning_rate": 0.00012526123521173121, + "loss": 0.0334, "step": 180490 }, { - "epoch": 1.95, - "learning_rate": 7.151664611590629e-06, - "loss": 0.0281, + "epoch": 1.16, + "learning_rate": 0.00012525155385737427, + "loss": 0.0334, "step": 180500 }, { - "epoch": 1.95, - "learning_rate": 7.135440327081575e-06, - "loss": 0.0287, + "epoch": 1.17, + "learning_rate": 0.00012524187250301735, + "loss": 0.0289, "step": 180510 }, { - "epoch": 1.95, - "learning_rate": 7.119216042572522e-06, - "loss": 0.0218, + "epoch": 1.17, + "learning_rate": 0.00012523219114866043, + "loss": 0.0369, "step": 180520 }, { - "epoch": 1.95, - "learning_rate": 7.1029917580634686e-06, - "loss": 0.0246, + "epoch": 1.17, + "learning_rate": 0.00012522250979430348, + "loss": 0.0345, "step": 180530 }, { - "epoch": 1.95, - "learning_rate": 7.086767473554416e-06, - "loss": 0.0228, + "epoch": 1.17, + "learning_rate": 0.00012521282843994653, + "loss": 0.0291, "step": 180540 }, { - "epoch": 1.95, - "learning_rate": 7.070543189045362e-06, - "loss": 0.0199, + "epoch": 1.17, + "learning_rate": 0.0001252031470855896, + "loss": 0.0367, "step": 180550 }, { - "epoch": 1.95, - "learning_rate": 7.054318904536309e-06, - "loss": 0.0192, + "epoch": 1.17, + "learning_rate": 0.0001251934657312327, + "loss": 0.0335, "step": 180560 }, { - "epoch": 1.95, - "learning_rate": 7.038094620027256e-06, - "loss": 0.0292, + "epoch": 1.17, + "learning_rate": 0.00012518378437687574, + "loss": 0.033, "step": 180570 }, { - "epoch": 1.95, - "learning_rate": 7.021870335518203e-06, - "loss": 0.0222, + "epoch": 1.17, + "learning_rate": 0.00012517410302251882, + "loss": 0.0344, "step": 180580 }, { - "epoch": 1.95, - "learning_rate": 7.005646051009149e-06, - "loss": 0.0275, + "epoch": 1.17, + "learning_rate": 0.00012516442166816188, + "loss": 0.0392, "step": 180590 }, { - "epoch": 1.95, - "learning_rate": 6.989421766500097e-06, - "loss": 0.0276, + "epoch": 1.17, + "learning_rate": 0.00012515474031380496, + "loss": 0.043, "step": 180600 }, { - "epoch": 1.95, - "learning_rate": 6.973197481991043e-06, - "loss": 0.0236, + "epoch": 1.17, + "learning_rate": 0.000125145058959448, + "loss": 0.0286, "step": 180610 }, { - "epoch": 1.95, - "learning_rate": 6.956973197481991e-06, - "loss": 0.0236, + "epoch": 1.17, + "learning_rate": 0.0001251353776050911, + "loss": 0.0332, "step": 180620 }, { - "epoch": 1.95, - "learning_rate": 6.9407489129729375e-06, - "loss": 0.0258, + "epoch": 1.17, + "learning_rate": 0.00012512569625073417, + "loss": 0.0282, "step": 180630 }, { - "epoch": 1.95, - "learning_rate": 6.924524628463885e-06, - "loss": 0.0231, + "epoch": 1.17, + "learning_rate": 0.00012511601489637722, + "loss": 0.0336, "step": 180640 }, { - "epoch": 1.95, - "learning_rate": 6.908300343954831e-06, - "loss": 0.02, + "epoch": 1.17, + "learning_rate": 0.0001251063335420203, + "loss": 0.0359, "step": 180650 }, { - "epoch": 1.95, - "learning_rate": 6.892076059445778e-06, - "loss": 0.0246, + "epoch": 1.17, + "learning_rate": 0.00012509665218766335, + "loss": 0.0342, "step": 180660 }, { - "epoch": 1.95, - "learning_rate": 6.875851774936725e-06, - "loss": 0.0234, + "epoch": 1.17, + "learning_rate": 0.00012508697083330643, + "loss": 0.03, "step": 180670 }, { - "epoch": 1.95, - "learning_rate": 6.859627490427672e-06, - "loss": 0.0248, + "epoch": 1.17, + "learning_rate": 0.0001250772894789495, + "loss": 0.0318, "step": 180680 }, { - "epoch": 1.95, - "learning_rate": 6.843403205918618e-06, - "loss": 0.0241, + "epoch": 1.17, + "learning_rate": 0.00012506760812459257, + "loss": 0.0311, "step": 180690 }, { - "epoch": 1.95, - "learning_rate": 6.8271789214095655e-06, - "loss": 0.0268, + "epoch": 1.17, + "learning_rate": 0.00012505792677023565, + "loss": 0.0315, "step": 180700 }, { - "epoch": 1.95, - "learning_rate": 6.810954636900512e-06, - "loss": 0.0223, + "epoch": 1.17, + "learning_rate": 0.0001250482454158787, + "loss": 0.0339, "step": 180710 }, { - "epoch": 1.95, - "learning_rate": 6.794730352391458e-06, - "loss": 0.0229, + "epoch": 1.17, + "learning_rate": 0.00012503856406152178, + "loss": 0.0346, "step": 180720 }, { - "epoch": 1.95, - "learning_rate": 6.7785060678824055e-06, - "loss": 0.0235, + "epoch": 1.17, + "learning_rate": 0.00012502888270716483, + "loss": 0.0356, "step": 180730 }, { - "epoch": 1.95, - "learning_rate": 6.762281783373352e-06, - "loss": 0.0223, + "epoch": 1.17, + "learning_rate": 0.0001250192013528079, + "loss": 0.0362, "step": 180740 }, { - "epoch": 1.96, - "learning_rate": 6.746057498864299e-06, - "loss": 0.0297, + "epoch": 1.17, + "learning_rate": 0.00012500951999845096, + "loss": 0.0355, "step": 180750 }, { - "epoch": 1.96, - "learning_rate": 6.729833214355247e-06, - "loss": 0.027, + "epoch": 1.17, + "learning_rate": 0.00012499983864409404, + "loss": 0.0292, "step": 180760 }, { - "epoch": 1.96, - "learning_rate": 6.713608929846194e-06, - "loss": 0.0196, + "epoch": 1.17, + "learning_rate": 0.00012499015728973712, + "loss": 0.0347, "step": 180770 }, { - "epoch": 1.96, - "learning_rate": 6.69738464533714e-06, - "loss": 0.0229, + "epoch": 1.17, + "learning_rate": 0.00012498047593538018, + "loss": 0.0355, "step": 180780 }, { - "epoch": 1.96, - "learning_rate": 6.681160360828087e-06, - "loss": 0.0242, + "epoch": 1.17, + "learning_rate": 0.00012497079458102323, + "loss": 0.0277, "step": 180790 }, { - "epoch": 1.96, - "learning_rate": 6.664936076319034e-06, - "loss": 0.0246, + "epoch": 1.17, + "learning_rate": 0.0001249611132266663, + "loss": 0.0342, "step": 180800 }, { - "epoch": 1.96, - "learning_rate": 6.648711791809981e-06, - "loss": 0.0226, + "epoch": 1.17, + "learning_rate": 0.00012495143187230936, + "loss": 0.0338, "step": 180810 }, { - "epoch": 1.96, - "learning_rate": 6.632487507300927e-06, - "loss": 0.0231, + "epoch": 1.17, + "learning_rate": 0.00012494175051795244, + "loss": 0.0288, "step": 180820 }, { - "epoch": 1.96, - "learning_rate": 6.6162632227918744e-06, - "loss": 0.02, + "epoch": 1.17, + "learning_rate": 0.00012493206916359552, + "loss": 0.0355, "step": 180830 }, { - "epoch": 1.96, - "learning_rate": 6.600038938282821e-06, - "loss": 0.0227, + "epoch": 1.17, + "learning_rate": 0.0001249223878092386, + "loss": 0.0318, "step": 180840 }, { - "epoch": 1.96, - "learning_rate": 6.583814653773768e-06, - "loss": 0.0244, + "epoch": 1.17, + "learning_rate": 0.00012491270645488165, + "loss": 0.0326, "step": 180850 }, { - "epoch": 1.96, - "learning_rate": 6.5675903692647144e-06, - "loss": 0.025, + "epoch": 1.17, + "learning_rate": 0.0001249030251005247, + "loss": 0.029, "step": 180860 }, { - "epoch": 1.96, - "learning_rate": 6.551366084755662e-06, - "loss": 0.0241, + "epoch": 1.17, + "learning_rate": 0.00012489334374616779, + "loss": 0.0317, "step": 180870 }, { - "epoch": 1.96, - "learning_rate": 6.535141800246608e-06, - "loss": 0.0194, + "epoch": 1.17, + "learning_rate": 0.00012488366239181084, + "loss": 0.0332, "step": 180880 }, { - "epoch": 1.96, - "learning_rate": 6.518917515737555e-06, - "loss": 0.0232, + "epoch": 1.17, + "learning_rate": 0.00012487398103745392, + "loss": 0.0326, "step": 180890 }, { - "epoch": 1.96, - "learning_rate": 6.502693231228502e-06, - "loss": 0.0201, + "epoch": 1.17, + "learning_rate": 0.000124864299683097, + "loss": 0.0311, "step": 180900 }, { - "epoch": 1.96, - "learning_rate": 6.48646894671945e-06, - "loss": 0.0273, + "epoch": 1.17, + "learning_rate": 0.00012485461832874005, + "loss": 0.0429, "step": 180910 }, { - "epoch": 1.96, - "learning_rate": 6.470244662210396e-06, - "loss": 0.0221, + "epoch": 1.17, + "learning_rate": 0.00012484493697438313, + "loss": 0.0318, "step": 180920 }, { - "epoch": 1.96, - "learning_rate": 6.454020377701343e-06, - "loss": 0.0248, + "epoch": 1.17, + "learning_rate": 0.00012483525562002618, + "loss": 0.0345, "step": 180930 }, { - "epoch": 1.96, - "learning_rate": 6.43779609319229e-06, - "loss": 0.0263, + "epoch": 1.17, + "learning_rate": 0.00012482557426566926, + "loss": 0.0316, "step": 180940 }, { - "epoch": 1.96, - "learning_rate": 6.421571808683237e-06, - "loss": 0.0213, + "epoch": 1.17, + "learning_rate": 0.00012481589291131232, + "loss": 0.0304, "step": 180950 }, { - "epoch": 1.96, - "learning_rate": 6.405347524174183e-06, - "loss": 0.0241, + "epoch": 1.17, + "learning_rate": 0.0001248062115569554, + "loss": 0.0357, "step": 180960 }, { - "epoch": 1.96, - "learning_rate": 6.389123239665131e-06, - "loss": 0.0219, + "epoch": 1.17, + "learning_rate": 0.00012479653020259848, + "loss": 0.0336, "step": 180970 }, { - "epoch": 1.96, - "learning_rate": 6.372898955156077e-06, - "loss": 0.0254, + "epoch": 1.17, + "learning_rate": 0.00012478684884824153, + "loss": 0.0355, "step": 180980 }, { - "epoch": 1.96, - "learning_rate": 6.356674670647024e-06, - "loss": 0.0262, + "epoch": 1.17, + "learning_rate": 0.00012477716749388458, + "loss": 0.0291, "step": 180990 }, { - "epoch": 1.96, - "learning_rate": 6.3404503861379706e-06, - "loss": 0.0197, + "epoch": 1.17, + "learning_rate": 0.00012476748613952766, + "loss": 0.029, "step": 181000 }, { - "epoch": 1.96, - "eval_cer": 0.9210739282009962, - "eval_loss": 0.020191214978694916, - "eval_runtime": 118.9516, - "eval_samples_per_second": 16.814, - "eval_steps_per_second": 4.203, + "epoch": 1.17, + "eval_cer": 0.9198345949610214, + "eval_loss": 0.02338983491063118, + "eval_runtime": 120.1574, + "eval_samples_per_second": 16.645, + "eval_steps_per_second": 4.161, "step": 181000 }, { - "epoch": 1.96, - "learning_rate": 6.324226101628917e-06, - "loss": 0.0202, + "epoch": 1.17, + "learning_rate": 0.00012475780478517074, + "loss": 0.0365, "step": 181010 }, { - "epoch": 1.96, - "learning_rate": 6.308001817119864e-06, - "loss": 0.0275, + "epoch": 1.17, + "learning_rate": 0.0001247481234308138, + "loss": 0.0356, "step": 181020 }, { - "epoch": 1.96, - "learning_rate": 6.2917775326108106e-06, - "loss": 0.0266, + "epoch": 1.17, + "learning_rate": 0.00012473844207645687, + "loss": 0.0287, "step": 181030 }, { - "epoch": 1.96, - "learning_rate": 6.275553248101758e-06, - "loss": 0.0229, + "epoch": 1.17, + "learning_rate": 0.00012472876072209995, + "loss": 0.0354, "step": 181040 }, { - "epoch": 1.96, - "learning_rate": 6.259328963592704e-06, - "loss": 0.0268, + "epoch": 1.17, + "learning_rate": 0.000124719079367743, + "loss": 0.0289, "step": 181050 }, { - "epoch": 1.96, - "learning_rate": 6.243104679083652e-06, - "loss": 0.0183, + "epoch": 1.17, + "learning_rate": 0.00012470939801338606, + "loss": 0.0305, "step": 181060 }, { - "epoch": 1.96, - "learning_rate": 6.2268803945745995e-06, - "loss": 0.0232, + "epoch": 1.17, + "learning_rate": 0.00012469971665902914, + "loss": 0.028, "step": 181070 }, { - "epoch": 1.96, - "learning_rate": 6.210656110065546e-06, - "loss": 0.0211, + "epoch": 1.17, + "learning_rate": 0.00012469003530467222, + "loss": 0.0341, "step": 181080 }, { - "epoch": 1.96, - "learning_rate": 6.194431825556492e-06, - "loss": 0.0296, + "epoch": 1.17, + "learning_rate": 0.00012468035395031527, + "loss": 0.028, "step": 181090 }, { - "epoch": 1.96, - "learning_rate": 6.1782075410474395e-06, - "loss": 0.0227, + "epoch": 1.17, + "learning_rate": 0.00012467067259595835, + "loss": 0.0359, "step": 181100 }, { - "epoch": 1.96, - "learning_rate": 6.161983256538386e-06, - "loss": 0.022, + "epoch": 1.17, + "learning_rate": 0.0001246609912416014, + "loss": 0.0402, "step": 181110 }, { - "epoch": 1.96, - "learning_rate": 6.145758972029333e-06, - "loss": 0.0262, + "epoch": 1.17, + "learning_rate": 0.00012465130988724448, + "loss": 0.0369, "step": 181120 }, { - "epoch": 1.96, - "learning_rate": 6.1295346875202795e-06, - "loss": 0.0248, + "epoch": 1.17, + "learning_rate": 0.00012464162853288754, + "loss": 0.0368, "step": 181130 }, { - "epoch": 1.96, - "learning_rate": 6.113310403011227e-06, - "loss": 0.0248, + "epoch": 1.17, + "learning_rate": 0.00012463194717853062, + "loss": 0.0335, "step": 181140 }, { - "epoch": 1.96, - "learning_rate": 6.097086118502173e-06, - "loss": 0.0191, + "epoch": 1.17, + "learning_rate": 0.0001246222658241737, + "loss": 0.0302, "step": 181150 }, { - "epoch": 1.96, - "learning_rate": 6.08086183399312e-06, - "loss": 0.0215, + "epoch": 1.17, + "learning_rate": 0.00012461258446981675, + "loss": 0.0292, "step": 181160 }, { - "epoch": 1.96, - "learning_rate": 6.064637549484067e-06, - "loss": 0.0223, + "epoch": 1.17, + "learning_rate": 0.00012460290311545983, + "loss": 0.0304, "step": 181170 }, { - "epoch": 1.96, - "learning_rate": 6.048413264975014e-06, - "loss": 0.0226, + "epoch": 1.17, + "learning_rate": 0.00012459322176110288, + "loss": 0.0323, "step": 181180 }, { - "epoch": 1.96, - "learning_rate": 6.03218898046596e-06, - "loss": 0.0231, + "epoch": 1.17, + "learning_rate": 0.00012458354040674596, + "loss": 0.0336, "step": 181190 }, { - "epoch": 1.96, - "learning_rate": 6.015964695956908e-06, - "loss": 0.0206, + "epoch": 1.17, + "learning_rate": 0.000124573859052389, + "loss": 0.0329, "step": 181200 }, { - "epoch": 1.96, - "learning_rate": 5.999740411447855e-06, - "loss": 0.0239, + "epoch": 1.17, + "learning_rate": 0.0001245641776980321, + "loss": 0.0334, "step": 181210 }, { - "epoch": 1.96, - "learning_rate": 5.983516126938802e-06, - "loss": 0.023, + "epoch": 1.17, + "learning_rate": 0.00012455449634367517, + "loss": 0.0368, "step": 181220 }, { - "epoch": 1.96, - "learning_rate": 5.967291842429748e-06, - "loss": 0.0267, + "epoch": 1.17, + "learning_rate": 0.00012454481498931822, + "loss": 0.0307, "step": 181230 }, { - "epoch": 1.96, - "learning_rate": 5.951067557920696e-06, - "loss": 0.0232, + "epoch": 1.17, + "learning_rate": 0.0001245351336349613, + "loss": 0.0275, "step": 181240 }, { - "epoch": 1.96, - "learning_rate": 5.934843273411642e-06, - "loss": 0.0257, + "epoch": 1.17, + "learning_rate": 0.00012452545228060436, + "loss": 0.0282, "step": 181250 }, { - "epoch": 1.96, - "learning_rate": 5.918618988902589e-06, - "loss": 0.0222, + "epoch": 1.17, + "learning_rate": 0.00012451577092624744, + "loss": 0.0459, "step": 181260 }, { - "epoch": 1.96, - "learning_rate": 5.902394704393536e-06, - "loss": 0.0251, + "epoch": 1.17, + "learning_rate": 0.0001245060895718905, + "loss": 0.0361, "step": 181270 }, { - "epoch": 1.96, - "learning_rate": 5.886170419884483e-06, - "loss": 0.0233, + "epoch": 1.17, + "learning_rate": 0.00012449640821753357, + "loss": 0.0338, "step": 181280 }, { - "epoch": 1.96, - "learning_rate": 5.869946135375429e-06, - "loss": 0.0194, + "epoch": 1.17, + "learning_rate": 0.00012448672686317665, + "loss": 0.0325, "step": 181290 }, { - "epoch": 1.96, - "learning_rate": 5.8537218508663765e-06, - "loss": 0.0211, + "epoch": 1.17, + "learning_rate": 0.0001244770455088197, + "loss": 0.0362, "step": 181300 }, { - "epoch": 1.96, - "learning_rate": 5.837497566357323e-06, - "loss": 0.0221, - "step": 181310 + "epoch": 1.17, + "learning_rate": 0.00012446736415446275, + "loss": 0.0313, + "step": 181310 }, { - "epoch": 1.96, - "learning_rate": 5.821273281848269e-06, - "loss": 0.0204, + "epoch": 1.17, + "learning_rate": 0.00012445768280010583, + "loss": 0.0316, "step": 181320 }, { - "epoch": 1.96, - "learning_rate": 5.8050489973392164e-06, - "loss": 0.0292, + "epoch": 1.17, + "learning_rate": 0.00012444800144574891, + "loss": 0.0294, "step": 181330 }, { - "epoch": 1.96, - "learning_rate": 5.788824712830163e-06, - "loss": 0.0244, + "epoch": 1.17, + "learning_rate": 0.00012443832009139197, + "loss": 0.0332, "step": 181340 }, { - "epoch": 1.96, - "learning_rate": 5.772600428321111e-06, - "loss": 0.0238, + "epoch": 1.17, + "learning_rate": 0.00012442863873703505, + "loss": 0.028, "step": 181350 }, { - "epoch": 1.96, - "learning_rate": 5.756376143812058e-06, - "loss": 0.0197, + "epoch": 1.17, + "learning_rate": 0.00012441895738267813, + "loss": 0.0326, "step": 181360 }, { - "epoch": 1.96, - "learning_rate": 5.7401518593030045e-06, - "loss": 0.0279, + "epoch": 1.17, + "learning_rate": 0.00012440927602832118, + "loss": 0.0445, "step": 181370 }, { - "epoch": 1.96, - "learning_rate": 5.723927574793952e-06, - "loss": 0.0205, + "epoch": 1.17, + "learning_rate": 0.00012439959467396423, + "loss": 0.0319, "step": 181380 }, { - "epoch": 1.96, - "learning_rate": 5.707703290284898e-06, - "loss": 0.0222, + "epoch": 1.17, + "learning_rate": 0.0001243899133196073, + "loss": 0.0336, "step": 181390 }, { - "epoch": 1.96, - "learning_rate": 5.6914790057758445e-06, - "loss": 0.0226, + "epoch": 1.17, + "learning_rate": 0.0001243802319652504, + "loss": 0.0356, "step": 181400 }, { - "epoch": 1.96, - "learning_rate": 5.675254721266792e-06, - "loss": 0.023, + "epoch": 1.17, + "learning_rate": 0.00012437055061089344, + "loss": 0.0308, "step": 181410 }, { - "epoch": 1.96, - "learning_rate": 5.659030436757738e-06, - "loss": 0.0234, + "epoch": 1.17, + "learning_rate": 0.00012436086925653652, + "loss": 0.0335, "step": 181420 }, { - "epoch": 1.96, - "learning_rate": 5.642806152248685e-06, - "loss": 0.0281, + "epoch": 1.17, + "learning_rate": 0.00012435118790217958, + "loss": 0.0306, "step": 181430 }, { - "epoch": 1.96, - "learning_rate": 5.626581867739632e-06, - "loss": 0.0247, + "epoch": 1.17, + "learning_rate": 0.00012434150654782266, + "loss": 0.0259, "step": 181440 }, { - "epoch": 1.96, - "learning_rate": 5.610357583230579e-06, - "loss": 0.0224, + "epoch": 1.17, + "learning_rate": 0.0001243318251934657, + "loss": 0.0335, "step": 181450 }, { - "epoch": 1.96, - "learning_rate": 5.594133298721525e-06, - "loss": 0.0222, + "epoch": 1.17, + "learning_rate": 0.0001243221438391088, + "loss": 0.0293, "step": 181460 }, { - "epoch": 1.96, - "learning_rate": 5.577909014212473e-06, - "loss": 0.0234, + "epoch": 1.17, + "learning_rate": 0.00012431246248475187, + "loss": 0.0404, "step": 181470 }, { - "epoch": 1.96, - "learning_rate": 5.561684729703419e-06, - "loss": 0.0207, + "epoch": 1.17, + "learning_rate": 0.00012430278113039492, + "loss": 0.0277, "step": 181480 }, { - "epoch": 1.96, - "learning_rate": 5.545460445194366e-06, - "loss": 0.0258, + "epoch": 1.17, + "learning_rate": 0.000124293099776038, + "loss": 0.0286, "step": 181490 }, { - "epoch": 1.96, - "learning_rate": 5.529236160685313e-06, - "loss": 0.0243, + "epoch": 1.17, + "learning_rate": 0.00012428341842168105, + "loss": 0.0431, "step": 181500 }, { - "epoch": 1.96, - "learning_rate": 5.513011876176261e-06, - "loss": 0.0247, + "epoch": 1.17, + "learning_rate": 0.0001242737370673241, + "loss": 0.0359, "step": 181510 }, { - "epoch": 1.96, - "learning_rate": 5.496787591667207e-06, - "loss": 0.0225, + "epoch": 1.17, + "learning_rate": 0.0001242640557129672, + "loss": 0.0404, "step": 181520 }, { - "epoch": 1.96, - "learning_rate": 5.480563307158154e-06, - "loss": 0.0252, + "epoch": 1.17, + "learning_rate": 0.00012425437435861027, + "loss": 0.0326, "step": 181530 }, { - "epoch": 1.96, - "learning_rate": 5.464339022649101e-06, - "loss": 0.0222, + "epoch": 1.17, + "learning_rate": 0.00012424469300425335, + "loss": 0.0338, "step": 181540 }, { - "epoch": 1.96, - "learning_rate": 5.448114738140048e-06, - "loss": 0.0176, + "epoch": 1.17, + "learning_rate": 0.0001242350116498964, + "loss": 0.0398, "step": 181550 }, { - "epoch": 1.96, - "learning_rate": 5.431890453630994e-06, - "loss": 0.0215, + "epoch": 1.17, + "learning_rate": 0.00012422533029553948, + "loss": 0.0346, "step": 181560 }, { - "epoch": 1.96, - "learning_rate": 5.4156661691219415e-06, - "loss": 0.0243, + "epoch": 1.17, + "learning_rate": 0.00012421564894118253, + "loss": 0.0343, "step": 181570 }, { - "epoch": 1.96, - "learning_rate": 5.399441884612888e-06, - "loss": 0.0185, + "epoch": 1.17, + "learning_rate": 0.00012420596758682558, + "loss": 0.0318, "step": 181580 }, { - "epoch": 1.96, - "learning_rate": 5.383217600103835e-06, - "loss": 0.0259, + "epoch": 1.17, + "learning_rate": 0.00012419628623246866, + "loss": 0.0314, "step": 181590 }, { - "epoch": 1.96, - "learning_rate": 5.3669933155947815e-06, - "loss": 0.0296, + "epoch": 1.17, + "learning_rate": 0.00012418660487811174, + "loss": 0.0319, "step": 181600 }, { - "epoch": 1.96, - "learning_rate": 5.350769031085729e-06, - "loss": 0.0239, + "epoch": 1.17, + "learning_rate": 0.00012417692352375482, + "loss": 0.0342, "step": 181610 }, { - "epoch": 1.96, - "learning_rate": 5.334544746576675e-06, - "loss": 0.0254, + "epoch": 1.17, + "learning_rate": 0.00012416724216939788, + "loss": 0.0326, "step": 181620 }, { - "epoch": 1.96, - "learning_rate": 5.3183204620676215e-06, - "loss": 0.0263, + "epoch": 1.17, + "learning_rate": 0.00012415756081504093, + "loss": 0.0354, "step": 181630 }, { - "epoch": 1.96, - "learning_rate": 5.3020961775585696e-06, - "loss": 0.023, + "epoch": 1.17, + "learning_rate": 0.000124147879460684, + "loss": 0.0375, "step": 181640 }, { - "epoch": 1.96, - "learning_rate": 5.285871893049517e-06, - "loss": 0.0199, + "epoch": 1.17, + "learning_rate": 0.00012413819810632706, + "loss": 0.0311, "step": 181650 }, { - "epoch": 1.96, - "learning_rate": 5.269647608540463e-06, - "loss": 0.0216, + "epoch": 1.17, + "learning_rate": 0.00012412851675197014, + "loss": 0.0352, "step": 181660 }, { - "epoch": 1.96, - "learning_rate": 5.25342332403141e-06, - "loss": 0.0204, + "epoch": 1.17, + "learning_rate": 0.00012411883539761322, + "loss": 0.0304, "step": 181670 }, { - "epoch": 1.97, - "learning_rate": 5.237199039522357e-06, - "loss": 0.0242, + "epoch": 1.17, + "learning_rate": 0.00012410915404325627, + "loss": 0.0291, "step": 181680 }, { - "epoch": 1.97, - "learning_rate": 5.220974755013304e-06, - "loss": 0.0214, + "epoch": 1.17, + "learning_rate": 0.00012409947268889935, + "loss": 0.0294, "step": 181690 }, { - "epoch": 1.97, - "learning_rate": 5.20475047050425e-06, - "loss": 0.0204, + "epoch": 1.17, + "learning_rate": 0.0001240897913345424, + "loss": 0.0349, "step": 181700 }, { - "epoch": 1.97, - "learning_rate": 5.188526185995197e-06, - "loss": 0.0258, + "epoch": 1.17, + "learning_rate": 0.00012408010998018549, + "loss": 0.0331, "step": 181710 }, { - "epoch": 1.97, - "learning_rate": 5.172301901486144e-06, - "loss": 0.0249, + "epoch": 1.17, + "learning_rate": 0.00012407042862582854, + "loss": 0.0323, "step": 181720 }, { - "epoch": 1.97, - "learning_rate": 5.15607761697709e-06, - "loss": 0.0264, + "epoch": 1.17, + "learning_rate": 0.00012406074727147162, + "loss": 0.0359, "step": 181730 }, { - "epoch": 1.97, - "learning_rate": 5.139853332468038e-06, - "loss": 0.0296, + "epoch": 1.17, + "learning_rate": 0.0001240510659171147, + "loss": 0.03, "step": 181740 }, { - "epoch": 1.97, - "learning_rate": 5.123629047958984e-06, - "loss": 0.0217, + "epoch": 1.17, + "learning_rate": 0.00012404138456275775, + "loss": 0.0302, "step": 181750 }, { - "epoch": 1.97, - "learning_rate": 5.107404763449931e-06, - "loss": 0.0251, + "epoch": 1.17, + "learning_rate": 0.00012403170320840083, + "loss": 0.0325, "step": 181760 }, { - "epoch": 1.97, - "learning_rate": 5.091180478940878e-06, - "loss": 0.0208, + "epoch": 1.17, + "learning_rate": 0.00012402202185404388, + "loss": 0.0326, "step": 181770 }, { - "epoch": 1.97, - "learning_rate": 5.074956194431825e-06, - "loss": 0.0245, + "epoch": 1.17, + "learning_rate": 0.00012401234049968696, + "loss": 0.0332, "step": 181780 }, { - "epoch": 1.97, - "learning_rate": 5.058731909922772e-06, - "loss": 0.0254, + "epoch": 1.17, + "learning_rate": 0.00012400265914533002, + "loss": 0.0308, "step": 181790 }, { - "epoch": 1.97, - "learning_rate": 5.042507625413719e-06, - "loss": 0.0262, + "epoch": 1.17, + "learning_rate": 0.0001239929777909731, + "loss": 0.0327, "step": 181800 }, { - "epoch": 1.97, - "learning_rate": 5.026283340904666e-06, - "loss": 0.0231, + "epoch": 1.17, + "learning_rate": 0.00012398329643661618, + "loss": 0.0322, "step": 181810 }, { - "epoch": 1.97, - "learning_rate": 5.010059056395613e-06, - "loss": 0.0247, + "epoch": 1.17, + "learning_rate": 0.00012397361508225923, + "loss": 0.032, "step": 181820 }, { - "epoch": 1.97, - "learning_rate": 4.993834771886559e-06, - "loss": 0.0215, + "epoch": 1.17, + "learning_rate": 0.00012396393372790228, + "loss": 0.0289, "step": 181830 }, { - "epoch": 1.97, - "learning_rate": 4.9776104873775065e-06, - "loss": 0.025, + "epoch": 1.17, + "learning_rate": 0.00012395425237354536, + "loss": 0.0296, "step": 181840 }, { - "epoch": 1.97, - "learning_rate": 4.961386202868453e-06, - "loss": 0.0264, + "epoch": 1.17, + "learning_rate": 0.00012394457101918844, + "loss": 0.043, "step": 181850 }, { - "epoch": 1.97, - "learning_rate": 4.9451619183594e-06, - "loss": 0.0221, + "epoch": 1.17, + "learning_rate": 0.0001239348896648315, + "loss": 0.0327, "step": 181860 }, { - "epoch": 1.97, - "learning_rate": 4.9289376338503465e-06, - "loss": 0.0223, + "epoch": 1.17, + "learning_rate": 0.00012392520831047457, + "loss": 0.0313, "step": 181870 }, { - "epoch": 1.97, - "learning_rate": 4.912713349341294e-06, - "loss": 0.0249, + "epoch": 1.17, + "learning_rate": 0.00012391552695611763, + "loss": 0.0386, "step": 181880 }, { - "epoch": 1.97, - "learning_rate": 4.89648906483224e-06, - "loss": 0.0301, + "epoch": 1.17, + "learning_rate": 0.0001239058456017607, + "loss": 0.0358, "step": 181890 }, { - "epoch": 1.97, - "learning_rate": 4.880264780323187e-06, - "loss": 0.0257, + "epoch": 1.17, + "learning_rate": 0.00012389616424740376, + "loss": 0.0313, "step": 181900 }, { - "epoch": 1.97, - "learning_rate": 4.864040495814134e-06, - "loss": 0.0236, + "epoch": 1.17, + "learning_rate": 0.00012388648289304684, + "loss": 0.0317, "step": 181910 }, { - "epoch": 1.97, - "learning_rate": 4.847816211305081e-06, - "loss": 0.026, + "epoch": 1.17, + "learning_rate": 0.00012387680153868992, + "loss": 0.0347, "step": 181920 }, { - "epoch": 1.97, - "learning_rate": 4.831591926796027e-06, - "loss": 0.0227, + "epoch": 1.17, + "learning_rate": 0.00012386712018433297, + "loss": 0.0327, "step": 181930 }, { - "epoch": 1.97, - "learning_rate": 4.8153676422869754e-06, - "loss": 0.0175, + "epoch": 1.17, + "learning_rate": 0.00012385743882997605, + "loss": 0.0405, "step": 181940 }, { - "epoch": 1.97, - "learning_rate": 4.799143357777922e-06, - "loss": 0.0273, + "epoch": 1.17, + "learning_rate": 0.0001238477574756191, + "loss": 0.0301, "step": 181950 }, { - "epoch": 1.97, - "learning_rate": 4.782919073268869e-06, - "loss": 0.023, + "epoch": 1.17, + "learning_rate": 0.00012383807612126218, + "loss": 0.028, "step": 181960 }, { - "epoch": 1.97, - "learning_rate": 4.766694788759815e-06, - "loss": 0.0286, + "epoch": 1.17, + "learning_rate": 0.00012382839476690524, + "loss": 0.0276, "step": 181970 }, { - "epoch": 1.97, - "learning_rate": 4.750470504250763e-06, - "loss": 0.0312, + "epoch": 1.17, + "learning_rate": 0.00012381871341254831, + "loss": 0.0332, "step": 181980 }, { - "epoch": 1.97, - "learning_rate": 4.734246219741709e-06, - "loss": 0.0271, + "epoch": 1.17, + "learning_rate": 0.0001238090320581914, + "loss": 0.0268, "step": 181990 }, { - "epoch": 1.97, - "learning_rate": 4.718021935232656e-06, - "loss": 0.0231, + "epoch": 1.17, + "learning_rate": 0.00012379935070383445, + "loss": 0.0305, "step": 182000 }, { - "epoch": 1.97, - "eval_cer": 0.9210650933577882, - "eval_loss": 0.020048491656780243, - "eval_runtime": 119.2292, - "eval_samples_per_second": 16.774, - "eval_steps_per_second": 4.194, + "epoch": 1.17, + "eval_cer": 0.9198861145633261, + "eval_loss": 0.0231363195925951, + "eval_runtime": 120.0639, + "eval_samples_per_second": 16.658, + "eval_steps_per_second": 4.164, "step": 182000 }, { - "epoch": 1.97, - "learning_rate": 4.701797650723603e-06, - "loss": 0.0271, + "epoch": 1.17, + "learning_rate": 0.00012378966934947753, + "loss": 0.0339, "step": 182010 }, { - "epoch": 1.97, - "learning_rate": 4.685573366214549e-06, - "loss": 0.0244, + "epoch": 1.17, + "learning_rate": 0.00012377998799512058, + "loss": 0.033, "step": 182020 }, { - "epoch": 1.97, - "learning_rate": 4.669349081705496e-06, - "loss": 0.0251, + "epoch": 1.17, + "learning_rate": 0.00012377030664076366, + "loss": 0.0328, "step": 182030 }, { - "epoch": 1.97, - "learning_rate": 4.653124797196443e-06, - "loss": 0.0276, + "epoch": 1.17, + "learning_rate": 0.0001237606252864067, + "loss": 0.0302, "step": 182040 }, { - "epoch": 1.97, - "learning_rate": 4.63690051268739e-06, - "loss": 0.0285, + "epoch": 1.17, + "learning_rate": 0.0001237509439320498, + "loss": 0.0301, "step": 182050 }, { - "epoch": 1.97, - "learning_rate": 4.620676228178337e-06, - "loss": 0.0233, + "epoch": 1.18, + "learning_rate": 0.00012374126257769287, + "loss": 0.033, "step": 182060 }, { - "epoch": 1.97, - "learning_rate": 4.6044519436692835e-06, - "loss": 0.0245, + "epoch": 1.18, + "learning_rate": 0.00012373158122333592, + "loss": 0.0315, "step": 182070 }, { - "epoch": 1.97, - "learning_rate": 4.588227659160231e-06, - "loss": 0.0278, + "epoch": 1.18, + "learning_rate": 0.000123721899868979, + "loss": 0.0368, "step": 182080 }, { - "epoch": 1.97, - "learning_rate": 4.572003374651177e-06, - "loss": 0.0237, + "epoch": 1.18, + "learning_rate": 0.00012371221851462206, + "loss": 0.0333, "step": 182090 }, { - "epoch": 1.97, - "learning_rate": 4.555779090142124e-06, - "loss": 0.0248, + "epoch": 1.18, + "learning_rate": 0.00012370253716026514, + "loss": 0.0337, "step": 182100 }, { - "epoch": 1.97, - "learning_rate": 4.539554805633071e-06, - "loss": 0.0228, + "epoch": 1.18, + "learning_rate": 0.0001236928558059082, + "loss": 0.0315, "step": 182110 }, { - "epoch": 1.97, - "learning_rate": 4.523330521124018e-06, - "loss": 0.0234, + "epoch": 1.18, + "learning_rate": 0.00012368317445155127, + "loss": 0.0301, "step": 182120 }, { - "epoch": 1.97, - "learning_rate": 4.507106236614965e-06, - "loss": 0.0237, + "epoch": 1.18, + "learning_rate": 0.00012367349309719435, + "loss": 0.0307, "step": 182130 }, { - "epoch": 1.97, - "learning_rate": 4.4908819521059115e-06, - "loss": 0.0259, + "epoch": 1.18, + "learning_rate": 0.0001236638117428374, + "loss": 0.0319, "step": 182140 }, { - "epoch": 1.97, - "learning_rate": 4.474657667596859e-06, - "loss": 0.0272, + "epoch": 1.18, + "learning_rate": 0.00012365413038848045, + "loss": 0.0291, "step": 182150 }, { - "epoch": 1.97, - "learning_rate": 4.458433383087805e-06, - "loss": 0.0246, + "epoch": 1.18, + "learning_rate": 0.00012364444903412353, + "loss": 0.0308, "step": 182160 }, { - "epoch": 1.97, - "learning_rate": 4.442209098578752e-06, - "loss": 0.0219, + "epoch": 1.18, + "learning_rate": 0.00012363476767976661, + "loss": 0.0283, "step": 182170 }, { - "epoch": 1.97, - "learning_rate": 4.425984814069699e-06, - "loss": 0.0249, + "epoch": 1.18, + "learning_rate": 0.00012362508632540967, + "loss": 0.0339, "step": 182180 }, { - "epoch": 1.97, - "learning_rate": 4.409760529560646e-06, - "loss": 0.0204, + "epoch": 1.18, + "learning_rate": 0.00012361540497105275, + "loss": 0.0286, "step": 182190 }, { - "epoch": 1.97, - "learning_rate": 4.393536245051593e-06, - "loss": 0.0212, + "epoch": 1.18, + "learning_rate": 0.0001236057236166958, + "loss": 0.0293, "step": 182200 }, { - "epoch": 1.97, - "learning_rate": 4.37731196054254e-06, - "loss": 0.0205, + "epoch": 1.18, + "learning_rate": 0.00012359604226233888, + "loss": 0.0306, "step": 182210 }, { - "epoch": 1.97, - "learning_rate": 4.361087676033487e-06, - "loss": 0.0193, + "epoch": 1.18, + "learning_rate": 0.00012358636090798193, + "loss": 0.0314, "step": 182220 }, { - "epoch": 1.97, - "learning_rate": 4.344863391524433e-06, - "loss": 0.0235, + "epoch": 1.18, + "learning_rate": 0.000123576679553625, + "loss": 0.0319, "step": 182230 }, { - "epoch": 1.97, - "learning_rate": 4.3286391070153805e-06, - "loss": 0.0235, + "epoch": 1.18, + "learning_rate": 0.0001235669981992681, + "loss": 0.0409, "step": 182240 }, { - "epoch": 1.97, - "learning_rate": 4.312414822506327e-06, - "loss": 0.024, + "epoch": 1.18, + "learning_rate": 0.00012355731684491114, + "loss": 0.0335, "step": 182250 }, { - "epoch": 1.97, - "learning_rate": 4.296190537997274e-06, - "loss": 0.0232, + "epoch": 1.18, + "learning_rate": 0.00012354763549055422, + "loss": 0.0414, "step": 182260 }, { - "epoch": 1.97, - "learning_rate": 4.279966253488221e-06, - "loss": 0.0244, + "epoch": 1.18, + "learning_rate": 0.00012353795413619728, + "loss": 0.0286, "step": 182270 }, { - "epoch": 1.97, - "learning_rate": 4.263741968979168e-06, - "loss": 0.0209, + "epoch": 1.18, + "learning_rate": 0.00012352827278184036, + "loss": 0.0279, "step": 182280 }, { - "epoch": 1.97, - "learning_rate": 4.247517684470115e-06, - "loss": 0.0227, + "epoch": 1.18, + "learning_rate": 0.0001235185914274834, + "loss": 0.0348, "step": 182290 }, { - "epoch": 1.97, - "learning_rate": 4.231293399961061e-06, - "loss": 0.0224, + "epoch": 1.18, + "learning_rate": 0.0001235089100731265, + "loss": 0.0302, "step": 182300 }, { - "epoch": 1.97, - "learning_rate": 4.2150691154520085e-06, - "loss": 0.0283, + "epoch": 1.18, + "learning_rate": 0.00012349922871876957, + "loss": 0.0289, "step": 182310 }, { - "epoch": 1.97, - "learning_rate": 4.198844830942955e-06, - "loss": 0.0227, + "epoch": 1.18, + "learning_rate": 0.00012348954736441262, + "loss": 0.0292, "step": 182320 }, { - "epoch": 1.97, - "learning_rate": 4.182620546433901e-06, - "loss": 0.0291, + "epoch": 1.18, + "learning_rate": 0.0001234798660100557, + "loss": 0.0348, "step": 182330 }, { - "epoch": 1.97, - "learning_rate": 4.166396261924849e-06, - "loss": 0.0246, + "epoch": 1.18, + "learning_rate": 0.00012347018465569875, + "loss": 0.034, "step": 182340 }, { - "epoch": 1.97, - "learning_rate": 4.150171977415796e-06, - "loss": 0.0203, + "epoch": 1.18, + "learning_rate": 0.0001234605033013418, + "loss": 0.0262, "step": 182350 }, { - "epoch": 1.97, - "learning_rate": 4.133947692906742e-06, - "loss": 0.0218, + "epoch": 1.18, + "learning_rate": 0.00012345082194698489, + "loss": 0.0263, "step": 182360 }, { - "epoch": 1.97, - "learning_rate": 4.117723408397689e-06, - "loss": 0.0219, + "epoch": 1.18, + "learning_rate": 0.00012344114059262797, + "loss": 0.0368, "step": 182370 }, { - "epoch": 1.97, - "learning_rate": 4.101499123888636e-06, - "loss": 0.0216, + "epoch": 1.18, + "learning_rate": 0.00012343145923827105, + "loss": 0.0377, "step": 182380 }, { - "epoch": 1.97, - "learning_rate": 4.085274839379583e-06, - "loss": 0.0227, + "epoch": 1.18, + "learning_rate": 0.0001234217778839141, + "loss": 0.0289, "step": 182390 }, { - "epoch": 1.97, - "learning_rate": 4.069050554870529e-06, - "loss": 0.0212, + "epoch": 1.18, + "learning_rate": 0.00012341209652955715, + "loss": 0.0343, "step": 182400 }, { - "epoch": 1.97, - "learning_rate": 4.052826270361477e-06, - "loss": 0.0219, + "epoch": 1.18, + "learning_rate": 0.00012340241517520023, + "loss": 0.036, "step": 182410 }, { - "epoch": 1.97, - "learning_rate": 4.036601985852424e-06, - "loss": 0.0206, + "epoch": 1.18, + "learning_rate": 0.00012339273382084328, + "loss": 0.0291, "step": 182420 }, { - "epoch": 1.97, - "learning_rate": 4.02037770134337e-06, - "loss": 0.0245, + "epoch": 1.18, + "learning_rate": 0.00012338305246648636, + "loss": 0.0292, "step": 182430 }, { - "epoch": 1.97, - "learning_rate": 4.004153416834317e-06, - "loss": 0.021, + "epoch": 1.18, + "learning_rate": 0.00012337337111212944, + "loss": 0.0343, "step": 182440 }, { - "epoch": 1.97, - "learning_rate": 3.987929132325264e-06, - "loss": 0.0228, + "epoch": 1.18, + "learning_rate": 0.00012336368975777252, + "loss": 0.0324, "step": 182450 }, { - "epoch": 1.97, - "learning_rate": 3.971704847816211e-06, - "loss": 0.0266, + "epoch": 1.18, + "learning_rate": 0.00012335400840341558, + "loss": 0.0286, "step": 182460 }, { - "epoch": 1.97, - "learning_rate": 3.955480563307157e-06, - "loss": 0.0243, + "epoch": 1.18, + "learning_rate": 0.00012334432704905863, + "loss": 0.0339, "step": 182470 }, { - "epoch": 1.97, - "learning_rate": 3.939256278798105e-06, - "loss": 0.0225, + "epoch": 1.18, + "learning_rate": 0.0001233346456947017, + "loss": 0.0302, "step": 182480 }, { - "epoch": 1.97, - "learning_rate": 3.923031994289052e-06, - "loss": 0.026, + "epoch": 1.18, + "learning_rate": 0.00012332496434034476, + "loss": 0.0371, "step": 182490 }, { - "epoch": 1.97, - "learning_rate": 3.906807709779998e-06, - "loss": 0.0219, + "epoch": 1.18, + "learning_rate": 0.00012331528298598784, + "loss": 0.0391, "step": 182500 }, { - "epoch": 1.97, - "learning_rate": 3.8905834252709455e-06, - "loss": 0.0221, + "epoch": 1.18, + "learning_rate": 0.00012330560163163092, + "loss": 0.0336, "step": 182510 }, { - "epoch": 1.97, - "learning_rate": 3.874359140761892e-06, - "loss": 0.0268, + "epoch": 1.18, + "learning_rate": 0.00012329592027727397, + "loss": 0.0301, "step": 182520 }, { - "epoch": 1.97, - "learning_rate": 3.858134856252839e-06, - "loss": 0.0222, + "epoch": 1.18, + "learning_rate": 0.00012328623892291705, + "loss": 0.0311, "step": 182530 }, { - "epoch": 1.97, - "learning_rate": 3.8419105717437855e-06, - "loss": 0.0268, + "epoch": 1.18, + "learning_rate": 0.0001232765575685601, + "loss": 0.0273, "step": 182540 }, { - "epoch": 1.97, - "learning_rate": 3.825686287234733e-06, - "loss": 0.0234, + "epoch": 1.18, + "learning_rate": 0.00012326687621420319, + "loss": 0.032, "step": 182550 }, { - "epoch": 1.97, - "learning_rate": 3.8094620027256795e-06, - "loss": 0.0247, + "epoch": 1.18, + "learning_rate": 0.00012325719485984624, + "loss": 0.0364, "step": 182560 }, { - "epoch": 1.97, - "learning_rate": 3.7932377182166263e-06, - "loss": 0.022, + "epoch": 1.18, + "learning_rate": 0.00012324751350548932, + "loss": 0.032, "step": 182570 }, { - "epoch": 1.97, - "learning_rate": 3.777013433707573e-06, - "loss": 0.0223, - "step": 182580 + "epoch": 1.18, + "learning_rate": 0.0001232378321511324, + "loss": 0.0307, + "step": 182580 }, { - "epoch": 1.97, - "learning_rate": 3.76078914919852e-06, - "loss": 0.0217, + "epoch": 1.18, + "learning_rate": 0.00012322815079677545, + "loss": 0.0315, "step": 182590 }, { - "epoch": 1.98, - "learning_rate": 3.7445648646894667e-06, - "loss": 0.0203, + "epoch": 1.18, + "learning_rate": 0.0001232184694424185, + "loss": 0.0304, "step": 182600 }, { - "epoch": 1.98, - "learning_rate": 3.7283405801804135e-06, - "loss": 0.0213, + "epoch": 1.18, + "learning_rate": 0.00012320878808806158, + "loss": 0.0328, "step": 182610 }, { - "epoch": 1.98, - "learning_rate": 3.7121162956713604e-06, - "loss": 0.0204, + "epoch": 1.18, + "learning_rate": 0.00012319910673370466, + "loss": 0.0389, "step": 182620 }, { - "epoch": 1.98, - "learning_rate": 3.6958920111623076e-06, - "loss": 0.0264, + "epoch": 1.18, + "learning_rate": 0.00012318942537934772, + "loss": 0.0304, "step": 182630 }, { - "epoch": 1.98, - "learning_rate": 3.6796677266532544e-06, - "loss": 0.0207, + "epoch": 1.18, + "learning_rate": 0.0001231797440249908, + "loss": 0.0317, "step": 182640 }, { - "epoch": 1.98, - "learning_rate": 3.663443442144201e-06, - "loss": 0.0229, + "epoch": 1.18, + "learning_rate": 0.00012317006267063387, + "loss": 0.0329, "step": 182650 }, { - "epoch": 1.98, - "learning_rate": 3.647219157635148e-06, - "loss": 0.0256, + "epoch": 1.18, + "learning_rate": 0.00012316038131627693, + "loss": 0.033, "step": 182660 }, { - "epoch": 1.98, - "learning_rate": 3.630994873126095e-06, - "loss": 0.0257, + "epoch": 1.18, + "learning_rate": 0.00012315069996191998, + "loss": 0.0375, "step": 182670 }, { - "epoch": 1.98, - "learning_rate": 3.6147705886170416e-06, - "loss": 0.0244, + "epoch": 1.18, + "learning_rate": 0.00012314101860756306, + "loss": 0.036, "step": 182680 }, { - "epoch": 1.98, - "learning_rate": 3.5985463041079884e-06, - "loss": 0.0239, + "epoch": 1.18, + "learning_rate": 0.00012313133725320614, + "loss": 0.0351, "step": 182690 }, { - "epoch": 1.98, - "learning_rate": 3.5823220195989352e-06, - "loss": 0.0222, + "epoch": 1.18, + "learning_rate": 0.0001231216558988492, + "loss": 0.0379, "step": 182700 }, { - "epoch": 1.98, - "learning_rate": 3.5660977350898825e-06, - "loss": 0.0307, + "epoch": 1.18, + "learning_rate": 0.00012311197454449227, + "loss": 0.0362, "step": 182710 }, { - "epoch": 1.98, - "learning_rate": 3.5498734505808293e-06, - "loss": 0.025, + "epoch": 1.18, + "learning_rate": 0.00012310229319013533, + "loss": 0.0295, "step": 182720 }, { - "epoch": 1.98, - "learning_rate": 3.533649166071776e-06, - "loss": 0.0239, + "epoch": 1.18, + "learning_rate": 0.0001230926118357784, + "loss": 0.031, "step": 182730 }, { - "epoch": 1.98, - "learning_rate": 3.517424881562723e-06, - "loss": 0.0232, + "epoch": 1.18, + "learning_rate": 0.00012308293048142146, + "loss": 0.0327, "step": 182740 }, { - "epoch": 1.98, - "learning_rate": 3.5012005970536697e-06, - "loss": 0.0208, + "epoch": 1.18, + "learning_rate": 0.00012307324912706454, + "loss": 0.0357, "step": 182750 }, { - "epoch": 1.98, - "learning_rate": 3.4849763125446165e-06, - "loss": 0.0204, + "epoch": 1.18, + "learning_rate": 0.00012306356777270762, + "loss": 0.0357, "step": 182760 }, { - "epoch": 1.98, - "learning_rate": 3.4687520280355633e-06, - "loss": 0.023, + "epoch": 1.18, + "learning_rate": 0.00012305388641835067, + "loss": 0.0283, "step": 182770 }, { - "epoch": 1.98, - "learning_rate": 3.4525277435265105e-06, - "loss": 0.0261, + "epoch": 1.18, + "learning_rate": 0.00012304420506399375, + "loss": 0.0405, "step": 182780 }, { - "epoch": 1.98, - "learning_rate": 3.4363034590174573e-06, - "loss": 0.0267, + "epoch": 1.18, + "learning_rate": 0.0001230345237096368, + "loss": 0.0323, "step": 182790 }, { - "epoch": 1.98, - "learning_rate": 3.420079174508404e-06, - "loss": 0.0193, + "epoch": 1.18, + "learning_rate": 0.00012302484235527988, + "loss": 0.0311, "step": 182800 }, { - "epoch": 1.98, - "learning_rate": 3.403854889999351e-06, - "loss": 0.0239, + "epoch": 1.18, + "learning_rate": 0.00012301516100092293, + "loss": 0.0302, "step": 182810 }, { - "epoch": 1.98, - "learning_rate": 3.3876306054902973e-06, - "loss": 0.0272, + "epoch": 1.18, + "learning_rate": 0.00012300547964656601, + "loss": 0.0381, "step": 182820 }, { - "epoch": 1.98, - "learning_rate": 3.371406320981244e-06, - "loss": 0.024, + "epoch": 1.18, + "learning_rate": 0.0001229957982922091, + "loss": 0.0282, "step": 182830 }, { - "epoch": 1.98, - "learning_rate": 3.355182036472191e-06, - "loss": 0.0262, + "epoch": 1.18, + "learning_rate": 0.00012298611693785215, + "loss": 0.0353, "step": 182840 }, { - "epoch": 1.98, - "learning_rate": 3.338957751963138e-06, - "loss": 0.0226, + "epoch": 1.18, + "learning_rate": 0.00012297643558349523, + "loss": 0.0373, "step": 182850 }, { - "epoch": 1.98, - "learning_rate": 3.322733467454085e-06, - "loss": 0.0229, + "epoch": 1.18, + "learning_rate": 0.00012296675422913828, + "loss": 0.0317, "step": 182860 }, { - "epoch": 1.98, - "learning_rate": 3.3065091829450318e-06, - "loss": 0.0232, + "epoch": 1.18, + "learning_rate": 0.00012295707287478136, + "loss": 0.0343, "step": 182870 }, { - "epoch": 1.98, - "learning_rate": 3.2902848984359786e-06, - "loss": 0.0224, + "epoch": 1.18, + "learning_rate": 0.0001229473915204244, + "loss": 0.0267, "step": 182880 }, { - "epoch": 1.98, - "learning_rate": 3.2740606139269254e-06, - "loss": 0.0212, + "epoch": 1.18, + "learning_rate": 0.0001229377101660675, + "loss": 0.0396, "step": 182890 }, { - "epoch": 1.98, - "learning_rate": 3.257836329417872e-06, - "loss": 0.0221, + "epoch": 1.18, + "learning_rate": 0.00012292802881171057, + "loss": 0.0345, "step": 182900 }, { - "epoch": 1.98, - "learning_rate": 3.241612044908819e-06, - "loss": 0.0216, + "epoch": 1.18, + "learning_rate": 0.00012291834745735362, + "loss": 0.0337, "step": 182910 }, { - "epoch": 1.98, - "learning_rate": 3.225387760399766e-06, - "loss": 0.0274, + "epoch": 1.18, + "learning_rate": 0.00012290866610299668, + "loss": 0.0292, "step": 182920 }, { - "epoch": 1.98, - "learning_rate": 3.209163475890713e-06, - "loss": 0.0216, + "epoch": 1.18, + "learning_rate": 0.00012289898474863976, + "loss": 0.0362, "step": 182930 }, { - "epoch": 1.98, - "learning_rate": 3.19293919138166e-06, - "loss": 0.0254, + "epoch": 1.18, + "learning_rate": 0.00012288930339428284, + "loss": 0.0334, "step": 182940 }, { - "epoch": 1.98, - "learning_rate": 3.1767149068726066e-06, - "loss": 0.0241, + "epoch": 1.18, + "learning_rate": 0.0001228796220399259, + "loss": 0.0372, "step": 182950 }, { - "epoch": 1.98, - "learning_rate": 3.1604906223635535e-06, - "loss": 0.0203, + "epoch": 1.18, + "learning_rate": 0.00012286994068556897, + "loss": 0.0303, "step": 182960 }, { - "epoch": 1.98, - "learning_rate": 3.1442663378545003e-06, - "loss": 0.021, + "epoch": 1.18, + "learning_rate": 0.00012286025933121205, + "loss": 0.0385, "step": 182970 }, { - "epoch": 1.98, - "learning_rate": 3.128042053345447e-06, - "loss": 0.021, + "epoch": 1.18, + "learning_rate": 0.0001228505779768551, + "loss": 0.0367, "step": 182980 }, { - "epoch": 1.98, - "learning_rate": 3.111817768836394e-06, - "loss": 0.0222, + "epoch": 1.18, + "learning_rate": 0.00012284089662249815, + "loss": 0.0338, "step": 182990 }, { - "epoch": 1.98, - "learning_rate": 3.095593484327341e-06, - "loss": 0.0244, + "epoch": 1.18, + "learning_rate": 0.00012283121526814123, + "loss": 0.0454, "step": 183000 }, { - "epoch": 1.98, - "eval_cer": 0.9210721612323546, - "eval_loss": 0.020101139321923256, - "eval_runtime": 118.9914, - "eval_samples_per_second": 16.808, - "eval_steps_per_second": 4.202, + "epoch": 1.18, + "eval_cer": 0.9199674613038075, + "eval_loss": 0.023103881627321243, + "eval_runtime": 120.0626, + "eval_samples_per_second": 16.658, + "eval_steps_per_second": 4.164, "step": 183000 }, { - "epoch": 1.98, - "learning_rate": 3.079369199818288e-06, - "loss": 0.0233, + "epoch": 1.18, + "learning_rate": 0.00012282153391378431, + "loss": 0.0339, "step": 183010 }, { - "epoch": 1.98, - "learning_rate": 3.0631449153092347e-06, - "loss": 0.0292, + "epoch": 1.18, + "learning_rate": 0.00012281185255942737, + "loss": 0.0299, "step": 183020 }, { - "epoch": 1.98, - "learning_rate": 3.0469206308001815e-06, - "loss": 0.0244, + "epoch": 1.18, + "learning_rate": 0.00012280217120507045, + "loss": 0.0337, "step": 183030 }, { - "epoch": 1.98, - "learning_rate": 3.0306963462911283e-06, - "loss": 0.02, + "epoch": 1.18, + "learning_rate": 0.0001227924898507135, + "loss": 0.0272, "step": 183040 }, { - "epoch": 1.98, - "learning_rate": 3.014472061782075e-06, - "loss": 0.0227, + "epoch": 1.18, + "learning_rate": 0.00012278280849635658, + "loss": 0.0322, "step": 183050 }, { - "epoch": 1.98, - "learning_rate": 2.998247777273022e-06, - "loss": 0.028, + "epoch": 1.18, + "learning_rate": 0.00012277312714199963, + "loss": 0.0301, "step": 183060 }, { - "epoch": 1.98, - "learning_rate": 2.982023492763969e-06, - "loss": 0.0238, + "epoch": 1.18, + "learning_rate": 0.0001227634457876427, + "loss": 0.0366, "step": 183070 }, { - "epoch": 1.98, - "learning_rate": 2.965799208254916e-06, - "loss": 0.0244, + "epoch": 1.18, + "learning_rate": 0.0001227537644332858, + "loss": 0.0266, "step": 183080 }, { - "epoch": 1.98, - "learning_rate": 2.9495749237458628e-06, - "loss": 0.0234, + "epoch": 1.18, + "learning_rate": 0.00012274408307892884, + "loss": 0.0324, "step": 183090 }, { - "epoch": 1.98, - "learning_rate": 2.9333506392368096e-06, - "loss": 0.0252, + "epoch": 1.18, + "learning_rate": 0.00012273440172457192, + "loss": 0.0306, "step": 183100 }, { - "epoch": 1.98, - "learning_rate": 2.9171263547277564e-06, - "loss": 0.0237, + "epoch": 1.18, + "learning_rate": 0.00012272472037021498, + "loss": 0.0308, "step": 183110 }, { - "epoch": 1.98, - "learning_rate": 2.900902070218703e-06, - "loss": 0.0257, + "epoch": 1.18, + "learning_rate": 0.00012271503901585803, + "loss": 0.0324, "step": 183120 }, { - "epoch": 1.98, - "learning_rate": 2.8846777857096496e-06, - "loss": 0.0224, + "epoch": 1.18, + "learning_rate": 0.0001227053576615011, + "loss": 0.0339, "step": 183130 }, { - "epoch": 1.98, - "learning_rate": 2.8684535012005964e-06, - "loss": 0.0246, + "epoch": 1.18, + "learning_rate": 0.0001226956763071442, + "loss": 0.0385, "step": 183140 }, { - "epoch": 1.98, - "learning_rate": 2.852229216691544e-06, - "loss": 0.0201, + "epoch": 1.18, + "learning_rate": 0.00012268599495278727, + "loss": 0.0426, "step": 183150 }, { - "epoch": 1.98, - "learning_rate": 2.8360049321824904e-06, - "loss": 0.0231, + "epoch": 1.18, + "learning_rate": 0.00012267631359843032, + "loss": 0.0336, "step": 183160 }, { - "epoch": 1.98, - "learning_rate": 2.8197806476734372e-06, - "loss": 0.0238, + "epoch": 1.18, + "learning_rate": 0.0001226666322440734, + "loss": 0.0323, "step": 183170 }, { - "epoch": 1.98, - "learning_rate": 2.803556363164384e-06, - "loss": 0.0191, + "epoch": 1.18, + "learning_rate": 0.00012265695088971645, + "loss": 0.0343, "step": 183180 }, { - "epoch": 1.98, - "learning_rate": 2.787332078655331e-06, - "loss": 0.0253, + "epoch": 1.18, + "learning_rate": 0.0001226472695353595, + "loss": 0.0303, "step": 183190 }, { - "epoch": 1.98, - "learning_rate": 2.7711077941462776e-06, - "loss": 0.025, + "epoch": 1.18, + "learning_rate": 0.00012263758818100259, + "loss": 0.0312, "step": 183200 }, { - "epoch": 1.98, - "learning_rate": 2.7548835096372245e-06, - "loss": 0.0238, + "epoch": 1.18, + "learning_rate": 0.00012262790682664567, + "loss": 0.0271, "step": 183210 }, { - "epoch": 1.98, - "learning_rate": 2.7386592251281717e-06, - "loss": 0.0229, + "epoch": 1.18, + "learning_rate": 0.00012261822547228875, + "loss": 0.0356, "step": 183220 }, { - "epoch": 1.98, - "learning_rate": 2.7224349406191185e-06, - "loss": 0.0239, + "epoch": 1.18, + "learning_rate": 0.0001226085441179318, + "loss": 0.0387, "step": 183230 }, { - "epoch": 1.98, - "learning_rate": 2.7062106561100653e-06, - "loss": 0.021, + "epoch": 1.18, + "learning_rate": 0.00012259886276357485, + "loss": 0.0379, "step": 183240 }, { - "epoch": 1.98, - "learning_rate": 2.689986371601012e-06, - "loss": 0.0228, + "epoch": 1.18, + "learning_rate": 0.00012258918140921793, + "loss": 0.0358, "step": 183250 }, { - "epoch": 1.98, - "learning_rate": 2.673762087091959e-06, - "loss": 0.0226, + "epoch": 1.18, + "learning_rate": 0.00012257950005486098, + "loss": 0.0363, "step": 183260 }, { - "epoch": 1.98, - "learning_rate": 2.6575378025829057e-06, - "loss": 0.024, + "epoch": 1.18, + "learning_rate": 0.00012256981870050406, + "loss": 0.0361, "step": 183270 }, { - "epoch": 1.98, - "learning_rate": 2.6413135180738525e-06, - "loss": 0.0251, + "epoch": 1.18, + "learning_rate": 0.00012256013734614714, + "loss": 0.0309, "step": 183280 }, { - "epoch": 1.98, - "learning_rate": 2.6250892335647997e-06, - "loss": 0.027, + "epoch": 1.18, + "learning_rate": 0.0001225504559917902, + "loss": 0.0335, "step": 183290 }, { - "epoch": 1.98, - "learning_rate": 2.6088649490557466e-06, - "loss": 0.02, + "epoch": 1.18, + "learning_rate": 0.00012254077463743328, + "loss": 0.0308, "step": 183300 }, { - "epoch": 1.98, - "learning_rate": 2.5926406645466934e-06, - "loss": 0.0204, + "epoch": 1.18, + "learning_rate": 0.00012253109328307633, + "loss": 0.0338, "step": 183310 }, { - "epoch": 1.98, - "learning_rate": 2.57641638003764e-06, - "loss": 0.0186, + "epoch": 1.18, + "learning_rate": 0.0001225214119287194, + "loss": 0.0265, "step": 183320 }, { - "epoch": 1.98, - "learning_rate": 2.560192095528587e-06, - "loss": 0.0274, + "epoch": 1.18, + "learning_rate": 0.00012251173057436246, + "loss": 0.0357, "step": 183330 }, { - "epoch": 1.98, - "learning_rate": 2.5439678110195338e-06, - "loss": 0.0281, + "epoch": 1.18, + "learning_rate": 0.00012250204922000554, + "loss": 0.0381, "step": 183340 }, { - "epoch": 1.98, - "learning_rate": 2.5277435265104806e-06, - "loss": 0.0208, + "epoch": 1.18, + "learning_rate": 0.00012249236786564862, + "loss": 0.0319, "step": 183350 }, { - "epoch": 1.98, - "learning_rate": 2.5115192420014274e-06, - "loss": 0.0208, + "epoch": 1.18, + "learning_rate": 0.00012248268651129167, + "loss": 0.0297, "step": 183360 }, { - "epoch": 1.98, - "learning_rate": 2.4952949574923746e-06, - "loss": 0.0232, + "epoch": 1.18, + "learning_rate": 0.00012247300515693475, + "loss": 0.0423, "step": 183370 }, { - "epoch": 1.98, - "learning_rate": 2.4790706729833214e-06, - "loss": 0.0214, + "epoch": 1.18, + "learning_rate": 0.0001224633238025778, + "loss": 0.0384, "step": 183380 }, { - "epoch": 1.98, - "learning_rate": 2.4628463884742682e-06, - "loss": 0.0212, + "epoch": 1.18, + "learning_rate": 0.00012245364244822089, + "loss": 0.0337, "step": 183390 }, { - "epoch": 1.98, - "learning_rate": 2.446622103965215e-06, - "loss": 0.0296, + "epoch": 1.18, + "learning_rate": 0.00012244396109386394, + "loss": 0.0339, "step": 183400 }, { - "epoch": 1.98, - "learning_rate": 2.430397819456162e-06, - "loss": 0.0281, + "epoch": 1.18, + "learning_rate": 0.00012243427973950702, + "loss": 0.0293, "step": 183410 }, { - "epoch": 1.98, - "learning_rate": 2.4141735349471087e-06, - "loss": 0.0197, + "epoch": 1.18, + "learning_rate": 0.0001224245983851501, + "loss": 0.0309, "step": 183420 }, { - "epoch": 1.98, - "learning_rate": 2.397949250438055e-06, - "loss": 0.0321, + "epoch": 1.18, + "learning_rate": 0.00012241491703079315, + "loss": 0.0298, "step": 183430 }, { - "epoch": 1.98, - "learning_rate": 2.3817249659290027e-06, - "loss": 0.0225, + "epoch": 1.18, + "learning_rate": 0.0001224052356764362, + "loss": 0.0351, "step": 183440 }, { - "epoch": 1.98, - "learning_rate": 2.3655006814199495e-06, - "loss": 0.0329, + "epoch": 1.18, + "learning_rate": 0.00012239555432207928, + "loss": 0.0298, "step": 183450 }, { - "epoch": 1.98, - "learning_rate": 2.3492763969108963e-06, - "loss": 0.0186, + "epoch": 1.18, + "learning_rate": 0.00012238587296772236, + "loss": 0.033, "step": 183460 }, { - "epoch": 1.98, - "learning_rate": 2.3330521124018427e-06, - "loss": 0.0245, + "epoch": 1.18, + "learning_rate": 0.00012237619161336541, + "loss": 0.0331, "step": 183470 }, { - "epoch": 1.98, - "learning_rate": 2.3168278278927895e-06, - "loss": 0.0231, + "epoch": 1.18, + "learning_rate": 0.0001223665102590085, + "loss": 0.0304, "step": 183480 }, { - "epoch": 1.98, - "learning_rate": 2.3006035433837367e-06, - "loss": 0.0262, + "epoch": 1.18, + "learning_rate": 0.00012235682890465155, + "loss": 0.0333, "step": 183490 }, { - "epoch": 1.98, - "learning_rate": 2.2843792588746835e-06, - "loss": 0.0219, + "epoch": 1.18, + "learning_rate": 0.00012234714755029463, + "loss": 0.0327, "step": 183500 }, { - "epoch": 1.98, - "learning_rate": 2.2681549743656303e-06, - "loss": 0.0287, + "epoch": 1.18, + "learning_rate": 0.00012233746619593768, + "loss": 0.0296, "step": 183510 }, { - "epoch": 1.98, - "learning_rate": 2.251930689856577e-06, - "loss": 0.0235, + "epoch": 1.18, + "learning_rate": 0.00012232778484158076, + "loss": 0.0332, "step": 183520 }, + { + "epoch": 1.18, + "learning_rate": 0.00012231810348722384, + "loss": 0.0311, + "step": 183530 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001223084221328669, + "loss": 0.0398, + "step": 183540 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012229874077850997, + "loss": 0.0344, + "step": 183550 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012228905942415302, + "loss": 0.0286, + "step": 183560 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001222793780697961, + "loss": 0.0281, + "step": 183570 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012226969671543916, + "loss": 0.0354, + "step": 183580 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012226001536108224, + "loss": 0.0329, + "step": 183590 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012225033400672532, + "loss": 0.0283, + "step": 183600 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012224065265236837, + "loss": 0.0296, + "step": 183610 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012223097129801145, + "loss": 0.0281, + "step": 183620 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001222212899436545, + "loss": 0.0326, + "step": 183630 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012221160858929758, + "loss": 0.0309, + "step": 183640 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012220192723494063, + "loss": 0.0353, + "step": 183650 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012219224588058371, + "loss": 0.0343, + "step": 183660 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001221825645262268, + "loss": 0.0331, + "step": 183670 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012217288317186985, + "loss": 0.0338, + "step": 183680 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001221632018175129, + "loss": 0.0388, + "step": 183690 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012215352046315598, + "loss": 0.0338, + "step": 183700 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012214383910879906, + "loss": 0.0331, + "step": 183710 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001221341577544421, + "loss": 0.0309, + "step": 183720 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001221244764000852, + "loss": 0.0346, + "step": 183730 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012211479504572827, + "loss": 0.0321, + "step": 183740 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012210511369137132, + "loss": 0.0265, + "step": 183750 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012209543233701438, + "loss": 0.0331, + "step": 183760 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012208575098265746, + "loss": 0.0342, + "step": 183770 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012207606962830054, + "loss": 0.0261, + "step": 183780 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012206638827394359, + "loss": 0.0333, + "step": 183790 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012205670691958666, + "loss": 0.0359, + "step": 183800 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012204702556522973, + "loss": 0.0364, + "step": 183810 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012203734421087279, + "loss": 0.0352, + "step": 183820 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012202766285651587, + "loss": 0.0357, + "step": 183830 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012201798150215893, + "loss": 0.0314, + "step": 183840 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012200830014780201, + "loss": 0.0386, + "step": 183850 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012199861879344507, + "loss": 0.0325, + "step": 183860 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012198893743908813, + "loss": 0.0376, + "step": 183870 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012197925608473121, + "loss": 0.037, + "step": 183880 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012196957473037426, + "loss": 0.0342, + "step": 183890 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012195989337601733, + "loss": 0.0351, + "step": 183900 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012195021202166041, + "loss": 0.03, + "step": 183910 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012194053066730348, + "loss": 0.029, + "step": 183920 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012193084931294654, + "loss": 0.0296, + "step": 183930 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012192116795858961, + "loss": 0.0317, + "step": 183940 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012191148660423269, + "loss": 0.0399, + "step": 183950 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012190180524987574, + "loss": 0.033, + "step": 183960 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012189212389551881, + "loss": 0.0319, + "step": 183970 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012188244254116189, + "loss": 0.0357, + "step": 183980 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012187276118680495, + "loss": 0.028, + "step": 183990 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012186307983244801, + "loss": 0.0339, + "step": 184000 + }, + { + "epoch": 1.19, + "eval_cer": 0.9198978646480623, + "eval_loss": 0.023351291194558144, + "eval_runtime": 120.0133, + "eval_samples_per_second": 16.665, + "eval_steps_per_second": 4.166, + "step": 184000 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012185339847809109, + "loss": 0.0279, + "step": 184010 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012184371712373415, + "loss": 0.0329, + "step": 184020 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012183403576937722, + "loss": 0.0363, + "step": 184030 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012182435441502029, + "loss": 0.0325, + "step": 184040 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012181467306066337, + "loss": 0.0309, + "step": 184050 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012180499170630643, + "loss": 0.0312, + "step": 184060 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012179531035194948, + "loss": 0.0269, + "step": 184070 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012178562899759256, + "loss": 0.0297, + "step": 184080 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012177594764323563, + "loss": 0.0302, + "step": 184090 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012176626628887868, + "loss": 0.0286, + "step": 184100 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012175658493452176, + "loss": 0.0365, + "step": 184110 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012174690358016483, + "loss": 0.0311, + "step": 184120 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012173722222580791, + "loss": 0.0385, + "step": 184130 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012172754087145096, + "loss": 0.0381, + "step": 184140 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012171785951709404, + "loss": 0.0319, + "step": 184150 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012170817816273711, + "loss": 0.0342, + "step": 184160 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012169849680838016, + "loss": 0.029, + "step": 184170 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012168881545402324, + "loss": 0.0324, + "step": 184180 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001216791340996663, + "loss": 0.0339, + "step": 184190 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012166945274530939, + "loss": 0.0298, + "step": 184200 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012165977139095244, + "loss": 0.0287, + "step": 184210 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001216500900365955, + "loss": 0.0302, + "step": 184220 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012164040868223858, + "loss": 0.0292, + "step": 184230 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012163072732788164, + "loss": 0.03, + "step": 184240 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012162104597352472, + "loss": 0.03, + "step": 184250 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012161136461916778, + "loss": 0.0262, + "step": 184260 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012160168326481084, + "loss": 0.0329, + "step": 184270 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012159200191045392, + "loss": 0.0296, + "step": 184280 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012158232055609698, + "loss": 0.0374, + "step": 184290 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012157263920174006, + "loss": 0.0328, + "step": 184300 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012156295784738311, + "loss": 0.0335, + "step": 184310 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012155327649302618, + "loss": 0.0324, + "step": 184320 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012154359513866926, + "loss": 0.0284, + "step": 184330 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012153391378431231, + "loss": 0.0251, + "step": 184340 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012152423242995539, + "loss": 0.0296, + "step": 184350 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012151455107559846, + "loss": 0.0361, + "step": 184360 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012150486972124153, + "loss": 0.0329, + "step": 184370 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012149518836688459, + "loss": 0.027, + "step": 184380 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012148550701252766, + "loss": 0.0308, + "step": 184390 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012147582565817074, + "loss": 0.0307, + "step": 184400 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012146614430381379, + "loss": 0.0347, + "step": 184410 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012145646294945686, + "loss": 0.0295, + "step": 184420 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012144678159509994, + "loss": 0.0301, + "step": 184430 + }, + { + "epoch": 1.19, + "learning_rate": 0.000121437100240743, + "loss": 0.0375, + "step": 184440 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012142741888638607, + "loss": 0.0302, + "step": 184450 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012141773753202914, + "loss": 0.031, + "step": 184460 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012140805617767222, + "loss": 0.0323, + "step": 184470 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012139837482331527, + "loss": 0.0285, + "step": 184480 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012138869346895833, + "loss": 0.0288, + "step": 184490 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012137901211460141, + "loss": 0.0377, + "step": 184500 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012136933076024448, + "loss": 0.0298, + "step": 184510 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012135964940588753, + "loss": 0.032, + "step": 184520 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012134996805153061, + "loss": 0.034, + "step": 184530 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012134028669717368, + "loss": 0.0333, + "step": 184540 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012133060534281674, + "loss": 0.0372, + "step": 184550 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012132092398845981, + "loss": 0.0302, + "step": 184560 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012131124263410289, + "loss": 0.0315, + "step": 184570 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012130156127974596, + "loss": 0.0408, + "step": 184580 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012129187992538901, + "loss": 0.0363, + "step": 184590 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012128219857103209, + "loss": 0.0328, + "step": 184600 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012127251721667516, + "loss": 0.032, + "step": 184610 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012126283586231821, + "loss": 0.0303, + "step": 184620 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012125315450796129, + "loss": 0.0277, + "step": 184630 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012124347315360435, + "loss": 0.0262, + "step": 184640 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012123379179924743, + "loss": 0.0383, + "step": 184650 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012122411044489049, + "loss": 0.0346, + "step": 184660 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012121442909053357, + "loss": 0.0369, + "step": 184670 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012120474773617663, + "loss": 0.0345, + "step": 184680 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012119506638181969, + "loss": 0.0325, + "step": 184690 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012118538502746277, + "loss": 0.0354, + "step": 184700 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012117570367310583, + "loss": 0.0316, + "step": 184710 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012116602231874891, + "loss": 0.0414, + "step": 184720 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012115634096439196, + "loss": 0.0296, + "step": 184730 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012114665961003503, + "loss": 0.0351, + "step": 184740 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012113697825567811, + "loss": 0.0338, + "step": 184750 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012112729690132116, + "loss": 0.0289, + "step": 184760 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012111761554696424, + "loss": 0.0327, + "step": 184770 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012110793419260731, + "loss": 0.0328, + "step": 184780 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012109825283825038, + "loss": 0.0322, + "step": 184790 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012108857148389344, + "loss": 0.0325, + "step": 184800 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012107889012953651, + "loss": 0.0356, + "step": 184810 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012106920877517959, + "loss": 0.0332, + "step": 184820 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012105952742082264, + "loss": 0.0255, + "step": 184830 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001210498460664657, + "loss": 0.0318, + "step": 184840 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012104016471210879, + "loss": 0.0276, + "step": 184850 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012103048335775185, + "loss": 0.0326, + "step": 184860 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012102080200339492, + "loss": 0.0429, + "step": 184870 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012101112064903799, + "loss": 0.0294, + "step": 184880 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012100143929468105, + "loss": 0.0303, + "step": 184890 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012099175794032412, + "loss": 0.0264, + "step": 184900 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012098207658596718, + "loss": 0.0295, + "step": 184910 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012097239523161026, + "loss": 0.0324, + "step": 184920 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012096271387725333, + "loss": 0.0338, + "step": 184930 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012095303252289638, + "loss": 0.0291, + "step": 184940 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012094335116853946, + "loss": 0.0293, + "step": 184950 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012093366981418253, + "loss": 0.0323, + "step": 184960 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001209239884598256, + "loss": 0.0329, + "step": 184970 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012091430710546866, + "loss": 0.0278, + "step": 184980 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012090462575111173, + "loss": 0.0255, + "step": 184990 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012089494439675481, + "loss": 0.0375, + "step": 185000 + }, + { + "epoch": 1.19, + "eval_cer": 0.9199150378488307, + "eval_loss": 0.022892048582434654, + "eval_runtime": 120.0905, + "eval_samples_per_second": 16.654, + "eval_steps_per_second": 4.164, + "step": 185000 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012088526304239786, + "loss": 0.0303, + "step": 185010 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012087558168804094, + "loss": 0.0331, + "step": 185020 + }, + { + "epoch": 1.19, + "learning_rate": 0.000120865900333684, + "loss": 0.0302, + "step": 185030 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012085621897932706, + "loss": 0.0281, + "step": 185040 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012084653762497014, + "loss": 0.0306, + "step": 185050 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001208368562706132, + "loss": 0.0306, + "step": 185060 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012082717491625628, + "loss": 0.0304, + "step": 185070 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012081749356189934, + "loss": 0.0281, + "step": 185080 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001208078122075424, + "loss": 0.0385, + "step": 185090 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012079813085318548, + "loss": 0.0352, + "step": 185100 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012078844949882854, + "loss": 0.0364, + "step": 185110 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012077876814447162, + "loss": 0.0312, + "step": 185120 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012076908679011468, + "loss": 0.0322, + "step": 185130 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012075940543575776, + "loss": 0.0318, + "step": 185140 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012074972408140081, + "loss": 0.0299, + "step": 185150 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012074004272704388, + "loss": 0.035, + "step": 185160 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012073036137268696, + "loss": 0.0365, + "step": 185170 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012072068001833001, + "loss": 0.0332, + "step": 185180 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012071099866397308, + "loss": 0.035, + "step": 185190 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012070131730961616, + "loss": 0.0333, + "step": 185200 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012069163595525923, + "loss": 0.029, + "step": 185210 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012068195460090229, + "loss": 0.0367, + "step": 185220 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012067227324654536, + "loss": 0.0396, + "step": 185230 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012066259189218844, + "loss": 0.0288, + "step": 185240 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012065291053783149, + "loss": 0.0343, + "step": 185250 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012064322918347456, + "loss": 0.0305, + "step": 185260 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012063354782911764, + "loss": 0.0373, + "step": 185270 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001206238664747607, + "loss": 0.0336, + "step": 185280 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012061418512040376, + "loss": 0.0284, + "step": 185290 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012060450376604683, + "loss": 0.0332, + "step": 185300 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001205948224116899, + "loss": 0.029, + "step": 185310 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012058514105733297, + "loss": 0.0331, + "step": 185320 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012057545970297603, + "loss": 0.0334, + "step": 185330 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012056577834861911, + "loss": 0.0274, + "step": 185340 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012055609699426218, + "loss": 0.0324, + "step": 185350 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012054641563990523, + "loss": 0.0366, + "step": 185360 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012053673428554831, + "loss": 0.0293, + "step": 185370 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012052705293119138, + "loss": 0.0262, + "step": 185380 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012051737157683443, + "loss": 0.03, + "step": 185390 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012050769022247751, + "loss": 0.0319, + "step": 185400 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012049800886812058, + "loss": 0.0299, + "step": 185410 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012048832751376366, + "loss": 0.0361, + "step": 185420 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012047864615940671, + "loss": 0.0258, + "step": 185430 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012046896480504979, + "loss": 0.0378, + "step": 185440 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012045928345069286, + "loss": 0.0317, + "step": 185450 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012044960209633591, + "loss": 0.0286, + "step": 185460 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012043992074197899, + "loss": 0.0272, + "step": 185470 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012043023938762205, + "loss": 0.0341, + "step": 185480 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012042055803326513, + "loss": 0.0302, + "step": 185490 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012041087667890819, + "loss": 0.0305, + "step": 185500 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012040119532455125, + "loss": 0.03, + "step": 185510 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012039151397019433, + "loss": 0.0359, + "step": 185520 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012038183261583739, + "loss": 0.0354, + "step": 185530 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012037215126148047, + "loss": 0.0395, + "step": 185540 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012036246990712353, + "loss": 0.0295, + "step": 185550 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012035278855276661, + "loss": 0.0339, + "step": 185560 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012034310719840966, + "loss": 0.0361, + "step": 185570 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012033342584405273, + "loss": 0.0279, + "step": 185580 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012032374448969581, + "loss": 0.0321, + "step": 185590 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012031406313533886, + "loss": 0.0353, + "step": 185600 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012030438178098193, + "loss": 0.0342, + "step": 185610 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012029470042662501, + "loss": 0.0345, + "step": 185620 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012028501907226807, + "loss": 0.031, + "step": 185630 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012027533771791114, + "loss": 0.0371, + "step": 185640 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012026565636355421, + "loss": 0.0292, + "step": 185650 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012025597500919729, + "loss": 0.033, + "step": 185660 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012024629365484034, + "loss": 0.0355, + "step": 185670 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001202366123004834, + "loss": 0.029, + "step": 185680 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012022693094612649, + "loss": 0.0293, + "step": 185690 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012021724959176955, + "loss": 0.0335, + "step": 185700 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001202075682374126, + "loss": 0.032, + "step": 185710 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012019788688305568, + "loss": 0.029, + "step": 185720 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012018820552869875, + "loss": 0.0324, + "step": 185730 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012017852417434182, + "loss": 0.0353, + "step": 185740 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012016884281998488, + "loss": 0.03, + "step": 185750 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012015916146562796, + "loss": 0.0275, + "step": 185760 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012014948011127103, + "loss": 0.0318, + "step": 185770 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012013979875691408, + "loss": 0.0255, + "step": 185780 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012013011740255716, + "loss": 0.0315, + "step": 185790 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012012043604820023, + "loss": 0.0369, + "step": 185800 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012011075469384328, + "loss": 0.0325, + "step": 185810 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012010107333948636, + "loss": 0.0378, + "step": 185820 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012009139198512943, + "loss": 0.0307, + "step": 185830 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001200817106307725, + "loss": 0.0297, + "step": 185840 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012007202927641556, + "loss": 0.0338, + "step": 185850 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012006234792205864, + "loss": 0.0344, + "step": 185860 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001200526665677017, + "loss": 0.0308, + "step": 185870 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012004298521334476, + "loss": 0.0346, + "step": 185880 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012003330385898784, + "loss": 0.0343, + "step": 185890 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001200236225046309, + "loss": 0.0318, + "step": 185900 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012001394115027398, + "loss": 0.027, + "step": 185910 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012000425979591704, + "loss": 0.0302, + "step": 185920 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001199945784415601, + "loss": 0.0304, + "step": 185930 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011998489708720318, + "loss": 0.0303, + "step": 185940 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011997521573284624, + "loss": 0.0323, + "step": 185950 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011996553437848932, + "loss": 0.0336, + "step": 185960 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011995585302413238, + "loss": 0.0344, + "step": 185970 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011994617166977545, + "loss": 0.0369, + "step": 185980 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011993649031541851, + "loss": 0.0323, + "step": 185990 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011992680896106158, + "loss": 0.0351, + "step": 186000 + }, + { + "epoch": 1.2, + "eval_cer": 0.9198815952999662, + "eval_loss": 0.022712325677275658, + "eval_runtime": 120.0277, + "eval_samples_per_second": 16.663, + "eval_steps_per_second": 4.166, + "step": 186000 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011991712760670466, + "loss": 0.0321, + "step": 186010 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011990744625234771, + "loss": 0.0325, + "step": 186020 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011989776489799078, + "loss": 0.0341, + "step": 186030 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011988808354363386, + "loss": 0.0283, + "step": 186040 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011987840218927692, + "loss": 0.0304, + "step": 186050 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011986872083491999, + "loss": 0.038, + "step": 186060 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011985903948056306, + "loss": 0.0335, + "step": 186070 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011984935812620612, + "loss": 0.0361, + "step": 186080 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011983967677184919, + "loss": 0.0357, + "step": 186090 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011982999541749226, + "loss": 0.03, + "step": 186100 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011982031406313534, + "loss": 0.0304, + "step": 186110 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001198106327087784, + "loss": 0.031, + "step": 186120 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011980095135442145, + "loss": 0.0323, + "step": 186130 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011979127000006453, + "loss": 0.0331, + "step": 186140 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001197815886457076, + "loss": 0.0254, + "step": 186150 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011977190729135067, + "loss": 0.0328, + "step": 186160 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011976222593699373, + "loss": 0.0325, + "step": 186170 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001197525445826368, + "loss": 0.0356, + "step": 186180 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011974286322827988, + "loss": 0.0321, + "step": 186190 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011973318187392293, + "loss": 0.0319, + "step": 186200 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011972350051956601, + "loss": 0.0314, + "step": 186210 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011971381916520908, + "loss": 0.0353, + "step": 186220 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011970413781085213, + "loss": 0.0267, + "step": 186230 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011969445645649521, + "loss": 0.0323, + "step": 186240 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011968477510213828, + "loss": 0.0291, + "step": 186250 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011967509374778136, + "loss": 0.0293, + "step": 186260 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011966541239342441, + "loss": 0.0331, + "step": 186270 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011965573103906748, + "loss": 0.0354, + "step": 186280 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011964604968471056, + "loss": 0.0278, + "step": 186290 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011963636833035361, + "loss": 0.0403, + "step": 186300 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011962668697599669, + "loss": 0.0322, + "step": 186310 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011961700562163975, + "loss": 0.0316, + "step": 186320 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011960732426728283, + "loss": 0.0331, + "step": 186330 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011959764291292589, + "loss": 0.028, + "step": 186340 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011958796155856895, + "loss": 0.0326, + "step": 186350 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011957828020421203, + "loss": 0.0283, + "step": 186360 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011956859884985509, + "loss": 0.0337, + "step": 186370 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011955891749549815, + "loss": 0.0319, + "step": 186380 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011954923614114123, + "loss": 0.0338, + "step": 186390 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001195395547867843, + "loss": 0.0272, + "step": 186400 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011952987343242736, + "loss": 0.0386, + "step": 186410 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011952019207807043, + "loss": 0.0298, + "step": 186420 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011951051072371351, + "loss": 0.0319, + "step": 186430 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011950082936935656, + "loss": 0.0388, + "step": 186440 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011949114801499963, + "loss": 0.0322, + "step": 186450 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011948146666064271, + "loss": 0.0327, + "step": 186460 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011947178530628577, + "loss": 0.0415, + "step": 186470 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011946210395192883, + "loss": 0.0302, + "step": 186480 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011945242259757191, + "loss": 0.0292, + "step": 186490 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011944274124321497, + "loss": 0.0284, + "step": 186500 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011943305988885804, + "loss": 0.031, + "step": 186510 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001194233785345011, + "loss": 0.0364, + "step": 186520 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011941369718014419, + "loss": 0.0361, + "step": 186530 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011940401582578725, + "loss": 0.0367, + "step": 186540 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001193943344714303, + "loss": 0.0315, + "step": 186550 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011938465311707338, + "loss": 0.0348, + "step": 186560 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011937497176271645, + "loss": 0.0352, + "step": 186570 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001193652904083595, + "loss": 0.039, + "step": 186580 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011935560905400258, + "loss": 0.0324, + "step": 186590 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011934592769964565, + "loss": 0.0279, + "step": 186600 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011933624634528873, + "loss": 0.0329, + "step": 186610 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011932656499093178, + "loss": 0.0351, + "step": 186620 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011931688363657486, + "loss": 0.0299, + "step": 186630 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011930720228221793, + "loss": 0.0322, + "step": 186640 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011929752092786098, + "loss": 0.0291, + "step": 186650 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011928783957350406, + "loss": 0.0374, + "step": 186660 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011927815821914713, + "loss": 0.035, + "step": 186670 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001192684768647902, + "loss": 0.0298, + "step": 186680 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011925879551043326, + "loss": 0.0306, + "step": 186690 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011924911415607633, + "loss": 0.0281, + "step": 186700 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001192394328017194, + "loss": 0.0321, + "step": 186710 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011922975144736246, + "loss": 0.0386, + "step": 186720 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011922007009300554, + "loss": 0.0346, + "step": 186730 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001192103887386486, + "loss": 0.0302, + "step": 186740 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011920070738429168, + "loss": 0.0317, + "step": 186750 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011919102602993474, + "loss": 0.0317, + "step": 186760 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001191813446755778, + "loss": 0.0324, + "step": 186770 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011917166332122088, + "loss": 0.0301, + "step": 186780 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011916198196686393, + "loss": 0.0299, + "step": 186790 + }, + { + "epoch": 1.21, + "learning_rate": 0.000119152300612507, + "loss": 0.0299, + "step": 186800 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011914261925815008, + "loss": 0.0371, + "step": 186810 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011913293790379315, + "loss": 0.0305, + "step": 186820 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011912325654943621, + "loss": 0.0269, + "step": 186830 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011911357519507928, + "loss": 0.0346, + "step": 186840 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011910389384072236, + "loss": 0.0322, + "step": 186850 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011909421248636541, + "loss": 0.0298, + "step": 186860 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011908453113200848, + "loss": 0.0289, + "step": 186870 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011907484977765156, + "loss": 0.0306, + "step": 186880 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011906516842329462, + "loss": 0.0387, + "step": 186890 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011905548706893768, + "loss": 0.034, + "step": 186900 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011904580571458076, + "loss": 0.0293, + "step": 186910 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011903612436022382, + "loss": 0.0292, + "step": 186920 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011902644300586689, + "loss": 0.0311, + "step": 186930 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011901676165150996, + "loss": 0.0328, + "step": 186940 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011900708029715304, + "loss": 0.0312, + "step": 186950 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001189973989427961, + "loss": 0.0337, + "step": 186960 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011898771758843915, + "loss": 0.0291, + "step": 186970 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011897803623408223, + "loss": 0.0285, + "step": 186980 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001189683548797253, + "loss": 0.0328, + "step": 186990 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011895867352536835, + "loss": 0.0305, + "step": 187000 + }, + { + "epoch": 1.21, + "eval_cer": 0.9199005762060785, + "eval_loss": 0.022978171706199646, + "eval_runtime": 120.5367, + "eval_samples_per_second": 16.592, + "eval_steps_per_second": 4.148, + "step": 187000 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011894899217101143, + "loss": 0.032, + "step": 187010 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001189393108166545, + "loss": 0.03, + "step": 187020 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011892962946229758, + "loss": 0.0314, + "step": 187030 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011891994810794063, + "loss": 0.032, + "step": 187040 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011891026675358371, + "loss": 0.0337, + "step": 187050 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011890058539922678, + "loss": 0.0295, + "step": 187060 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011889090404486983, + "loss": 0.0301, + "step": 187070 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011888122269051291, + "loss": 0.0365, + "step": 187080 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011887154133615598, + "loss": 0.0293, + "step": 187090 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011886185998179906, + "loss": 0.0329, + "step": 187100 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011885217862744211, + "loss": 0.0341, + "step": 187110 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011884249727308517, + "loss": 0.0353, + "step": 187120 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011883281591872825, + "loss": 0.0413, + "step": 187130 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011882313456437131, + "loss": 0.0292, + "step": 187140 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011881345321001439, + "loss": 0.0378, + "step": 187150 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011880377185565745, + "loss": 0.0304, + "step": 187160 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011879409050130052, + "loss": 0.0306, + "step": 187170 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011878440914694359, + "loss": 0.0327, + "step": 187180 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011877472779258665, + "loss": 0.0355, + "step": 187190 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011876504643822973, + "loss": 0.0312, + "step": 187200 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011875536508387278, + "loss": 0.0302, + "step": 187210 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011874568372951585, + "loss": 0.0293, + "step": 187220 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011873600237515893, + "loss": 0.0271, + "step": 187230 + }, + { + "epoch": 1.21, + "learning_rate": 0.000118726321020802, + "loss": 0.0285, + "step": 187240 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011871663966644506, + "loss": 0.0345, + "step": 187250 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011870695831208813, + "loss": 0.0289, + "step": 187260 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001186972769577312, + "loss": 0.032, + "step": 187270 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011868759560337426, + "loss": 0.0318, + "step": 187280 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011867791424901733, + "loss": 0.0303, + "step": 187290 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011866823289466041, + "loss": 0.0281, + "step": 187300 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011865855154030347, + "loss": 0.0318, + "step": 187310 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011864887018594653, + "loss": 0.0291, + "step": 187320 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001186391888315896, + "loss": 0.0374, + "step": 187330 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011862950747723267, + "loss": 0.0318, + "step": 187340 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011861982612287574, + "loss": 0.0295, + "step": 187350 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001186101447685188, + "loss": 0.0311, + "step": 187360 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011860046341416187, + "loss": 0.0315, + "step": 187370 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011859078205980495, + "loss": 0.0301, + "step": 187380 + }, + { + "epoch": 1.21, + "learning_rate": 0.000118581100705448, + "loss": 0.0306, + "step": 187390 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011857141935109108, + "loss": 0.031, + "step": 187400 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011856173799673415, + "loss": 0.0319, + "step": 187410 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001185520566423772, + "loss": 0.0328, + "step": 187420 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011854237528802028, + "loss": 0.0308, + "step": 187430 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011853269393366335, + "loss": 0.028, + "step": 187440 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011852301257930643, + "loss": 0.0365, + "step": 187450 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011851333122494948, + "loss": 0.0295, + "step": 187460 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011850364987059255, + "loss": 0.0292, + "step": 187470 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011849396851623563, + "loss": 0.0331, + "step": 187480 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011848428716187868, + "loss": 0.0343, + "step": 187490 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011847460580752176, + "loss": 0.0362, + "step": 187500 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011846492445316483, + "loss": 0.0317, + "step": 187510 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001184552430988079, + "loss": 0.036, + "step": 187520 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011844556174445096, + "loss": 0.0354, + "step": 187530 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011843588039009402, + "loss": 0.0262, + "step": 187540 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001184261990357371, + "loss": 0.0395, + "step": 187550 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011841651768138016, + "loss": 0.0259, + "step": 187560 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011840683632702322, + "loss": 0.0347, + "step": 187570 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001183971549726663, + "loss": 0.0322, + "step": 187580 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011838747361830937, + "loss": 0.0336, + "step": 187590 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011837779226395244, + "loss": 0.0297, + "step": 187600 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001183681109095955, + "loss": 0.0346, + "step": 187610 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011835842955523858, + "loss": 0.0322, + "step": 187620 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011834874820088163, + "loss": 0.0362, + "step": 187630 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001183390668465247, + "loss": 0.0392, + "step": 187640 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011832938549216778, + "loss": 0.0327, + "step": 187650 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011831970413781083, + "loss": 0.0291, + "step": 187660 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001183100227834539, + "loss": 0.037, + "step": 187670 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011830034142909698, + "loss": 0.0371, + "step": 187680 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011829066007474005, + "loss": 0.0346, + "step": 187690 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011828097872038311, + "loss": 0.0324, + "step": 187700 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011827129736602618, + "loss": 0.0315, + "step": 187710 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011826161601166926, + "loss": 0.034, + "step": 187720 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011825193465731231, + "loss": 0.0331, + "step": 187730 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011824225330295538, + "loss": 0.032, + "step": 187740 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011823257194859846, + "loss": 0.0246, + "step": 187750 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011822289059424152, + "loss": 0.0339, + "step": 187760 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011821320923988458, + "loss": 0.0356, + "step": 187770 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011820352788552766, + "loss": 0.0318, + "step": 187780 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011819384653117072, + "loss": 0.0319, + "step": 187790 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011818416517681379, + "loss": 0.0333, + "step": 187800 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011817448382245685, + "loss": 0.0373, + "step": 187810 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011816480246809993, + "loss": 0.0285, + "step": 187820 + }, + { + "epoch": 1.21, + "learning_rate": 0.000118155121113743, + "loss": 0.0344, + "step": 187830 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011814543975938605, + "loss": 0.0305, + "step": 187840 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011813575840502913, + "loss": 0.0311, + "step": 187850 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001181260770506722, + "loss": 0.0328, + "step": 187860 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011811639569631525, + "loss": 0.0329, + "step": 187870 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011810671434195833, + "loss": 0.0296, + "step": 187880 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001180970329876014, + "loss": 0.0322, + "step": 187890 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011808735163324448, + "loss": 0.0362, + "step": 187900 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011807767027888753, + "loss": 0.0363, + "step": 187910 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011806798892453061, + "loss": 0.0314, + "step": 187920 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011805830757017368, + "loss": 0.0317, + "step": 187930 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011804862621581673, + "loss": 0.0288, + "step": 187940 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011803894486145981, + "loss": 0.0295, + "step": 187950 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011802926350710287, + "loss": 0.0305, + "step": 187960 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011801958215274595, + "loss": 0.0346, + "step": 187970 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011800990079838901, + "loss": 0.0318, + "step": 187980 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011800021944403207, + "loss": 0.0301, + "step": 187990 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011799053808967515, + "loss": 0.0376, + "step": 188000 + }, + { + "epoch": 1.21, + "eval_cer": 0.9199258840808948, + "eval_loss": 0.022766409441828728, + "eval_runtime": 120.0519, + "eval_samples_per_second": 16.659, + "eval_steps_per_second": 4.165, + "step": 188000 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001179808567353182, + "loss": 0.0315, + "step": 188010 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011797117538096129, + "loss": 0.0358, + "step": 188020 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011796149402660435, + "loss": 0.0336, + "step": 188030 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011795181267224743, + "loss": 0.0348, + "step": 188040 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011794213131789048, + "loss": 0.0289, + "step": 188050 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011793244996353355, + "loss": 0.0286, + "step": 188060 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011792276860917663, + "loss": 0.0313, + "step": 188070 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011791308725481968, + "loss": 0.03, + "step": 188080 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011790340590046275, + "loss": 0.0362, + "step": 188090 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011789372454610583, + "loss": 0.0354, + "step": 188100 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001178840431917489, + "loss": 0.0331, + "step": 188110 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011787436183739196, + "loss": 0.0279, + "step": 188120 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011786468048303503, + "loss": 0.0334, + "step": 188130 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011785499912867811, + "loss": 0.0354, + "step": 188140 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011784531777432116, + "loss": 0.0314, + "step": 188150 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011783563641996423, + "loss": 0.0332, + "step": 188160 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001178259550656073, + "loss": 0.0364, + "step": 188170 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011781627371125037, + "loss": 0.0289, + "step": 188180 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011780659235689343, + "loss": 0.0305, + "step": 188190 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001177969110025365, + "loss": 0.0285, + "step": 188200 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011778722964817957, + "loss": 0.0306, + "step": 188210 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011777754829382264, + "loss": 0.0303, + "step": 188220 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001177678669394657, + "loss": 0.0353, + "step": 188230 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011775818558510878, + "loss": 0.0282, + "step": 188240 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011774850423075185, + "loss": 0.0334, + "step": 188250 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001177388228763949, + "loss": 0.0308, + "step": 188260 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011772914152203798, + "loss": 0.0302, + "step": 188270 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011771946016768105, + "loss": 0.0296, + "step": 188280 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001177097788133241, + "loss": 0.0301, + "step": 188290 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011770009745896718, + "loss": 0.0328, + "step": 188300 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011769041610461025, + "loss": 0.0325, + "step": 188310 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011768073475025333, + "loss": 0.0297, + "step": 188320 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011767105339589638, + "loss": 0.0341, + "step": 188330 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011766137204153946, + "loss": 0.0299, + "step": 188340 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011765169068718253, + "loss": 0.0347, + "step": 188350 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011764200933282558, + "loss": 0.033, + "step": 188360 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011763232797846866, + "loss": 0.0292, + "step": 188370 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011762264662411172, + "loss": 0.0309, + "step": 188380 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001176129652697548, + "loss": 0.0299, + "step": 188390 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011760328391539786, + "loss": 0.0385, + "step": 188400 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011759360256104092, + "loss": 0.0317, + "step": 188410 + }, + { + "epoch": 1.22, + "learning_rate": 0.000117583921206684, + "loss": 0.0332, + "step": 188420 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011757423985232706, + "loss": 0.0263, + "step": 188430 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011756455849797014, + "loss": 0.0341, + "step": 188440 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001175548771436132, + "loss": 0.0313, + "step": 188450 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011754519578925627, + "loss": 0.0258, + "step": 188460 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011753551443489933, + "loss": 0.0297, + "step": 188470 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001175258330805424, + "loss": 0.0309, + "step": 188480 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011751615172618548, + "loss": 0.0284, + "step": 188490 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011750647037182853, + "loss": 0.0296, + "step": 188500 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001174967890174716, + "loss": 0.033, + "step": 188510 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011748710766311468, + "loss": 0.029, + "step": 188520 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011747742630875775, + "loss": 0.0327, + "step": 188530 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011746774495440081, + "loss": 0.031, + "step": 188540 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011745806360004388, + "loss": 0.0331, + "step": 188550 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011744838224568694, + "loss": 0.0315, + "step": 188560 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011743870089133001, + "loss": 0.0288, + "step": 188570 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011742901953697308, + "loss": 0.0347, + "step": 188580 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011741933818261616, + "loss": 0.0345, + "step": 188590 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011740965682825922, + "loss": 0.034, + "step": 188600 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011739997547390228, + "loss": 0.0291, + "step": 188610 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011739029411954535, + "loss": 0.0347, + "step": 188620 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011738061276518842, + "loss": 0.0285, + "step": 188630 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011737093141083149, + "loss": 0.0361, + "step": 188640 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011736125005647455, + "loss": 0.0358, + "step": 188650 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011735156870211762, + "loss": 0.0298, + "step": 188660 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001173418873477607, + "loss": 0.0311, + "step": 188670 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011733220599340375, + "loss": 0.0274, + "step": 188680 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011732252463904683, + "loss": 0.037, + "step": 188690 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001173128432846899, + "loss": 0.0329, + "step": 188700 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011730316193033295, + "loss": 0.0321, + "step": 188710 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011729348057597603, + "loss": 0.0312, + "step": 188720 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001172837992216191, + "loss": 0.0331, + "step": 188730 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011727411786726218, + "loss": 0.0331, + "step": 188740 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011726443651290523, + "loss": 0.037, + "step": 188750 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011725475515854831, + "loss": 0.0368, + "step": 188760 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011724507380419138, + "loss": 0.0305, + "step": 188770 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011723539244983443, + "loss": 0.0361, + "step": 188780 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011722571109547751, + "loss": 0.0255, + "step": 188790 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011721602974112057, + "loss": 0.039, + "step": 188800 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011720634838676365, + "loss": 0.0334, + "step": 188810 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001171966670324067, + "loss": 0.0359, + "step": 188820 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011718698567804977, + "loss": 0.0302, + "step": 188830 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011717730432369285, + "loss": 0.0276, + "step": 188840 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001171676229693359, + "loss": 0.0349, + "step": 188850 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011715794161497899, + "loss": 0.0358, + "step": 188860 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011714826026062205, + "loss": 0.0313, + "step": 188870 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011713857890626512, + "loss": 0.0342, + "step": 188880 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011712889755190818, + "loss": 0.0257, + "step": 188890 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011711921619755125, + "loss": 0.031, + "step": 188900 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011710953484319433, + "loss": 0.031, + "step": 188910 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011709985348883738, + "loss": 0.0251, + "step": 188920 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011709017213448045, + "loss": 0.0294, + "step": 188930 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011708049078012353, + "loss": 0.0326, + "step": 188940 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001170708094257666, + "loss": 0.0333, + "step": 188950 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011706112807140966, + "loss": 0.0319, + "step": 188960 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011705144671705273, + "loss": 0.026, + "step": 188970 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001170417653626958, + "loss": 0.0325, + "step": 188980 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011703208400833886, + "loss": 0.0325, + "step": 188990 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011702240265398193, + "loss": 0.0338, + "step": 189000 + }, + { + "epoch": 1.22, + "eval_cer": 0.9199575189244154, + "eval_loss": 0.02248038910329342, + "eval_runtime": 120.1814, + "eval_samples_per_second": 16.642, + "eval_steps_per_second": 4.16, + "step": 189000 + }, + { + "epoch": 1.22, + "learning_rate": 0.000117012721299625, + "loss": 0.0337, + "step": 189010 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011700303994526807, + "loss": 0.0304, + "step": 189020 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011699335859091112, + "loss": 0.0317, + "step": 189030 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001169836772365542, + "loss": 0.0345, + "step": 189040 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011697399588219727, + "loss": 0.0378, + "step": 189050 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011696431452784034, + "loss": 0.0291, + "step": 189060 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001169546331734834, + "loss": 0.0362, + "step": 189070 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011694495181912647, + "loss": 0.0331, + "step": 189080 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011693527046476955, + "loss": 0.0343, + "step": 189090 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001169255891104126, + "loss": 0.0334, + "step": 189100 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011691590775605568, + "loss": 0.0376, + "step": 189110 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011690622640169875, + "loss": 0.031, + "step": 189120 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001168965450473418, + "loss": 0.0347, + "step": 189130 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011688686369298488, + "loss": 0.0268, + "step": 189140 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011687718233862795, + "loss": 0.0298, + "step": 189150 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011686750098427103, + "loss": 0.0329, + "step": 189160 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011685781962991408, + "loss": 0.0338, + "step": 189170 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011684813827555715, + "loss": 0.0336, + "step": 189180 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011683845692120023, + "loss": 0.0338, + "step": 189190 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011682877556684328, + "loss": 0.0298, + "step": 189200 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011681909421248636, + "loss": 0.0252, + "step": 189210 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011680941285812942, + "loss": 0.0349, + "step": 189220 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001167997315037725, + "loss": 0.0306, + "step": 189230 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011679005014941556, + "loss": 0.0293, + "step": 189240 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011678036879505862, + "loss": 0.029, + "step": 189250 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001167706874407017, + "loss": 0.0261, + "step": 189260 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011676100608634476, + "loss": 0.028, + "step": 189270 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011675132473198782, + "loss": 0.0272, + "step": 189280 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001167416433776309, + "loss": 0.0305, + "step": 189290 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011673196202327397, + "loss": 0.0314, + "step": 189300 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011672228066891703, + "loss": 0.0278, + "step": 189310 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001167125993145601, + "loss": 0.0285, + "step": 189320 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011670291796020318, + "loss": 0.0351, + "step": 189330 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011669323660584623, + "loss": 0.031, + "step": 189340 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001166835552514893, + "loss": 0.0306, + "step": 189350 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011667387389713238, + "loss": 0.029, + "step": 189360 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011666419254277544, + "loss": 0.0303, + "step": 189370 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001166545111884185, + "loss": 0.0286, + "step": 189380 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011664482983406158, + "loss": 0.0327, + "step": 189390 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011663514847970464, + "loss": 0.0302, + "step": 189400 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011662546712534771, + "loss": 0.0346, + "step": 189410 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011661578577099078, + "loss": 0.029, + "step": 189420 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011660610441663386, + "loss": 0.0311, + "step": 189430 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011659642306227692, + "loss": 0.0278, + "step": 189440 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011658674170791997, + "loss": 0.0364, + "step": 189450 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011657706035356305, + "loss": 0.0292, + "step": 189460 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011656737899920612, + "loss": 0.0288, + "step": 189470 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011655769764484917, + "loss": 0.0257, + "step": 189480 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011654801629049225, + "loss": 0.0292, + "step": 189490 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011653833493613532, + "loss": 0.0333, + "step": 189500 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001165286535817784, + "loss": 0.0262, + "step": 189510 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011651897222742145, + "loss": 0.0319, + "step": 189520 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011650929087306453, + "loss": 0.0311, + "step": 189530 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001164996095187076, + "loss": 0.0356, + "step": 189540 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011648992816435065, + "loss": 0.0348, + "step": 189550 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011648024680999373, + "loss": 0.0348, + "step": 189560 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001164705654556368, + "loss": 0.0348, + "step": 189570 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011646088410127988, + "loss": 0.0281, + "step": 189580 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011645120274692293, + "loss": 0.0332, + "step": 189590 + }, + { + "epoch": 1.22, + "learning_rate": 0.000116441521392566, + "loss": 0.0315, + "step": 189600 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011643184003820908, + "loss": 0.0273, + "step": 189610 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011642215868385213, + "loss": 0.0365, + "step": 189620 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011641247732949521, + "loss": 0.037, + "step": 189630 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011640279597513827, + "loss": 0.0307, + "step": 189640 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011639311462078135, + "loss": 0.0256, + "step": 189650 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001163834332664244, + "loss": 0.0275, + "step": 189660 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011637375191206747, + "loss": 0.0319, + "step": 189670 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011636407055771055, + "loss": 0.0325, + "step": 189680 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001163543892033536, + "loss": 0.0401, + "step": 189690 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011634470784899667, + "loss": 0.0311, + "step": 189700 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011633502649463975, + "loss": 0.0332, + "step": 189710 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011632534514028282, + "loss": 0.031, + "step": 189720 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011631566378592588, + "loss": 0.0307, + "step": 189730 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011630598243156895, + "loss": 0.025, + "step": 189740 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011629630107721203, + "loss": 0.0318, + "step": 189750 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011628661972285508, + "loss": 0.0338, + "step": 189760 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011627693836849815, + "loss": 0.0318, + "step": 189770 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011626725701414123, + "loss": 0.0332, + "step": 189780 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001162575756597843, + "loss": 0.0262, + "step": 189790 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011624789430542735, + "loss": 0.032, + "step": 189800 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011623821295107043, + "loss": 0.0337, + "step": 189810 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001162285315967135, + "loss": 0.0263, + "step": 189820 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011621885024235656, + "loss": 0.0325, + "step": 189830 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011620916888799963, + "loss": 0.0377, + "step": 189840 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001161994875336427, + "loss": 0.0291, + "step": 189850 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011618980617928577, + "loss": 0.0298, + "step": 189860 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011618012482492882, + "loss": 0.0301, + "step": 189870 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001161704434705719, + "loss": 0.034, + "step": 189880 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011616076211621497, + "loss": 0.0293, + "step": 189890 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011615108076185802, + "loss": 0.0327, + "step": 189900 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001161413994075011, + "loss": 0.0305, + "step": 189910 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011613171805314417, + "loss": 0.0283, + "step": 189920 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011612203669878725, + "loss": 0.0279, + "step": 189930 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001161123553444303, + "loss": 0.0287, + "step": 189940 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011610267399007338, + "loss": 0.0286, + "step": 189950 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011609299263571645, + "loss": 0.0336, + "step": 189960 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001160833112813595, + "loss": 0.0389, + "step": 189970 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011607362992700258, + "loss": 0.0419, + "step": 189980 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011606394857264565, + "loss": 0.0321, + "step": 189990 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011605426721828873, + "loss": 0.0315, + "step": 190000 + }, + { + "epoch": 1.23, + "eval_cer": 0.9198580951304938, + "eval_loss": 0.02292782999575138, + "eval_runtime": 120.2546, + "eval_samples_per_second": 16.631, + "eval_steps_per_second": 4.158, + "step": 190000 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011604458586393178, + "loss": 0.0329, + "step": 190010 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011603490450957485, + "loss": 0.0348, + "step": 190020 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011602522315521792, + "loss": 0.0299, + "step": 190030 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011601554180086098, + "loss": 0.0266, + "step": 190040 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011600586044650406, + "loss": 0.0321, + "step": 190050 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011599617909214712, + "loss": 0.0321, + "step": 190060 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011598649773779019, + "loss": 0.0311, + "step": 190070 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011597681638343326, + "loss": 0.0321, + "step": 190080 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011596713502907632, + "loss": 0.0325, + "step": 190090 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001159574536747194, + "loss": 0.0327, + "step": 190100 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011594777232036245, + "loss": 0.0339, + "step": 190110 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011593809096600552, + "loss": 0.0298, + "step": 190120 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001159284096116486, + "loss": 0.0303, + "step": 190130 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011591872825729167, + "loss": 0.0373, + "step": 190140 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011590904690293473, + "loss": 0.0275, + "step": 190150 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001158993655485778, + "loss": 0.0303, + "step": 190160 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011588968419422087, + "loss": 0.0295, + "step": 190170 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011588000283986393, + "loss": 0.0323, + "step": 190180 + }, + { + "epoch": 1.23, + "learning_rate": 0.000115870321485507, + "loss": 0.0301, + "step": 190190 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011586064013115008, + "loss": 0.0276, + "step": 190200 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011585095877679314, + "loss": 0.03, + "step": 190210 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001158412774224362, + "loss": 0.0302, + "step": 190220 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011583159606807928, + "loss": 0.0286, + "step": 190230 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011582191471372234, + "loss": 0.0362, + "step": 190240 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011581223335936541, + "loss": 0.0326, + "step": 190250 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011580255200500848, + "loss": 0.0277, + "step": 190260 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011579287065065154, + "loss": 0.0333, + "step": 190270 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011578318929629462, + "loss": 0.0263, + "step": 190280 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011577350794193767, + "loss": 0.0313, + "step": 190290 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011576382658758075, + "loss": 0.0327, + "step": 190300 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011575414523322382, + "loss": 0.0304, + "step": 190310 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011574446387886687, + "loss": 0.0294, + "step": 190320 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011573478252450995, + "loss": 0.0331, + "step": 190330 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011572510117015302, + "loss": 0.0312, + "step": 190340 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001157154198157961, + "loss": 0.0313, + "step": 190350 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011570573846143915, + "loss": 0.0276, + "step": 190360 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011569605710708222, + "loss": 0.036, + "step": 190370 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001156863757527253, + "loss": 0.03, + "step": 190380 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011567669439836835, + "loss": 0.0372, + "step": 190390 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011566701304401143, + "loss": 0.0311, + "step": 190400 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001156573316896545, + "loss": 0.0343, + "step": 190410 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011564765033529758, + "loss": 0.0321, + "step": 190420 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011563796898094063, + "loss": 0.0268, + "step": 190430 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001156282876265837, + "loss": 0.0314, + "step": 190440 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011561860627222677, + "loss": 0.0317, + "step": 190450 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011560892491786983, + "loss": 0.0358, + "step": 190460 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001155992435635129, + "loss": 0.0299, + "step": 190470 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011558956220915597, + "loss": 0.0321, + "step": 190480 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011557988085479904, + "loss": 0.0276, + "step": 190490 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001155701995004421, + "loss": 0.0286, + "step": 190500 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011556051814608517, + "loss": 0.0311, + "step": 190510 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011555083679172825, + "loss": 0.0261, + "step": 190520 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001155411554373713, + "loss": 0.0327, + "step": 190530 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011553147408301437, + "loss": 0.0291, + "step": 190540 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011552179272865745, + "loss": 0.0328, + "step": 190550 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011551211137430052, + "loss": 0.0327, + "step": 190560 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011550243001994357, + "loss": 0.0308, + "step": 190570 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011549274866558665, + "loss": 0.032, + "step": 190580 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011548306731122972, + "loss": 0.0323, + "step": 190590 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011547338595687278, + "loss": 0.0329, + "step": 190600 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011546370460251585, + "loss": 0.0349, + "step": 190610 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011545402324815893, + "loss": 0.0326, + "step": 190620 + }, + { + "epoch": 1.23, + "learning_rate": 0.000115444341893802, + "loss": 0.03, + "step": 190630 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011543466053944505, + "loss": 0.0305, + "step": 190640 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011542497918508813, + "loss": 0.0373, + "step": 190650 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011541529783073119, + "loss": 0.0313, + "step": 190660 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011540561647637425, + "loss": 0.0316, + "step": 190670 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011539593512201733, + "loss": 0.0304, + "step": 190680 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011538625376766039, + "loss": 0.0322, + "step": 190690 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011537657241330347, + "loss": 0.029, + "step": 190700 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011536689105894652, + "loss": 0.0319, + "step": 190710 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001153572097045896, + "loss": 0.0318, + "step": 190720 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011534752835023267, + "loss": 0.0295, + "step": 190730 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011533784699587572, + "loss": 0.0319, + "step": 190740 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001153281656415188, + "loss": 0.0308, + "step": 190750 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011531848428716187, + "loss": 0.0298, + "step": 190760 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011530880293280495, + "loss": 0.0313, + "step": 190770 + }, + { + "epoch": 1.23, + "learning_rate": 0.000115299121578448, + "loss": 0.0338, + "step": 190780 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011528944022409107, + "loss": 0.0387, + "step": 190790 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011527975886973415, + "loss": 0.0272, + "step": 190800 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001152700775153772, + "loss": 0.035, + "step": 190810 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011526039616102028, + "loss": 0.0305, + "step": 190820 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011525071480666335, + "loss": 0.0367, + "step": 190830 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011524103345230643, + "loss": 0.0319, + "step": 190840 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011523135209794948, + "loss": 0.0307, + "step": 190850 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011522167074359254, + "loss": 0.0308, + "step": 190860 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011521198938923562, + "loss": 0.0362, + "step": 190870 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011520230803487868, + "loss": 0.0278, + "step": 190880 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011519262668052174, + "loss": 0.0344, + "step": 190890 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011518294532616482, + "loss": 0.0307, + "step": 190900 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011517326397180789, + "loss": 0.0312, + "step": 190910 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011516358261745096, + "loss": 0.0318, + "step": 190920 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011515390126309402, + "loss": 0.0324, + "step": 190930 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001151442199087371, + "loss": 0.0362, + "step": 190940 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011513453855438015, + "loss": 0.0316, + "step": 190950 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011512485720002322, + "loss": 0.0275, + "step": 190960 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001151151758456663, + "loss": 0.0259, + "step": 190970 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011510549449130937, + "loss": 0.0332, + "step": 190980 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011509581313695242, + "loss": 0.0322, + "step": 190990 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001150861317825955, + "loss": 0.0369, + "step": 191000 + }, + { + "epoch": 1.23, + "eval_cer": 0.9199421534289911, + "eval_loss": 0.022925306111574173, + "eval_runtime": 120.1456, + "eval_samples_per_second": 16.646, + "eval_steps_per_second": 4.162, + "step": 191000 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011507645042823857, + "loss": 0.0278, + "step": 191010 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011506676907388163, + "loss": 0.0316, + "step": 191020 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001150570877195247, + "loss": 0.0279, + "step": 191030 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011504740636516778, + "loss": 0.0319, + "step": 191040 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011503772501081084, + "loss": 0.0293, + "step": 191050 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001150280436564539, + "loss": 0.0337, + "step": 191060 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011501836230209698, + "loss": 0.0307, + "step": 191070 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011500868094774004, + "loss": 0.0276, + "step": 191080 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001149989995933831, + "loss": 0.0281, + "step": 191090 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011498931823902618, + "loss": 0.0303, + "step": 191100 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011497963688466924, + "loss": 0.0333, + "step": 191110 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011496995553031231, + "loss": 0.0311, + "step": 191120 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011496027417595537, + "loss": 0.0264, + "step": 191130 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011495059282159845, + "loss": 0.0343, + "step": 191140 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011494091146724152, + "loss": 0.0326, + "step": 191150 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011493123011288457, + "loss": 0.0276, + "step": 191160 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011492154875852765, + "loss": 0.0376, + "step": 191170 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011491186740417072, + "loss": 0.0362, + "step": 191180 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011490218604981377, + "loss": 0.032, + "step": 191190 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011489250469545685, + "loss": 0.0307, + "step": 191200 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011488282334109992, + "loss": 0.0332, + "step": 191210 + }, + { + "epoch": 1.23, + "learning_rate": 0.000114873141986743, + "loss": 0.042, + "step": 191220 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011486346063238605, + "loss": 0.0345, + "step": 191230 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011485377927802913, + "loss": 0.0305, + "step": 191240 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001148440979236722, + "loss": 0.032, + "step": 191250 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011483441656931525, + "loss": 0.0356, + "step": 191260 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011482473521495833, + "loss": 0.0324, + "step": 191270 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001148150538606014, + "loss": 0.0306, + "step": 191280 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011480537250624447, + "loss": 0.0278, + "step": 191290 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011479569115188753, + "loss": 0.028, + "step": 191300 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001147860097975306, + "loss": 0.0312, + "step": 191310 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011477632844317367, + "loss": 0.0326, + "step": 191320 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011476664708881673, + "loss": 0.0324, + "step": 191330 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001147569657344598, + "loss": 0.0306, + "step": 191340 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011474728438010287, + "loss": 0.0259, + "step": 191350 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011473760302574594, + "loss": 0.025, + "step": 191360 + }, + { + "epoch": 1.24, + "learning_rate": 0.000114727921671389, + "loss": 0.0343, + "step": 191370 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011471824031703207, + "loss": 0.0361, + "step": 191380 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011470855896267515, + "loss": 0.0345, + "step": 191390 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001146988776083182, + "loss": 0.0338, + "step": 191400 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011468919625396127, + "loss": 0.0328, + "step": 191410 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011467951489960435, + "loss": 0.0284, + "step": 191420 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011466983354524742, + "loss": 0.0317, + "step": 191430 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011466015219089048, + "loss": 0.0269, + "step": 191440 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011465047083653355, + "loss": 0.0347, + "step": 191450 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011464078948217661, + "loss": 0.0349, + "step": 191460 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011463110812781968, + "loss": 0.0329, + "step": 191470 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011462142677346275, + "loss": 0.0385, + "step": 191480 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011461174541910583, + "loss": 0.0316, + "step": 191490 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011460206406474889, + "loss": 0.0388, + "step": 191500 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011459238271039195, + "loss": 0.0277, + "step": 191510 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011458270135603502, + "loss": 0.033, + "step": 191520 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011457302000167809, + "loss": 0.0264, + "step": 191530 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011456333864732116, + "loss": 0.0358, + "step": 191540 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011455365729296422, + "loss": 0.0299, + "step": 191550 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011454397593860729, + "loss": 0.0286, + "step": 191560 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011453429458425037, + "loss": 0.0311, + "step": 191570 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011452461322989342, + "loss": 0.0304, + "step": 191580 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001145149318755365, + "loss": 0.0374, + "step": 191590 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011450525052117957, + "loss": 0.0308, + "step": 191600 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011449556916682262, + "loss": 0.0283, + "step": 191610 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001144858878124657, + "loss": 0.0285, + "step": 191620 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011447620645810877, + "loss": 0.0295, + "step": 191630 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011446652510375185, + "loss": 0.0315, + "step": 191640 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001144568437493949, + "loss": 0.0293, + "step": 191650 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011444716239503797, + "loss": 0.0299, + "step": 191660 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011443748104068105, + "loss": 0.0325, + "step": 191670 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001144277996863241, + "loss": 0.0298, + "step": 191680 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011441811833196718, + "loss": 0.0262, + "step": 191690 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011440843697761024, + "loss": 0.0334, + "step": 191700 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011439875562325332, + "loss": 0.0292, + "step": 191710 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011438907426889638, + "loss": 0.0294, + "step": 191720 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011437939291453944, + "loss": 0.0412, + "step": 191730 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011436971156018252, + "loss": 0.0295, + "step": 191740 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011436003020582558, + "loss": 0.0367, + "step": 191750 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011435034885146864, + "loss": 0.0315, + "step": 191760 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011434066749711172, + "loss": 0.0297, + "step": 191770 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011433098614275479, + "loss": 0.032, + "step": 191780 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011432130478839785, + "loss": 0.0304, + "step": 191790 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011431162343404092, + "loss": 0.0297, + "step": 191800 + }, + { + "epoch": 1.24, + "learning_rate": 0.000114301942079684, + "loss": 0.0259, + "step": 191810 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011429226072532705, + "loss": 0.0304, + "step": 191820 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011428257937097012, + "loss": 0.0318, + "step": 191830 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001142728980166132, + "loss": 0.0331, + "step": 191840 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011426321666225627, + "loss": 0.0298, + "step": 191850 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011425353530789932, + "loss": 0.0286, + "step": 191860 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001142438539535424, + "loss": 0.0275, + "step": 191870 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011423417259918546, + "loss": 0.0257, + "step": 191880 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011422449124482853, + "loss": 0.0272, + "step": 191890 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001142148098904716, + "loss": 0.031, + "step": 191900 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011420512853611468, + "loss": 0.0342, + "step": 191910 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011419544718175774, + "loss": 0.0271, + "step": 191920 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001141857658274008, + "loss": 0.033, + "step": 191930 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011417608447304387, + "loss": 0.0278, + "step": 191940 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011416640311868694, + "loss": 0.0374, + "step": 191950 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011415672176433, + "loss": 0.03, + "step": 191960 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011414704040997307, + "loss": 0.031, + "step": 191970 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011413735905561614, + "loss": 0.0376, + "step": 191980 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011412767770125922, + "loss": 0.0343, + "step": 191990 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011411799634690227, + "loss": 0.0288, + "step": 192000 + }, + { + "epoch": 1.24, + "eval_cer": 0.919876172183934, + "eval_loss": 0.022667761892080307, + "eval_runtime": 120.1644, + "eval_samples_per_second": 16.644, + "eval_steps_per_second": 4.161, + "step": 192000 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011410831499254535, + "loss": 0.0354, + "step": 192010 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011409863363818842, + "loss": 0.0436, + "step": 192020 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011408895228383147, + "loss": 0.0312, + "step": 192030 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011407927092947455, + "loss": 0.0304, + "step": 192040 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011406958957511762, + "loss": 0.0317, + "step": 192050 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001140599082207607, + "loss": 0.0326, + "step": 192060 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011405022686640375, + "loss": 0.0348, + "step": 192070 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011404054551204682, + "loss": 0.0379, + "step": 192080 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001140308641576899, + "loss": 0.0286, + "step": 192090 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011402118280333295, + "loss": 0.0367, + "step": 192100 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011401150144897603, + "loss": 0.0296, + "step": 192110 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001140018200946191, + "loss": 0.0297, + "step": 192120 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011399213874026217, + "loss": 0.032, + "step": 192130 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011398245738590523, + "loss": 0.0348, + "step": 192140 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011397277603154829, + "loss": 0.0309, + "step": 192150 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011396309467719137, + "loss": 0.0322, + "step": 192160 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011395341332283443, + "loss": 0.0335, + "step": 192170 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011394373196847749, + "loss": 0.0296, + "step": 192180 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011393405061412057, + "loss": 0.0346, + "step": 192190 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011392436925976364, + "loss": 0.0367, + "step": 192200 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001139146879054067, + "loss": 0.0334, + "step": 192210 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011390500655104977, + "loss": 0.0307, + "step": 192220 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011389532519669285, + "loss": 0.0351, + "step": 192230 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001138856438423359, + "loss": 0.027, + "step": 192240 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011387596248797897, + "loss": 0.0323, + "step": 192250 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011386628113362205, + "loss": 0.0302, + "step": 192260 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011385659977926511, + "loss": 0.0369, + "step": 192270 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011384691842490817, + "loss": 0.0244, + "step": 192280 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011383723707055125, + "loss": 0.0279, + "step": 192290 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011382755571619431, + "loss": 0.0266, + "step": 192300 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011381787436183738, + "loss": 0.0308, + "step": 192310 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011380819300748045, + "loss": 0.0332, + "step": 192320 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011379851165312353, + "loss": 0.0272, + "step": 192330 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011378883029876659, + "loss": 0.0361, + "step": 192340 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011377914894440964, + "loss": 0.0287, + "step": 192350 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011376946759005272, + "loss": 0.0294, + "step": 192360 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011375978623569579, + "loss": 0.0321, + "step": 192370 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011375010488133884, + "loss": 0.0317, + "step": 192380 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011374042352698192, + "loss": 0.0287, + "step": 192390 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011373074217262499, + "loss": 0.0293, + "step": 192400 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011372106081826807, + "loss": 0.0316, + "step": 192410 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011371137946391112, + "loss": 0.032, + "step": 192420 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001137016981095542, + "loss": 0.0333, + "step": 192430 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011369201675519727, + "loss": 0.0299, + "step": 192440 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011368233540084032, + "loss": 0.0334, + "step": 192450 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001136726540464834, + "loss": 0.0298, + "step": 192460 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011366297269212647, + "loss": 0.0319, + "step": 192470 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011365329133776955, + "loss": 0.0365, + "step": 192480 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001136436099834126, + "loss": 0.0322, + "step": 192490 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011363392862905567, + "loss": 0.0355, + "step": 192500 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011362424727469875, + "loss": 0.0326, + "step": 192510 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001136145659203418, + "loss": 0.0352, + "step": 192520 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011360488456598488, + "loss": 0.0347, + "step": 192530 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011359520321162794, + "loss": 0.0297, + "step": 192540 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011358552185727101, + "loss": 0.0284, + "step": 192550 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011357584050291408, + "loss": 0.0282, + "step": 192560 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011356615914855714, + "loss": 0.029, + "step": 192570 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011355647779420022, + "loss": 0.0259, + "step": 192580 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011354679643984328, + "loss": 0.032, + "step": 192590 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011353711508548634, + "loss": 0.0341, + "step": 192600 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011352743373112942, + "loss": 0.0326, + "step": 192610 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011351775237677249, + "loss": 0.0309, + "step": 192620 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011350807102241555, + "loss": 0.0291, + "step": 192630 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011349838966805862, + "loss": 0.0345, + "step": 192640 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011348870831370169, + "loss": 0.0326, + "step": 192650 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011347902695934475, + "loss": 0.0333, + "step": 192660 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011346934560498782, + "loss": 0.03, + "step": 192670 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001134596642506309, + "loss": 0.0273, + "step": 192680 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011344998289627396, + "loss": 0.0274, + "step": 192690 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011344030154191702, + "loss": 0.0288, + "step": 192700 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001134306201875601, + "loss": 0.024, + "step": 192710 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011342093883320316, + "loss": 0.0298, + "step": 192720 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011341125747884623, + "loss": 0.034, + "step": 192730 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001134015761244893, + "loss": 0.029, + "step": 192740 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011339189477013236, + "loss": 0.0326, + "step": 192750 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011338221341577544, + "loss": 0.031, + "step": 192760 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001133725320614185, + "loss": 0.0262, + "step": 192770 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011336285070706157, + "loss": 0.0386, + "step": 192780 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011335316935270464, + "loss": 0.0325, + "step": 192790 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001133434879983477, + "loss": 0.0313, + "step": 192800 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011333380664399077, + "loss": 0.0314, + "step": 192810 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011332412528963384, + "loss": 0.0287, + "step": 192820 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011331444393527692, + "loss": 0.0316, + "step": 192830 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011330476258091997, + "loss": 0.0371, + "step": 192840 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011329508122656304, + "loss": 0.0322, + "step": 192850 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011328539987220612, + "loss": 0.0316, + "step": 192860 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011327571851784917, + "loss": 0.0327, + "step": 192870 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011326603716349225, + "loss": 0.0351, + "step": 192880 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011325635580913532, + "loss": 0.0263, + "step": 192890 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001132466744547784, + "loss": 0.0273, + "step": 192900 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011323699310042145, + "loss": 0.0283, + "step": 192910 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011322731174606452, + "loss": 0.0299, + "step": 192920 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001132176303917076, + "loss": 0.0263, + "step": 192930 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011320794903735065, + "loss": 0.0311, + "step": 192940 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011319826768299371, + "loss": 0.0304, + "step": 192950 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001131885863286368, + "loss": 0.0293, + "step": 192960 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011317890497427986, + "loss": 0.0375, + "step": 192970 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011316922361992293, + "loss": 0.0302, + "step": 192980 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011315954226556599, + "loss": 0.0303, + "step": 192990 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011314986091120907, + "loss": 0.0344, + "step": 193000 + }, + { + "epoch": 1.25, + "eval_cer": 0.9198716529205739, + "eval_loss": 0.022520260885357857, + "eval_runtime": 120.1842, + "eval_samples_per_second": 16.641, + "eval_steps_per_second": 4.16, + "step": 193000 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011314017955685212, + "loss": 0.0279, + "step": 193010 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011313049820249519, + "loss": 0.0348, + "step": 193020 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011312081684813827, + "loss": 0.0312, + "step": 193030 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011311113549378134, + "loss": 0.029, + "step": 193040 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001131014541394244, + "loss": 0.0353, + "step": 193050 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011309177278506747, + "loss": 0.0343, + "step": 193060 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011308209143071054, + "loss": 0.0286, + "step": 193070 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001130724100763536, + "loss": 0.0294, + "step": 193080 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011306272872199667, + "loss": 0.0328, + "step": 193090 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011305304736763975, + "loss": 0.0326, + "step": 193100 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011304336601328281, + "loss": 0.0283, + "step": 193110 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011303368465892587, + "loss": 0.0255, + "step": 193120 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011302400330456895, + "loss": 0.0353, + "step": 193130 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011301432195021201, + "loss": 0.0302, + "step": 193140 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011300464059585508, + "loss": 0.0267, + "step": 193150 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011299495924149815, + "loss": 0.0316, + "step": 193160 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011298527788714121, + "loss": 0.0304, + "step": 193170 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011297559653278429, + "loss": 0.0344, + "step": 193180 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011296591517842734, + "loss": 0.0339, + "step": 193190 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011295623382407042, + "loss": 0.0311, + "step": 193200 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011294655246971349, + "loss": 0.0292, + "step": 193210 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011293687111535654, + "loss": 0.0264, + "step": 193220 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011292718976099962, + "loss": 0.0355, + "step": 193230 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011291750840664269, + "loss": 0.0326, + "step": 193240 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011290782705228577, + "loss": 0.0242, + "step": 193250 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011289814569792882, + "loss": 0.0309, + "step": 193260 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011288846434357189, + "loss": 0.0293, + "step": 193270 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011287878298921497, + "loss": 0.0309, + "step": 193280 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011286910163485802, + "loss": 0.0323, + "step": 193290 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001128594202805011, + "loss": 0.0303, + "step": 193300 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011284973892614417, + "loss": 0.0332, + "step": 193310 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011284005757178725, + "loss": 0.0302, + "step": 193320 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001128303762174303, + "loss": 0.0304, + "step": 193330 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011282069486307337, + "loss": 0.0328, + "step": 193340 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011281101350871644, + "loss": 0.0302, + "step": 193350 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001128013321543595, + "loss": 0.0402, + "step": 193360 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011279165080000256, + "loss": 0.0293, + "step": 193370 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011278196944564564, + "loss": 0.0355, + "step": 193380 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011277228809128871, + "loss": 0.0268, + "step": 193390 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011276260673693178, + "loss": 0.0293, + "step": 193400 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011275292538257484, + "loss": 0.0342, + "step": 193410 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011274324402821792, + "loss": 0.0313, + "step": 193420 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011273356267386097, + "loss": 0.027, + "step": 193430 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011272388131950404, + "loss": 0.0329, + "step": 193440 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011271419996514712, + "loss": 0.035, + "step": 193450 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011270451861079019, + "loss": 0.033, + "step": 193460 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011269483725643324, + "loss": 0.0353, + "step": 193470 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011268515590207632, + "loss": 0.0332, + "step": 193480 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011267547454771939, + "loss": 0.033, + "step": 193490 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011266579319336245, + "loss": 0.031, + "step": 193500 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011265611183900552, + "loss": 0.027, + "step": 193510 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001126464304846486, + "loss": 0.032, + "step": 193520 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011263674913029166, + "loss": 0.0346, + "step": 193530 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011262706777593472, + "loss": 0.0286, + "step": 193540 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001126173864215778, + "loss": 0.0303, + "step": 193550 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011260770506722086, + "loss": 0.03, + "step": 193560 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011259802371286392, + "loss": 0.0273, + "step": 193570 + }, + { + "epoch": 1.25, + "learning_rate": 0.000112588342358507, + "loss": 0.029, + "step": 193580 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011257866100415006, + "loss": 0.031, + "step": 193590 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011256897964979314, + "loss": 0.0335, + "step": 193600 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001125592982954362, + "loss": 0.0356, + "step": 193610 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011254961694107927, + "loss": 0.0305, + "step": 193620 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011253993558672234, + "loss": 0.0284, + "step": 193630 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011253025423236539, + "loss": 0.033, + "step": 193640 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011252057287800847, + "loss": 0.032, + "step": 193650 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011251089152365154, + "loss": 0.0291, + "step": 193660 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011250121016929462, + "loss": 0.0272, + "step": 193670 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011249152881493767, + "loss": 0.0288, + "step": 193680 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011248184746058074, + "loss": 0.0303, + "step": 193690 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011247216610622382, + "loss": 0.029, + "step": 193700 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011246248475186687, + "loss": 0.0263, + "step": 193710 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011245280339750995, + "loss": 0.0328, + "step": 193720 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011244312204315302, + "loss": 0.0314, + "step": 193730 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001124334406887961, + "loss": 0.0381, + "step": 193740 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011242375933443915, + "loss": 0.0297, + "step": 193750 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011241407798008221, + "loss": 0.0281, + "step": 193760 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001124043966257253, + "loss": 0.0252, + "step": 193770 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011239471527136835, + "loss": 0.0303, + "step": 193780 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011238503391701141, + "loss": 0.0322, + "step": 193790 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001123753525626545, + "loss": 0.037, + "step": 193800 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011236567120829756, + "loss": 0.0343, + "step": 193810 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011235598985394063, + "loss": 0.0336, + "step": 193820 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011234630849958369, + "loss": 0.0352, + "step": 193830 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011233662714522677, + "loss": 0.0303, + "step": 193840 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011232694579086982, + "loss": 0.0322, + "step": 193850 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011231726443651289, + "loss": 0.0327, + "step": 193860 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011230758308215597, + "loss": 0.03, + "step": 193870 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011229790172779904, + "loss": 0.0299, + "step": 193880 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011228822037344209, + "loss": 0.0366, + "step": 193890 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011227853901908517, + "loss": 0.0279, + "step": 193900 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011226885766472824, + "loss": 0.0335, + "step": 193910 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001122591763103713, + "loss": 0.0281, + "step": 193920 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011224949495601437, + "loss": 0.0348, + "step": 193930 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011223981360165745, + "loss": 0.0342, + "step": 193940 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011223013224730051, + "loss": 0.0396, + "step": 193950 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011222045089294357, + "loss": 0.0315, + "step": 193960 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011221076953858665, + "loss": 0.0292, + "step": 193970 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011220108818422971, + "loss": 0.0317, + "step": 193980 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011219140682987277, + "loss": 0.0346, + "step": 193990 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011218172547551585, + "loss": 0.0283, + "step": 194000 + }, + { + "epoch": 1.25, + "eval_cer": 0.91987436447859, + "eval_loss": 0.022109534591436386, + "eval_runtime": 120.1821, + "eval_samples_per_second": 16.641, + "eval_steps_per_second": 4.16, + "step": 194000 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011217204412115891, + "loss": 0.0379, + "step": 194010 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011216236276680199, + "loss": 0.0315, + "step": 194020 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011215268141244504, + "loss": 0.0361, + "step": 194030 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011214300005808812, + "loss": 0.0365, + "step": 194040 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011213331870373119, + "loss": 0.0301, + "step": 194050 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011212363734937424, + "loss": 0.0329, + "step": 194060 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011211395599501732, + "loss": 0.0312, + "step": 194070 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011210427464066039, + "loss": 0.0357, + "step": 194080 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011209459328630347, + "loss": 0.0286, + "step": 194090 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011208491193194652, + "loss": 0.0273, + "step": 194100 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011207523057758959, + "loss": 0.0322, + "step": 194110 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011206554922323267, + "loss": 0.028, + "step": 194120 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011205586786887572, + "loss": 0.034, + "step": 194130 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001120461865145188, + "loss": 0.0278, + "step": 194140 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011203650516016187, + "loss": 0.028, + "step": 194150 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011202682380580493, + "loss": 0.0314, + "step": 194160 + }, + { + "epoch": 1.25, + "learning_rate": 0.000112017142451448, + "loss": 0.0344, + "step": 194170 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011200746109709106, + "loss": 0.0321, + "step": 194180 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011199777974273414, + "loss": 0.032, + "step": 194190 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001119880983883772, + "loss": 0.0359, + "step": 194200 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011197841703402026, + "loss": 0.0273, + "step": 194210 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011196873567966334, + "loss": 0.0301, + "step": 194220 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011195905432530641, + "loss": 0.0283, + "step": 194230 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011194937297094948, + "loss": 0.0307, + "step": 194240 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011193969161659254, + "loss": 0.0349, + "step": 194250 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011193001026223561, + "loss": 0.0347, + "step": 194260 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011192032890787867, + "loss": 0.0284, + "step": 194270 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011191064755352174, + "loss": 0.0296, + "step": 194280 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011190096619916482, + "loss": 0.028, + "step": 194290 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011189128484480789, + "loss": 0.0305, + "step": 194300 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011188160349045094, + "loss": 0.0307, + "step": 194310 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011187192213609402, + "loss": 0.0275, + "step": 194320 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011186224078173709, + "loss": 0.0368, + "step": 194330 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011185255942738015, + "loss": 0.0307, + "step": 194340 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011184287807302322, + "loss": 0.0303, + "step": 194350 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011183319671866628, + "loss": 0.0327, + "step": 194360 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011182351536430936, + "loss": 0.0291, + "step": 194370 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011181383400995242, + "loss": 0.034, + "step": 194380 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001118041526555955, + "loss": 0.0298, + "step": 194390 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011179447130123856, + "loss": 0.0391, + "step": 194400 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011178478994688162, + "loss": 0.0288, + "step": 194410 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001117751085925247, + "loss": 0.0326, + "step": 194420 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011176542723816776, + "loss": 0.025, + "step": 194430 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011175574588381084, + "loss": 0.0362, + "step": 194440 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001117460645294539, + "loss": 0.0351, + "step": 194450 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011173638317509696, + "loss": 0.0297, + "step": 194460 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011172670182074004, + "loss": 0.0338, + "step": 194470 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011171702046638309, + "loss": 0.0334, + "step": 194480 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011170733911202617, + "loss": 0.0338, + "step": 194490 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011169765775766924, + "loss": 0.0299, + "step": 194500 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011168797640331232, + "loss": 0.0293, + "step": 194510 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011167829504895537, + "loss": 0.0293, + "step": 194520 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011166861369459844, + "loss": 0.0298, + "step": 194530 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011165893234024152, + "loss": 0.0339, + "step": 194540 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011164925098588457, + "loss": 0.0304, + "step": 194550 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011163956963152764, + "loss": 0.0374, + "step": 194560 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011162988827717072, + "loss": 0.0312, + "step": 194570 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011162020692281377, + "loss": 0.0298, + "step": 194580 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011161052556845685, + "loss": 0.0379, + "step": 194590 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011160084421409991, + "loss": 0.0327, + "step": 194600 + }, + { + "epoch": 1.26, + "learning_rate": 0.000111591162859743, + "loss": 0.0315, + "step": 194610 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011158148150538605, + "loss": 0.0276, + "step": 194620 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011157180015102911, + "loss": 0.0408, + "step": 194630 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011156211879667219, + "loss": 0.0329, + "step": 194640 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011155243744231525, + "loss": 0.0318, + "step": 194650 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011154275608795831, + "loss": 0.0331, + "step": 194660 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011153307473360139, + "loss": 0.0269, + "step": 194670 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011152339337924446, + "loss": 0.0274, + "step": 194680 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011151371202488752, + "loss": 0.0291, + "step": 194690 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011150403067053059, + "loss": 0.0296, + "step": 194700 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011149434931617367, + "loss": 0.039, + "step": 194710 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011148466796181672, + "loss": 0.0339, + "step": 194720 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011147498660745979, + "loss": 0.0263, + "step": 194730 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011146530525310287, + "loss": 0.031, + "step": 194740 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011145562389874594, + "loss": 0.0369, + "step": 194750 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011144594254438899, + "loss": 0.0364, + "step": 194760 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011143626119003207, + "loss": 0.028, + "step": 194770 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011142657983567513, + "loss": 0.0291, + "step": 194780 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001114168984813182, + "loss": 0.0341, + "step": 194790 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011140721712696127, + "loss": 0.0282, + "step": 194800 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011139753577260435, + "loss": 0.0347, + "step": 194810 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011138785441824741, + "loss": 0.032, + "step": 194820 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011137817306389047, + "loss": 0.033, + "step": 194830 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011136849170953354, + "loss": 0.0328, + "step": 194840 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011135881035517661, + "loss": 0.0329, + "step": 194850 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011134912900081966, + "loss": 0.0348, + "step": 194860 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011133944764646274, + "loss": 0.0313, + "step": 194870 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011132976629210581, + "loss": 0.0339, + "step": 194880 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011132008493774889, + "loss": 0.0319, + "step": 194890 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011131040358339194, + "loss": 0.0328, + "step": 194900 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011130072222903502, + "loss": 0.0305, + "step": 194910 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011129104087467809, + "loss": 0.0273, + "step": 194920 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011128135952032114, + "loss": 0.0312, + "step": 194930 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011127167816596422, + "loss": 0.0271, + "step": 194940 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011126199681160729, + "loss": 0.029, + "step": 194950 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011125231545725037, + "loss": 0.0308, + "step": 194960 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011124263410289342, + "loss": 0.0296, + "step": 194970 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011123295274853649, + "loss": 0.0385, + "step": 194980 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011122327139417957, + "loss": 0.0269, + "step": 194990 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011121359003982262, + "loss": 0.0377, + "step": 195000 + }, + { + "epoch": 1.26, + "eval_cer": 0.9198336911083493, + "eval_loss": 0.022459572181105614, + "eval_runtime": 120.3875, + "eval_samples_per_second": 16.613, + "eval_steps_per_second": 4.153, + "step": 195000 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001112039086854657, + "loss": 0.0366, + "step": 195010 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011119422733110876, + "loss": 0.0376, + "step": 195020 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011118454597675184, + "loss": 0.0343, + "step": 195030 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001111748646223949, + "loss": 0.0326, + "step": 195040 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011116518326803796, + "loss": 0.0319, + "step": 195050 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011115550191368104, + "loss": 0.03, + "step": 195060 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001111458205593241, + "loss": 0.0323, + "step": 195070 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011113613920496716, + "loss": 0.0299, + "step": 195080 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011112645785061024, + "loss": 0.0343, + "step": 195090 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011111677649625331, + "loss": 0.0304, + "step": 195100 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011110709514189637, + "loss": 0.0339, + "step": 195110 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011109741378753944, + "loss": 0.0282, + "step": 195120 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011108773243318252, + "loss": 0.0297, + "step": 195130 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011107805107882557, + "loss": 0.0273, + "step": 195140 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011106836972446864, + "loss": 0.0277, + "step": 195150 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011105868837011172, + "loss": 0.0366, + "step": 195160 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011104900701575478, + "loss": 0.0285, + "step": 195170 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011103932566139784, + "loss": 0.0302, + "step": 195180 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011102964430704092, + "loss": 0.0305, + "step": 195190 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011101996295268398, + "loss": 0.0314, + "step": 195200 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011101028159832705, + "loss": 0.029, + "step": 195210 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011100060024397012, + "loss": 0.0316, + "step": 195220 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001109909188896132, + "loss": 0.0316, + "step": 195230 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011098123753525626, + "loss": 0.035, + "step": 195240 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011097155618089931, + "loss": 0.0318, + "step": 195250 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001109618748265424, + "loss": 0.0358, + "step": 195260 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011095219347218546, + "loss": 0.0279, + "step": 195270 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011094251211782851, + "loss": 0.0313, + "step": 195280 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001109328307634716, + "loss": 0.0354, + "step": 195290 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011092314940911466, + "loss": 0.0275, + "step": 195300 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011091346805475774, + "loss": 0.0314, + "step": 195310 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011090378670040079, + "loss": 0.0279, + "step": 195320 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011089410534604387, + "loss": 0.032, + "step": 195330 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011088442399168694, + "loss": 0.0346, + "step": 195340 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011087474263732999, + "loss": 0.0329, + "step": 195350 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011086506128297307, + "loss": 0.0306, + "step": 195360 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011085537992861614, + "loss": 0.0279, + "step": 195370 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011084569857425922, + "loss": 0.0311, + "step": 195380 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011083601721990227, + "loss": 0.0302, + "step": 195390 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011082633586554534, + "loss": 0.0329, + "step": 195400 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011081665451118842, + "loss": 0.0297, + "step": 195410 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011080697315683147, + "loss": 0.0293, + "step": 195420 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011079729180247455, + "loss": 0.0331, + "step": 195430 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011078761044811761, + "loss": 0.0331, + "step": 195440 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011077792909376068, + "loss": 0.0316, + "step": 195450 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011076824773940375, + "loss": 0.0234, + "step": 195460 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011075856638504681, + "loss": 0.0288, + "step": 195470 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011074888503068989, + "loss": 0.0339, + "step": 195480 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011073920367633295, + "loss": 0.0286, + "step": 195490 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011072952232197601, + "loss": 0.0294, + "step": 195500 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011071984096761909, + "loss": 0.0369, + "step": 195510 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011071015961326216, + "loss": 0.0283, + "step": 195520 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011070047825890522, + "loss": 0.034, + "step": 195530 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011069079690454829, + "loss": 0.0275, + "step": 195540 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011068111555019136, + "loss": 0.0297, + "step": 195550 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011067143419583442, + "loss": 0.0318, + "step": 195560 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011066175284147749, + "loss": 0.0291, + "step": 195570 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011065207148712057, + "loss": 0.0289, + "step": 195580 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011064239013276363, + "loss": 0.028, + "step": 195590 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011063270877840669, + "loss": 0.0295, + "step": 195600 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011062302742404977, + "loss": 0.0346, + "step": 195610 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011061334606969283, + "loss": 0.0298, + "step": 195620 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001106036647153359, + "loss": 0.0295, + "step": 195630 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011059398336097897, + "loss": 0.0325, + "step": 195640 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011058430200662203, + "loss": 0.0329, + "step": 195650 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011057462065226511, + "loss": 0.0292, + "step": 195660 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011056493929790816, + "loss": 0.03, + "step": 195670 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011055525794355124, + "loss": 0.0368, + "step": 195680 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011054557658919431, + "loss": 0.0314, + "step": 195690 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011053589523483736, + "loss": 0.0328, + "step": 195700 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011052621388048044, + "loss": 0.0324, + "step": 195710 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011051653252612351, + "loss": 0.0317, + "step": 195720 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011050685117176659, + "loss": 0.0333, + "step": 195730 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011049716981740964, + "loss": 0.0316, + "step": 195740 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011048748846305271, + "loss": 0.0381, + "step": 195750 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011047780710869579, + "loss": 0.0326, + "step": 195760 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011046812575433884, + "loss": 0.032, + "step": 195770 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011045844439998192, + "loss": 0.0328, + "step": 195780 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011044876304562499, + "loss": 0.0338, + "step": 195790 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011043908169126807, + "loss": 0.0349, + "step": 195800 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011042940033691112, + "loss": 0.0285, + "step": 195810 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011041971898255419, + "loss": 0.027, + "step": 195820 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011041003762819727, + "loss": 0.0342, + "step": 195830 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011040035627384032, + "loss": 0.0263, + "step": 195840 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011039067491948338, + "loss": 0.0341, + "step": 195850 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011038099356512646, + "loss": 0.0402, + "step": 195860 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011037131221076953, + "loss": 0.0289, + "step": 195870 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001103616308564126, + "loss": 0.0279, + "step": 195880 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011035194950205566, + "loss": 0.028, + "step": 195890 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011034226814769874, + "loss": 0.0282, + "step": 195900 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001103325867933418, + "loss": 0.0261, + "step": 195910 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011032290543898486, + "loss": 0.0304, + "step": 195920 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011031322408462794, + "loss": 0.0308, + "step": 195930 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011030354273027101, + "loss": 0.0313, + "step": 195940 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011029386137591406, + "loss": 0.037, + "step": 195950 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011028418002155714, + "loss": 0.0287, + "step": 195960 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001102744986672002, + "loss": 0.0373, + "step": 195970 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011026481731284327, + "loss": 0.0303, + "step": 195980 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011025513595848634, + "loss": 0.0312, + "step": 195990 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011024545460412942, + "loss": 0.0395, + "step": 196000 + }, + { + "epoch": 1.27, + "eval_cer": 0.9198987685007344, + "eval_loss": 0.022464269772171974, + "eval_runtime": 120.2, + "eval_samples_per_second": 16.639, + "eval_steps_per_second": 4.16, + "step": 196000 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011023577324977248, + "loss": 0.0302, + "step": 196010 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011022609189541554, + "loss": 0.0254, + "step": 196020 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011021641054105862, + "loss": 0.0367, + "step": 196030 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011020672918670168, + "loss": 0.0304, + "step": 196040 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011019704783234474, + "loss": 0.0324, + "step": 196050 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011018736647798782, + "loss": 0.0333, + "step": 196060 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011017768512363088, + "loss": 0.0355, + "step": 196070 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011016800376927396, + "loss": 0.0341, + "step": 196080 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011015832241491701, + "loss": 0.0261, + "step": 196090 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001101486410605601, + "loss": 0.0288, + "step": 196100 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011013895970620316, + "loss": 0.0319, + "step": 196110 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011012927835184621, + "loss": 0.0264, + "step": 196120 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011011959699748929, + "loss": 0.0246, + "step": 196130 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011010991564313236, + "loss": 0.0307, + "step": 196140 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011010023428877544, + "loss": 0.0316, + "step": 196150 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011009055293441849, + "loss": 0.0281, + "step": 196160 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011008087158006156, + "loss": 0.0329, + "step": 196170 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011007119022570464, + "loss": 0.0336, + "step": 196180 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011006150887134769, + "loss": 0.0285, + "step": 196190 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011005182751699077, + "loss": 0.0302, + "step": 196200 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011004214616263384, + "loss": 0.0343, + "step": 196210 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011003246480827692, + "loss": 0.0327, + "step": 196220 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011002278345391997, + "loss": 0.0278, + "step": 196230 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011001310209956304, + "loss": 0.0264, + "step": 196240 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011000342074520612, + "loss": 0.0335, + "step": 196250 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010999373939084917, + "loss": 0.0311, + "step": 196260 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010998405803649223, + "loss": 0.0284, + "step": 196270 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010997437668213531, + "loss": 0.0341, + "step": 196280 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010996469532777838, + "loss": 0.0324, + "step": 196290 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010995501397342145, + "loss": 0.0272, + "step": 196300 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010994533261906451, + "loss": 0.0281, + "step": 196310 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010993565126470759, + "loss": 0.0296, + "step": 196320 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010992596991035064, + "loss": 0.0267, + "step": 196330 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010991628855599371, + "loss": 0.0254, + "step": 196340 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010990660720163679, + "loss": 0.032, + "step": 196350 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010989692584727986, + "loss": 0.0296, + "step": 196360 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010988724449292291, + "loss": 0.0272, + "step": 196370 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010987756313856599, + "loss": 0.03, + "step": 196380 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010986788178420906, + "loss": 0.0257, + "step": 196390 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010985820042985212, + "loss": 0.0324, + "step": 196400 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010984851907549519, + "loss": 0.0323, + "step": 196410 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010983883772113827, + "loss": 0.0279, + "step": 196420 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010982915636678133, + "loss": 0.0357, + "step": 196430 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010981947501242439, + "loss": 0.0305, + "step": 196440 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010980979365806747, + "loss": 0.0281, + "step": 196450 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010980011230371053, + "loss": 0.0333, + "step": 196460 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010979043094935359, + "loss": 0.0281, + "step": 196470 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010978074959499667, + "loss": 0.0263, + "step": 196480 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010977106824063973, + "loss": 0.0278, + "step": 196490 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010976138688628281, + "loss": 0.0284, + "step": 196500 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010975170553192586, + "loss": 0.0284, + "step": 196510 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010974202417756894, + "loss": 0.0314, + "step": 196520 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010973234282321201, + "loss": 0.0306, + "step": 196530 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010972266146885506, + "loss": 0.026, + "step": 196540 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010971298011449814, + "loss": 0.0262, + "step": 196550 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010970329876014121, + "loss": 0.0296, + "step": 196560 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010969361740578429, + "loss": 0.0374, + "step": 196570 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010968393605142734, + "loss": 0.0263, + "step": 196580 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010967425469707041, + "loss": 0.0328, + "step": 196590 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010966457334271349, + "loss": 0.0335, + "step": 196600 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010965489198835654, + "loss": 0.0354, + "step": 196610 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010964521063399962, + "loss": 0.0292, + "step": 196620 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010963552927964269, + "loss": 0.0404, + "step": 196630 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010962584792528575, + "loss": 0.0311, + "step": 196640 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010961616657092882, + "loss": 0.0334, + "step": 196650 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010960648521657189, + "loss": 0.0289, + "step": 196660 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010959680386221496, + "loss": 0.0363, + "step": 196670 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010958712250785802, + "loss": 0.029, + "step": 196680 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010957744115350108, + "loss": 0.0268, + "step": 196690 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010956775979914416, + "loss": 0.0322, + "step": 196700 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010955807844478723, + "loss": 0.0322, + "step": 196710 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001095483970904303, + "loss": 0.0245, + "step": 196720 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010953871573607336, + "loss": 0.0335, + "step": 196730 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010952903438171643, + "loss": 0.0291, + "step": 196740 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001095193530273595, + "loss": 0.0298, + "step": 196750 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010950967167300256, + "loss": 0.0257, + "step": 196760 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010949999031864564, + "loss": 0.0312, + "step": 196770 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010949030896428871, + "loss": 0.0323, + "step": 196780 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010948062760993176, + "loss": 0.027, + "step": 196790 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010947094625557484, + "loss": 0.034, + "step": 196800 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001094612649012179, + "loss": 0.0299, + "step": 196810 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010945158354686097, + "loss": 0.0258, + "step": 196820 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010944190219250404, + "loss": 0.0292, + "step": 196830 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001094322208381471, + "loss": 0.0276, + "step": 196840 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010942253948379018, + "loss": 0.0303, + "step": 196850 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010941285812943324, + "loss": 0.0371, + "step": 196860 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010940317677507632, + "loss": 0.0298, + "step": 196870 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010939349542071938, + "loss": 0.0339, + "step": 196880 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010938381406636244, + "loss": 0.0312, + "step": 196890 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010937413271200552, + "loss": 0.0336, + "step": 196900 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010936445135764858, + "loss": 0.0261, + "step": 196910 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010935477000329166, + "loss": 0.0277, + "step": 196920 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010934508864893471, + "loss": 0.0331, + "step": 196930 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010933540729457778, + "loss": 0.0302, + "step": 196940 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010932572594022086, + "loss": 0.029, + "step": 196950 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010931604458586391, + "loss": 0.032, + "step": 196960 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010930636323150699, + "loss": 0.0341, + "step": 196970 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010929668187715006, + "loss": 0.0323, + "step": 196980 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010928700052279314, + "loss": 0.0309, + "step": 196990 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010927731916843619, + "loss": 0.0268, + "step": 197000 + }, + { + "epoch": 1.27, + "eval_cer": 0.919872556773246, + "eval_loss": 0.022425523027777672, + "eval_runtime": 120.1817, + "eval_samples_per_second": 16.641, + "eval_steps_per_second": 4.16, + "step": 197000 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010926763781407926, + "loss": 0.0271, + "step": 197010 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010925795645972234, + "loss": 0.0324, + "step": 197020 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010924827510536539, + "loss": 0.0242, + "step": 197030 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010923859375100846, + "loss": 0.028, + "step": 197040 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010922891239665154, + "loss": 0.0284, + "step": 197050 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001092192310422946, + "loss": 0.0314, + "step": 197060 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010920954968793767, + "loss": 0.0307, + "step": 197070 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010919986833358073, + "loss": 0.0383, + "step": 197080 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010919018697922381, + "loss": 0.0278, + "step": 197090 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010918050562486687, + "loss": 0.0288, + "step": 197100 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010917082427050993, + "loss": 0.0321, + "step": 197110 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010916114291615301, + "loss": 0.0314, + "step": 197120 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010915146156179608, + "loss": 0.025, + "step": 197130 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010914178020743913, + "loss": 0.0322, + "step": 197140 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010913209885308221, + "loss": 0.0395, + "step": 197150 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010912241749872528, + "loss": 0.0284, + "step": 197160 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010911273614436834, + "loss": 0.0293, + "step": 197170 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010910305479001141, + "loss": 0.0377, + "step": 197180 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010909337343565449, + "loss": 0.0319, + "step": 197190 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010908369208129756, + "loss": 0.036, + "step": 197200 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010907401072694061, + "loss": 0.0279, + "step": 197210 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010906432937258369, + "loss": 0.0303, + "step": 197220 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010905464801822676, + "loss": 0.0292, + "step": 197230 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010904496666386981, + "loss": 0.0285, + "step": 197240 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010903528530951289, + "loss": 0.0392, + "step": 197250 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010902560395515595, + "loss": 0.0299, + "step": 197260 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010901592260079903, + "loss": 0.0263, + "step": 197270 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010900624124644209, + "loss": 0.0244, + "step": 197280 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010899655989208517, + "loss": 0.0294, + "step": 197290 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010898687853772823, + "loss": 0.0325, + "step": 197300 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010897719718337129, + "loss": 0.0322, + "step": 197310 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010896751582901437, + "loss": 0.0257, + "step": 197320 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010895783447465743, + "loss": 0.0341, + "step": 197330 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010894815312030051, + "loss": 0.0326, + "step": 197340 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010893847176594356, + "loss": 0.0308, + "step": 197350 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010892879041158663, + "loss": 0.0295, + "step": 197360 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010891910905722971, + "loss": 0.0274, + "step": 197370 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010890942770287276, + "loss": 0.0298, + "step": 197380 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010889974634851584, + "loss": 0.0302, + "step": 197390 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010889006499415891, + "loss": 0.0281, + "step": 197400 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010888038363980199, + "loss": 0.0292, + "step": 197410 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010887070228544504, + "loss": 0.0295, + "step": 197420 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010886102093108811, + "loss": 0.0343, + "step": 197430 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010885133957673119, + "loss": 0.0295, + "step": 197440 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010884165822237424, + "loss": 0.0308, + "step": 197450 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001088319768680173, + "loss": 0.0315, + "step": 197460 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010882229551366039, + "loss": 0.0307, + "step": 197470 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010881261415930345, + "loss": 0.0275, + "step": 197480 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010880293280494652, + "loss": 0.0257, + "step": 197490 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010879325145058958, + "loss": 0.0293, + "step": 197500 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010878357009623266, + "loss": 0.0336, + "step": 197510 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010877388874187572, + "loss": 0.0306, + "step": 197520 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010876420738751878, + "loss": 0.0338, + "step": 197530 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010875452603316186, + "loss": 0.0299, + "step": 197540 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010874484467880493, + "loss": 0.0314, + "step": 197550 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010873516332444798, + "loss": 0.027, + "step": 197560 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010872548197009106, + "loss": 0.0338, + "step": 197570 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010871580061573413, + "loss": 0.031, + "step": 197580 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001087061192613772, + "loss": 0.0318, + "step": 197590 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010869643790702026, + "loss": 0.0297, + "step": 197600 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010868675655266334, + "loss": 0.0316, + "step": 197610 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001086770751983064, + "loss": 0.0335, + "step": 197620 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010866739384394946, + "loss": 0.0308, + "step": 197630 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010865771248959254, + "loss": 0.029, + "step": 197640 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001086480311352356, + "loss": 0.0299, + "step": 197650 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010863834978087866, + "loss": 0.0298, + "step": 197660 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010862866842652174, + "loss": 0.0266, + "step": 197670 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001086189870721648, + "loss": 0.0351, + "step": 197680 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010860930571780788, + "loss": 0.0337, + "step": 197690 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010859962436345094, + "loss": 0.0284, + "step": 197700 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010858994300909402, + "loss": 0.0278, + "step": 197710 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010858026165473708, + "loss": 0.0283, + "step": 197720 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010857058030038014, + "loss": 0.0342, + "step": 197730 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010856089894602322, + "loss": 0.0282, + "step": 197740 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010855121759166628, + "loss": 0.0296, + "step": 197750 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010854153623730936, + "loss": 0.0258, + "step": 197760 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010853185488295241, + "loss": 0.0281, + "step": 197770 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010852217352859548, + "loss": 0.0322, + "step": 197780 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010851249217423856, + "loss": 0.0327, + "step": 197790 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010850281081988161, + "loss": 0.0359, + "step": 197800 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010849312946552469, + "loss": 0.0266, + "step": 197810 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010848344811116776, + "loss": 0.0316, + "step": 197820 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010847376675681084, + "loss": 0.0269, + "step": 197830 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010846408540245389, + "loss": 0.0316, + "step": 197840 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010845440404809696, + "loss": 0.0309, + "step": 197850 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010844472269374004, + "loss": 0.0282, + "step": 197860 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010843504133938309, + "loss": 0.0333, + "step": 197870 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010842535998502616, + "loss": 0.028, + "step": 197880 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010841567863066924, + "loss": 0.0287, + "step": 197890 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001084059972763123, + "loss": 0.0336, + "step": 197900 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010839631592195537, + "loss": 0.0306, + "step": 197910 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010838663456759843, + "loss": 0.0245, + "step": 197920 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010837695321324151, + "loss": 0.0295, + "step": 197930 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010836727185888457, + "loss": 0.0267, + "step": 197940 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010835759050452763, + "loss": 0.034, + "step": 197950 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010834790915017071, + "loss": 0.0288, + "step": 197960 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010833822779581378, + "loss": 0.0308, + "step": 197970 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010832854644145683, + "loss": 0.029, + "step": 197980 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010831886508709991, + "loss": 0.0287, + "step": 197990 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010830918373274298, + "loss": 0.032, + "step": 198000 + }, + { + "epoch": 1.28, + "eval_cer": 0.919873460625918, + "eval_loss": 0.022191094234585762, + "eval_runtime": 120.0906, + "eval_samples_per_second": 16.654, + "eval_steps_per_second": 4.164, + "step": 198000 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010829950237838604, + "loss": 0.0277, + "step": 198010 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010828982102402911, + "loss": 0.0295, + "step": 198020 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010828013966967219, + "loss": 0.0316, + "step": 198030 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010827045831531524, + "loss": 0.0327, + "step": 198040 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010826077696095831, + "loss": 0.0337, + "step": 198050 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010825109560660139, + "loss": 0.028, + "step": 198060 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010824141425224446, + "loss": 0.0297, + "step": 198070 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010823173289788751, + "loss": 0.0287, + "step": 198080 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010822205154353059, + "loss": 0.0271, + "step": 198090 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010821237018917365, + "loss": 0.0304, + "step": 198100 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010820268883481672, + "loss": 0.0285, + "step": 198110 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010819300748045979, + "loss": 0.0319, + "step": 198120 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010818332612610287, + "loss": 0.0264, + "step": 198130 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010817364477174593, + "loss": 0.0388, + "step": 198140 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010816396341738899, + "loss": 0.0354, + "step": 198150 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010815428206303206, + "loss": 0.0355, + "step": 198160 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010814460070867513, + "loss": 0.0324, + "step": 198170 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010813491935431818, + "loss": 0.0315, + "step": 198180 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010812523799996126, + "loss": 0.0294, + "step": 198190 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010811555664560433, + "loss": 0.0317, + "step": 198200 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010810587529124741, + "loss": 0.028, + "step": 198210 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010809619393689046, + "loss": 0.0267, + "step": 198220 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010808651258253354, + "loss": 0.0317, + "step": 198230 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010807683122817661, + "loss": 0.0355, + "step": 198240 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010806714987381966, + "loss": 0.0304, + "step": 198250 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010805746851946274, + "loss": 0.0298, + "step": 198260 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010804778716510581, + "loss": 0.0322, + "step": 198270 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010803810581074889, + "loss": 0.0278, + "step": 198280 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010802842445639194, + "loss": 0.0326, + "step": 198290 + }, + { + "epoch": 1.28, + "learning_rate": 0.000108018743102035, + "loss": 0.0332, + "step": 198300 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010800906174767809, + "loss": 0.0291, + "step": 198310 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010799938039332114, + "loss": 0.027, + "step": 198320 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010798969903896422, + "loss": 0.0318, + "step": 198330 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010798001768460728, + "loss": 0.0329, + "step": 198340 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010797033633025035, + "loss": 0.0279, + "step": 198350 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010796065497589342, + "loss": 0.0329, + "step": 198360 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010795097362153648, + "loss": 0.0263, + "step": 198370 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010794129226717956, + "loss": 0.0342, + "step": 198380 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010793161091282262, + "loss": 0.0313, + "step": 198390 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010792192955846568, + "loss": 0.0332, + "step": 198400 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010791224820410876, + "loss": 0.0359, + "step": 198410 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010790256684975183, + "loss": 0.0267, + "step": 198420 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001078928854953949, + "loss": 0.0341, + "step": 198430 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010788320414103796, + "loss": 0.0292, + "step": 198440 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010787352278668103, + "loss": 0.0329, + "step": 198450 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010786384143232409, + "loss": 0.0326, + "step": 198460 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010785416007796716, + "loss": 0.0319, + "step": 198470 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010784447872361024, + "loss": 0.0262, + "step": 198480 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001078347973692533, + "loss": 0.0277, + "step": 198490 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010782511601489636, + "loss": 0.028, + "step": 198500 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010781543466053944, + "loss": 0.0404, + "step": 198510 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001078057533061825, + "loss": 0.0357, + "step": 198520 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010779607195182557, + "loss": 0.0304, + "step": 198530 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010778639059746864, + "loss": 0.0374, + "step": 198540 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001077767092431117, + "loss": 0.0316, + "step": 198550 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010776702788875478, + "loss": 0.038, + "step": 198560 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010775734653439783, + "loss": 0.0295, + "step": 198570 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010774766518004091, + "loss": 0.0325, + "step": 198580 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010773798382568398, + "loss": 0.0309, + "step": 198590 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010772830247132703, + "loss": 0.036, + "step": 198600 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010771862111697011, + "loss": 0.0308, + "step": 198610 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010770893976261318, + "loss": 0.0301, + "step": 198620 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010769925840825626, + "loss": 0.0275, + "step": 198630 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010768957705389931, + "loss": 0.0302, + "step": 198640 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010767989569954238, + "loss": 0.0295, + "step": 198650 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010767021434518546, + "loss": 0.0283, + "step": 198660 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010766053299082851, + "loss": 0.029, + "step": 198670 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010765085163647159, + "loss": 0.0323, + "step": 198680 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010764117028211466, + "loss": 0.029, + "step": 198690 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010763148892775774, + "loss": 0.0326, + "step": 198700 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010762180757340079, + "loss": 0.0287, + "step": 198710 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010761212621904386, + "loss": 0.025, + "step": 198720 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010760244486468694, + "loss": 0.0319, + "step": 198730 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010759276351032999, + "loss": 0.0274, + "step": 198740 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010758308215597305, + "loss": 0.0266, + "step": 198750 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010757340080161613, + "loss": 0.0331, + "step": 198760 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001075637194472592, + "loss": 0.03, + "step": 198770 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010755403809290227, + "loss": 0.0368, + "step": 198780 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010754435673854533, + "loss": 0.0272, + "step": 198790 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010753467538418841, + "loss": 0.0296, + "step": 198800 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010752499402983147, + "loss": 0.033, + "step": 198810 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010751531267547453, + "loss": 0.0282, + "step": 198820 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010750563132111761, + "loss": 0.0303, + "step": 198830 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010749594996676068, + "loss": 0.0276, + "step": 198840 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010748626861240373, + "loss": 0.0277, + "step": 198850 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010747658725804681, + "loss": 0.029, + "step": 198860 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010746690590368988, + "loss": 0.0311, + "step": 198870 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010745722454933294, + "loss": 0.0343, + "step": 198880 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010744754319497601, + "loss": 0.0326, + "step": 198890 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010743786184061909, + "loss": 0.0288, + "step": 198900 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010742818048626215, + "loss": 0.0359, + "step": 198910 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010741849913190521, + "loss": 0.0324, + "step": 198920 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010740881777754829, + "loss": 0.0278, + "step": 198930 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010739913642319135, + "loss": 0.0272, + "step": 198940 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001073894550688344, + "loss": 0.0246, + "step": 198950 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010737977371447749, + "loss": 0.035, + "step": 198960 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010737009236012055, + "loss": 0.0303, + "step": 198970 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010736041100576363, + "loss": 0.0431, + "step": 198980 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010735072965140668, + "loss": 0.0306, + "step": 198990 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010734104829704976, + "loss": 0.0328, + "step": 199000 + }, + { + "epoch": 1.28, + "eval_cer": 0.9199132301434866, + "eval_loss": 0.0220940038561821, + "eval_runtime": 120.1709, + "eval_samples_per_second": 16.643, + "eval_steps_per_second": 4.161, + "step": 199000 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010733136694269283, + "loss": 0.0302, + "step": 199010 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010732168558833588, + "loss": 0.0261, + "step": 199020 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010731200423397896, + "loss": 0.0289, + "step": 199030 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010730232287962203, + "loss": 0.0292, + "step": 199040 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010729264152526511, + "loss": 0.0308, + "step": 199050 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010728296017090816, + "loss": 0.0337, + "step": 199060 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010727327881655123, + "loss": 0.026, + "step": 199070 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010726359746219431, + "loss": 0.0302, + "step": 199080 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010725391610783736, + "loss": 0.0311, + "step": 199090 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010724423475348044, + "loss": 0.0297, + "step": 199100 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001072345533991235, + "loss": 0.0344, + "step": 199110 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010722487204476659, + "loss": 0.0288, + "step": 199120 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010721519069040964, + "loss": 0.035, + "step": 199130 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001072055093360527, + "loss": 0.0294, + "step": 199140 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010719582798169579, + "loss": 0.0269, + "step": 199150 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010718614662733884, + "loss": 0.029, + "step": 199160 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001071764652729819, + "loss": 0.0298, + "step": 199170 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010716678391862498, + "loss": 0.0355, + "step": 199180 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010715710256426805, + "loss": 0.0338, + "step": 199190 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010714742120991112, + "loss": 0.0315, + "step": 199200 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010713773985555418, + "loss": 0.0379, + "step": 199210 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010712805850119726, + "loss": 0.0433, + "step": 199220 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010711837714684032, + "loss": 0.0281, + "step": 199230 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010710869579248338, + "loss": 0.0283, + "step": 199240 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010709901443812646, + "loss": 0.0324, + "step": 199250 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010708933308376953, + "loss": 0.0263, + "step": 199260 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010707965172941258, + "loss": 0.0291, + "step": 199270 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010706997037505566, + "loss": 0.0307, + "step": 199280 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010706028902069873, + "loss": 0.0316, + "step": 199290 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010705060766634179, + "loss": 0.0293, + "step": 199300 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010704092631198486, + "loss": 0.0397, + "step": 199310 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010703124495762794, + "loss": 0.0334, + "step": 199320 + }, + { + "epoch": 1.29, + "learning_rate": 0.000107021563603271, + "loss": 0.0329, + "step": 199330 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010701188224891406, + "loss": 0.0296, + "step": 199340 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010700220089455714, + "loss": 0.0345, + "step": 199350 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001069925195402002, + "loss": 0.0348, + "step": 199360 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010698283818584326, + "loss": 0.0292, + "step": 199370 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010697315683148634, + "loss": 0.0279, + "step": 199380 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001069634754771294, + "loss": 0.0306, + "step": 199390 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010695379412277248, + "loss": 0.0302, + "step": 199400 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010694411276841553, + "loss": 0.0339, + "step": 199410 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010693443141405861, + "loss": 0.0295, + "step": 199420 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010692475005970168, + "loss": 0.0305, + "step": 199430 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010691506870534473, + "loss": 0.0298, + "step": 199440 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010690538735098781, + "loss": 0.0328, + "step": 199450 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010689570599663088, + "loss": 0.0317, + "step": 199460 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010688602464227396, + "loss": 0.0312, + "step": 199470 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010687634328791701, + "loss": 0.032, + "step": 199480 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010686666193356008, + "loss": 0.0293, + "step": 199490 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010685698057920316, + "loss": 0.0383, + "step": 199500 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010684729922484621, + "loss": 0.0341, + "step": 199510 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010683761787048929, + "loss": 0.0316, + "step": 199520 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010682793651613236, + "loss": 0.0372, + "step": 199530 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010681825516177542, + "loss": 0.0263, + "step": 199540 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010680857380741849, + "loss": 0.0378, + "step": 199550 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010679889245306156, + "loss": 0.0277, + "step": 199560 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010678921109870463, + "loss": 0.031, + "step": 199570 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010677952974434769, + "loss": 0.0288, + "step": 199580 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010676984838999075, + "loss": 0.0316, + "step": 199590 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010676016703563383, + "loss": 0.0304, + "step": 199600 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001067504856812769, + "loss": 0.0302, + "step": 199610 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010674080432691997, + "loss": 0.0332, + "step": 199620 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010673112297256303, + "loss": 0.0293, + "step": 199630 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001067214416182061, + "loss": 0.0337, + "step": 199640 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010671176026384916, + "loss": 0.034, + "step": 199650 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010670207890949223, + "loss": 0.0306, + "step": 199660 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010669239755513531, + "loss": 0.0292, + "step": 199670 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010668271620077838, + "loss": 0.0311, + "step": 199680 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010667303484642143, + "loss": 0.0344, + "step": 199690 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010666335349206451, + "loss": 0.0283, + "step": 199700 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010665367213770758, + "loss": 0.0321, + "step": 199710 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010664399078335064, + "loss": 0.0316, + "step": 199720 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010663430942899371, + "loss": 0.0342, + "step": 199730 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010662462807463677, + "loss": 0.0303, + "step": 199740 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010661494672027985, + "loss": 0.0272, + "step": 199750 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010660526536592291, + "loss": 0.0325, + "step": 199760 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010659558401156599, + "loss": 0.0317, + "step": 199770 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010658590265720905, + "loss": 0.0366, + "step": 199780 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001065762213028521, + "loss": 0.0341, + "step": 199790 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010656653994849519, + "loss": 0.0258, + "step": 199800 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010655685859413825, + "loss": 0.0294, + "step": 199810 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010654717723978133, + "loss": 0.0249, + "step": 199820 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010653749588542438, + "loss": 0.0339, + "step": 199830 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010652781453106745, + "loss": 0.0336, + "step": 199840 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010651813317671053, + "loss": 0.0324, + "step": 199850 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010650845182235358, + "loss": 0.0342, + "step": 199860 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010649877046799666, + "loss": 0.0317, + "step": 199870 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010648908911363973, + "loss": 0.0289, + "step": 199880 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010647940775928281, + "loss": 0.0345, + "step": 199890 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010646972640492586, + "loss": 0.0298, + "step": 199900 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010646004505056893, + "loss": 0.0345, + "step": 199910 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010645036369621201, + "loss": 0.0302, + "step": 199920 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010644068234185506, + "loss": 0.0309, + "step": 199930 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010643100098749813, + "loss": 0.0319, + "step": 199940 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001064213196331412, + "loss": 0.0338, + "step": 199950 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010641163827878427, + "loss": 0.031, + "step": 199960 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010640195692442734, + "loss": 0.0279, + "step": 199970 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001063922755700704, + "loss": 0.0289, + "step": 199980 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010638259421571348, + "loss": 0.0311, + "step": 199990 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010637291286135654, + "loss": 0.0278, + "step": 200000 + }, + { + "epoch": 1.29, + "eval_cer": 0.9198264602869732, + "eval_loss": 0.02203773520886898, + "eval_runtime": 120.2041, + "eval_samples_per_second": 16.638, + "eval_steps_per_second": 4.16, + "step": 200000 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001063632315069996, + "loss": 0.0299, + "step": 200010 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010635355015264268, + "loss": 0.0331, + "step": 200020 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010634386879828575, + "loss": 0.0334, + "step": 200030 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001063341874439288, + "loss": 0.0365, + "step": 200040 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010632450608957188, + "loss": 0.0291, + "step": 200050 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010631482473521495, + "loss": 0.0294, + "step": 200060 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010630514338085801, + "loss": 0.0349, + "step": 200070 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010629546202650108, + "loss": 0.0325, + "step": 200080 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010628578067214416, + "loss": 0.0291, + "step": 200090 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010627609931778723, + "loss": 0.034, + "step": 200100 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010626641796343028, + "loss": 0.0294, + "step": 200110 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010625673660907336, + "loss": 0.0351, + "step": 200120 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010624705525471643, + "loss": 0.0309, + "step": 200130 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010623737390035948, + "loss": 0.0313, + "step": 200140 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010622769254600256, + "loss": 0.0281, + "step": 200150 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010621801119164562, + "loss": 0.0307, + "step": 200160 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001062083298372887, + "loss": 0.032, + "step": 200170 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010619864848293176, + "loss": 0.0313, + "step": 200180 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010618896712857484, + "loss": 0.0351, + "step": 200190 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001061792857742179, + "loss": 0.0314, + "step": 200200 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010616960441986096, + "loss": 0.0461, + "step": 200210 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010615992306550404, + "loss": 0.0269, + "step": 200220 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001061502417111471, + "loss": 0.0349, + "step": 200230 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010614056035679018, + "loss": 0.0294, + "step": 200240 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010613087900243323, + "loss": 0.0244, + "step": 200250 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001061211976480763, + "loss": 0.0282, + "step": 200260 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010611151629371938, + "loss": 0.0297, + "step": 200270 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010610183493936243, + "loss": 0.0319, + "step": 200280 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010609215358500551, + "loss": 0.0272, + "step": 200290 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010608247223064858, + "loss": 0.0311, + "step": 200300 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010607279087629166, + "loss": 0.0334, + "step": 200310 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010606310952193471, + "loss": 0.0279, + "step": 200320 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010605342816757778, + "loss": 0.0292, + "step": 200330 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010604374681322086, + "loss": 0.0302, + "step": 200340 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010603406545886391, + "loss": 0.0289, + "step": 200350 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010602438410450698, + "loss": 0.0309, + "step": 200360 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010601470275015006, + "loss": 0.0297, + "step": 200370 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010600502139579312, + "loss": 0.0327, + "step": 200380 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010599534004143619, + "loss": 0.0236, + "step": 200390 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010598565868707925, + "loss": 0.0266, + "step": 200400 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010597597733272233, + "loss": 0.0299, + "step": 200410 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010596629597836539, + "loss": 0.0334, + "step": 200420 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010595661462400845, + "loss": 0.0266, + "step": 200430 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010594693326965153, + "loss": 0.0324, + "step": 200440 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001059372519152946, + "loss": 0.0303, + "step": 200450 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010592757056093765, + "loss": 0.0316, + "step": 200460 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010591788920658073, + "loss": 0.0305, + "step": 200470 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001059082078522238, + "loss": 0.0318, + "step": 200480 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010589852649786686, + "loss": 0.0303, + "step": 200490 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010588884514350993, + "loss": 0.035, + "step": 200500 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010587916378915301, + "loss": 0.031, + "step": 200510 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010586948243479608, + "loss": 0.027, + "step": 200520 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010585980108043913, + "loss": 0.0294, + "step": 200530 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010585011972608221, + "loss": 0.0293, + "step": 200540 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010584043837172528, + "loss": 0.0349, + "step": 200550 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010583075701736833, + "loss": 0.0342, + "step": 200560 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010582107566301141, + "loss": 0.0273, + "step": 200570 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010581139430865447, + "loss": 0.0289, + "step": 200580 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010580171295429755, + "loss": 0.0304, + "step": 200590 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001057920315999406, + "loss": 0.0271, + "step": 200600 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010578235024558369, + "loss": 0.0357, + "step": 200610 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010577266889122675, + "loss": 0.0342, + "step": 200620 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001057629875368698, + "loss": 0.0334, + "step": 200630 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010575330618251289, + "loss": 0.029, + "step": 200640 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010574362482815595, + "loss": 0.0276, + "step": 200650 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010573394347379903, + "loss": 0.0235, + "step": 200660 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010572426211944208, + "loss": 0.0314, + "step": 200670 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010571458076508515, + "loss": 0.0304, + "step": 200680 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010570489941072823, + "loss": 0.0348, + "step": 200690 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010569521805637128, + "loss": 0.0248, + "step": 200700 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010568553670201436, + "loss": 0.0307, + "step": 200710 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010567585534765743, + "loss": 0.0309, + "step": 200720 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001056661739933005, + "loss": 0.0269, + "step": 200730 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010565649263894356, + "loss": 0.0287, + "step": 200740 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010564681128458663, + "loss": 0.0283, + "step": 200750 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010563712993022971, + "loss": 0.0338, + "step": 200760 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010562744857587276, + "loss": 0.0282, + "step": 200770 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010561776722151583, + "loss": 0.0295, + "step": 200780 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001056080858671589, + "loss": 0.0258, + "step": 200790 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010559840451280197, + "loss": 0.0262, + "step": 200800 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010558872315844504, + "loss": 0.0276, + "step": 200810 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001055790418040881, + "loss": 0.0288, + "step": 200820 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010556936044973117, + "loss": 0.035, + "step": 200830 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010555967909537424, + "loss": 0.031, + "step": 200840 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001055499977410173, + "loss": 0.0341, + "step": 200850 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010554031638666038, + "loss": 0.0319, + "step": 200860 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010553063503230345, + "loss": 0.0339, + "step": 200870 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001055209536779465, + "loss": 0.0269, + "step": 200880 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010551127232358958, + "loss": 0.0365, + "step": 200890 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010550159096923265, + "loss": 0.0312, + "step": 200900 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010549190961487571, + "loss": 0.0327, + "step": 200910 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010548222826051878, + "loss": 0.0308, + "step": 200920 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010547254690616185, + "loss": 0.031, + "step": 200930 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010546286555180493, + "loss": 0.0332, + "step": 200940 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010545318419744798, + "loss": 0.0291, + "step": 200950 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010544350284309106, + "loss": 0.0245, + "step": 200960 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010543382148873413, + "loss": 0.0292, + "step": 200970 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010542414013437718, + "loss": 0.0294, + "step": 200980 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010541445878002026, + "loss": 0.0319, + "step": 200990 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010540477742566332, + "loss": 0.029, + "step": 201000 + }, + { + "epoch": 1.3, + "eval_cer": 0.9199159417015027, + "eval_loss": 0.02207825891673565, + "eval_runtime": 120.2757, + "eval_samples_per_second": 16.628, + "eval_steps_per_second": 4.157, + "step": 201000 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001053950960713064, + "loss": 0.0365, + "step": 201010 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010538541471694946, + "loss": 0.0312, + "step": 201020 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010537573336259252, + "loss": 0.0304, + "step": 201030 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001053660520082356, + "loss": 0.0306, + "step": 201040 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010535637065387866, + "loss": 0.0321, + "step": 201050 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010534668929952173, + "loss": 0.0307, + "step": 201060 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001053370079451648, + "loss": 0.031, + "step": 201070 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010532732659080788, + "loss": 0.0326, + "step": 201080 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010531764523645093, + "loss": 0.0332, + "step": 201090 + }, + { + "epoch": 1.3, + "learning_rate": 0.000105307963882094, + "loss": 0.032, + "step": 201100 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010529828252773708, + "loss": 0.0297, + "step": 201110 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010528860117338013, + "loss": 0.0321, + "step": 201120 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001052789198190232, + "loss": 0.0275, + "step": 201130 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010526923846466628, + "loss": 0.0324, + "step": 201140 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010525955711030934, + "loss": 0.0317, + "step": 201150 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010524987575595241, + "loss": 0.0311, + "step": 201160 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010524019440159548, + "loss": 0.0313, + "step": 201170 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010523051304723856, + "loss": 0.0324, + "step": 201180 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010522083169288161, + "loss": 0.0275, + "step": 201190 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010521115033852468, + "loss": 0.0277, + "step": 201200 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010520146898416776, + "loss": 0.0342, + "step": 201210 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010519178762981082, + "loss": 0.0356, + "step": 201220 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010518210627545387, + "loss": 0.0275, + "step": 201230 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010517242492109695, + "loss": 0.0358, + "step": 201240 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010516274356674002, + "loss": 0.0342, + "step": 201250 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010515306221238309, + "loss": 0.0285, + "step": 201260 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010514338085802615, + "loss": 0.0321, + "step": 201270 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010513369950366923, + "loss": 0.0349, + "step": 201280 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001051240181493123, + "loss": 0.0333, + "step": 201290 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010511433679495535, + "loss": 0.0389, + "step": 201300 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010510465544059843, + "loss": 0.029, + "step": 201310 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001050949740862415, + "loss": 0.0231, + "step": 201320 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010508529273188455, + "loss": 0.0262, + "step": 201330 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010507561137752763, + "loss": 0.0328, + "step": 201340 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001050659300231707, + "loss": 0.0298, + "step": 201350 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010505624866881378, + "loss": 0.0342, + "step": 201360 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010504656731445683, + "loss": 0.0334, + "step": 201370 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010503688596009991, + "loss": 0.0281, + "step": 201380 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010502720460574298, + "loss": 0.0283, + "step": 201390 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010501752325138603, + "loss": 0.0315, + "step": 201400 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010500784189702911, + "loss": 0.0245, + "step": 201410 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010499816054267217, + "loss": 0.029, + "step": 201420 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010498847918831523, + "loss": 0.0312, + "step": 201430 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001049787978339583, + "loss": 0.0267, + "step": 201440 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010496911647960137, + "loss": 0.0245, + "step": 201450 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010495943512524445, + "loss": 0.0322, + "step": 201460 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001049497537708875, + "loss": 0.034, + "step": 201470 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010494007241653058, + "loss": 0.0266, + "step": 201480 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010493039106217365, + "loss": 0.0323, + "step": 201490 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001049207097078167, + "loss": 0.035, + "step": 201500 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010491102835345978, + "loss": 0.0343, + "step": 201510 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010490134699910285, + "loss": 0.0351, + "step": 201520 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010489166564474593, + "loss": 0.0339, + "step": 201530 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010488198429038898, + "loss": 0.0292, + "step": 201540 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010487230293603205, + "loss": 0.03, + "step": 201550 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010486262158167513, + "loss": 0.0324, + "step": 201560 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010485294022731818, + "loss": 0.0314, + "step": 201570 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010484325887296126, + "loss": 0.0255, + "step": 201580 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010483357751860433, + "loss": 0.0296, + "step": 201590 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001048238961642474, + "loss": 0.0275, + "step": 201600 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010481421480989046, + "loss": 0.0309, + "step": 201610 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010480453345553353, + "loss": 0.0286, + "step": 201620 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001047948521011766, + "loss": 0.0344, + "step": 201630 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010478517074681966, + "loss": 0.0235, + "step": 201640 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010477548939246272, + "loss": 0.0303, + "step": 201650 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001047658080381058, + "loss": 0.0318, + "step": 201660 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010475612668374887, + "loss": 0.0371, + "step": 201670 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010474644532939194, + "loss": 0.0257, + "step": 201680 + }, + { + "epoch": 1.3, + "learning_rate": 0.000104736763975035, + "loss": 0.0278, + "step": 201690 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010472708262067808, + "loss": 0.0273, + "step": 201700 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010471740126632114, + "loss": 0.0307, + "step": 201710 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001047077199119642, + "loss": 0.0294, + "step": 201720 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010469803855760728, + "loss": 0.0291, + "step": 201730 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010468835720325035, + "loss": 0.0276, + "step": 201740 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001046786758488934, + "loss": 0.0299, + "step": 201750 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010466899449453648, + "loss": 0.0311, + "step": 201760 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010465931314017955, + "loss": 0.0366, + "step": 201770 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010464963178582261, + "loss": 0.0266, + "step": 201780 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010463995043146568, + "loss": 0.0292, + "step": 201790 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010463026907710876, + "loss": 0.0331, + "step": 201800 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010462058772275182, + "loss": 0.0289, + "step": 201810 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010461090636839488, + "loss": 0.0272, + "step": 201820 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010460122501403796, + "loss": 0.0334, + "step": 201830 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010459154365968102, + "loss": 0.0308, + "step": 201840 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010458186230532408, + "loss": 0.0236, + "step": 201850 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010457218095096716, + "loss": 0.0289, + "step": 201860 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010456249959661022, + "loss": 0.0264, + "step": 201870 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001045528182422533, + "loss": 0.026, + "step": 201880 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010454313688789635, + "loss": 0.0375, + "step": 201890 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010453345553353943, + "loss": 0.0372, + "step": 201900 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001045237741791825, + "loss": 0.0309, + "step": 201910 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010451409282482555, + "loss": 0.0264, + "step": 201920 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010450441147046863, + "loss": 0.0307, + "step": 201930 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001044947301161117, + "loss": 0.029, + "step": 201940 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010448504876175478, + "loss": 0.0314, + "step": 201950 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010447536740739783, + "loss": 0.0331, + "step": 201960 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001044656860530409, + "loss": 0.0265, + "step": 201970 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010445600469868398, + "loss": 0.0289, + "step": 201980 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010444632334432703, + "loss": 0.0267, + "step": 201990 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010443664198997011, + "loss": 0.0319, + "step": 202000 + }, + { + "epoch": 1.3, + "eval_cer": 0.9198861145633261, + "eval_loss": 0.02179008163511753, + "eval_runtime": 120.2378, + "eval_samples_per_second": 16.634, + "eval_steps_per_second": 4.158, + "step": 202000 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010442696063561318, + "loss": 0.0331, + "step": 202010 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010441727928125624, + "loss": 0.0294, + "step": 202020 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010440759792689931, + "loss": 0.0315, + "step": 202030 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010439791657254238, + "loss": 0.0305, + "step": 202040 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010438823521818546, + "loss": 0.0318, + "step": 202050 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010437855386382851, + "loss": 0.0247, + "step": 202060 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010436887250947157, + "loss": 0.0336, + "step": 202070 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010435919115511465, + "loss": 0.0297, + "step": 202080 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010434950980075772, + "loss": 0.0308, + "step": 202090 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010433982844640079, + "loss": 0.0277, + "step": 202100 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010433014709204385, + "loss": 0.0285, + "step": 202110 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010432046573768693, + "loss": 0.0324, + "step": 202120 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010431078438332999, + "loss": 0.0258, + "step": 202130 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010430110302897305, + "loss": 0.04, + "step": 202140 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010429142167461613, + "loss": 0.0281, + "step": 202150 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001042817403202592, + "loss": 0.0359, + "step": 202160 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010427205896590225, + "loss": 0.0375, + "step": 202170 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010426237761154533, + "loss": 0.0358, + "step": 202180 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001042526962571884, + "loss": 0.0351, + "step": 202190 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010424301490283146, + "loss": 0.0262, + "step": 202200 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010423333354847453, + "loss": 0.034, + "step": 202210 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010422365219411761, + "loss": 0.0306, + "step": 202220 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010421397083976067, + "loss": 0.0352, + "step": 202230 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010420428948540373, + "loss": 0.03, + "step": 202240 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010419460813104681, + "loss": 0.0331, + "step": 202250 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010418492677668987, + "loss": 0.0396, + "step": 202260 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010417524542233293, + "loss": 0.0328, + "step": 202270 + }, + { + "epoch": 1.31, + "learning_rate": 0.000104165564067976, + "loss": 0.0306, + "step": 202280 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010415588271361907, + "loss": 0.0309, + "step": 202290 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010414620135926215, + "loss": 0.0314, + "step": 202300 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001041365200049052, + "loss": 0.0365, + "step": 202310 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010412683865054828, + "loss": 0.0294, + "step": 202320 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010411715729619135, + "loss": 0.0367, + "step": 202330 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001041074759418344, + "loss": 0.0298, + "step": 202340 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010409779458747748, + "loss": 0.0283, + "step": 202350 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010408811323312055, + "loss": 0.0325, + "step": 202360 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010407843187876363, + "loss": 0.029, + "step": 202370 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010406875052440668, + "loss": 0.0302, + "step": 202380 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010405906917004975, + "loss": 0.0307, + "step": 202390 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010404938781569283, + "loss": 0.0317, + "step": 202400 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010403970646133588, + "loss": 0.0337, + "step": 202410 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010403002510697896, + "loss": 0.0258, + "step": 202420 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010402034375262203, + "loss": 0.0329, + "step": 202430 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010401066239826509, + "loss": 0.0317, + "step": 202440 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010400098104390816, + "loss": 0.0347, + "step": 202450 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010399129968955123, + "loss": 0.0288, + "step": 202460 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001039816183351943, + "loss": 0.0335, + "step": 202470 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010397193698083736, + "loss": 0.0275, + "step": 202480 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010396225562648042, + "loss": 0.0291, + "step": 202490 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001039525742721235, + "loss": 0.0243, + "step": 202500 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010394289291776657, + "loss": 0.0367, + "step": 202510 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010393321156340964, + "loss": 0.0258, + "step": 202520 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001039235302090527, + "loss": 0.0343, + "step": 202530 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010391384885469577, + "loss": 0.0252, + "step": 202540 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010390416750033884, + "loss": 0.0324, + "step": 202550 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001038944861459819, + "loss": 0.0312, + "step": 202560 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010388480479162498, + "loss": 0.0299, + "step": 202570 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010387512343726805, + "loss": 0.0314, + "step": 202580 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001038654420829111, + "loss": 0.0357, + "step": 202590 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010385576072855418, + "loss": 0.026, + "step": 202600 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010384607937419725, + "loss": 0.0304, + "step": 202610 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010383639801984031, + "loss": 0.0304, + "step": 202620 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010382671666548338, + "loss": 0.0293, + "step": 202630 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010381703531112644, + "loss": 0.0338, + "step": 202640 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010380735395676952, + "loss": 0.0284, + "step": 202650 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010379767260241258, + "loss": 0.0257, + "step": 202660 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010378799124805566, + "loss": 0.0302, + "step": 202670 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010377830989369872, + "loss": 0.0281, + "step": 202680 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010376862853934178, + "loss": 0.0253, + "step": 202690 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010375894718498486, + "loss": 0.0339, + "step": 202700 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010374926583062792, + "loss": 0.0348, + "step": 202710 + }, + { + "epoch": 1.31, + "learning_rate": 0.000103739584476271, + "loss": 0.032, + "step": 202720 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010372990312191405, + "loss": 0.0311, + "step": 202730 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010372022176755712, + "loss": 0.031, + "step": 202740 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001037105404132002, + "loss": 0.0345, + "step": 202750 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010370085905884325, + "loss": 0.0333, + "step": 202760 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010369117770448633, + "loss": 0.028, + "step": 202770 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001036814963501294, + "loss": 0.0359, + "step": 202780 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010367181499577248, + "loss": 0.0301, + "step": 202790 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010366213364141553, + "loss": 0.0269, + "step": 202800 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001036524522870586, + "loss": 0.0322, + "step": 202810 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010364277093270168, + "loss": 0.0245, + "step": 202820 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010363308957834473, + "loss": 0.0281, + "step": 202830 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001036234082239878, + "loss": 0.0324, + "step": 202840 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010361372686963088, + "loss": 0.0285, + "step": 202850 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010360404551527394, + "loss": 0.027, + "step": 202860 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010359436416091701, + "loss": 0.0284, + "step": 202870 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010358468280656008, + "loss": 0.0298, + "step": 202880 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010357500145220315, + "loss": 0.0315, + "step": 202890 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010356532009784621, + "loss": 0.0263, + "step": 202900 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010355563874348927, + "loss": 0.0337, + "step": 202910 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010354595738913235, + "loss": 0.0371, + "step": 202920 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010353627603477542, + "loss": 0.0265, + "step": 202930 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010352659468041847, + "loss": 0.0316, + "step": 202940 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010351691332606155, + "loss": 0.0297, + "step": 202950 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010350723197170462, + "loss": 0.0298, + "step": 202960 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010349755061734768, + "loss": 0.0289, + "step": 202970 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010348786926299075, + "loss": 0.0251, + "step": 202980 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010347818790863383, + "loss": 0.0316, + "step": 202990 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001034685065542769, + "loss": 0.0422, + "step": 203000 + }, + { + "epoch": 1.31, + "eval_cer": 0.9198933453847022, + "eval_loss": 0.022010989487171173, + "eval_runtime": 120.2296, + "eval_samples_per_second": 16.635, + "eval_steps_per_second": 4.159, + "step": 203000 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010345882519991995, + "loss": 0.0289, + "step": 203010 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010344914384556303, + "loss": 0.0281, + "step": 203020 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001034394624912061, + "loss": 0.0341, + "step": 203030 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010342978113684915, + "loss": 0.0366, + "step": 203040 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010342009978249223, + "loss": 0.0303, + "step": 203050 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001034104184281353, + "loss": 0.0316, + "step": 203060 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010340073707377837, + "loss": 0.0306, + "step": 203070 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010339105571942143, + "loss": 0.0312, + "step": 203080 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010338137436506451, + "loss": 0.0304, + "step": 203090 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010337169301070757, + "loss": 0.0294, + "step": 203100 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010336201165635063, + "loss": 0.0317, + "step": 203110 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001033523303019937, + "loss": 0.0397, + "step": 203120 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010334264894763677, + "loss": 0.0279, + "step": 203130 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010333296759327985, + "loss": 0.0306, + "step": 203140 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001033232862389229, + "loss": 0.0312, + "step": 203150 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010331360488456597, + "loss": 0.0279, + "step": 203160 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010330392353020905, + "loss": 0.0278, + "step": 203170 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001032942421758521, + "loss": 0.032, + "step": 203180 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010328456082149518, + "loss": 0.0308, + "step": 203190 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010327487946713825, + "loss": 0.0269, + "step": 203200 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010326519811278133, + "loss": 0.024, + "step": 203210 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010325551675842438, + "loss": 0.0278, + "step": 203220 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010324583540406745, + "loss": 0.0312, + "step": 203230 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010323615404971053, + "loss": 0.0347, + "step": 203240 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010322647269535358, + "loss": 0.0272, + "step": 203250 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010321679134099665, + "loss": 0.03, + "step": 203260 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010320710998663973, + "loss": 0.0272, + "step": 203270 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010319742863228279, + "loss": 0.0306, + "step": 203280 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010318774727792586, + "loss": 0.0331, + "step": 203290 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010317806592356892, + "loss": 0.0351, + "step": 203300 + }, + { + "epoch": 1.31, + "learning_rate": 0.000103168384569212, + "loss": 0.0375, + "step": 203310 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010315870321485506, + "loss": 0.0282, + "step": 203320 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010314902186049812, + "loss": 0.0313, + "step": 203330 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001031393405061412, + "loss": 0.0281, + "step": 203340 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010312965915178427, + "loss": 0.0308, + "step": 203350 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010311997779742732, + "loss": 0.0323, + "step": 203360 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001031102964430704, + "loss": 0.029, + "step": 203370 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010310061508871347, + "loss": 0.0341, + "step": 203380 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010309093373435653, + "loss": 0.0331, + "step": 203390 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001030812523799996, + "loss": 0.0402, + "step": 203400 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010307157102564268, + "loss": 0.0295, + "step": 203410 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010306188967128575, + "loss": 0.0314, + "step": 203420 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001030522083169288, + "loss": 0.0339, + "step": 203430 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010304252696257188, + "loss": 0.0412, + "step": 203440 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010303284560821495, + "loss": 0.0338, + "step": 203450 + }, + { + "epoch": 1.31, + "learning_rate": 0.000103023164253858, + "loss": 0.0313, + "step": 203460 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010301348289950108, + "loss": 0.0405, + "step": 203470 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010300380154514414, + "loss": 0.0283, + "step": 203480 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010299412019078722, + "loss": 0.0276, + "step": 203490 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010298443883643028, + "loss": 0.0325, + "step": 203500 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010297475748207336, + "loss": 0.0306, + "step": 203510 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010296507612771642, + "loss": 0.0306, + "step": 203520 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010295539477335948, + "loss": 0.0307, + "step": 203530 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010294571341900256, + "loss": 0.0267, + "step": 203540 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010293603206464562, + "loss": 0.0337, + "step": 203550 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001029263507102887, + "loss": 0.0418, + "step": 203560 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010291666935593175, + "loss": 0.0313, + "step": 203570 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010290698800157482, + "loss": 0.0301, + "step": 203580 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001028973066472179, + "loss": 0.0327, + "step": 203590 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010288762529286095, + "loss": 0.0273, + "step": 203600 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010287794393850403, + "loss": 0.0298, + "step": 203610 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001028682625841471, + "loss": 0.027, + "step": 203620 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010285858122979017, + "loss": 0.0322, + "step": 203630 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010284889987543323, + "loss": 0.0344, + "step": 203640 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001028392185210763, + "loss": 0.0313, + "step": 203650 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010282953716671938, + "loss": 0.029, + "step": 203660 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010281985581236243, + "loss": 0.0294, + "step": 203670 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001028101744580055, + "loss": 0.0293, + "step": 203680 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010280049310364858, + "loss": 0.0287, + "step": 203690 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010279081174929164, + "loss": 0.0327, + "step": 203700 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010278113039493471, + "loss": 0.0345, + "step": 203710 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010277144904057777, + "loss": 0.0303, + "step": 203720 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010276176768622084, + "loss": 0.0257, + "step": 203730 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010275208633186391, + "loss": 0.0256, + "step": 203740 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010274240497750697, + "loss": 0.0309, + "step": 203750 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010273272362315005, + "loss": 0.028, + "step": 203760 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010272304226879312, + "loss": 0.0328, + "step": 203770 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010271336091443617, + "loss": 0.026, + "step": 203780 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010270367956007925, + "loss": 0.0273, + "step": 203790 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010269399820572232, + "loss": 0.0287, + "step": 203800 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010268431685136538, + "loss": 0.0348, + "step": 203810 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010267463549700845, + "loss": 0.031, + "step": 203820 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010266495414265152, + "loss": 0.0268, + "step": 203830 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001026552727882946, + "loss": 0.0338, + "step": 203840 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010264559143393765, + "loss": 0.0338, + "step": 203850 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010263591007958073, + "loss": 0.0264, + "step": 203860 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001026262287252238, + "loss": 0.0265, + "step": 203870 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010261654737086685, + "loss": 0.0276, + "step": 203880 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010260686601650993, + "loss": 0.0279, + "step": 203890 + }, + { + "epoch": 1.32, + "learning_rate": 0.000102597184662153, + "loss": 0.0284, + "step": 203900 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010258750330779607, + "loss": 0.034, + "step": 203910 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010257782195343913, + "loss": 0.0344, + "step": 203920 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010256814059908219, + "loss": 0.0318, + "step": 203930 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010255845924472527, + "loss": 0.028, + "step": 203940 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010254877789036833, + "loss": 0.03, + "step": 203950 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001025390965360114, + "loss": 0.0297, + "step": 203960 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010252941518165447, + "loss": 0.0344, + "step": 203970 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010251973382729755, + "loss": 0.0328, + "step": 203980 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001025100524729406, + "loss": 0.0294, + "step": 203990 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010250037111858367, + "loss": 0.0301, + "step": 204000 + }, + { + "epoch": 1.32, + "eval_cer": 0.9198237487289572, + "eval_loss": 0.02146965079009533, + "eval_runtime": 120.4063, + "eval_samples_per_second": 16.61, + "eval_steps_per_second": 4.153, + "step": 204000 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010249068976422675, + "loss": 0.0301, + "step": 204010 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001024810084098698, + "loss": 0.0315, + "step": 204020 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010247132705551287, + "loss": 0.0307, + "step": 204030 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010246164570115595, + "loss": 0.0366, + "step": 204040 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010245196434679901, + "loss": 0.0315, + "step": 204050 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010244228299244208, + "loss": 0.034, + "step": 204060 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010243260163808515, + "loss": 0.0307, + "step": 204070 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010242292028372823, + "loss": 0.0268, + "step": 204080 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010241323892937128, + "loss": 0.0338, + "step": 204090 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010240355757501435, + "loss": 0.0332, + "step": 204100 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010239387622065743, + "loss": 0.0247, + "step": 204110 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010238419486630049, + "loss": 0.0291, + "step": 204120 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010237451351194354, + "loss": 0.0308, + "step": 204130 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010236483215758662, + "loss": 0.0298, + "step": 204140 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010235515080322969, + "loss": 0.0313, + "step": 204150 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010234546944887276, + "loss": 0.0344, + "step": 204160 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010233578809451582, + "loss": 0.0324, + "step": 204170 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001023261067401589, + "loss": 0.0386, + "step": 204180 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010231642538580197, + "loss": 0.0308, + "step": 204190 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010230674403144502, + "loss": 0.0298, + "step": 204200 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001022970626770881, + "loss": 0.0377, + "step": 204210 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010228738132273117, + "loss": 0.034, + "step": 204220 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010227769996837422, + "loss": 0.03, + "step": 204230 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001022680186140173, + "loss": 0.0297, + "step": 204240 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010225833725966037, + "loss": 0.0363, + "step": 204250 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010224865590530345, + "loss": 0.0292, + "step": 204260 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001022389745509465, + "loss": 0.025, + "step": 204270 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010222929319658958, + "loss": 0.0277, + "step": 204280 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010221961184223265, + "loss": 0.0302, + "step": 204290 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001022099304878757, + "loss": 0.0296, + "step": 204300 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010220024913351878, + "loss": 0.0282, + "step": 204310 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010219056777916184, + "loss": 0.0317, + "step": 204320 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010218088642480492, + "loss": 0.0264, + "step": 204330 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010217120507044798, + "loss": 0.0363, + "step": 204340 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010216152371609104, + "loss": 0.0279, + "step": 204350 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010215184236173412, + "loss": 0.0264, + "step": 204360 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010214216100737718, + "loss": 0.0241, + "step": 204370 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010213247965302025, + "loss": 0.0331, + "step": 204380 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010212279829866332, + "loss": 0.0335, + "step": 204390 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001021131169443064, + "loss": 0.0305, + "step": 204400 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010210343558994945, + "loss": 0.0389, + "step": 204410 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010209375423559252, + "loss": 0.0278, + "step": 204420 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001020840728812356, + "loss": 0.031, + "step": 204430 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010207439152687865, + "loss": 0.034, + "step": 204440 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010206471017252172, + "loss": 0.0324, + "step": 204450 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001020550288181648, + "loss": 0.027, + "step": 204460 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010204534746380786, + "loss": 0.029, + "step": 204470 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010203566610945093, + "loss": 0.0296, + "step": 204480 + }, + { + "epoch": 1.32, + "learning_rate": 0.000102025984755094, + "loss": 0.0254, + "step": 204490 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010201630340073708, + "loss": 0.0319, + "step": 204500 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010200662204638013, + "loss": 0.0239, + "step": 204510 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001019969406920232, + "loss": 0.0307, + "step": 204520 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010198725933766628, + "loss": 0.0271, + "step": 204530 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010197757798330934, + "loss": 0.0345, + "step": 204540 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001019678966289524, + "loss": 0.0346, + "step": 204550 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010195821527459547, + "loss": 0.0348, + "step": 204560 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010194853392023854, + "loss": 0.0278, + "step": 204570 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010193885256588161, + "loss": 0.032, + "step": 204580 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010192917121152467, + "loss": 0.0312, + "step": 204590 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010191948985716775, + "loss": 0.029, + "step": 204600 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010190980850281082, + "loss": 0.0282, + "step": 204610 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010190012714845387, + "loss": 0.0255, + "step": 204620 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010189044579409695, + "loss": 0.0335, + "step": 204630 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010188076443974002, + "loss": 0.0318, + "step": 204640 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010187108308538307, + "loss": 0.0296, + "step": 204650 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010186140173102615, + "loss": 0.0315, + "step": 204660 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010185172037666922, + "loss": 0.0329, + "step": 204670 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001018420390223123, + "loss": 0.0268, + "step": 204680 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010183235766795535, + "loss": 0.0374, + "step": 204690 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010182267631359843, + "loss": 0.032, + "step": 204700 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001018129949592415, + "loss": 0.0347, + "step": 204710 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010180331360488455, + "loss": 0.03, + "step": 204720 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010179363225052763, + "loss": 0.0291, + "step": 204730 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001017839508961707, + "loss": 0.0288, + "step": 204740 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010177426954181377, + "loss": 0.0273, + "step": 204750 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010176458818745683, + "loss": 0.0294, + "step": 204760 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010175490683309989, + "loss": 0.0354, + "step": 204770 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010174522547874297, + "loss": 0.0328, + "step": 204780 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010173554412438602, + "loss": 0.0301, + "step": 204790 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001017258627700291, + "loss": 0.029, + "step": 204800 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010171618141567217, + "loss": 0.0333, + "step": 204810 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010170650006131524, + "loss": 0.028, + "step": 204820 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001016968187069583, + "loss": 0.0321, + "step": 204830 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010168713735260137, + "loss": 0.0351, + "step": 204840 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010167745599824445, + "loss": 0.0329, + "step": 204850 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001016677746438875, + "loss": 0.0263, + "step": 204860 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010165809328953057, + "loss": 0.0336, + "step": 204870 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010164841193517365, + "loss": 0.0262, + "step": 204880 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001016387305808167, + "loss": 0.0304, + "step": 204890 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010162904922645978, + "loss": 0.0338, + "step": 204900 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010161936787210285, + "loss": 0.0259, + "step": 204910 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010160968651774591, + "loss": 0.0281, + "step": 204920 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010160000516338898, + "loss": 0.025, + "step": 204930 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010159032380903205, + "loss": 0.0303, + "step": 204940 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010158064245467513, + "loss": 0.0287, + "step": 204950 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010157096110031818, + "loss": 0.0304, + "step": 204960 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010156127974596124, + "loss": 0.0308, + "step": 204970 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010155159839160432, + "loss": 0.0253, + "step": 204980 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010154191703724739, + "loss": 0.0236, + "step": 204990 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010153223568289046, + "loss": 0.0293, + "step": 205000 + }, + { + "epoch": 1.32, + "eval_cer": 0.9198472488984295, + "eval_loss": 0.021727943792939186, + "eval_runtime": 120.2177, + "eval_samples_per_second": 16.636, + "eval_steps_per_second": 4.159, + "step": 205000 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010152255432853352, + "loss": 0.0271, + "step": 205010 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010151287297417659, + "loss": 0.0265, + "step": 205020 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010150319161981966, + "loss": 0.0303, + "step": 205030 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010149351026546272, + "loss": 0.027, + "step": 205040 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001014838289111058, + "loss": 0.0293, + "step": 205050 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010147414755674887, + "loss": 0.0351, + "step": 205060 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010146446620239192, + "loss": 0.0244, + "step": 205070 + }, + { + "epoch": 1.32, + "learning_rate": 0.000101454784848035, + "loss": 0.0343, + "step": 205080 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010144510349367807, + "loss": 0.028, + "step": 205090 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010143542213932113, + "loss": 0.0276, + "step": 205100 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001014257407849642, + "loss": 0.0294, + "step": 205110 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010141605943060727, + "loss": 0.0325, + "step": 205120 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010140637807625034, + "loss": 0.0301, + "step": 205130 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001013966967218934, + "loss": 0.0309, + "step": 205140 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010138701536753648, + "loss": 0.0337, + "step": 205150 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010137733401317954, + "loss": 0.0316, + "step": 205160 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001013676526588226, + "loss": 0.0289, + "step": 205170 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010135797130446568, + "loss": 0.0301, + "step": 205180 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010134828995010874, + "loss": 0.0284, + "step": 205190 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010133860859575182, + "loss": 0.0298, + "step": 205200 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010132892724139487, + "loss": 0.0285, + "step": 205210 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010131924588703794, + "loss": 0.025, + "step": 205220 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010130956453268102, + "loss": 0.0295, + "step": 205230 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010129988317832407, + "loss": 0.0292, + "step": 205240 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010129020182396715, + "loss": 0.0275, + "step": 205250 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010128052046961022, + "loss": 0.0406, + "step": 205260 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001012708391152533, + "loss": 0.0274, + "step": 205270 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010126115776089635, + "loss": 0.0284, + "step": 205280 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010125147640653942, + "loss": 0.0269, + "step": 205290 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001012417950521825, + "loss": 0.0342, + "step": 205300 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010123211369782555, + "loss": 0.0375, + "step": 205310 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010122243234346862, + "loss": 0.0268, + "step": 205320 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001012127509891117, + "loss": 0.032, + "step": 205330 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010120306963475476, + "loss": 0.0287, + "step": 205340 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010119338828039783, + "loss": 0.0261, + "step": 205350 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001011837069260409, + "loss": 0.0328, + "step": 205360 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010117402557168398, + "loss": 0.0337, + "step": 205370 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010116434421732703, + "loss": 0.0274, + "step": 205380 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001011546628629701, + "loss": 0.0313, + "step": 205390 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010114498150861317, + "loss": 0.0301, + "step": 205400 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010113530015425624, + "loss": 0.0377, + "step": 205410 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010112561879989929, + "loss": 0.0305, + "step": 205420 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010111593744554237, + "loss": 0.026, + "step": 205430 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010110625609118544, + "loss": 0.0296, + "step": 205440 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001010965747368285, + "loss": 0.0318, + "step": 205450 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010108689338247157, + "loss": 0.0328, + "step": 205460 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010107721202811465, + "loss": 0.0317, + "step": 205470 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010106753067375772, + "loss": 0.027, + "step": 205480 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010105784931940077, + "loss": 0.0279, + "step": 205490 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010104816796504385, + "loss": 0.0324, + "step": 205500 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010103848661068692, + "loss": 0.0278, + "step": 205510 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010102880525632997, + "loss": 0.0287, + "step": 205520 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010101912390197305, + "loss": 0.0351, + "step": 205530 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010100944254761611, + "loss": 0.0328, + "step": 205540 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001009997611932592, + "loss": 0.0289, + "step": 205550 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010099007983890225, + "loss": 0.0286, + "step": 205560 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010098039848454533, + "loss": 0.031, + "step": 205570 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001009707171301884, + "loss": 0.0244, + "step": 205580 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010096103577583145, + "loss": 0.0257, + "step": 205590 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010095135442147453, + "loss": 0.0343, + "step": 205600 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010094167306711759, + "loss": 0.0286, + "step": 205610 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010093199171276067, + "loss": 0.0309, + "step": 205620 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010092231035840372, + "loss": 0.0293, + "step": 205630 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010091262900404679, + "loss": 0.0282, + "step": 205640 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010090294764968987, + "loss": 0.0269, + "step": 205650 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010089326629533292, + "loss": 0.0413, + "step": 205660 + }, + { + "epoch": 1.33, + "learning_rate": 0.000100883584940976, + "loss": 0.0273, + "step": 205670 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010087390358661907, + "loss": 0.0259, + "step": 205680 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010086422223226215, + "loss": 0.03, + "step": 205690 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001008545408779052, + "loss": 0.0275, + "step": 205700 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010084485952354827, + "loss": 0.0265, + "step": 205710 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010083517816919135, + "loss": 0.0348, + "step": 205720 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001008254968148344, + "loss": 0.0322, + "step": 205730 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010081581546047747, + "loss": 0.0322, + "step": 205740 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010080613410612055, + "loss": 0.0351, + "step": 205750 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010079645275176361, + "loss": 0.0277, + "step": 205760 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010078677139740668, + "loss": 0.0379, + "step": 205770 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010077709004304975, + "loss": 0.0286, + "step": 205780 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010076740868869283, + "loss": 0.0262, + "step": 205790 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010075772733433588, + "loss": 0.0266, + "step": 205800 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010074804597997894, + "loss": 0.0272, + "step": 205810 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010073836462562202, + "loss": 0.0286, + "step": 205820 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010072868327126509, + "loss": 0.0264, + "step": 205830 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010071900191690814, + "loss": 0.0272, + "step": 205840 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010070932056255122, + "loss": 0.0324, + "step": 205850 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010069963920819429, + "loss": 0.0284, + "step": 205860 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010068995785383735, + "loss": 0.0306, + "step": 205870 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010068027649948042, + "loss": 0.0314, + "step": 205880 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001006705951451235, + "loss": 0.033, + "step": 205890 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010066091379076657, + "loss": 0.0314, + "step": 205900 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010065123243640962, + "loss": 0.0277, + "step": 205910 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001006415510820527, + "loss": 0.0249, + "step": 205920 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010063186972769577, + "loss": 0.0271, + "step": 205930 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010062218837333882, + "loss": 0.028, + "step": 205940 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001006125070189819, + "loss": 0.026, + "step": 205950 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010060282566462496, + "loss": 0.0276, + "step": 205960 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010059314431026804, + "loss": 0.0292, + "step": 205970 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001005834629559111, + "loss": 0.0283, + "step": 205980 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010057378160155418, + "loss": 0.0244, + "step": 205990 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010056410024719724, + "loss": 0.0347, + "step": 206000 + }, + { + "epoch": 1.33, + "eval_cer": 0.9198969607953904, + "eval_loss": 0.021649910137057304, + "eval_runtime": 120.1272, + "eval_samples_per_second": 16.649, + "eval_steps_per_second": 4.162, + "step": 206000 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001005544188928403, + "loss": 0.0304, + "step": 206010 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010054473753848338, + "loss": 0.0347, + "step": 206020 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010053505618412644, + "loss": 0.0286, + "step": 206030 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010052537482976952, + "loss": 0.0311, + "step": 206040 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010051569347541257, + "loss": 0.0348, + "step": 206050 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010050601212105564, + "loss": 0.0289, + "step": 206060 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010049633076669872, + "loss": 0.0292, + "step": 206070 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010048664941234177, + "loss": 0.0307, + "step": 206080 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010047696805798485, + "loss": 0.0242, + "step": 206090 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010046728670362792, + "loss": 0.0299, + "step": 206100 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010045760534927099, + "loss": 0.0295, + "step": 206110 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010044792399491405, + "loss": 0.0302, + "step": 206120 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010043824264055712, + "loss": 0.031, + "step": 206130 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001004285612862002, + "loss": 0.0335, + "step": 206140 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010041887993184325, + "loss": 0.0297, + "step": 206150 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010040919857748632, + "loss": 0.0317, + "step": 206160 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001003995172231294, + "loss": 0.0268, + "step": 206170 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010038983586877246, + "loss": 0.0312, + "step": 206180 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010038015451441553, + "loss": 0.0346, + "step": 206190 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001003704731600586, + "loss": 0.0354, + "step": 206200 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010036079180570166, + "loss": 0.029, + "step": 206210 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010035111045134473, + "loss": 0.0299, + "step": 206220 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001003414290969878, + "loss": 0.027, + "step": 206230 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010033174774263087, + "loss": 0.028, + "step": 206240 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010032206638827394, + "loss": 0.0303, + "step": 206250 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010031238503391699, + "loss": 0.0284, + "step": 206260 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010030270367956007, + "loss": 0.0321, + "step": 206270 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010029302232520314, + "loss": 0.0339, + "step": 206280 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001002833409708462, + "loss": 0.0302, + "step": 206290 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010027365961648927, + "loss": 0.0268, + "step": 206300 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010026397826213234, + "loss": 0.032, + "step": 206310 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010025429690777542, + "loss": 0.0311, + "step": 206320 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010024461555341847, + "loss": 0.0269, + "step": 206330 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010023493419906155, + "loss": 0.0256, + "step": 206340 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010022525284470462, + "loss": 0.0269, + "step": 206350 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010021557149034767, + "loss": 0.0275, + "step": 206360 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010020589013599075, + "loss": 0.0314, + "step": 206370 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010019620878163381, + "loss": 0.0291, + "step": 206380 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001001865274272769, + "loss": 0.0337, + "step": 206390 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010017684607291995, + "loss": 0.0227, + "step": 206400 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010016716471856301, + "loss": 0.0275, + "step": 206410 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010015748336420609, + "loss": 0.0282, + "step": 206420 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010014780200984915, + "loss": 0.0288, + "step": 206430 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010013812065549223, + "loss": 0.0326, + "step": 206440 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010012843930113529, + "loss": 0.025, + "step": 206450 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010011875794677837, + "loss": 0.0293, + "step": 206460 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010010907659242142, + "loss": 0.0325, + "step": 206470 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010009939523806449, + "loss": 0.0315, + "step": 206480 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010008971388370757, + "loss": 0.0299, + "step": 206490 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010008003252935062, + "loss": 0.0272, + "step": 206500 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001000703511749937, + "loss": 0.0368, + "step": 206510 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010006066982063677, + "loss": 0.0309, + "step": 206520 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010005098846627984, + "loss": 0.0308, + "step": 206530 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001000413071119229, + "loss": 0.0284, + "step": 206540 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010003162575756597, + "loss": 0.027, + "step": 206550 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010002194440320905, + "loss": 0.0274, + "step": 206560 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001000122630488521, + "loss": 0.0301, + "step": 206570 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010000258169449517, + "loss": 0.0292, + "step": 206580 + }, + { + "epoch": 1.33, + "learning_rate": 9.999290034013825e-05, + "loss": 0.0307, + "step": 206590 + }, + { + "epoch": 1.33, + "learning_rate": 9.998321898578131e-05, + "loss": 0.0362, + "step": 206600 + }, + { + "epoch": 1.33, + "learning_rate": 9.997353763142438e-05, + "loss": 0.0376, + "step": 206610 + }, + { + "epoch": 1.33, + "learning_rate": 9.996385627706744e-05, + "loss": 0.0274, + "step": 206620 + }, + { + "epoch": 1.33, + "learning_rate": 9.995417492271051e-05, + "loss": 0.0349, + "step": 206630 + }, + { + "epoch": 1.33, + "learning_rate": 9.994449356835358e-05, + "loss": 0.032, + "step": 206640 + }, + { + "epoch": 1.33, + "learning_rate": 9.993481221399664e-05, + "loss": 0.0344, + "step": 206650 + }, + { + "epoch": 1.33, + "learning_rate": 9.992513085963972e-05, + "loss": 0.0297, + "step": 206660 + }, + { + "epoch": 1.33, + "learning_rate": 9.991544950528279e-05, + "loss": 0.0311, + "step": 206670 + }, + { + "epoch": 1.33, + "learning_rate": 9.990576815092584e-05, + "loss": 0.0253, + "step": 206680 + }, + { + "epoch": 1.33, + "learning_rate": 9.989608679656892e-05, + "loss": 0.03, + "step": 206690 + }, + { + "epoch": 1.33, + "learning_rate": 9.988640544221199e-05, + "loss": 0.0267, + "step": 206700 + }, + { + "epoch": 1.33, + "learning_rate": 9.987672408785505e-05, + "loss": 0.0266, + "step": 206710 + }, + { + "epoch": 1.33, + "learning_rate": 9.986704273349812e-05, + "loss": 0.0344, + "step": 206720 + }, + { + "epoch": 1.33, + "learning_rate": 9.985736137914119e-05, + "loss": 0.0292, + "step": 206730 + }, + { + "epoch": 1.33, + "learning_rate": 9.984768002478427e-05, + "loss": 0.0367, + "step": 206740 + }, + { + "epoch": 1.33, + "learning_rate": 9.983799867042732e-05, + "loss": 0.0299, + "step": 206750 + }, + { + "epoch": 1.33, + "learning_rate": 9.98283173160704e-05, + "loss": 0.0319, + "step": 206760 + }, + { + "epoch": 1.33, + "learning_rate": 9.981863596171347e-05, + "loss": 0.0321, + "step": 206770 + }, + { + "epoch": 1.33, + "learning_rate": 9.980895460735652e-05, + "loss": 0.0354, + "step": 206780 + }, + { + "epoch": 1.33, + "learning_rate": 9.97992732529996e-05, + "loss": 0.0303, + "step": 206790 + }, + { + "epoch": 1.33, + "learning_rate": 9.978959189864266e-05, + "loss": 0.0287, + "step": 206800 + }, + { + "epoch": 1.33, + "learning_rate": 9.977991054428574e-05, + "loss": 0.0304, + "step": 206810 + }, + { + "epoch": 1.33, + "learning_rate": 9.97702291899288e-05, + "loss": 0.0278, + "step": 206820 + }, + { + "epoch": 1.33, + "learning_rate": 9.976054783557186e-05, + "loss": 0.0291, + "step": 206830 + }, + { + "epoch": 1.33, + "learning_rate": 9.975086648121494e-05, + "loss": 0.0333, + "step": 206840 + }, + { + "epoch": 1.34, + "learning_rate": 9.9741185126858e-05, + "loss": 0.0327, + "step": 206850 + }, + { + "epoch": 1.34, + "learning_rate": 9.973150377250108e-05, + "loss": 0.0253, + "step": 206860 + }, + { + "epoch": 1.34, + "learning_rate": 9.972182241814414e-05, + "loss": 0.0288, + "step": 206870 + }, + { + "epoch": 1.34, + "learning_rate": 9.971214106378722e-05, + "loss": 0.0275, + "step": 206880 + }, + { + "epoch": 1.34, + "learning_rate": 9.970245970943027e-05, + "loss": 0.0321, + "step": 206890 + }, + { + "epoch": 1.34, + "learning_rate": 9.969277835507334e-05, + "loss": 0.032, + "step": 206900 + }, + { + "epoch": 1.34, + "learning_rate": 9.968309700071642e-05, + "loss": 0.0252, + "step": 206910 + }, + { + "epoch": 1.34, + "learning_rate": 9.967341564635947e-05, + "loss": 0.0317, + "step": 206920 + }, + { + "epoch": 1.34, + "learning_rate": 9.966373429200254e-05, + "loss": 0.0279, + "step": 206930 + }, + { + "epoch": 1.34, + "learning_rate": 9.965405293764562e-05, + "loss": 0.0284, + "step": 206940 + }, + { + "epoch": 1.34, + "learning_rate": 9.964437158328868e-05, + "loss": 0.0292, + "step": 206950 + }, + { + "epoch": 1.34, + "learning_rate": 9.963469022893175e-05, + "loss": 0.0317, + "step": 206960 + }, + { + "epoch": 1.34, + "learning_rate": 9.962500887457482e-05, + "loss": 0.0324, + "step": 206970 + }, + { + "epoch": 1.34, + "learning_rate": 9.96153275202179e-05, + "loss": 0.0344, + "step": 206980 + }, + { + "epoch": 1.34, + "learning_rate": 9.960564616586095e-05, + "loss": 0.0309, + "step": 206990 + }, + { + "epoch": 1.34, + "learning_rate": 9.959596481150402e-05, + "loss": 0.0288, + "step": 207000 + }, + { + "epoch": 1.34, + "eval_cer": 0.9198942492373743, + "eval_loss": 0.02147371508181095, + "eval_runtime": 120.1748, + "eval_samples_per_second": 16.642, + "eval_steps_per_second": 4.161, + "step": 207000 + }, + { + "epoch": 1.34, + "learning_rate": 9.95862834571471e-05, + "loss": 0.029, + "step": 207010 + }, + { + "epoch": 1.34, + "learning_rate": 9.957660210279016e-05, + "loss": 0.0309, + "step": 207020 + }, + { + "epoch": 1.34, + "learning_rate": 9.956692074843321e-05, + "loss": 0.0331, + "step": 207030 + }, + { + "epoch": 1.34, + "learning_rate": 9.95572393940763e-05, + "loss": 0.0278, + "step": 207040 + }, + { + "epoch": 1.34, + "learning_rate": 9.954755803971936e-05, + "loss": 0.026, + "step": 207050 + }, + { + "epoch": 1.34, + "learning_rate": 9.953787668536243e-05, + "loss": 0.0315, + "step": 207060 + }, + { + "epoch": 1.34, + "learning_rate": 9.95281953310055e-05, + "loss": 0.0337, + "step": 207070 + }, + { + "epoch": 1.34, + "learning_rate": 9.951851397664857e-05, + "loss": 0.0323, + "step": 207080 + }, + { + "epoch": 1.34, + "learning_rate": 9.950883262229164e-05, + "loss": 0.027, + "step": 207090 + }, + { + "epoch": 1.34, + "learning_rate": 9.949915126793469e-05, + "loss": 0.0277, + "step": 207100 + }, + { + "epoch": 1.34, + "learning_rate": 9.948946991357777e-05, + "loss": 0.0273, + "step": 207110 + }, + { + "epoch": 1.34, + "learning_rate": 9.947978855922084e-05, + "loss": 0.0259, + "step": 207120 + }, + { + "epoch": 1.34, + "learning_rate": 9.947010720486389e-05, + "loss": 0.0271, + "step": 207130 + }, + { + "epoch": 1.34, + "learning_rate": 9.946042585050697e-05, + "loss": 0.0295, + "step": 207140 + }, + { + "epoch": 1.34, + "learning_rate": 9.945074449615004e-05, + "loss": 0.0336, + "step": 207150 + }, + { + "epoch": 1.34, + "learning_rate": 9.944106314179312e-05, + "loss": 0.0341, + "step": 207160 + }, + { + "epoch": 1.34, + "learning_rate": 9.943138178743617e-05, + "loss": 0.0281, + "step": 207170 + }, + { + "epoch": 1.34, + "learning_rate": 9.942170043307925e-05, + "loss": 0.0332, + "step": 207180 + }, + { + "epoch": 1.34, + "learning_rate": 9.941201907872232e-05, + "loss": 0.0223, + "step": 207190 + }, + { + "epoch": 1.34, + "learning_rate": 9.940233772436537e-05, + "loss": 0.0299, + "step": 207200 + }, + { + "epoch": 1.34, + "learning_rate": 9.939265637000845e-05, + "loss": 0.0281, + "step": 207210 + }, + { + "epoch": 1.34, + "learning_rate": 9.938297501565151e-05, + "loss": 0.0284, + "step": 207220 + }, + { + "epoch": 1.34, + "learning_rate": 9.93732936612946e-05, + "loss": 0.0266, + "step": 207230 + }, + { + "epoch": 1.34, + "learning_rate": 9.936361230693765e-05, + "loss": 0.0319, + "step": 207240 + }, + { + "epoch": 1.34, + "learning_rate": 9.935393095258071e-05, + "loss": 0.028, + "step": 207250 + }, + { + "epoch": 1.34, + "learning_rate": 9.934424959822379e-05, + "loss": 0.0317, + "step": 207260 + }, + { + "epoch": 1.34, + "learning_rate": 9.933456824386685e-05, + "loss": 0.0277, + "step": 207270 + }, + { + "epoch": 1.34, + "learning_rate": 9.932488688950993e-05, + "loss": 0.032, + "step": 207280 + }, + { + "epoch": 1.34, + "learning_rate": 9.931520553515299e-05, + "loss": 0.0267, + "step": 207290 + }, + { + "epoch": 1.34, + "learning_rate": 9.930552418079607e-05, + "loss": 0.0301, + "step": 207300 + }, + { + "epoch": 1.34, + "learning_rate": 9.929584282643912e-05, + "loss": 0.0276, + "step": 207310 + }, + { + "epoch": 1.34, + "learning_rate": 9.928616147208219e-05, + "loss": 0.0289, + "step": 207320 + }, + { + "epoch": 1.34, + "learning_rate": 9.927648011772527e-05, + "loss": 0.0307, + "step": 207330 + }, + { + "epoch": 1.34, + "learning_rate": 9.926679876336832e-05, + "loss": 0.0293, + "step": 207340 + }, + { + "epoch": 1.34, + "learning_rate": 9.925711740901139e-05, + "loss": 0.0309, + "step": 207350 + }, + { + "epoch": 1.34, + "learning_rate": 9.924743605465447e-05, + "loss": 0.031, + "step": 207360 + }, + { + "epoch": 1.34, + "learning_rate": 9.923775470029753e-05, + "loss": 0.0369, + "step": 207370 + }, + { + "epoch": 1.34, + "learning_rate": 9.92280733459406e-05, + "loss": 0.0265, + "step": 207380 + }, + { + "epoch": 1.34, + "learning_rate": 9.921839199158367e-05, + "loss": 0.0294, + "step": 207390 + }, + { + "epoch": 1.34, + "learning_rate": 9.920871063722675e-05, + "loss": 0.0276, + "step": 207400 + }, + { + "epoch": 1.34, + "learning_rate": 9.91990292828698e-05, + "loss": 0.0341, + "step": 207410 + }, + { + "epoch": 1.34, + "learning_rate": 9.918934792851287e-05, + "loss": 0.0261, + "step": 207420 + }, + { + "epoch": 1.34, + "learning_rate": 9.917966657415595e-05, + "loss": 0.0315, + "step": 207430 + }, + { + "epoch": 1.34, + "learning_rate": 9.916998521979901e-05, + "loss": 0.0298, + "step": 207440 + }, + { + "epoch": 1.34, + "learning_rate": 9.916030386544206e-05, + "loss": 0.0258, + "step": 207450 + }, + { + "epoch": 1.34, + "learning_rate": 9.915062251108514e-05, + "loss": 0.0337, + "step": 207460 + }, + { + "epoch": 1.34, + "learning_rate": 9.914094115672821e-05, + "loss": 0.0357, + "step": 207470 + }, + { + "epoch": 1.34, + "learning_rate": 9.913125980237128e-05, + "loss": 0.0292, + "step": 207480 + }, + { + "epoch": 1.34, + "learning_rate": 9.912157844801434e-05, + "loss": 0.0333, + "step": 207490 + }, + { + "epoch": 1.34, + "learning_rate": 9.911189709365742e-05, + "loss": 0.0296, + "step": 207500 + }, + { + "epoch": 1.34, + "learning_rate": 9.910221573930049e-05, + "loss": 0.0293, + "step": 207510 + }, + { + "epoch": 1.34, + "learning_rate": 9.909253438494354e-05, + "loss": 0.0253, + "step": 207520 + }, + { + "epoch": 1.34, + "learning_rate": 9.908285303058662e-05, + "loss": 0.0327, + "step": 207530 + }, + { + "epoch": 1.34, + "learning_rate": 9.907317167622969e-05, + "loss": 0.0347, + "step": 207540 + }, + { + "epoch": 1.34, + "learning_rate": 9.906349032187274e-05, + "loss": 0.0348, + "step": 207550 + }, + { + "epoch": 1.34, + "learning_rate": 9.905380896751582e-05, + "loss": 0.0306, + "step": 207560 + }, + { + "epoch": 1.34, + "learning_rate": 9.904412761315889e-05, + "loss": 0.0316, + "step": 207570 + }, + { + "epoch": 1.34, + "learning_rate": 9.903444625880197e-05, + "loss": 0.0341, + "step": 207580 + }, + { + "epoch": 1.34, + "learning_rate": 9.902476490444502e-05, + "loss": 0.0392, + "step": 207590 + }, + { + "epoch": 1.34, + "learning_rate": 9.90150835500881e-05, + "loss": 0.0362, + "step": 207600 + }, + { + "epoch": 1.34, + "learning_rate": 9.900540219573117e-05, + "loss": 0.028, + "step": 207610 + }, + { + "epoch": 1.34, + "learning_rate": 9.899572084137422e-05, + "loss": 0.0309, + "step": 207620 + }, + { + "epoch": 1.34, + "learning_rate": 9.89860394870173e-05, + "loss": 0.0282, + "step": 207630 + }, + { + "epoch": 1.34, + "learning_rate": 9.897635813266036e-05, + "loss": 0.032, + "step": 207640 + }, + { + "epoch": 1.34, + "learning_rate": 9.896667677830344e-05, + "loss": 0.0362, + "step": 207650 + }, + { + "epoch": 1.34, + "learning_rate": 9.89569954239465e-05, + "loss": 0.0361, + "step": 207660 + }, + { + "epoch": 1.34, + "learning_rate": 9.894731406958956e-05, + "loss": 0.033, + "step": 207670 + }, + { + "epoch": 1.34, + "learning_rate": 9.893763271523264e-05, + "loss": 0.0313, + "step": 207680 + }, + { + "epoch": 1.34, + "learning_rate": 9.89279513608757e-05, + "loss": 0.0338, + "step": 207690 + }, + { + "epoch": 1.34, + "learning_rate": 9.891827000651877e-05, + "loss": 0.0296, + "step": 207700 + }, + { + "epoch": 1.34, + "learning_rate": 9.890858865216184e-05, + "loss": 0.026, + "step": 207710 + }, + { + "epoch": 1.34, + "learning_rate": 9.889890729780491e-05, + "loss": 0.0313, + "step": 207720 + }, + { + "epoch": 1.34, + "learning_rate": 9.888922594344797e-05, + "loss": 0.0295, + "step": 207730 + }, + { + "epoch": 1.34, + "learning_rate": 9.887954458909104e-05, + "loss": 0.0296, + "step": 207740 + }, + { + "epoch": 1.34, + "learning_rate": 9.886986323473412e-05, + "loss": 0.0316, + "step": 207750 + }, + { + "epoch": 1.34, + "learning_rate": 9.886018188037717e-05, + "loss": 0.0263, + "step": 207760 + }, + { + "epoch": 1.34, + "learning_rate": 9.885050052602024e-05, + "loss": 0.0336, + "step": 207770 + }, + { + "epoch": 1.34, + "learning_rate": 9.884081917166332e-05, + "loss": 0.0244, + "step": 207780 + }, + { + "epoch": 1.34, + "learning_rate": 9.883113781730638e-05, + "loss": 0.0278, + "step": 207790 + }, + { + "epoch": 1.34, + "learning_rate": 9.882145646294945e-05, + "loss": 0.0288, + "step": 207800 + }, + { + "epoch": 1.34, + "learning_rate": 9.881177510859252e-05, + "loss": 0.0286, + "step": 207810 + }, + { + "epoch": 1.34, + "learning_rate": 9.880209375423558e-05, + "loss": 0.0285, + "step": 207820 + }, + { + "epoch": 1.34, + "learning_rate": 9.879241239987865e-05, + "loss": 0.0281, + "step": 207830 + }, + { + "epoch": 1.34, + "learning_rate": 9.878273104552172e-05, + "loss": 0.0313, + "step": 207840 + }, + { + "epoch": 1.34, + "learning_rate": 9.87730496911648e-05, + "loss": 0.0306, + "step": 207850 + }, + { + "epoch": 1.34, + "learning_rate": 9.876336833680786e-05, + "loss": 0.0298, + "step": 207860 + }, + { + "epoch": 1.34, + "learning_rate": 9.875368698245091e-05, + "loss": 0.0303, + "step": 207870 + }, + { + "epoch": 1.34, + "learning_rate": 9.8744005628094e-05, + "loss": 0.0314, + "step": 207880 + }, + { + "epoch": 1.34, + "learning_rate": 9.873432427373706e-05, + "loss": 0.0264, + "step": 207890 + }, + { + "epoch": 1.34, + "learning_rate": 9.872464291938013e-05, + "loss": 0.0273, + "step": 207900 + }, + { + "epoch": 1.34, + "learning_rate": 9.871496156502319e-05, + "loss": 0.0271, + "step": 207910 + }, + { + "epoch": 1.34, + "learning_rate": 9.870528021066626e-05, + "loss": 0.0296, + "step": 207920 + }, + { + "epoch": 1.34, + "learning_rate": 9.869559885630934e-05, + "loss": 0.0263, + "step": 207930 + }, + { + "epoch": 1.34, + "learning_rate": 9.868591750195239e-05, + "loss": 0.0297, + "step": 207940 + }, + { + "epoch": 1.34, + "learning_rate": 9.867623614759547e-05, + "loss": 0.033, + "step": 207950 + }, + { + "epoch": 1.34, + "learning_rate": 9.866655479323854e-05, + "loss": 0.0331, + "step": 207960 + }, + { + "epoch": 1.34, + "learning_rate": 9.865687343888159e-05, + "loss": 0.0246, + "step": 207970 + }, + { + "epoch": 1.34, + "learning_rate": 9.864719208452467e-05, + "loss": 0.0303, + "step": 207980 + }, + { + "epoch": 1.34, + "learning_rate": 9.863751073016774e-05, + "loss": 0.0266, + "step": 207990 + }, + { + "epoch": 1.34, + "learning_rate": 9.862782937581082e-05, + "loss": 0.0264, + "step": 208000 + }, + { + "epoch": 1.34, + "eval_cer": 0.91987888374195, + "eval_loss": 0.02161572314798832, + "eval_runtime": 120.2015, + "eval_samples_per_second": 16.639, + "eval_steps_per_second": 4.16, + "step": 208000 + }, + { + "epoch": 1.34, + "learning_rate": 9.861814802145387e-05, + "loss": 0.0352, + "step": 208010 + }, + { + "epoch": 1.34, + "learning_rate": 9.860846666709694e-05, + "loss": 0.0295, + "step": 208020 + }, + { + "epoch": 1.34, + "learning_rate": 9.859878531274001e-05, + "loss": 0.0302, + "step": 208030 + }, + { + "epoch": 1.34, + "learning_rate": 9.858910395838307e-05, + "loss": 0.0315, + "step": 208040 + }, + { + "epoch": 1.34, + "learning_rate": 9.857942260402615e-05, + "loss": 0.0343, + "step": 208050 + }, + { + "epoch": 1.34, + "learning_rate": 9.856974124966921e-05, + "loss": 0.0287, + "step": 208060 + }, + { + "epoch": 1.34, + "learning_rate": 9.85600598953123e-05, + "loss": 0.0283, + "step": 208070 + }, + { + "epoch": 1.34, + "learning_rate": 9.855037854095535e-05, + "loss": 0.0243, + "step": 208080 + }, + { + "epoch": 1.34, + "learning_rate": 9.854069718659841e-05, + "loss": 0.0318, + "step": 208090 + }, + { + "epoch": 1.34, + "learning_rate": 9.853101583224149e-05, + "loss": 0.0308, + "step": 208100 + }, + { + "epoch": 1.34, + "learning_rate": 9.852133447788454e-05, + "loss": 0.0278, + "step": 208110 + }, + { + "epoch": 1.34, + "learning_rate": 9.851165312352761e-05, + "loss": 0.0353, + "step": 208120 + }, + { + "epoch": 1.34, + "learning_rate": 9.850197176917069e-05, + "loss": 0.0323, + "step": 208130 + }, + { + "epoch": 1.34, + "learning_rate": 9.849229041481376e-05, + "loss": 0.0281, + "step": 208140 + }, + { + "epoch": 1.34, + "learning_rate": 9.848260906045682e-05, + "loss": 0.0342, + "step": 208150 + }, + { + "epoch": 1.34, + "learning_rate": 9.847292770609989e-05, + "loss": 0.0262, + "step": 208160 + }, + { + "epoch": 1.34, + "learning_rate": 9.846324635174297e-05, + "loss": 0.0361, + "step": 208170 + }, + { + "epoch": 1.34, + "learning_rate": 9.845356499738602e-05, + "loss": 0.0272, + "step": 208180 + }, + { + "epoch": 1.34, + "learning_rate": 9.844388364302909e-05, + "loss": 0.0292, + "step": 208190 + }, + { + "epoch": 1.34, + "learning_rate": 9.843420228867217e-05, + "loss": 0.0287, + "step": 208200 + }, + { + "epoch": 1.34, + "learning_rate": 9.842452093431523e-05, + "loss": 0.0315, + "step": 208210 + }, + { + "epoch": 1.34, + "learning_rate": 9.841483957995829e-05, + "loss": 0.0259, + "step": 208220 + }, + { + "epoch": 1.34, + "learning_rate": 9.840515822560137e-05, + "loss": 0.0269, + "step": 208230 + }, + { + "epoch": 1.34, + "learning_rate": 9.839547687124443e-05, + "loss": 0.0322, + "step": 208240 + }, + { + "epoch": 1.34, + "learning_rate": 9.83857955168875e-05, + "loss": 0.03, + "step": 208250 + }, + { + "epoch": 1.34, + "learning_rate": 9.837611416253057e-05, + "loss": 0.0272, + "step": 208260 + }, + { + "epoch": 1.34, + "learning_rate": 9.836643280817365e-05, + "loss": 0.0283, + "step": 208270 + }, + { + "epoch": 1.34, + "learning_rate": 9.835675145381671e-05, + "loss": 0.0312, + "step": 208280 + }, + { + "epoch": 1.34, + "learning_rate": 9.834707009945976e-05, + "loss": 0.0278, + "step": 208290 + }, + { + "epoch": 1.34, + "learning_rate": 9.833738874510284e-05, + "loss": 0.0266, + "step": 208300 + }, + { + "epoch": 1.34, + "learning_rate": 9.832770739074591e-05, + "loss": 0.0331, + "step": 208310 + }, + { + "epoch": 1.34, + "learning_rate": 9.831802603638896e-05, + "loss": 0.0324, + "step": 208320 + }, + { + "epoch": 1.34, + "learning_rate": 9.830834468203204e-05, + "loss": 0.034, + "step": 208330 + }, + { + "epoch": 1.34, + "learning_rate": 9.829866332767511e-05, + "loss": 0.0275, + "step": 208340 + }, + { + "epoch": 1.34, + "learning_rate": 9.828898197331818e-05, + "loss": 0.0288, + "step": 208350 + }, + { + "epoch": 1.34, + "learning_rate": 9.827930061896124e-05, + "loss": 0.0321, + "step": 208360 + }, + { + "epoch": 1.34, + "learning_rate": 9.826961926460432e-05, + "loss": 0.0335, + "step": 208370 + }, + { + "epoch": 1.34, + "learning_rate": 9.825993791024739e-05, + "loss": 0.0358, + "step": 208380 + }, + { + "epoch": 1.34, + "learning_rate": 9.825025655589044e-05, + "loss": 0.036, + "step": 208390 + }, + { + "epoch": 1.35, + "learning_rate": 9.824057520153352e-05, + "loss": 0.0321, + "step": 208400 + }, + { + "epoch": 1.35, + "learning_rate": 9.823089384717659e-05, + "loss": 0.0302, + "step": 208410 + }, + { + "epoch": 1.35, + "learning_rate": 9.822121249281964e-05, + "loss": 0.0318, + "step": 208420 + }, + { + "epoch": 1.35, + "learning_rate": 9.821153113846272e-05, + "loss": 0.0323, + "step": 208430 + }, + { + "epoch": 1.35, + "learning_rate": 9.820184978410578e-05, + "loss": 0.0314, + "step": 208440 + }, + { + "epoch": 1.35, + "learning_rate": 9.819216842974886e-05, + "loss": 0.0253, + "step": 208450 + }, + { + "epoch": 1.35, + "learning_rate": 9.818248707539192e-05, + "loss": 0.0295, + "step": 208460 + }, + { + "epoch": 1.35, + "learning_rate": 9.8172805721035e-05, + "loss": 0.0294, + "step": 208470 + }, + { + "epoch": 1.35, + "learning_rate": 9.816312436667806e-05, + "loss": 0.0267, + "step": 208480 + }, + { + "epoch": 1.35, + "learning_rate": 9.815344301232112e-05, + "loss": 0.0254, + "step": 208490 + }, + { + "epoch": 1.35, + "learning_rate": 9.81437616579642e-05, + "loss": 0.0277, + "step": 208500 + }, + { + "epoch": 1.35, + "learning_rate": 9.813408030360726e-05, + "loss": 0.0337, + "step": 208510 + }, + { + "epoch": 1.35, + "learning_rate": 9.812439894925034e-05, + "loss": 0.0299, + "step": 208520 + }, + { + "epoch": 1.35, + "learning_rate": 9.81147175948934e-05, + "loss": 0.0306, + "step": 208530 + }, + { + "epoch": 1.35, + "learning_rate": 9.810503624053646e-05, + "loss": 0.0255, + "step": 208540 + }, + { + "epoch": 1.35, + "learning_rate": 9.809535488617954e-05, + "loss": 0.028, + "step": 208550 + }, + { + "epoch": 1.35, + "learning_rate": 9.80856735318226e-05, + "loss": 0.0291, + "step": 208560 + }, + { + "epoch": 1.35, + "learning_rate": 9.807599217746567e-05, + "loss": 0.028, + "step": 208570 + }, + { + "epoch": 1.35, + "learning_rate": 9.806631082310874e-05, + "loss": 0.0317, + "step": 208580 + }, + { + "epoch": 1.35, + "learning_rate": 9.805662946875182e-05, + "loss": 0.0279, + "step": 208590 + }, + { + "epoch": 1.35, + "learning_rate": 9.804694811439487e-05, + "loss": 0.0303, + "step": 208600 + }, + { + "epoch": 1.35, + "learning_rate": 9.803726676003794e-05, + "loss": 0.0261, + "step": 208610 + }, + { + "epoch": 1.35, + "learning_rate": 9.802758540568102e-05, + "loss": 0.0333, + "step": 208620 + }, + { + "epoch": 1.35, + "learning_rate": 9.801790405132407e-05, + "loss": 0.0331, + "step": 208630 + }, + { + "epoch": 1.35, + "learning_rate": 9.800822269696714e-05, + "loss": 0.0299, + "step": 208640 + }, + { + "epoch": 1.35, + "learning_rate": 9.799854134261022e-05, + "loss": 0.0335, + "step": 208650 + }, + { + "epoch": 1.35, + "learning_rate": 9.798885998825328e-05, + "loss": 0.0337, + "step": 208660 + }, + { + "epoch": 1.35, + "learning_rate": 9.797917863389635e-05, + "loss": 0.0257, + "step": 208670 + }, + { + "epoch": 1.35, + "learning_rate": 9.796949727953942e-05, + "loss": 0.0286, + "step": 208680 + }, + { + "epoch": 1.35, + "learning_rate": 9.79598159251825e-05, + "loss": 0.0272, + "step": 208690 + }, + { + "epoch": 1.35, + "learning_rate": 9.795013457082555e-05, + "loss": 0.0332, + "step": 208700 + }, + { + "epoch": 1.35, + "learning_rate": 9.794045321646861e-05, + "loss": 0.0285, + "step": 208710 + }, + { + "epoch": 1.35, + "learning_rate": 9.79307718621117e-05, + "loss": 0.0244, + "step": 208720 + }, + { + "epoch": 1.35, + "learning_rate": 9.792109050775476e-05, + "loss": 0.028, + "step": 208730 + }, + { + "epoch": 1.35, + "learning_rate": 9.791140915339781e-05, + "loss": 0.0278, + "step": 208740 + }, + { + "epoch": 1.35, + "learning_rate": 9.790172779904089e-05, + "loss": 0.0266, + "step": 208750 + }, + { + "epoch": 1.35, + "learning_rate": 9.789204644468396e-05, + "loss": 0.0282, + "step": 208760 + }, + { + "epoch": 1.35, + "learning_rate": 9.788236509032703e-05, + "loss": 0.0312, + "step": 208770 + }, + { + "epoch": 1.35, + "learning_rate": 9.787268373597009e-05, + "loss": 0.0272, + "step": 208780 + }, + { + "epoch": 1.35, + "learning_rate": 9.786300238161317e-05, + "loss": 0.0323, + "step": 208790 + }, + { + "epoch": 1.35, + "learning_rate": 9.785332102725624e-05, + "loss": 0.0277, + "step": 208800 + }, + { + "epoch": 1.35, + "learning_rate": 9.784363967289929e-05, + "loss": 0.0297, + "step": 208810 + }, + { + "epoch": 1.35, + "learning_rate": 9.783395831854237e-05, + "loss": 0.0275, + "step": 208820 + }, + { + "epoch": 1.35, + "learning_rate": 9.782427696418544e-05, + "loss": 0.028, + "step": 208830 + }, + { + "epoch": 1.35, + "learning_rate": 9.781459560982849e-05, + "loss": 0.026, + "step": 208840 + }, + { + "epoch": 1.35, + "learning_rate": 9.780491425547157e-05, + "loss": 0.0295, + "step": 208850 + }, + { + "epoch": 1.35, + "learning_rate": 9.779523290111463e-05, + "loss": 0.0239, + "step": 208860 + }, + { + "epoch": 1.35, + "learning_rate": 9.778555154675771e-05, + "loss": 0.0269, + "step": 208870 + }, + { + "epoch": 1.35, + "learning_rate": 9.777587019240077e-05, + "loss": 0.0334, + "step": 208880 + }, + { + "epoch": 1.35, + "learning_rate": 9.776618883804385e-05, + "loss": 0.0323, + "step": 208890 + }, + { + "epoch": 1.35, + "learning_rate": 9.775650748368691e-05, + "loss": 0.0267, + "step": 208900 + }, + { + "epoch": 1.35, + "learning_rate": 9.774682612932997e-05, + "loss": 0.0257, + "step": 208910 + }, + { + "epoch": 1.35, + "learning_rate": 9.773714477497305e-05, + "loss": 0.0325, + "step": 208920 + }, + { + "epoch": 1.35, + "learning_rate": 9.772746342061611e-05, + "loss": 0.0305, + "step": 208930 + }, + { + "epoch": 1.35, + "learning_rate": 9.771778206625919e-05, + "loss": 0.0303, + "step": 208940 + }, + { + "epoch": 1.35, + "learning_rate": 9.770810071190224e-05, + "loss": 0.0266, + "step": 208950 + }, + { + "epoch": 1.35, + "learning_rate": 9.769841935754531e-05, + "loss": 0.0333, + "step": 208960 + }, + { + "epoch": 1.35, + "learning_rate": 9.768873800318839e-05, + "loss": 0.0313, + "step": 208970 + }, + { + "epoch": 1.35, + "learning_rate": 9.767905664883144e-05, + "loss": 0.0286, + "step": 208980 + }, + { + "epoch": 1.35, + "learning_rate": 9.766937529447452e-05, + "loss": 0.0304, + "step": 208990 + }, + { + "epoch": 1.35, + "learning_rate": 9.765969394011759e-05, + "loss": 0.0341, + "step": 209000 + }, + { + "epoch": 1.35, + "eval_cer": 0.919940345723647, + "eval_loss": 0.021424537524580956, + "eval_runtime": 120.0847, + "eval_samples_per_second": 16.655, + "eval_steps_per_second": 4.164, + "step": 209000 + }, + { + "epoch": 1.35, + "learning_rate": 9.765001258576066e-05, + "loss": 0.0322, + "step": 209010 + }, + { + "epoch": 1.35, + "learning_rate": 9.764033123140372e-05, + "loss": 0.0329, + "step": 209020 + }, + { + "epoch": 1.35, + "learning_rate": 9.763064987704679e-05, + "loss": 0.033, + "step": 209030 + }, + { + "epoch": 1.35, + "learning_rate": 9.762096852268987e-05, + "loss": 0.0318, + "step": 209040 + }, + { + "epoch": 1.35, + "learning_rate": 9.761128716833292e-05, + "loss": 0.0308, + "step": 209050 + }, + { + "epoch": 1.35, + "learning_rate": 9.760160581397599e-05, + "loss": 0.027, + "step": 209060 + }, + { + "epoch": 1.35, + "learning_rate": 9.759192445961907e-05, + "loss": 0.0289, + "step": 209070 + }, + { + "epoch": 1.35, + "learning_rate": 9.758224310526213e-05, + "loss": 0.0294, + "step": 209080 + }, + { + "epoch": 1.35, + "learning_rate": 9.75725617509052e-05, + "loss": 0.0308, + "step": 209090 + }, + { + "epoch": 1.35, + "learning_rate": 9.756288039654827e-05, + "loss": 0.026, + "step": 209100 + }, + { + "epoch": 1.35, + "learning_rate": 9.755319904219133e-05, + "loss": 0.0319, + "step": 209110 + }, + { + "epoch": 1.35, + "learning_rate": 9.75435176878344e-05, + "loss": 0.0304, + "step": 209120 + }, + { + "epoch": 1.35, + "learning_rate": 9.753383633347746e-05, + "loss": 0.0266, + "step": 209130 + }, + { + "epoch": 1.35, + "learning_rate": 9.752415497912054e-05, + "loss": 0.0327, + "step": 209140 + }, + { + "epoch": 1.35, + "learning_rate": 9.751447362476361e-05, + "loss": 0.0238, + "step": 209150 + }, + { + "epoch": 1.35, + "learning_rate": 9.750479227040666e-05, + "loss": 0.033, + "step": 209160 + }, + { + "epoch": 1.35, + "learning_rate": 9.749511091604974e-05, + "loss": 0.0298, + "step": 209170 + }, + { + "epoch": 1.35, + "learning_rate": 9.748542956169281e-05, + "loss": 0.0324, + "step": 209180 + }, + { + "epoch": 1.35, + "learning_rate": 9.747574820733587e-05, + "loss": 0.0268, + "step": 209190 + }, + { + "epoch": 1.35, + "learning_rate": 9.746606685297894e-05, + "loss": 0.0278, + "step": 209200 + }, + { + "epoch": 1.35, + "learning_rate": 9.745638549862201e-05, + "loss": 0.03, + "step": 209210 + }, + { + "epoch": 1.35, + "learning_rate": 9.744670414426509e-05, + "loss": 0.0323, + "step": 209220 + }, + { + "epoch": 1.35, + "learning_rate": 9.743702278990814e-05, + "loss": 0.0285, + "step": 209230 + }, + { + "epoch": 1.35, + "learning_rate": 9.742734143555122e-05, + "loss": 0.0308, + "step": 209240 + }, + { + "epoch": 1.35, + "learning_rate": 9.741766008119429e-05, + "loss": 0.0297, + "step": 209250 + }, + { + "epoch": 1.35, + "learning_rate": 9.740797872683734e-05, + "loss": 0.035, + "step": 209260 + }, + { + "epoch": 1.35, + "learning_rate": 9.739829737248042e-05, + "loss": 0.0303, + "step": 209270 + }, + { + "epoch": 1.35, + "learning_rate": 9.738861601812348e-05, + "loss": 0.0303, + "step": 209280 + }, + { + "epoch": 1.35, + "learning_rate": 9.737893466376656e-05, + "loss": 0.0297, + "step": 209290 + }, + { + "epoch": 1.35, + "learning_rate": 9.736925330940962e-05, + "loss": 0.0295, + "step": 209300 + }, + { + "epoch": 1.35, + "learning_rate": 9.735957195505268e-05, + "loss": 0.0262, + "step": 209310 + }, + { + "epoch": 1.35, + "learning_rate": 9.734989060069576e-05, + "loss": 0.0346, + "step": 209320 + }, + { + "epoch": 1.35, + "learning_rate": 9.734020924633882e-05, + "loss": 0.0272, + "step": 209330 + }, + { + "epoch": 1.35, + "learning_rate": 9.73305278919819e-05, + "loss": 0.0289, + "step": 209340 + }, + { + "epoch": 1.35, + "learning_rate": 9.732084653762496e-05, + "loss": 0.0227, + "step": 209350 + }, + { + "epoch": 1.35, + "learning_rate": 9.731116518326804e-05, + "loss": 0.0285, + "step": 209360 + }, + { + "epoch": 1.35, + "learning_rate": 9.73014838289111e-05, + "loss": 0.0292, + "step": 209370 + }, + { + "epoch": 1.35, + "learning_rate": 9.729180247455416e-05, + "loss": 0.026, + "step": 209380 + }, + { + "epoch": 1.35, + "learning_rate": 9.728212112019724e-05, + "loss": 0.0269, + "step": 209390 + }, + { + "epoch": 1.35, + "learning_rate": 9.727243976584029e-05, + "loss": 0.0291, + "step": 209400 + }, + { + "epoch": 1.35, + "learning_rate": 9.726275841148336e-05, + "loss": 0.028, + "step": 209410 + }, + { + "epoch": 1.35, + "learning_rate": 9.725307705712644e-05, + "loss": 0.0292, + "step": 209420 + }, + { + "epoch": 1.35, + "learning_rate": 9.72433957027695e-05, + "loss": 0.03, + "step": 209430 + }, + { + "epoch": 1.35, + "learning_rate": 9.723371434841257e-05, + "loss": 0.0288, + "step": 209440 + }, + { + "epoch": 1.35, + "learning_rate": 9.722403299405564e-05, + "loss": 0.0306, + "step": 209450 + }, + { + "epoch": 1.35, + "learning_rate": 9.721435163969872e-05, + "loss": 0.0279, + "step": 209460 + }, + { + "epoch": 1.35, + "learning_rate": 9.720467028534177e-05, + "loss": 0.0315, + "step": 209470 + }, + { + "epoch": 1.35, + "learning_rate": 9.719498893098484e-05, + "loss": 0.0268, + "step": 209480 + }, + { + "epoch": 1.35, + "learning_rate": 9.718530757662792e-05, + "loss": 0.0324, + "step": 209490 + }, + { + "epoch": 1.35, + "learning_rate": 9.717562622227098e-05, + "loss": 0.0253, + "step": 209500 + }, + { + "epoch": 1.35, + "learning_rate": 9.716594486791404e-05, + "loss": 0.0345, + "step": 209510 + }, + { + "epoch": 1.35, + "learning_rate": 9.715626351355711e-05, + "loss": 0.028, + "step": 209520 + }, + { + "epoch": 1.35, + "learning_rate": 9.714658215920018e-05, + "loss": 0.0296, + "step": 209530 + }, + { + "epoch": 1.35, + "learning_rate": 9.713690080484325e-05, + "loss": 0.0348, + "step": 209540 + }, + { + "epoch": 1.35, + "learning_rate": 9.712721945048631e-05, + "loss": 0.0311, + "step": 209550 + }, + { + "epoch": 1.35, + "learning_rate": 9.71175380961294e-05, + "loss": 0.0243, + "step": 209560 + }, + { + "epoch": 1.35, + "learning_rate": 9.710785674177246e-05, + "loss": 0.0288, + "step": 209570 + }, + { + "epoch": 1.35, + "learning_rate": 9.709817538741551e-05, + "loss": 0.0306, + "step": 209580 + }, + { + "epoch": 1.35, + "learning_rate": 9.708849403305859e-05, + "loss": 0.0327, + "step": 209590 + }, + { + "epoch": 1.35, + "learning_rate": 9.707881267870166e-05, + "loss": 0.0321, + "step": 209600 + }, + { + "epoch": 1.35, + "learning_rate": 9.706913132434471e-05, + "loss": 0.026, + "step": 209610 + }, + { + "epoch": 1.35, + "learning_rate": 9.705944996998779e-05, + "loss": 0.0254, + "step": 209620 + }, + { + "epoch": 1.35, + "learning_rate": 9.704976861563086e-05, + "loss": 0.0326, + "step": 209630 + }, + { + "epoch": 1.35, + "learning_rate": 9.704008726127394e-05, + "loss": 0.0301, + "step": 209640 + }, + { + "epoch": 1.35, + "learning_rate": 9.703040590691699e-05, + "loss": 0.0292, + "step": 209650 + }, + { + "epoch": 1.35, + "learning_rate": 9.702072455256007e-05, + "loss": 0.0305, + "step": 209660 + }, + { + "epoch": 1.35, + "learning_rate": 9.701104319820314e-05, + "loss": 0.0292, + "step": 209670 + }, + { + "epoch": 1.35, + "learning_rate": 9.700136184384619e-05, + "loss": 0.0334, + "step": 209680 + }, + { + "epoch": 1.35, + "learning_rate": 9.699168048948927e-05, + "loss": 0.0314, + "step": 209690 + }, + { + "epoch": 1.35, + "learning_rate": 9.698199913513233e-05, + "loss": 0.028, + "step": 209700 + }, + { + "epoch": 1.35, + "learning_rate": 9.697231778077541e-05, + "loss": 0.0282, + "step": 209710 + }, + { + "epoch": 1.35, + "learning_rate": 9.696263642641847e-05, + "loss": 0.0296, + "step": 209720 + }, + { + "epoch": 1.35, + "learning_rate": 9.695295507206153e-05, + "loss": 0.0283, + "step": 209730 + }, + { + "epoch": 1.35, + "learning_rate": 9.694327371770461e-05, + "loss": 0.0367, + "step": 209740 + }, + { + "epoch": 1.35, + "learning_rate": 9.693359236334767e-05, + "loss": 0.0296, + "step": 209750 + }, + { + "epoch": 1.35, + "learning_rate": 9.692391100899075e-05, + "loss": 0.0251, + "step": 209760 + }, + { + "epoch": 1.35, + "learning_rate": 9.691422965463381e-05, + "loss": 0.0273, + "step": 209770 + }, + { + "epoch": 1.35, + "learning_rate": 9.690454830027689e-05, + "loss": 0.0304, + "step": 209780 + }, + { + "epoch": 1.35, + "learning_rate": 9.689486694591994e-05, + "loss": 0.0334, + "step": 209790 + }, + { + "epoch": 1.35, + "learning_rate": 9.688518559156301e-05, + "loss": 0.0327, + "step": 209800 + }, + { + "epoch": 1.35, + "learning_rate": 9.687550423720609e-05, + "loss": 0.0308, + "step": 209810 + }, + { + "epoch": 1.35, + "learning_rate": 9.686582288284914e-05, + "loss": 0.0267, + "step": 209820 + }, + { + "epoch": 1.35, + "learning_rate": 9.685614152849221e-05, + "loss": 0.0293, + "step": 209830 + }, + { + "epoch": 1.35, + "learning_rate": 9.684646017413529e-05, + "loss": 0.0328, + "step": 209840 + }, + { + "epoch": 1.35, + "learning_rate": 9.683677881977836e-05, + "loss": 0.0307, + "step": 209850 + }, + { + "epoch": 1.35, + "learning_rate": 9.682709746542142e-05, + "loss": 0.0323, + "step": 209860 + }, + { + "epoch": 1.35, + "learning_rate": 9.681741611106449e-05, + "loss": 0.0255, + "step": 209870 + }, + { + "epoch": 1.35, + "learning_rate": 9.680773475670757e-05, + "loss": 0.0291, + "step": 209880 + }, + { + "epoch": 1.35, + "learning_rate": 9.679805340235062e-05, + "loss": 0.0323, + "step": 209890 + }, + { + "epoch": 1.35, + "learning_rate": 9.678837204799369e-05, + "loss": 0.0256, + "step": 209900 + }, + { + "epoch": 1.35, + "learning_rate": 9.677869069363677e-05, + "loss": 0.0319, + "step": 209910 + }, + { + "epoch": 1.35, + "learning_rate": 9.676900933927983e-05, + "loss": 0.036, + "step": 209920 + }, + { + "epoch": 1.35, + "learning_rate": 9.675932798492289e-05, + "loss": 0.0298, + "step": 209930 + }, + { + "epoch": 1.35, + "learning_rate": 9.674964663056596e-05, + "loss": 0.0284, + "step": 209940 + }, + { + "epoch": 1.36, + "learning_rate": 9.673996527620903e-05, + "loss": 0.0312, + "step": 209950 + }, + { + "epoch": 1.36, + "learning_rate": 9.67302839218521e-05, + "loss": 0.0301, + "step": 209960 + }, + { + "epoch": 1.36, + "learning_rate": 9.672060256749516e-05, + "loss": 0.0285, + "step": 209970 + }, + { + "epoch": 1.36, + "learning_rate": 9.671092121313824e-05, + "loss": 0.0422, + "step": 209980 + }, + { + "epoch": 1.36, + "learning_rate": 9.670123985878131e-05, + "loss": 0.0268, + "step": 209990 + }, + { + "epoch": 1.36, + "learning_rate": 9.669155850442436e-05, + "loss": 0.029, + "step": 210000 + }, + { + "epoch": 1.36, + "eval_cer": 0.9199105185854706, + "eval_loss": 0.021298963576555252, + "eval_runtime": 120.106, + "eval_samples_per_second": 16.652, + "eval_steps_per_second": 4.163, + "step": 210000 + }, + { + "epoch": 1.36, + "learning_rate": 9.668187715006744e-05, + "loss": 0.0273, + "step": 210010 + }, + { + "epoch": 1.36, + "learning_rate": 9.667219579571051e-05, + "loss": 0.0299, + "step": 210020 + }, + { + "epoch": 1.36, + "learning_rate": 9.666251444135356e-05, + "loss": 0.0283, + "step": 210030 + }, + { + "epoch": 1.36, + "learning_rate": 9.665283308699664e-05, + "loss": 0.0274, + "step": 210040 + }, + { + "epoch": 1.36, + "learning_rate": 9.664315173263971e-05, + "loss": 0.0297, + "step": 210050 + }, + { + "epoch": 1.36, + "learning_rate": 9.663347037828279e-05, + "loss": 0.0345, + "step": 210060 + }, + { + "epoch": 1.36, + "learning_rate": 9.662378902392584e-05, + "loss": 0.0268, + "step": 210070 + }, + { + "epoch": 1.36, + "learning_rate": 9.661410766956892e-05, + "loss": 0.0269, + "step": 210080 + }, + { + "epoch": 1.36, + "learning_rate": 9.660442631521199e-05, + "loss": 0.0306, + "step": 210090 + }, + { + "epoch": 1.36, + "learning_rate": 9.659474496085504e-05, + "loss": 0.0261, + "step": 210100 + }, + { + "epoch": 1.36, + "learning_rate": 9.658506360649812e-05, + "loss": 0.0302, + "step": 210110 + }, + { + "epoch": 1.36, + "learning_rate": 9.657538225214118e-05, + "loss": 0.0309, + "step": 210120 + }, + { + "epoch": 1.36, + "learning_rate": 9.656570089778426e-05, + "loss": 0.034, + "step": 210130 + }, + { + "epoch": 1.36, + "learning_rate": 9.655601954342732e-05, + "loss": 0.0275, + "step": 210140 + }, + { + "epoch": 1.36, + "learning_rate": 9.654633818907038e-05, + "loss": 0.027, + "step": 210150 + }, + { + "epoch": 1.36, + "learning_rate": 9.653665683471346e-05, + "loss": 0.0365, + "step": 210160 + }, + { + "epoch": 1.36, + "learning_rate": 9.652697548035652e-05, + "loss": 0.0301, + "step": 210170 + }, + { + "epoch": 1.36, + "learning_rate": 9.65172941259996e-05, + "loss": 0.0259, + "step": 210180 + }, + { + "epoch": 1.36, + "learning_rate": 9.650761277164266e-05, + "loss": 0.0345, + "step": 210190 + }, + { + "epoch": 1.36, + "learning_rate": 9.649793141728573e-05, + "loss": 0.0331, + "step": 210200 + }, + { + "epoch": 1.36, + "learning_rate": 9.64882500629288e-05, + "loss": 0.0372, + "step": 210210 + }, + { + "epoch": 1.36, + "learning_rate": 9.647856870857186e-05, + "loss": 0.0323, + "step": 210220 + }, + { + "epoch": 1.36, + "learning_rate": 9.646888735421494e-05, + "loss": 0.0277, + "step": 210230 + }, + { + "epoch": 1.36, + "learning_rate": 9.645920599985799e-05, + "loss": 0.0301, + "step": 210240 + }, + { + "epoch": 1.36, + "learning_rate": 9.644952464550106e-05, + "loss": 0.0289, + "step": 210250 + }, + { + "epoch": 1.36, + "learning_rate": 9.643984329114414e-05, + "loss": 0.0238, + "step": 210260 + }, + { + "epoch": 1.36, + "learning_rate": 9.64301619367872e-05, + "loss": 0.0293, + "step": 210270 + }, + { + "epoch": 1.36, + "learning_rate": 9.642048058243027e-05, + "loss": 0.0241, + "step": 210280 + }, + { + "epoch": 1.36, + "learning_rate": 9.641079922807334e-05, + "loss": 0.0268, + "step": 210290 + }, + { + "epoch": 1.36, + "learning_rate": 9.64011178737164e-05, + "loss": 0.0286, + "step": 210300 + }, + { + "epoch": 1.36, + "learning_rate": 9.639143651935947e-05, + "loss": 0.0267, + "step": 210310 + }, + { + "epoch": 1.36, + "learning_rate": 9.638175516500254e-05, + "loss": 0.0277, + "step": 210320 + }, + { + "epoch": 1.36, + "learning_rate": 9.637207381064562e-05, + "loss": 0.03, + "step": 210330 + }, + { + "epoch": 1.36, + "learning_rate": 9.636239245628868e-05, + "loss": 0.0284, + "step": 210340 + }, + { + "epoch": 1.36, + "learning_rate": 9.635271110193173e-05, + "loss": 0.0316, + "step": 210350 + }, + { + "epoch": 1.36, + "learning_rate": 9.634302974757481e-05, + "loss": 0.0271, + "step": 210360 + }, + { + "epoch": 1.36, + "learning_rate": 9.633334839321788e-05, + "loss": 0.0259, + "step": 210370 + }, + { + "epoch": 1.36, + "learning_rate": 9.632366703886095e-05, + "loss": 0.0277, + "step": 210380 + }, + { + "epoch": 1.36, + "learning_rate": 9.631398568450401e-05, + "loss": 0.0325, + "step": 210390 + }, + { + "epoch": 1.36, + "learning_rate": 9.630430433014708e-05, + "loss": 0.0279, + "step": 210400 + }, + { + "epoch": 1.36, + "learning_rate": 9.629462297579016e-05, + "loss": 0.0301, + "step": 210410 + }, + { + "epoch": 1.36, + "learning_rate": 9.628494162143321e-05, + "loss": 0.0263, + "step": 210420 + }, + { + "epoch": 1.36, + "learning_rate": 9.627526026707629e-05, + "loss": 0.032, + "step": 210430 + }, + { + "epoch": 1.36, + "learning_rate": 9.626557891271936e-05, + "loss": 0.029, + "step": 210440 + }, + { + "epoch": 1.36, + "learning_rate": 9.625589755836241e-05, + "loss": 0.0287, + "step": 210450 + }, + { + "epoch": 1.36, + "learning_rate": 9.624621620400549e-05, + "loss": 0.0297, + "step": 210460 + }, + { + "epoch": 1.36, + "learning_rate": 9.623653484964856e-05, + "loss": 0.0325, + "step": 210470 + }, + { + "epoch": 1.36, + "learning_rate": 9.622685349529164e-05, + "loss": 0.0329, + "step": 210480 + }, + { + "epoch": 1.36, + "learning_rate": 9.621717214093469e-05, + "loss": 0.026, + "step": 210490 + }, + { + "epoch": 1.36, + "learning_rate": 9.620749078657776e-05, + "loss": 0.0288, + "step": 210500 + }, + { + "epoch": 1.36, + "learning_rate": 9.619780943222084e-05, + "loss": 0.0314, + "step": 210510 + }, + { + "epoch": 1.36, + "learning_rate": 9.618812807786389e-05, + "loss": 0.0305, + "step": 210520 + }, + { + "epoch": 1.36, + "learning_rate": 9.617844672350697e-05, + "loss": 0.0336, + "step": 210530 + }, + { + "epoch": 1.36, + "learning_rate": 9.616876536915003e-05, + "loss": 0.0336, + "step": 210540 + }, + { + "epoch": 1.36, + "learning_rate": 9.615908401479311e-05, + "loss": 0.0247, + "step": 210550 + }, + { + "epoch": 1.36, + "learning_rate": 9.614940266043617e-05, + "loss": 0.034, + "step": 210560 + }, + { + "epoch": 1.36, + "learning_rate": 9.613972130607923e-05, + "loss": 0.0268, + "step": 210570 + }, + { + "epoch": 1.36, + "learning_rate": 9.613003995172231e-05, + "loss": 0.0299, + "step": 210580 + }, + { + "epoch": 1.36, + "learning_rate": 9.612035859736537e-05, + "loss": 0.0296, + "step": 210590 + }, + { + "epoch": 1.36, + "learning_rate": 9.611067724300843e-05, + "loss": 0.0327, + "step": 210600 + }, + { + "epoch": 1.36, + "learning_rate": 9.610099588865151e-05, + "loss": 0.0295, + "step": 210610 + }, + { + "epoch": 1.36, + "learning_rate": 9.609131453429458e-05, + "loss": 0.0282, + "step": 210620 + }, + { + "epoch": 1.36, + "learning_rate": 9.608163317993764e-05, + "loss": 0.0303, + "step": 210630 + }, + { + "epoch": 1.36, + "learning_rate": 9.607195182558071e-05, + "loss": 0.0271, + "step": 210640 + }, + { + "epoch": 1.36, + "learning_rate": 9.606227047122379e-05, + "loss": 0.0281, + "step": 210650 + }, + { + "epoch": 1.36, + "learning_rate": 9.605258911686684e-05, + "loss": 0.0263, + "step": 210660 + }, + { + "epoch": 1.36, + "learning_rate": 9.604290776250991e-05, + "loss": 0.0342, + "step": 210670 + }, + { + "epoch": 1.36, + "learning_rate": 9.603322640815299e-05, + "loss": 0.029, + "step": 210680 + }, + { + "epoch": 1.36, + "learning_rate": 9.602354505379605e-05, + "loss": 0.0265, + "step": 210690 + }, + { + "epoch": 1.36, + "learning_rate": 9.601386369943911e-05, + "loss": 0.0308, + "step": 210700 + }, + { + "epoch": 1.36, + "learning_rate": 9.600418234508219e-05, + "loss": 0.032, + "step": 210710 + }, + { + "epoch": 1.36, + "learning_rate": 9.599450099072525e-05, + "loss": 0.0326, + "step": 210720 + }, + { + "epoch": 1.36, + "learning_rate": 9.598481963636832e-05, + "loss": 0.0345, + "step": 210730 + }, + { + "epoch": 1.36, + "learning_rate": 9.597513828201139e-05, + "loss": 0.0286, + "step": 210740 + }, + { + "epoch": 1.36, + "learning_rate": 9.596545692765447e-05, + "loss": 0.0351, + "step": 210750 + }, + { + "epoch": 1.36, + "learning_rate": 9.595577557329753e-05, + "loss": 0.0347, + "step": 210760 + }, + { + "epoch": 1.36, + "learning_rate": 9.594609421894058e-05, + "loss": 0.0311, + "step": 210770 + }, + { + "epoch": 1.36, + "learning_rate": 9.593641286458366e-05, + "loss": 0.032, + "step": 210780 + }, + { + "epoch": 1.36, + "learning_rate": 9.592673151022673e-05, + "loss": 0.0342, + "step": 210790 + }, + { + "epoch": 1.36, + "learning_rate": 9.59170501558698e-05, + "loss": 0.0299, + "step": 210800 + }, + { + "epoch": 1.36, + "learning_rate": 9.590736880151286e-05, + "loss": 0.0325, + "step": 210810 + }, + { + "epoch": 1.36, + "learning_rate": 9.589768744715593e-05, + "loss": 0.0276, + "step": 210820 + }, + { + "epoch": 1.36, + "learning_rate": 9.588800609279901e-05, + "loss": 0.0263, + "step": 210830 + }, + { + "epoch": 1.36, + "learning_rate": 9.587832473844206e-05, + "loss": 0.0302, + "step": 210840 + }, + { + "epoch": 1.36, + "learning_rate": 9.586864338408514e-05, + "loss": 0.0309, + "step": 210850 + }, + { + "epoch": 1.36, + "learning_rate": 9.585896202972821e-05, + "loss": 0.0341, + "step": 210860 + }, + { + "epoch": 1.36, + "learning_rate": 9.584928067537126e-05, + "loss": 0.0299, + "step": 210870 + }, + { + "epoch": 1.36, + "learning_rate": 9.583959932101434e-05, + "loss": 0.0334, + "step": 210880 + }, + { + "epoch": 1.36, + "learning_rate": 9.58299179666574e-05, + "loss": 0.0275, + "step": 210890 + }, + { + "epoch": 1.36, + "learning_rate": 9.582023661230049e-05, + "loss": 0.0332, + "step": 210900 + }, + { + "epoch": 1.36, + "learning_rate": 9.581055525794354e-05, + "loss": 0.0327, + "step": 210910 + }, + { + "epoch": 1.36, + "learning_rate": 9.58008739035866e-05, + "loss": 0.0275, + "step": 210920 + }, + { + "epoch": 1.36, + "learning_rate": 9.579119254922969e-05, + "loss": 0.0292, + "step": 210930 + }, + { + "epoch": 1.36, + "learning_rate": 9.578151119487274e-05, + "loss": 0.0264, + "step": 210940 + }, + { + "epoch": 1.36, + "learning_rate": 9.577182984051582e-05, + "loss": 0.028, + "step": 210950 + }, + { + "epoch": 1.36, + "learning_rate": 9.576214848615888e-05, + "loss": 0.031, + "step": 210960 + }, + { + "epoch": 1.36, + "learning_rate": 9.575246713180196e-05, + "loss": 0.0295, + "step": 210970 + }, + { + "epoch": 1.36, + "learning_rate": 9.574278577744502e-05, + "loss": 0.0311, + "step": 210980 + }, + { + "epoch": 1.36, + "learning_rate": 9.573310442308808e-05, + "loss": 0.0286, + "step": 210990 + }, + { + "epoch": 1.36, + "learning_rate": 9.572342306873116e-05, + "loss": 0.0281, + "step": 211000 + }, + { + "epoch": 1.36, + "eval_cer": 0.9198364026663653, + "eval_loss": 0.021836968138813972, + "eval_runtime": 120.1382, + "eval_samples_per_second": 16.647, + "eval_steps_per_second": 4.162, + "step": 211000 + }, + { + "epoch": 1.36, + "learning_rate": 9.571374171437422e-05, + "loss": 0.0298, + "step": 211010 + }, + { + "epoch": 1.36, + "learning_rate": 9.570406036001728e-05, + "loss": 0.0298, + "step": 211020 + }, + { + "epoch": 1.36, + "learning_rate": 9.569437900566036e-05, + "loss": 0.0268, + "step": 211030 + }, + { + "epoch": 1.36, + "learning_rate": 9.568469765130343e-05, + "loss": 0.0221, + "step": 211040 + }, + { + "epoch": 1.36, + "learning_rate": 9.56750162969465e-05, + "loss": 0.0275, + "step": 211050 + }, + { + "epoch": 1.36, + "learning_rate": 9.566533494258956e-05, + "loss": 0.0284, + "step": 211060 + }, + { + "epoch": 1.36, + "learning_rate": 9.565565358823264e-05, + "loss": 0.0303, + "step": 211070 + }, + { + "epoch": 1.36, + "learning_rate": 9.564597223387569e-05, + "loss": 0.0323, + "step": 211080 + }, + { + "epoch": 1.36, + "learning_rate": 9.563629087951876e-05, + "loss": 0.0308, + "step": 211090 + }, + { + "epoch": 1.36, + "learning_rate": 9.562660952516184e-05, + "loss": 0.033, + "step": 211100 + }, + { + "epoch": 1.36, + "learning_rate": 9.56169281708049e-05, + "loss": 0.0396, + "step": 211110 + }, + { + "epoch": 1.36, + "learning_rate": 9.560724681644796e-05, + "loss": 0.0297, + "step": 211120 + }, + { + "epoch": 1.36, + "learning_rate": 9.559756546209104e-05, + "loss": 0.0239, + "step": 211130 + }, + { + "epoch": 1.36, + "learning_rate": 9.55878841077341e-05, + "loss": 0.0275, + "step": 211140 + }, + { + "epoch": 1.36, + "learning_rate": 9.557820275337717e-05, + "loss": 0.0243, + "step": 211150 + }, + { + "epoch": 1.36, + "learning_rate": 9.556852139902024e-05, + "loss": 0.0292, + "step": 211160 + }, + { + "epoch": 1.36, + "learning_rate": 9.555884004466332e-05, + "loss": 0.0267, + "step": 211170 + }, + { + "epoch": 1.36, + "learning_rate": 9.554915869030638e-05, + "loss": 0.0296, + "step": 211180 + }, + { + "epoch": 1.36, + "learning_rate": 9.553947733594943e-05, + "loss": 0.0318, + "step": 211190 + }, + { + "epoch": 1.36, + "learning_rate": 9.552979598159251e-05, + "loss": 0.0307, + "step": 211200 + }, + { + "epoch": 1.36, + "learning_rate": 9.552011462723558e-05, + "loss": 0.0275, + "step": 211210 + }, + { + "epoch": 1.36, + "learning_rate": 9.551043327287863e-05, + "loss": 0.0328, + "step": 211220 + }, + { + "epoch": 1.36, + "learning_rate": 9.550075191852171e-05, + "loss": 0.0315, + "step": 211230 + }, + { + "epoch": 1.36, + "learning_rate": 9.549107056416478e-05, + "loss": 0.0325, + "step": 211240 + }, + { + "epoch": 1.36, + "learning_rate": 9.548138920980786e-05, + "loss": 0.0323, + "step": 211250 + }, + { + "epoch": 1.36, + "learning_rate": 9.547170785545091e-05, + "loss": 0.0299, + "step": 211260 + }, + { + "epoch": 1.36, + "learning_rate": 9.546202650109399e-05, + "loss": 0.0315, + "step": 211270 + }, + { + "epoch": 1.36, + "learning_rate": 9.545234514673706e-05, + "loss": 0.0291, + "step": 211280 + }, + { + "epoch": 1.36, + "learning_rate": 9.544266379238011e-05, + "loss": 0.0306, + "step": 211290 + }, + { + "epoch": 1.36, + "learning_rate": 9.543298243802319e-05, + "loss": 0.0265, + "step": 211300 + }, + { + "epoch": 1.36, + "learning_rate": 9.542330108366626e-05, + "loss": 0.0268, + "step": 211310 + }, + { + "epoch": 1.36, + "learning_rate": 9.541361972930934e-05, + "loss": 0.0309, + "step": 211320 + }, + { + "epoch": 1.36, + "learning_rate": 9.540393837495239e-05, + "loss": 0.0358, + "step": 211330 + }, + { + "epoch": 1.36, + "learning_rate": 9.539425702059546e-05, + "loss": 0.0314, + "step": 211340 + }, + { + "epoch": 1.36, + "learning_rate": 9.538457566623853e-05, + "loss": 0.0308, + "step": 211350 + }, + { + "epoch": 1.36, + "learning_rate": 9.537489431188159e-05, + "loss": 0.0346, + "step": 211360 + }, + { + "epoch": 1.36, + "learning_rate": 9.536521295752467e-05, + "loss": 0.031, + "step": 211370 + }, + { + "epoch": 1.36, + "learning_rate": 9.535553160316773e-05, + "loss": 0.0287, + "step": 211380 + }, + { + "epoch": 1.36, + "learning_rate": 9.534585024881081e-05, + "loss": 0.0329, + "step": 211390 + }, + { + "epoch": 1.36, + "learning_rate": 9.533616889445387e-05, + "loss": 0.0307, + "step": 211400 + }, + { + "epoch": 1.36, + "learning_rate": 9.532648754009693e-05, + "loss": 0.0239, + "step": 211410 + }, + { + "epoch": 1.36, + "learning_rate": 9.531680618574001e-05, + "loss": 0.0351, + "step": 211420 + }, + { + "epoch": 1.36, + "learning_rate": 9.530712483138306e-05, + "loss": 0.0351, + "step": 211430 + }, + { + "epoch": 1.36, + "learning_rate": 9.529744347702613e-05, + "loss": 0.0248, + "step": 211440 + }, + { + "epoch": 1.36, + "learning_rate": 9.528776212266921e-05, + "loss": 0.0309, + "step": 211450 + }, + { + "epoch": 1.36, + "learning_rate": 9.527808076831228e-05, + "loss": 0.0283, + "step": 211460 + }, + { + "epoch": 1.36, + "learning_rate": 9.526839941395534e-05, + "loss": 0.0319, + "step": 211470 + }, + { + "epoch": 1.36, + "learning_rate": 9.525871805959841e-05, + "loss": 0.0307, + "step": 211480 + }, + { + "epoch": 1.37, + "learning_rate": 9.524903670524149e-05, + "loss": 0.0277, + "step": 211490 + }, + { + "epoch": 1.37, + "learning_rate": 9.523935535088454e-05, + "loss": 0.0287, + "step": 211500 + }, + { + "epoch": 1.37, + "learning_rate": 9.522967399652761e-05, + "loss": 0.0272, + "step": 211510 + }, + { + "epoch": 1.37, + "learning_rate": 9.521999264217069e-05, + "loss": 0.0353, + "step": 211520 + }, + { + "epoch": 1.37, + "learning_rate": 9.521031128781375e-05, + "loss": 0.036, + "step": 211530 + }, + { + "epoch": 1.37, + "learning_rate": 9.520062993345681e-05, + "loss": 0.0358, + "step": 211540 + }, + { + "epoch": 1.37, + "learning_rate": 9.519094857909989e-05, + "loss": 0.029, + "step": 211550 + }, + { + "epoch": 1.37, + "learning_rate": 9.518126722474295e-05, + "loss": 0.0279, + "step": 211560 + }, + { + "epoch": 1.37, + "learning_rate": 9.517158587038602e-05, + "loss": 0.0261, + "step": 211570 + }, + { + "epoch": 1.37, + "learning_rate": 9.516190451602909e-05, + "loss": 0.0238, + "step": 211580 + }, + { + "epoch": 1.37, + "learning_rate": 9.515222316167217e-05, + "loss": 0.0356, + "step": 211590 + }, + { + "epoch": 1.37, + "learning_rate": 9.514254180731523e-05, + "loss": 0.0315, + "step": 211600 + }, + { + "epoch": 1.37, + "learning_rate": 9.513286045295828e-05, + "loss": 0.0274, + "step": 211610 + }, + { + "epoch": 1.37, + "learning_rate": 9.512317909860136e-05, + "loss": 0.0335, + "step": 211620 + }, + { + "epoch": 1.37, + "learning_rate": 9.511349774424443e-05, + "loss": 0.026, + "step": 211630 + }, + { + "epoch": 1.37, + "learning_rate": 9.510381638988748e-05, + "loss": 0.0333, + "step": 211640 + }, + { + "epoch": 1.37, + "learning_rate": 9.509413503553056e-05, + "loss": 0.032, + "step": 211650 + }, + { + "epoch": 1.37, + "learning_rate": 9.508445368117363e-05, + "loss": 0.0321, + "step": 211660 + }, + { + "epoch": 1.37, + "learning_rate": 9.507477232681671e-05, + "loss": 0.0289, + "step": 211670 + }, + { + "epoch": 1.37, + "learning_rate": 9.506509097245976e-05, + "loss": 0.0323, + "step": 211680 + }, + { + "epoch": 1.37, + "learning_rate": 9.505540961810284e-05, + "loss": 0.0254, + "step": 211690 + }, + { + "epoch": 1.37, + "learning_rate": 9.504572826374591e-05, + "loss": 0.026, + "step": 211700 + }, + { + "epoch": 1.37, + "learning_rate": 9.503604690938896e-05, + "loss": 0.0301, + "step": 211710 + }, + { + "epoch": 1.37, + "learning_rate": 9.502636555503204e-05, + "loss": 0.0263, + "step": 211720 + }, + { + "epoch": 1.37, + "learning_rate": 9.50166842006751e-05, + "loss": 0.0274, + "step": 211730 + }, + { + "epoch": 1.37, + "learning_rate": 9.500700284631819e-05, + "loss": 0.0265, + "step": 211740 + }, + { + "epoch": 1.37, + "learning_rate": 9.499732149196124e-05, + "loss": 0.0303, + "step": 211750 + }, + { + "epoch": 1.37, + "learning_rate": 9.49876401376043e-05, + "loss": 0.0291, + "step": 211760 + }, + { + "epoch": 1.37, + "learning_rate": 9.497795878324738e-05, + "loss": 0.028, + "step": 211770 + }, + { + "epoch": 1.37, + "learning_rate": 9.496827742889044e-05, + "loss": 0.0261, + "step": 211780 + }, + { + "epoch": 1.37, + "learning_rate": 9.495859607453352e-05, + "loss": 0.0254, + "step": 211790 + }, + { + "epoch": 1.37, + "learning_rate": 9.494891472017658e-05, + "loss": 0.0271, + "step": 211800 + }, + { + "epoch": 1.37, + "learning_rate": 9.493923336581964e-05, + "loss": 0.0257, + "step": 211810 + }, + { + "epoch": 1.37, + "learning_rate": 9.492955201146272e-05, + "loss": 0.0275, + "step": 211820 + }, + { + "epoch": 1.37, + "learning_rate": 9.491987065710578e-05, + "loss": 0.0356, + "step": 211830 + }, + { + "epoch": 1.37, + "learning_rate": 9.491018930274886e-05, + "loss": 0.0316, + "step": 211840 + }, + { + "epoch": 1.37, + "learning_rate": 9.490050794839191e-05, + "loss": 0.0253, + "step": 211850 + }, + { + "epoch": 1.37, + "learning_rate": 9.489082659403498e-05, + "loss": 0.0281, + "step": 211860 + }, + { + "epoch": 1.37, + "learning_rate": 9.488114523967806e-05, + "loss": 0.0296, + "step": 211870 + }, + { + "epoch": 1.37, + "learning_rate": 9.487146388532111e-05, + "loss": 0.0262, + "step": 211880 + }, + { + "epoch": 1.37, + "learning_rate": 9.486178253096419e-05, + "loss": 0.0335, + "step": 211890 + }, + { + "epoch": 1.37, + "learning_rate": 9.485210117660726e-05, + "loss": 0.0386, + "step": 211900 + }, + { + "epoch": 1.37, + "learning_rate": 9.484241982225033e-05, + "loss": 0.0279, + "step": 211910 + }, + { + "epoch": 1.37, + "learning_rate": 9.483273846789339e-05, + "loss": 0.0287, + "step": 211920 + }, + { + "epoch": 1.37, + "learning_rate": 9.482305711353646e-05, + "loss": 0.0318, + "step": 211930 + }, + { + "epoch": 1.37, + "learning_rate": 9.481337575917954e-05, + "loss": 0.0283, + "step": 211940 + }, + { + "epoch": 1.37, + "learning_rate": 9.480369440482259e-05, + "loss": 0.0253, + "step": 211950 + }, + { + "epoch": 1.37, + "learning_rate": 9.479401305046566e-05, + "loss": 0.0319, + "step": 211960 + }, + { + "epoch": 1.37, + "learning_rate": 9.478433169610874e-05, + "loss": 0.0348, + "step": 211970 + }, + { + "epoch": 1.37, + "learning_rate": 9.47746503417518e-05, + "loss": 0.0284, + "step": 211980 + }, + { + "epoch": 1.37, + "learning_rate": 9.476496898739487e-05, + "loss": 0.0302, + "step": 211990 + }, + { + "epoch": 1.37, + "learning_rate": 9.475528763303794e-05, + "loss": 0.033, + "step": 212000 + }, + { + "epoch": 1.37, + "eval_cer": 0.9199132301434866, + "eval_loss": 0.02124147117137909, + "eval_runtime": 120.2274, + "eval_samples_per_second": 16.635, + "eval_steps_per_second": 4.159, + "step": 212000 + }, + { + "epoch": 1.37, + "learning_rate": 9.4745606278681e-05, + "loss": 0.0337, + "step": 212010 + }, + { + "epoch": 1.37, + "learning_rate": 9.473592492432407e-05, + "loss": 0.0298, + "step": 212020 + }, + { + "epoch": 1.37, + "learning_rate": 9.472624356996713e-05, + "loss": 0.0331, + "step": 212030 + }, + { + "epoch": 1.37, + "learning_rate": 9.471656221561021e-05, + "loss": 0.0277, + "step": 212040 + }, + { + "epoch": 1.37, + "learning_rate": 9.470688086125328e-05, + "loss": 0.0339, + "step": 212050 + }, + { + "epoch": 1.37, + "learning_rate": 9.469719950689633e-05, + "loss": 0.0311, + "step": 212060 + }, + { + "epoch": 1.37, + "learning_rate": 9.468751815253941e-05, + "loss": 0.0252, + "step": 212070 + }, + { + "epoch": 1.37, + "learning_rate": 9.467783679818248e-05, + "loss": 0.0308, + "step": 212080 + }, + { + "epoch": 1.37, + "learning_rate": 9.466815544382555e-05, + "loss": 0.0276, + "step": 212090 + }, + { + "epoch": 1.37, + "learning_rate": 9.465847408946861e-05, + "loss": 0.0352, + "step": 212100 + }, + { + "epoch": 1.37, + "learning_rate": 9.464879273511168e-05, + "loss": 0.0293, + "step": 212110 + }, + { + "epoch": 1.37, + "learning_rate": 9.463911138075476e-05, + "loss": 0.0283, + "step": 212120 + }, + { + "epoch": 1.37, + "learning_rate": 9.462943002639781e-05, + "loss": 0.0284, + "step": 212130 + }, + { + "epoch": 1.37, + "learning_rate": 9.461974867204089e-05, + "loss": 0.0315, + "step": 212140 + }, + { + "epoch": 1.37, + "learning_rate": 9.461006731768396e-05, + "loss": 0.032, + "step": 212150 + }, + { + "epoch": 1.37, + "learning_rate": 9.460038596332701e-05, + "loss": 0.0269, + "step": 212160 + }, + { + "epoch": 1.37, + "learning_rate": 9.459070460897009e-05, + "loss": 0.0308, + "step": 212170 + }, + { + "epoch": 1.37, + "learning_rate": 9.458102325461315e-05, + "loss": 0.0266, + "step": 212180 + }, + { + "epoch": 1.37, + "learning_rate": 9.457134190025623e-05, + "loss": 0.0292, + "step": 212190 + }, + { + "epoch": 1.37, + "learning_rate": 9.456166054589929e-05, + "loss": 0.0278, + "step": 212200 + }, + { + "epoch": 1.37, + "learning_rate": 9.455197919154235e-05, + "loss": 0.0321, + "step": 212210 + }, + { + "epoch": 1.37, + "learning_rate": 9.454229783718543e-05, + "loss": 0.0336, + "step": 212220 + }, + { + "epoch": 1.37, + "learning_rate": 9.453261648282849e-05, + "loss": 0.0227, + "step": 212230 + }, + { + "epoch": 1.37, + "learning_rate": 9.452293512847157e-05, + "loss": 0.0256, + "step": 212240 + }, + { + "epoch": 1.37, + "learning_rate": 9.451325377411463e-05, + "loss": 0.0277, + "step": 212250 + }, + { + "epoch": 1.37, + "learning_rate": 9.450357241975771e-05, + "loss": 0.0296, + "step": 212260 + }, + { + "epoch": 1.37, + "learning_rate": 9.449389106540076e-05, + "loss": 0.026, + "step": 212270 + }, + { + "epoch": 1.37, + "learning_rate": 9.448420971104383e-05, + "loss": 0.0245, + "step": 212280 + }, + { + "epoch": 1.37, + "learning_rate": 9.447452835668691e-05, + "loss": 0.032, + "step": 212290 + }, + { + "epoch": 1.37, + "learning_rate": 9.446484700232996e-05, + "loss": 0.0286, + "step": 212300 + }, + { + "epoch": 1.37, + "learning_rate": 9.445516564797303e-05, + "loss": 0.0285, + "step": 212310 + }, + { + "epoch": 1.37, + "learning_rate": 9.444548429361611e-05, + "loss": 0.0286, + "step": 212320 + }, + { + "epoch": 1.37, + "learning_rate": 9.443580293925918e-05, + "loss": 0.0297, + "step": 212330 + }, + { + "epoch": 1.37, + "learning_rate": 9.442612158490224e-05, + "loss": 0.0333, + "step": 212340 + }, + { + "epoch": 1.37, + "learning_rate": 9.441644023054531e-05, + "loss": 0.0281, + "step": 212350 + }, + { + "epoch": 1.37, + "learning_rate": 9.440675887618839e-05, + "loss": 0.0299, + "step": 212360 + }, + { + "epoch": 1.37, + "learning_rate": 9.439707752183144e-05, + "loss": 0.0292, + "step": 212370 + }, + { + "epoch": 1.37, + "learning_rate": 9.43873961674745e-05, + "loss": 0.0278, + "step": 212380 + }, + { + "epoch": 1.37, + "learning_rate": 9.437771481311759e-05, + "loss": 0.0326, + "step": 212390 + }, + { + "epoch": 1.37, + "learning_rate": 9.436803345876065e-05, + "loss": 0.0276, + "step": 212400 + }, + { + "epoch": 1.37, + "learning_rate": 9.43583521044037e-05, + "loss": 0.0266, + "step": 212410 + }, + { + "epoch": 1.37, + "learning_rate": 9.434867075004679e-05, + "loss": 0.0271, + "step": 212420 + }, + { + "epoch": 1.37, + "learning_rate": 9.433898939568985e-05, + "loss": 0.0297, + "step": 212430 + }, + { + "epoch": 1.37, + "learning_rate": 9.432930804133292e-05, + "loss": 0.0261, + "step": 212440 + }, + { + "epoch": 1.37, + "learning_rate": 9.431962668697598e-05, + "loss": 0.0258, + "step": 212450 + }, + { + "epoch": 1.37, + "learning_rate": 9.430994533261906e-05, + "loss": 0.0304, + "step": 212460 + }, + { + "epoch": 1.37, + "learning_rate": 9.430026397826213e-05, + "loss": 0.0316, + "step": 212470 + }, + { + "epoch": 1.37, + "learning_rate": 9.429058262390518e-05, + "loss": 0.0241, + "step": 212480 + }, + { + "epoch": 1.37, + "learning_rate": 9.428090126954826e-05, + "loss": 0.027, + "step": 212490 + }, + { + "epoch": 1.37, + "learning_rate": 9.427121991519133e-05, + "loss": 0.0318, + "step": 212500 + }, + { + "epoch": 1.37, + "learning_rate": 9.426153856083438e-05, + "loss": 0.0272, + "step": 212510 + }, + { + "epoch": 1.37, + "learning_rate": 9.425185720647746e-05, + "loss": 0.0335, + "step": 212520 + }, + { + "epoch": 1.37, + "learning_rate": 9.424217585212053e-05, + "loss": 0.0275, + "step": 212530 + }, + { + "epoch": 1.37, + "learning_rate": 9.423249449776361e-05, + "loss": 0.0384, + "step": 212540 + }, + { + "epoch": 1.37, + "learning_rate": 9.422281314340666e-05, + "loss": 0.0268, + "step": 212550 + }, + { + "epoch": 1.37, + "learning_rate": 9.421313178904974e-05, + "loss": 0.0363, + "step": 212560 + }, + { + "epoch": 1.37, + "learning_rate": 9.42034504346928e-05, + "loss": 0.028, + "step": 212570 + }, + { + "epoch": 1.37, + "learning_rate": 9.419376908033586e-05, + "loss": 0.0293, + "step": 212580 + }, + { + "epoch": 1.37, + "learning_rate": 9.418408772597894e-05, + "loss": 0.0246, + "step": 212590 + }, + { + "epoch": 1.37, + "learning_rate": 9.4174406371622e-05, + "loss": 0.0316, + "step": 212600 + }, + { + "epoch": 1.37, + "learning_rate": 9.416472501726508e-05, + "loss": 0.0304, + "step": 212610 + }, + { + "epoch": 1.37, + "learning_rate": 9.415504366290814e-05, + "loss": 0.0318, + "step": 212620 + }, + { + "epoch": 1.37, + "learning_rate": 9.41453623085512e-05, + "loss": 0.0276, + "step": 212630 + }, + { + "epoch": 1.37, + "learning_rate": 9.413568095419428e-05, + "loss": 0.0295, + "step": 212640 + }, + { + "epoch": 1.37, + "learning_rate": 9.412599959983734e-05, + "loss": 0.029, + "step": 212650 + }, + { + "epoch": 1.37, + "learning_rate": 9.411631824548042e-05, + "loss": 0.024, + "step": 212660 + }, + { + "epoch": 1.37, + "learning_rate": 9.410663689112348e-05, + "loss": 0.0267, + "step": 212670 + }, + { + "epoch": 1.37, + "learning_rate": 9.409695553676656e-05, + "loss": 0.026, + "step": 212680 + }, + { + "epoch": 1.37, + "learning_rate": 9.408727418240961e-05, + "loss": 0.0278, + "step": 212690 + }, + { + "epoch": 1.37, + "learning_rate": 9.407759282805268e-05, + "loss": 0.0276, + "step": 212700 + }, + { + "epoch": 1.37, + "learning_rate": 9.406791147369576e-05, + "loss": 0.034, + "step": 212710 + }, + { + "epoch": 1.37, + "learning_rate": 9.405823011933881e-05, + "loss": 0.0282, + "step": 212720 + }, + { + "epoch": 1.37, + "learning_rate": 9.404854876498188e-05, + "loss": 0.0243, + "step": 212730 + }, + { + "epoch": 1.37, + "learning_rate": 9.403886741062496e-05, + "loss": 0.0282, + "step": 212740 + }, + { + "epoch": 1.37, + "learning_rate": 9.402918605626803e-05, + "loss": 0.0279, + "step": 212750 + }, + { + "epoch": 1.37, + "learning_rate": 9.401950470191109e-05, + "loss": 0.0332, + "step": 212760 + }, + { + "epoch": 1.37, + "learning_rate": 9.400982334755416e-05, + "loss": 0.0265, + "step": 212770 + }, + { + "epoch": 1.37, + "learning_rate": 9.400014199319724e-05, + "loss": 0.0267, + "step": 212780 + }, + { + "epoch": 1.37, + "learning_rate": 9.399046063884029e-05, + "loss": 0.0246, + "step": 212790 + }, + { + "epoch": 1.37, + "learning_rate": 9.398077928448336e-05, + "loss": 0.0364, + "step": 212800 + }, + { + "epoch": 1.37, + "learning_rate": 9.397109793012644e-05, + "loss": 0.0283, + "step": 212810 + }, + { + "epoch": 1.37, + "learning_rate": 9.39614165757695e-05, + "loss": 0.0267, + "step": 212820 + }, + { + "epoch": 1.37, + "learning_rate": 9.395173522141256e-05, + "loss": 0.0272, + "step": 212830 + }, + { + "epoch": 1.37, + "learning_rate": 9.394205386705563e-05, + "loss": 0.0332, + "step": 212840 + }, + { + "epoch": 1.37, + "learning_rate": 9.39323725126987e-05, + "loss": 0.0297, + "step": 212850 + }, + { + "epoch": 1.37, + "learning_rate": 9.392269115834177e-05, + "loss": 0.0298, + "step": 212860 + }, + { + "epoch": 1.37, + "learning_rate": 9.391300980398483e-05, + "loss": 0.0282, + "step": 212870 + }, + { + "epoch": 1.37, + "learning_rate": 9.390332844962791e-05, + "loss": 0.0291, + "step": 212880 + }, + { + "epoch": 1.37, + "learning_rate": 9.389364709527098e-05, + "loss": 0.0338, + "step": 212890 + }, + { + "epoch": 1.37, + "learning_rate": 9.388396574091403e-05, + "loss": 0.0303, + "step": 212900 + }, + { + "epoch": 1.37, + "learning_rate": 9.387428438655711e-05, + "loss": 0.0301, + "step": 212910 + }, + { + "epoch": 1.37, + "learning_rate": 9.386460303220018e-05, + "loss": 0.0275, + "step": 212920 + }, + { + "epoch": 1.37, + "learning_rate": 9.385492167784323e-05, + "loss": 0.0287, + "step": 212930 + }, + { + "epoch": 1.37, + "learning_rate": 9.384524032348631e-05, + "loss": 0.0274, + "step": 212940 + }, + { + "epoch": 1.37, + "learning_rate": 9.383555896912938e-05, + "loss": 0.0265, + "step": 212950 + }, + { + "epoch": 1.37, + "learning_rate": 9.382587761477246e-05, + "loss": 0.0297, + "step": 212960 + }, + { + "epoch": 1.37, + "learning_rate": 9.381619626041551e-05, + "loss": 0.0245, + "step": 212970 + }, + { + "epoch": 1.37, + "learning_rate": 9.380651490605859e-05, + "loss": 0.0262, + "step": 212980 + }, + { + "epoch": 1.37, + "learning_rate": 9.379683355170166e-05, + "loss": 0.0315, + "step": 212990 + }, + { + "epoch": 1.37, + "learning_rate": 9.378715219734471e-05, + "loss": 0.0348, + "step": 213000 + }, + { + "epoch": 1.37, + "eval_cer": 0.9199240763755507, + "eval_loss": 0.021109996363520622, + "eval_runtime": 120.0643, + "eval_samples_per_second": 16.658, + "eval_steps_per_second": 4.164, + "step": 213000 + }, + { + "epoch": 1.37, + "learning_rate": 9.377747084298779e-05, + "loss": 0.0329, + "step": 213010 + }, + { + "epoch": 1.37, + "learning_rate": 9.376778948863085e-05, + "loss": 0.028, + "step": 213020 + }, + { + "epoch": 1.37, + "learning_rate": 9.375810813427393e-05, + "loss": 0.0259, + "step": 213030 + }, + { + "epoch": 1.38, + "learning_rate": 9.374842677991699e-05, + "loss": 0.0295, + "step": 213040 + }, + { + "epoch": 1.38, + "learning_rate": 9.373874542556005e-05, + "loss": 0.0225, + "step": 213050 + }, + { + "epoch": 1.38, + "learning_rate": 9.372906407120313e-05, + "loss": 0.0313, + "step": 213060 + }, + { + "epoch": 1.38, + "learning_rate": 9.371938271684619e-05, + "loss": 0.0326, + "step": 213070 + }, + { + "epoch": 1.38, + "learning_rate": 9.370970136248927e-05, + "loss": 0.0246, + "step": 213080 + }, + { + "epoch": 1.38, + "learning_rate": 9.370002000813233e-05, + "loss": 0.0299, + "step": 213090 + }, + { + "epoch": 1.38, + "learning_rate": 9.36903386537754e-05, + "loss": 0.0282, + "step": 213100 + }, + { + "epoch": 1.38, + "learning_rate": 9.368065729941846e-05, + "loss": 0.0282, + "step": 213110 + }, + { + "epoch": 1.38, + "learning_rate": 9.367097594506153e-05, + "loss": 0.0279, + "step": 213120 + }, + { + "epoch": 1.38, + "learning_rate": 9.366129459070461e-05, + "loss": 0.0359, + "step": 213130 + }, + { + "epoch": 1.38, + "learning_rate": 9.365161323634766e-05, + "loss": 0.0349, + "step": 213140 + }, + { + "epoch": 1.38, + "learning_rate": 9.364193188199073e-05, + "loss": 0.0306, + "step": 213150 + }, + { + "epoch": 1.38, + "learning_rate": 9.363225052763381e-05, + "loss": 0.0315, + "step": 213160 + }, + { + "epoch": 1.38, + "learning_rate": 9.362256917327688e-05, + "loss": 0.0384, + "step": 213170 + }, + { + "epoch": 1.38, + "learning_rate": 9.361288781891994e-05, + "loss": 0.0275, + "step": 213180 + }, + { + "epoch": 1.38, + "learning_rate": 9.360320646456301e-05, + "loss": 0.0255, + "step": 213190 + }, + { + "epoch": 1.38, + "learning_rate": 9.359352511020607e-05, + "loss": 0.0335, + "step": 213200 + }, + { + "epoch": 1.38, + "learning_rate": 9.358384375584914e-05, + "loss": 0.0287, + "step": 213210 + }, + { + "epoch": 1.38, + "learning_rate": 9.35741624014922e-05, + "loss": 0.026, + "step": 213220 + }, + { + "epoch": 1.38, + "learning_rate": 9.356448104713529e-05, + "loss": 0.0272, + "step": 213230 + }, + { + "epoch": 1.38, + "learning_rate": 9.355479969277835e-05, + "loss": 0.0314, + "step": 213240 + }, + { + "epoch": 1.38, + "learning_rate": 9.35451183384214e-05, + "loss": 0.0376, + "step": 213250 + }, + { + "epoch": 1.38, + "learning_rate": 9.353543698406448e-05, + "loss": 0.0278, + "step": 213260 + }, + { + "epoch": 1.38, + "learning_rate": 9.352575562970755e-05, + "loss": 0.0261, + "step": 213270 + }, + { + "epoch": 1.38, + "learning_rate": 9.351607427535062e-05, + "loss": 0.025, + "step": 213280 + }, + { + "epoch": 1.38, + "learning_rate": 9.350639292099368e-05, + "loss": 0.0288, + "step": 213290 + }, + { + "epoch": 1.38, + "learning_rate": 9.349671156663675e-05, + "loss": 0.0359, + "step": 213300 + }, + { + "epoch": 1.38, + "learning_rate": 9.348703021227983e-05, + "loss": 0.0353, + "step": 213310 + }, + { + "epoch": 1.38, + "learning_rate": 9.347734885792288e-05, + "loss": 0.0315, + "step": 213320 + }, + { + "epoch": 1.38, + "learning_rate": 9.346766750356596e-05, + "loss": 0.0285, + "step": 213330 + }, + { + "epoch": 1.38, + "learning_rate": 9.345798614920903e-05, + "loss": 0.0306, + "step": 213340 + }, + { + "epoch": 1.38, + "learning_rate": 9.344830479485208e-05, + "loss": 0.0281, + "step": 213350 + }, + { + "epoch": 1.38, + "learning_rate": 9.343862344049516e-05, + "loss": 0.0307, + "step": 213360 + }, + { + "epoch": 1.38, + "learning_rate": 9.342894208613823e-05, + "loss": 0.0298, + "step": 213370 + }, + { + "epoch": 1.38, + "learning_rate": 9.34192607317813e-05, + "loss": 0.0276, + "step": 213380 + }, + { + "epoch": 1.38, + "learning_rate": 9.340957937742436e-05, + "loss": 0.031, + "step": 213390 + }, + { + "epoch": 1.38, + "learning_rate": 9.339989802306743e-05, + "loss": 0.0268, + "step": 213400 + }, + { + "epoch": 1.38, + "learning_rate": 9.33902166687105e-05, + "loss": 0.028, + "step": 213410 + }, + { + "epoch": 1.38, + "learning_rate": 9.338053531435356e-05, + "loss": 0.036, + "step": 213420 + }, + { + "epoch": 1.38, + "learning_rate": 9.337085395999664e-05, + "loss": 0.0267, + "step": 213430 + }, + { + "epoch": 1.38, + "learning_rate": 9.33611726056397e-05, + "loss": 0.0287, + "step": 213440 + }, + { + "epoch": 1.38, + "learning_rate": 9.335149125128278e-05, + "loss": 0.0336, + "step": 213450 + }, + { + "epoch": 1.38, + "learning_rate": 9.334180989692584e-05, + "loss": 0.0263, + "step": 213460 + }, + { + "epoch": 1.38, + "learning_rate": 9.33321285425689e-05, + "loss": 0.0345, + "step": 213470 + }, + { + "epoch": 1.38, + "learning_rate": 9.332244718821198e-05, + "loss": 0.0292, + "step": 213480 + }, + { + "epoch": 1.38, + "learning_rate": 9.331276583385504e-05, + "loss": 0.0264, + "step": 213490 + }, + { + "epoch": 1.38, + "learning_rate": 9.33030844794981e-05, + "loss": 0.0244, + "step": 213500 + }, + { + "epoch": 1.38, + "learning_rate": 9.329340312514118e-05, + "loss": 0.0274, + "step": 213510 + }, + { + "epoch": 1.38, + "learning_rate": 9.328372177078425e-05, + "loss": 0.0302, + "step": 213520 + }, + { + "epoch": 1.38, + "learning_rate": 9.327404041642731e-05, + "loss": 0.0326, + "step": 213530 + }, + { + "epoch": 1.38, + "learning_rate": 9.326435906207038e-05, + "loss": 0.0269, + "step": 213540 + }, + { + "epoch": 1.38, + "learning_rate": 9.325467770771346e-05, + "loss": 0.038, + "step": 213550 + }, + { + "epoch": 1.38, + "learning_rate": 9.324499635335651e-05, + "loss": 0.0319, + "step": 213560 + }, + { + "epoch": 1.38, + "learning_rate": 9.323531499899958e-05, + "loss": 0.0303, + "step": 213570 + }, + { + "epoch": 1.38, + "learning_rate": 9.322563364464266e-05, + "loss": 0.024, + "step": 213580 + }, + { + "epoch": 1.38, + "learning_rate": 9.321595229028572e-05, + "loss": 0.0336, + "step": 213590 + }, + { + "epoch": 1.38, + "learning_rate": 9.320627093592878e-05, + "loss": 0.0285, + "step": 213600 + }, + { + "epoch": 1.38, + "learning_rate": 9.319658958157186e-05, + "loss": 0.0308, + "step": 213610 + }, + { + "epoch": 1.38, + "learning_rate": 9.318690822721492e-05, + "loss": 0.0359, + "step": 213620 + }, + { + "epoch": 1.38, + "learning_rate": 9.317722687285799e-05, + "loss": 0.0289, + "step": 213630 + }, + { + "epoch": 1.38, + "learning_rate": 9.316754551850106e-05, + "loss": 0.0336, + "step": 213640 + }, + { + "epoch": 1.38, + "learning_rate": 9.315786416414414e-05, + "loss": 0.0254, + "step": 213650 + }, + { + "epoch": 1.38, + "learning_rate": 9.31481828097872e-05, + "loss": 0.0282, + "step": 213660 + }, + { + "epoch": 1.38, + "learning_rate": 9.313850145543025e-05, + "loss": 0.0316, + "step": 213670 + }, + { + "epoch": 1.38, + "learning_rate": 9.312882010107333e-05, + "loss": 0.026, + "step": 213680 + }, + { + "epoch": 1.38, + "learning_rate": 9.31191387467164e-05, + "loss": 0.0307, + "step": 213690 + }, + { + "epoch": 1.38, + "learning_rate": 9.310945739235945e-05, + "loss": 0.0284, + "step": 213700 + }, + { + "epoch": 1.38, + "learning_rate": 9.309977603800253e-05, + "loss": 0.0278, + "step": 213710 + }, + { + "epoch": 1.38, + "learning_rate": 9.30900946836456e-05, + "loss": 0.0266, + "step": 213720 + }, + { + "epoch": 1.38, + "learning_rate": 9.308041332928868e-05, + "loss": 0.0297, + "step": 213730 + }, + { + "epoch": 1.38, + "learning_rate": 9.307073197493173e-05, + "loss": 0.031, + "step": 213740 + }, + { + "epoch": 1.38, + "learning_rate": 9.306105062057481e-05, + "loss": 0.0261, + "step": 213750 + }, + { + "epoch": 1.38, + "learning_rate": 9.305136926621788e-05, + "loss": 0.0325, + "step": 213760 + }, + { + "epoch": 1.38, + "learning_rate": 9.304168791186093e-05, + "loss": 0.0278, + "step": 213770 + }, + { + "epoch": 1.38, + "learning_rate": 9.303200655750401e-05, + "loss": 0.0268, + "step": 213780 + }, + { + "epoch": 1.38, + "learning_rate": 9.302232520314708e-05, + "loss": 0.0282, + "step": 213790 + }, + { + "epoch": 1.38, + "learning_rate": 9.301264384879016e-05, + "loss": 0.0368, + "step": 213800 + }, + { + "epoch": 1.38, + "learning_rate": 9.300296249443321e-05, + "loss": 0.0294, + "step": 213810 + }, + { + "epoch": 1.38, + "learning_rate": 9.299328114007628e-05, + "loss": 0.0346, + "step": 213820 + }, + { + "epoch": 1.38, + "learning_rate": 9.298359978571936e-05, + "loss": 0.0267, + "step": 213830 + }, + { + "epoch": 1.38, + "learning_rate": 9.297391843136241e-05, + "loss": 0.0317, + "step": 213840 + }, + { + "epoch": 1.38, + "learning_rate": 9.296423707700549e-05, + "loss": 0.0267, + "step": 213850 + }, + { + "epoch": 1.38, + "learning_rate": 9.295455572264855e-05, + "loss": 0.03, + "step": 213860 + }, + { + "epoch": 1.38, + "learning_rate": 9.294487436829163e-05, + "loss": 0.0319, + "step": 213870 + }, + { + "epoch": 1.38, + "learning_rate": 9.293519301393469e-05, + "loss": 0.0273, + "step": 213880 + }, + { + "epoch": 1.38, + "learning_rate": 9.292551165957775e-05, + "loss": 0.0357, + "step": 213890 + }, + { + "epoch": 1.38, + "learning_rate": 9.291583030522083e-05, + "loss": 0.0261, + "step": 213900 + }, + { + "epoch": 1.38, + "learning_rate": 9.290614895086389e-05, + "loss": 0.0295, + "step": 213910 + }, + { + "epoch": 1.38, + "learning_rate": 9.289646759650695e-05, + "loss": 0.0285, + "step": 213920 + }, + { + "epoch": 1.38, + "learning_rate": 9.288678624215003e-05, + "loss": 0.0287, + "step": 213930 + }, + { + "epoch": 1.38, + "learning_rate": 9.28771048877931e-05, + "loss": 0.0306, + "step": 213940 + }, + { + "epoch": 1.38, + "learning_rate": 9.286742353343616e-05, + "loss": 0.0302, + "step": 213950 + }, + { + "epoch": 1.38, + "learning_rate": 9.285774217907923e-05, + "loss": 0.0328, + "step": 213960 + }, + { + "epoch": 1.38, + "learning_rate": 9.284806082472231e-05, + "loss": 0.0276, + "step": 213970 + }, + { + "epoch": 1.38, + "learning_rate": 9.283837947036536e-05, + "loss": 0.0287, + "step": 213980 + }, + { + "epoch": 1.38, + "learning_rate": 9.282869811600843e-05, + "loss": 0.0361, + "step": 213990 + }, + { + "epoch": 1.38, + "learning_rate": 9.281901676165151e-05, + "loss": 0.0291, + "step": 214000 + }, + { + "epoch": 1.38, + "eval_cer": 0.919937634165631, + "eval_loss": 0.02141990140080452, + "eval_runtime": 120.0948, + "eval_samples_per_second": 16.654, + "eval_steps_per_second": 4.163, + "step": 214000 + }, + { + "epoch": 1.38, + "learning_rate": 9.280933540729457e-05, + "loss": 0.0352, + "step": 214010 + }, + { + "epoch": 1.38, + "learning_rate": 9.279965405293763e-05, + "loss": 0.0293, + "step": 214020 + }, + { + "epoch": 1.38, + "learning_rate": 9.278997269858071e-05, + "loss": 0.0261, + "step": 214030 + }, + { + "epoch": 1.38, + "learning_rate": 9.278029134422377e-05, + "loss": 0.0275, + "step": 214040 + }, + { + "epoch": 1.38, + "learning_rate": 9.277060998986684e-05, + "loss": 0.0337, + "step": 214050 + }, + { + "epoch": 1.38, + "learning_rate": 9.27609286355099e-05, + "loss": 0.0306, + "step": 214060 + }, + { + "epoch": 1.38, + "learning_rate": 9.275124728115299e-05, + "loss": 0.0319, + "step": 214070 + }, + { + "epoch": 1.38, + "learning_rate": 9.274156592679605e-05, + "loss": 0.0284, + "step": 214080 + }, + { + "epoch": 1.38, + "learning_rate": 9.27318845724391e-05, + "loss": 0.0292, + "step": 214090 + }, + { + "epoch": 1.38, + "learning_rate": 9.272220321808218e-05, + "loss": 0.0311, + "step": 214100 + }, + { + "epoch": 1.38, + "learning_rate": 9.271252186372525e-05, + "loss": 0.029, + "step": 214110 + }, + { + "epoch": 1.38, + "learning_rate": 9.27028405093683e-05, + "loss": 0.0304, + "step": 214120 + }, + { + "epoch": 1.38, + "learning_rate": 9.269315915501138e-05, + "loss": 0.0256, + "step": 214130 + }, + { + "epoch": 1.38, + "learning_rate": 9.268347780065445e-05, + "loss": 0.0317, + "step": 214140 + }, + { + "epoch": 1.38, + "learning_rate": 9.267379644629753e-05, + "loss": 0.0291, + "step": 214150 + }, + { + "epoch": 1.38, + "learning_rate": 9.266411509194058e-05, + "loss": 0.0299, + "step": 214160 + }, + { + "epoch": 1.38, + "learning_rate": 9.265443373758366e-05, + "loss": 0.0297, + "step": 214170 + }, + { + "epoch": 1.38, + "learning_rate": 9.264475238322673e-05, + "loss": 0.0237, + "step": 214180 + }, + { + "epoch": 1.38, + "learning_rate": 9.263507102886978e-05, + "loss": 0.0249, + "step": 214190 + }, + { + "epoch": 1.38, + "learning_rate": 9.262538967451286e-05, + "loss": 0.0269, + "step": 214200 + }, + { + "epoch": 1.38, + "learning_rate": 9.261570832015593e-05, + "loss": 0.0285, + "step": 214210 + }, + { + "epoch": 1.38, + "learning_rate": 9.2606026965799e-05, + "loss": 0.0308, + "step": 214220 + }, + { + "epoch": 1.38, + "learning_rate": 9.259634561144206e-05, + "loss": 0.0335, + "step": 214230 + }, + { + "epoch": 1.38, + "learning_rate": 9.258666425708513e-05, + "loss": 0.0259, + "step": 214240 + }, + { + "epoch": 1.38, + "learning_rate": 9.25769829027282e-05, + "loss": 0.0318, + "step": 214250 + }, + { + "epoch": 1.38, + "learning_rate": 9.256730154837126e-05, + "loss": 0.0321, + "step": 214260 + }, + { + "epoch": 1.38, + "learning_rate": 9.255762019401434e-05, + "loss": 0.0296, + "step": 214270 + }, + { + "epoch": 1.38, + "learning_rate": 9.25479388396574e-05, + "loss": 0.0309, + "step": 214280 + }, + { + "epoch": 1.38, + "learning_rate": 9.253825748530047e-05, + "loss": 0.0309, + "step": 214290 + }, + { + "epoch": 1.38, + "learning_rate": 9.252857613094354e-05, + "loss": 0.0319, + "step": 214300 + }, + { + "epoch": 1.38, + "learning_rate": 9.25188947765866e-05, + "loss": 0.0276, + "step": 214310 + }, + { + "epoch": 1.38, + "learning_rate": 9.250921342222968e-05, + "loss": 0.0312, + "step": 214320 + }, + { + "epoch": 1.38, + "learning_rate": 9.249953206787273e-05, + "loss": 0.0301, + "step": 214330 + }, + { + "epoch": 1.38, + "learning_rate": 9.24898507135158e-05, + "loss": 0.0269, + "step": 214340 + }, + { + "epoch": 1.38, + "learning_rate": 9.248016935915888e-05, + "loss": 0.0278, + "step": 214350 + }, + { + "epoch": 1.38, + "learning_rate": 9.247048800480195e-05, + "loss": 0.0284, + "step": 214360 + }, + { + "epoch": 1.38, + "learning_rate": 9.246080665044501e-05, + "loss": 0.0297, + "step": 214370 + }, + { + "epoch": 1.38, + "learning_rate": 9.245112529608808e-05, + "loss": 0.0295, + "step": 214380 + }, + { + "epoch": 1.38, + "learning_rate": 9.244144394173115e-05, + "loss": 0.0262, + "step": 214390 + }, + { + "epoch": 1.38, + "learning_rate": 9.243176258737421e-05, + "loss": 0.0271, + "step": 214400 + }, + { + "epoch": 1.38, + "learning_rate": 9.242208123301728e-05, + "loss": 0.0308, + "step": 214410 + }, + { + "epoch": 1.38, + "learning_rate": 9.241239987866036e-05, + "loss": 0.0249, + "step": 214420 + }, + { + "epoch": 1.38, + "learning_rate": 9.240271852430342e-05, + "loss": 0.0306, + "step": 214430 + }, + { + "epoch": 1.38, + "learning_rate": 9.239303716994648e-05, + "loss": 0.0347, + "step": 214440 + }, + { + "epoch": 1.38, + "learning_rate": 9.238335581558956e-05, + "loss": 0.0278, + "step": 214450 + }, + { + "epoch": 1.38, + "learning_rate": 9.237367446123262e-05, + "loss": 0.0264, + "step": 214460 + }, + { + "epoch": 1.38, + "learning_rate": 9.236399310687569e-05, + "loss": 0.0255, + "step": 214470 + }, + { + "epoch": 1.38, + "learning_rate": 9.235431175251876e-05, + "loss": 0.0283, + "step": 214480 + }, + { + "epoch": 1.38, + "learning_rate": 9.234463039816182e-05, + "loss": 0.0282, + "step": 214490 + }, + { + "epoch": 1.38, + "learning_rate": 9.23349490438049e-05, + "loss": 0.0241, + "step": 214500 + }, + { + "epoch": 1.38, + "learning_rate": 9.232526768944795e-05, + "loss": 0.0268, + "step": 214510 + }, + { + "epoch": 1.38, + "learning_rate": 9.231558633509103e-05, + "loss": 0.0273, + "step": 214520 + }, + { + "epoch": 1.38, + "learning_rate": 9.23059049807341e-05, + "loss": 0.0254, + "step": 214530 + }, + { + "epoch": 1.38, + "learning_rate": 9.229622362637715e-05, + "loss": 0.027, + "step": 214540 + }, + { + "epoch": 1.38, + "learning_rate": 9.228654227202023e-05, + "loss": 0.0307, + "step": 214550 + }, + { + "epoch": 1.38, + "learning_rate": 9.22768609176633e-05, + "loss": 0.0361, + "step": 214560 + }, + { + "epoch": 1.38, + "learning_rate": 9.226717956330638e-05, + "loss": 0.0271, + "step": 214570 + }, + { + "epoch": 1.38, + "learning_rate": 9.225749820894943e-05, + "loss": 0.0304, + "step": 214580 + }, + { + "epoch": 1.39, + "learning_rate": 9.22478168545925e-05, + "loss": 0.0304, + "step": 214590 + }, + { + "epoch": 1.39, + "learning_rate": 9.223813550023558e-05, + "loss": 0.0262, + "step": 214600 + }, + { + "epoch": 1.39, + "learning_rate": 9.222845414587863e-05, + "loss": 0.0285, + "step": 214610 + }, + { + "epoch": 1.39, + "learning_rate": 9.221877279152171e-05, + "loss": 0.0285, + "step": 214620 + }, + { + "epoch": 1.39, + "learning_rate": 9.220909143716478e-05, + "loss": 0.0265, + "step": 214630 + }, + { + "epoch": 1.39, + "learning_rate": 9.219941008280786e-05, + "loss": 0.025, + "step": 214640 + }, + { + "epoch": 1.39, + "learning_rate": 9.218972872845091e-05, + "loss": 0.0256, + "step": 214650 + }, + { + "epoch": 1.39, + "learning_rate": 9.218004737409398e-05, + "loss": 0.0306, + "step": 214660 + }, + { + "epoch": 1.39, + "learning_rate": 9.217036601973705e-05, + "loss": 0.0346, + "step": 214670 + }, + { + "epoch": 1.39, + "learning_rate": 9.216068466538011e-05, + "loss": 0.0296, + "step": 214680 + }, + { + "epoch": 1.39, + "learning_rate": 9.215100331102317e-05, + "loss": 0.0324, + "step": 214690 + }, + { + "epoch": 1.39, + "learning_rate": 9.214132195666625e-05, + "loss": 0.0323, + "step": 214700 + }, + { + "epoch": 1.39, + "learning_rate": 9.213164060230932e-05, + "loss": 0.0281, + "step": 214710 + }, + { + "epoch": 1.39, + "learning_rate": 9.212195924795239e-05, + "loss": 0.0312, + "step": 214720 + }, + { + "epoch": 1.39, + "learning_rate": 9.211227789359545e-05, + "loss": 0.0276, + "step": 214730 + }, + { + "epoch": 1.39, + "learning_rate": 9.210259653923853e-05, + "loss": 0.0334, + "step": 214740 + }, + { + "epoch": 1.39, + "learning_rate": 9.209291518488158e-05, + "loss": 0.0267, + "step": 214750 + }, + { + "epoch": 1.39, + "learning_rate": 9.208323383052465e-05, + "loss": 0.0332, + "step": 214760 + }, + { + "epoch": 1.39, + "learning_rate": 9.207355247616773e-05, + "loss": 0.0301, + "step": 214770 + }, + { + "epoch": 1.39, + "learning_rate": 9.20638711218108e-05, + "loss": 0.029, + "step": 214780 + }, + { + "epoch": 1.39, + "learning_rate": 9.205418976745385e-05, + "loss": 0.03, + "step": 214790 + }, + { + "epoch": 1.39, + "learning_rate": 9.204450841309693e-05, + "loss": 0.0297, + "step": 214800 + }, + { + "epoch": 1.39, + "learning_rate": 9.203482705874e-05, + "loss": 0.0268, + "step": 214810 + }, + { + "epoch": 1.39, + "learning_rate": 9.202514570438306e-05, + "loss": 0.0272, + "step": 214820 + }, + { + "epoch": 1.39, + "learning_rate": 9.201546435002613e-05, + "loss": 0.0258, + "step": 214830 + }, + { + "epoch": 1.39, + "learning_rate": 9.200578299566921e-05, + "loss": 0.0299, + "step": 214840 + }, + { + "epoch": 1.39, + "learning_rate": 9.199610164131227e-05, + "loss": 0.0308, + "step": 214850 + }, + { + "epoch": 1.39, + "learning_rate": 9.198642028695533e-05, + "loss": 0.0316, + "step": 214860 + }, + { + "epoch": 1.39, + "learning_rate": 9.19767389325984e-05, + "loss": 0.0206, + "step": 214870 + }, + { + "epoch": 1.39, + "learning_rate": 9.196705757824147e-05, + "loss": 0.028, + "step": 214880 + }, + { + "epoch": 1.39, + "learning_rate": 9.195737622388453e-05, + "loss": 0.0256, + "step": 214890 + }, + { + "epoch": 1.39, + "learning_rate": 9.19476948695276e-05, + "loss": 0.0287, + "step": 214900 + }, + { + "epoch": 1.39, + "learning_rate": 9.193801351517067e-05, + "loss": 0.0258, + "step": 214910 + }, + { + "epoch": 1.39, + "learning_rate": 9.192833216081375e-05, + "loss": 0.0326, + "step": 214920 + }, + { + "epoch": 1.39, + "learning_rate": 9.19186508064568e-05, + "loss": 0.0279, + "step": 214930 + }, + { + "epoch": 1.39, + "learning_rate": 9.190896945209988e-05, + "loss": 0.0304, + "step": 214940 + }, + { + "epoch": 1.39, + "learning_rate": 9.189928809774295e-05, + "loss": 0.0262, + "step": 214950 + }, + { + "epoch": 1.39, + "learning_rate": 9.1889606743386e-05, + "loss": 0.0304, + "step": 214960 + }, + { + "epoch": 1.39, + "learning_rate": 9.187992538902908e-05, + "loss": 0.0274, + "step": 214970 + }, + { + "epoch": 1.39, + "learning_rate": 9.187024403467215e-05, + "loss": 0.0275, + "step": 214980 + }, + { + "epoch": 1.39, + "learning_rate": 9.186056268031523e-05, + "loss": 0.0253, + "step": 214990 + }, + { + "epoch": 1.39, + "learning_rate": 9.185088132595828e-05, + "loss": 0.0353, + "step": 215000 + }, + { + "epoch": 1.39, + "eval_cer": 0.9198843068579822, + "eval_loss": 0.021198125556111336, + "eval_runtime": 120.2091, + "eval_samples_per_second": 16.638, + "eval_steps_per_second": 4.159, + "step": 215000 + }, + { + "epoch": 1.39, + "learning_rate": 9.184119997160135e-05, + "loss": 0.0293, + "step": 215010 + }, + { + "epoch": 1.39, + "learning_rate": 9.183151861724443e-05, + "loss": 0.0336, + "step": 215020 + }, + { + "epoch": 1.39, + "learning_rate": 9.182183726288748e-05, + "loss": 0.0365, + "step": 215030 + }, + { + "epoch": 1.39, + "learning_rate": 9.181215590853056e-05, + "loss": 0.0335, + "step": 215040 + }, + { + "epoch": 1.39, + "learning_rate": 9.180247455417363e-05, + "loss": 0.0239, + "step": 215050 + }, + { + "epoch": 1.39, + "learning_rate": 9.17927931998167e-05, + "loss": 0.0283, + "step": 215060 + }, + { + "epoch": 1.39, + "learning_rate": 9.178311184545976e-05, + "loss": 0.0254, + "step": 215070 + }, + { + "epoch": 1.39, + "learning_rate": 9.177343049110282e-05, + "loss": 0.0271, + "step": 215080 + }, + { + "epoch": 1.39, + "learning_rate": 9.17637491367459e-05, + "loss": 0.0338, + "step": 215090 + }, + { + "epoch": 1.39, + "learning_rate": 9.175406778238896e-05, + "loss": 0.026, + "step": 215100 + }, + { + "epoch": 1.39, + "learning_rate": 9.174438642803202e-05, + "loss": 0.0311, + "step": 215110 + }, + { + "epoch": 1.39, + "learning_rate": 9.17347050736751e-05, + "loss": 0.0319, + "step": 215120 + }, + { + "epoch": 1.39, + "learning_rate": 9.172502371931817e-05, + "loss": 0.0232, + "step": 215130 + }, + { + "epoch": 1.39, + "learning_rate": 9.171534236496124e-05, + "loss": 0.037, + "step": 215140 + }, + { + "epoch": 1.39, + "learning_rate": 9.17056610106043e-05, + "loss": 0.0367, + "step": 215150 + }, + { + "epoch": 1.39, + "learning_rate": 9.169597965624738e-05, + "loss": 0.0299, + "step": 215160 + }, + { + "epoch": 1.39, + "learning_rate": 9.168629830189043e-05, + "loss": 0.027, + "step": 215170 + }, + { + "epoch": 1.39, + "learning_rate": 9.16766169475335e-05, + "loss": 0.0277, + "step": 215180 + }, + { + "epoch": 1.39, + "learning_rate": 9.166693559317658e-05, + "loss": 0.033, + "step": 215190 + }, + { + "epoch": 1.39, + "learning_rate": 9.165725423881963e-05, + "loss": 0.0306, + "step": 215200 + }, + { + "epoch": 1.39, + "learning_rate": 9.16475728844627e-05, + "loss": 0.0293, + "step": 215210 + }, + { + "epoch": 1.39, + "learning_rate": 9.163789153010578e-05, + "loss": 0.0362, + "step": 215220 + }, + { + "epoch": 1.39, + "learning_rate": 9.162821017574885e-05, + "loss": 0.0249, + "step": 215230 + }, + { + "epoch": 1.39, + "learning_rate": 9.161852882139191e-05, + "loss": 0.028, + "step": 215240 + }, + { + "epoch": 1.39, + "learning_rate": 9.160884746703498e-05, + "loss": 0.0201, + "step": 215250 + }, + { + "epoch": 1.39, + "learning_rate": 9.159916611267806e-05, + "loss": 0.0261, + "step": 215260 + }, + { + "epoch": 1.39, + "learning_rate": 9.158948475832111e-05, + "loss": 0.0316, + "step": 215270 + }, + { + "epoch": 1.39, + "learning_rate": 9.157980340396418e-05, + "loss": 0.0267, + "step": 215280 + }, + { + "epoch": 1.39, + "learning_rate": 9.157012204960726e-05, + "loss": 0.0281, + "step": 215290 + }, + { + "epoch": 1.39, + "learning_rate": 9.156044069525032e-05, + "loss": 0.0336, + "step": 215300 + }, + { + "epoch": 1.39, + "learning_rate": 9.155075934089338e-05, + "loss": 0.0287, + "step": 215310 + }, + { + "epoch": 1.39, + "learning_rate": 9.154107798653646e-05, + "loss": 0.0279, + "step": 215320 + }, + { + "epoch": 1.39, + "learning_rate": 9.153139663217952e-05, + "loss": 0.0335, + "step": 215330 + }, + { + "epoch": 1.39, + "learning_rate": 9.152171527782259e-05, + "loss": 0.0235, + "step": 215340 + }, + { + "epoch": 1.39, + "learning_rate": 9.151203392346565e-05, + "loss": 0.025, + "step": 215350 + }, + { + "epoch": 1.39, + "learning_rate": 9.150235256910873e-05, + "loss": 0.0275, + "step": 215360 + }, + { + "epoch": 1.39, + "learning_rate": 9.14926712147518e-05, + "loss": 0.0278, + "step": 215370 + }, + { + "epoch": 1.39, + "learning_rate": 9.148298986039485e-05, + "loss": 0.028, + "step": 215380 + }, + { + "epoch": 1.39, + "learning_rate": 9.147330850603793e-05, + "loss": 0.0298, + "step": 215390 + }, + { + "epoch": 1.39, + "learning_rate": 9.1463627151681e-05, + "loss": 0.027, + "step": 215400 + }, + { + "epoch": 1.39, + "learning_rate": 9.145394579732405e-05, + "loss": 0.0316, + "step": 215410 + }, + { + "epoch": 1.39, + "learning_rate": 9.144426444296713e-05, + "loss": 0.0331, + "step": 215420 + }, + { + "epoch": 1.39, + "learning_rate": 9.14345830886102e-05, + "loss": 0.0319, + "step": 215430 + }, + { + "epoch": 1.39, + "learning_rate": 9.142490173425328e-05, + "loss": 0.027, + "step": 215440 + }, + { + "epoch": 1.39, + "learning_rate": 9.141522037989633e-05, + "loss": 0.0264, + "step": 215450 + }, + { + "epoch": 1.39, + "learning_rate": 9.140553902553941e-05, + "loss": 0.0318, + "step": 215460 + }, + { + "epoch": 1.39, + "learning_rate": 9.139585767118248e-05, + "loss": 0.0296, + "step": 215470 + }, + { + "epoch": 1.39, + "learning_rate": 9.138617631682553e-05, + "loss": 0.0263, + "step": 215480 + }, + { + "epoch": 1.39, + "learning_rate": 9.137649496246861e-05, + "loss": 0.0271, + "step": 215490 + }, + { + "epoch": 1.39, + "learning_rate": 9.136681360811167e-05, + "loss": 0.0301, + "step": 215500 + }, + { + "epoch": 1.39, + "learning_rate": 9.135713225375475e-05, + "loss": 0.0358, + "step": 215510 + }, + { + "epoch": 1.39, + "learning_rate": 9.134745089939781e-05, + "loss": 0.0277, + "step": 215520 + }, + { + "epoch": 1.39, + "learning_rate": 9.133776954504087e-05, + "loss": 0.025, + "step": 215530 + }, + { + "epoch": 1.39, + "learning_rate": 9.132808819068395e-05, + "loss": 0.0259, + "step": 215540 + }, + { + "epoch": 1.39, + "learning_rate": 9.1318406836327e-05, + "loss": 0.028, + "step": 215550 + }, + { + "epoch": 1.39, + "learning_rate": 9.130872548197009e-05, + "loss": 0.0293, + "step": 215560 + }, + { + "epoch": 1.39, + "learning_rate": 9.129904412761315e-05, + "loss": 0.0243, + "step": 215570 + }, + { + "epoch": 1.39, + "learning_rate": 9.128936277325623e-05, + "loss": 0.0251, + "step": 215580 + }, + { + "epoch": 1.39, + "learning_rate": 9.127968141889928e-05, + "loss": 0.0269, + "step": 215590 + }, + { + "epoch": 1.39, + "learning_rate": 9.127000006454235e-05, + "loss": 0.0325, + "step": 215600 + }, + { + "epoch": 1.39, + "learning_rate": 9.126031871018543e-05, + "loss": 0.026, + "step": 215610 + }, + { + "epoch": 1.39, + "learning_rate": 9.125063735582848e-05, + "loss": 0.0258, + "step": 215620 + }, + { + "epoch": 1.39, + "learning_rate": 9.124095600147155e-05, + "loss": 0.0299, + "step": 215630 + }, + { + "epoch": 1.39, + "learning_rate": 9.123127464711463e-05, + "loss": 0.0284, + "step": 215640 + }, + { + "epoch": 1.39, + "learning_rate": 9.12215932927577e-05, + "loss": 0.0305, + "step": 215650 + }, + { + "epoch": 1.39, + "learning_rate": 9.121191193840076e-05, + "loss": 0.0292, + "step": 215660 + }, + { + "epoch": 1.39, + "learning_rate": 9.120223058404383e-05, + "loss": 0.0234, + "step": 215670 + }, + { + "epoch": 1.39, + "learning_rate": 9.119254922968691e-05, + "loss": 0.0338, + "step": 215680 + }, + { + "epoch": 1.39, + "learning_rate": 9.118286787532996e-05, + "loss": 0.034, + "step": 215690 + }, + { + "epoch": 1.39, + "learning_rate": 9.117318652097303e-05, + "loss": 0.0286, + "step": 215700 + }, + { + "epoch": 1.39, + "learning_rate": 9.11635051666161e-05, + "loss": 0.0272, + "step": 215710 + }, + { + "epoch": 1.39, + "learning_rate": 9.115382381225917e-05, + "loss": 0.0257, + "step": 215720 + }, + { + "epoch": 1.39, + "learning_rate": 9.114414245790223e-05, + "loss": 0.0296, + "step": 215730 + }, + { + "epoch": 1.39, + "learning_rate": 9.11344611035453e-05, + "loss": 0.0324, + "step": 215740 + }, + { + "epoch": 1.39, + "learning_rate": 9.112477974918837e-05, + "loss": 0.0326, + "step": 215750 + }, + { + "epoch": 1.39, + "learning_rate": 9.111509839483144e-05, + "loss": 0.0302, + "step": 215760 + }, + { + "epoch": 1.39, + "learning_rate": 9.11054170404745e-05, + "loss": 0.026, + "step": 215770 + }, + { + "epoch": 1.39, + "learning_rate": 9.109573568611758e-05, + "loss": 0.033, + "step": 215780 + }, + { + "epoch": 1.39, + "learning_rate": 9.108605433176065e-05, + "loss": 0.0281, + "step": 215790 + }, + { + "epoch": 1.39, + "learning_rate": 9.10763729774037e-05, + "loss": 0.0243, + "step": 215800 + }, + { + "epoch": 1.39, + "learning_rate": 9.106669162304678e-05, + "loss": 0.0266, + "step": 215810 + }, + { + "epoch": 1.39, + "learning_rate": 9.105701026868985e-05, + "loss": 0.0286, + "step": 215820 + }, + { + "epoch": 1.39, + "learning_rate": 9.10473289143329e-05, + "loss": 0.0302, + "step": 215830 + }, + { + "epoch": 1.39, + "learning_rate": 9.103764755997598e-05, + "loss": 0.0277, + "step": 215840 + }, + { + "epoch": 1.39, + "learning_rate": 9.102796620561905e-05, + "loss": 0.026, + "step": 215850 + }, + { + "epoch": 1.39, + "learning_rate": 9.101828485126213e-05, + "loss": 0.0261, + "step": 215860 + }, + { + "epoch": 1.39, + "learning_rate": 9.100860349690518e-05, + "loss": 0.029, + "step": 215870 + }, + { + "epoch": 1.39, + "learning_rate": 9.099892214254826e-05, + "loss": 0.028, + "step": 215880 + }, + { + "epoch": 1.39, + "learning_rate": 9.098924078819133e-05, + "loss": 0.0271, + "step": 215890 + }, + { + "epoch": 1.39, + "learning_rate": 9.097955943383438e-05, + "loss": 0.032, + "step": 215900 + }, + { + "epoch": 1.39, + "learning_rate": 9.096987807947746e-05, + "loss": 0.0312, + "step": 215910 + }, + { + "epoch": 1.39, + "learning_rate": 9.096019672512052e-05, + "loss": 0.0259, + "step": 215920 + }, + { + "epoch": 1.39, + "learning_rate": 9.09505153707636e-05, + "loss": 0.0275, + "step": 215930 + }, + { + "epoch": 1.39, + "learning_rate": 9.094083401640666e-05, + "loss": 0.0248, + "step": 215940 + }, + { + "epoch": 1.39, + "learning_rate": 9.093115266204972e-05, + "loss": 0.029, + "step": 215950 + }, + { + "epoch": 1.39, + "learning_rate": 9.09214713076928e-05, + "loss": 0.0321, + "step": 215960 + }, + { + "epoch": 1.39, + "learning_rate": 9.091178995333586e-05, + "loss": 0.0305, + "step": 215970 + }, + { + "epoch": 1.39, + "learning_rate": 9.090210859897894e-05, + "loss": 0.0296, + "step": 215980 + }, + { + "epoch": 1.39, + "learning_rate": 9.0892427244622e-05, + "loss": 0.0301, + "step": 215990 + }, + { + "epoch": 1.39, + "learning_rate": 9.088274589026507e-05, + "loss": 0.0324, + "step": 216000 + }, + { + "epoch": 1.39, + "eval_cer": 0.9199457688396792, + "eval_loss": 0.020877143368124962, + "eval_runtime": 120.2616, + "eval_samples_per_second": 16.63, + "eval_steps_per_second": 4.158, + "step": 216000 + }, + { + "epoch": 1.39, + "learning_rate": 9.087306453590813e-05, + "loss": 0.031, + "step": 216010 + }, + { + "epoch": 1.39, + "learning_rate": 9.08633831815512e-05, + "loss": 0.0263, + "step": 216020 + }, + { + "epoch": 1.39, + "learning_rate": 9.085370182719428e-05, + "loss": 0.0279, + "step": 216030 + }, + { + "epoch": 1.39, + "learning_rate": 9.084402047283733e-05, + "loss": 0.03, + "step": 216040 + }, + { + "epoch": 1.39, + "learning_rate": 9.08343391184804e-05, + "loss": 0.0259, + "step": 216050 + }, + { + "epoch": 1.39, + "learning_rate": 9.082465776412348e-05, + "loss": 0.0288, + "step": 216060 + }, + { + "epoch": 1.39, + "learning_rate": 9.081497640976655e-05, + "loss": 0.0304, + "step": 216070 + }, + { + "epoch": 1.39, + "learning_rate": 9.080529505540961e-05, + "loss": 0.0328, + "step": 216080 + }, + { + "epoch": 1.39, + "learning_rate": 9.079561370105268e-05, + "loss": 0.0269, + "step": 216090 + }, + { + "epoch": 1.39, + "learning_rate": 9.078593234669574e-05, + "loss": 0.0287, + "step": 216100 + }, + { + "epoch": 1.39, + "learning_rate": 9.077625099233881e-05, + "loss": 0.0318, + "step": 216110 + }, + { + "epoch": 1.39, + "learning_rate": 9.076656963798188e-05, + "loss": 0.0272, + "step": 216120 + }, + { + "epoch": 1.39, + "learning_rate": 9.075688828362496e-05, + "loss": 0.0272, + "step": 216130 + }, + { + "epoch": 1.4, + "learning_rate": 9.074720692926802e-05, + "loss": 0.0261, + "step": 216140 + }, + { + "epoch": 1.4, + "learning_rate": 9.073752557491108e-05, + "loss": 0.0278, + "step": 216150 + }, + { + "epoch": 1.4, + "learning_rate": 9.072784422055415e-05, + "loss": 0.0278, + "step": 216160 + }, + { + "epoch": 1.4, + "learning_rate": 9.071816286619722e-05, + "loss": 0.0286, + "step": 216170 + }, + { + "epoch": 1.4, + "learning_rate": 9.070848151184029e-05, + "loss": 0.0318, + "step": 216180 + }, + { + "epoch": 1.4, + "learning_rate": 9.069880015748335e-05, + "loss": 0.0308, + "step": 216190 + }, + { + "epoch": 1.4, + "learning_rate": 9.068911880312642e-05, + "loss": 0.0266, + "step": 216200 + }, + { + "epoch": 1.4, + "learning_rate": 9.06794374487695e-05, + "loss": 0.0285, + "step": 216210 + }, + { + "epoch": 1.4, + "learning_rate": 9.066975609441255e-05, + "loss": 0.0289, + "step": 216220 + }, + { + "epoch": 1.4, + "learning_rate": 9.066007474005563e-05, + "loss": 0.0309, + "step": 216230 + }, + { + "epoch": 1.4, + "learning_rate": 9.06503933856987e-05, + "loss": 0.0294, + "step": 216240 + }, + { + "epoch": 1.4, + "learning_rate": 9.064071203134175e-05, + "loss": 0.0259, + "step": 216250 + }, + { + "epoch": 1.4, + "learning_rate": 9.063103067698483e-05, + "loss": 0.0257, + "step": 216260 + }, + { + "epoch": 1.4, + "learning_rate": 9.06213493226279e-05, + "loss": 0.0367, + "step": 216270 + }, + { + "epoch": 1.4, + "learning_rate": 9.061166796827098e-05, + "loss": 0.0253, + "step": 216280 + }, + { + "epoch": 1.4, + "learning_rate": 9.060198661391403e-05, + "loss": 0.0266, + "step": 216290 + }, + { + "epoch": 1.4, + "learning_rate": 9.05923052595571e-05, + "loss": 0.0301, + "step": 216300 + }, + { + "epoch": 1.4, + "learning_rate": 9.058262390520018e-05, + "loss": 0.0238, + "step": 216310 + }, + { + "epoch": 1.4, + "learning_rate": 9.057294255084323e-05, + "loss": 0.0302, + "step": 216320 + }, + { + "epoch": 1.4, + "learning_rate": 9.056326119648631e-05, + "loss": 0.0305, + "step": 216330 + }, + { + "epoch": 1.4, + "learning_rate": 9.055357984212937e-05, + "loss": 0.0276, + "step": 216340 + }, + { + "epoch": 1.4, + "learning_rate": 9.054389848777245e-05, + "loss": 0.0332, + "step": 216350 + }, + { + "epoch": 1.4, + "learning_rate": 9.053421713341551e-05, + "loss": 0.0248, + "step": 216360 + }, + { + "epoch": 1.4, + "learning_rate": 9.052453577905857e-05, + "loss": 0.0307, + "step": 216370 + }, + { + "epoch": 1.4, + "learning_rate": 9.051485442470165e-05, + "loss": 0.0299, + "step": 216380 + }, + { + "epoch": 1.4, + "learning_rate": 9.05051730703447e-05, + "loss": 0.0345, + "step": 216390 + }, + { + "epoch": 1.4, + "learning_rate": 9.049549171598777e-05, + "loss": 0.0335, + "step": 216400 + }, + { + "epoch": 1.4, + "learning_rate": 9.048581036163085e-05, + "loss": 0.033, + "step": 216410 + }, + { + "epoch": 1.4, + "learning_rate": 9.047612900727392e-05, + "loss": 0.0302, + "step": 216420 + }, + { + "epoch": 1.4, + "learning_rate": 9.046644765291698e-05, + "loss": 0.0268, + "step": 216430 + }, + { + "epoch": 1.4, + "learning_rate": 9.045676629856005e-05, + "loss": 0.03, + "step": 216440 + }, + { + "epoch": 1.4, + "learning_rate": 9.044708494420313e-05, + "loss": 0.0234, + "step": 216450 + }, + { + "epoch": 1.4, + "learning_rate": 9.043740358984618e-05, + "loss": 0.0323, + "step": 216460 + }, + { + "epoch": 1.4, + "learning_rate": 9.042772223548925e-05, + "loss": 0.0254, + "step": 216470 + }, + { + "epoch": 1.4, + "learning_rate": 9.041804088113233e-05, + "loss": 0.0318, + "step": 216480 + }, + { + "epoch": 1.4, + "learning_rate": 9.04083595267754e-05, + "loss": 0.0264, + "step": 216490 + }, + { + "epoch": 1.4, + "learning_rate": 9.039867817241845e-05, + "loss": 0.0293, + "step": 216500 + }, + { + "epoch": 1.4, + "learning_rate": 9.038899681806153e-05, + "loss": 0.0267, + "step": 216510 + }, + { + "epoch": 1.4, + "learning_rate": 9.03793154637046e-05, + "loss": 0.0293, + "step": 216520 + }, + { + "epoch": 1.4, + "learning_rate": 9.036963410934766e-05, + "loss": 0.0281, + "step": 216530 + }, + { + "epoch": 1.4, + "learning_rate": 9.035995275499073e-05, + "loss": 0.0295, + "step": 216540 + }, + { + "epoch": 1.4, + "learning_rate": 9.03502714006338e-05, + "loss": 0.0275, + "step": 216550 + }, + { + "epoch": 1.4, + "learning_rate": 9.034059004627687e-05, + "loss": 0.0277, + "step": 216560 + }, + { + "epoch": 1.4, + "learning_rate": 9.033090869191992e-05, + "loss": 0.0339, + "step": 216570 + }, + { + "epoch": 1.4, + "learning_rate": 9.0321227337563e-05, + "loss": 0.0271, + "step": 216580 + }, + { + "epoch": 1.4, + "learning_rate": 9.031154598320607e-05, + "loss": 0.0289, + "step": 216590 + }, + { + "epoch": 1.4, + "learning_rate": 9.030186462884912e-05, + "loss": 0.0303, + "step": 216600 + }, + { + "epoch": 1.4, + "learning_rate": 9.02921832744922e-05, + "loss": 0.0257, + "step": 216610 + }, + { + "epoch": 1.4, + "learning_rate": 9.028250192013527e-05, + "loss": 0.0263, + "step": 216620 + }, + { + "epoch": 1.4, + "learning_rate": 9.027282056577835e-05, + "loss": 0.0313, + "step": 216630 + }, + { + "epoch": 1.4, + "learning_rate": 9.02631392114214e-05, + "loss": 0.0285, + "step": 216640 + }, + { + "epoch": 1.4, + "learning_rate": 9.025345785706448e-05, + "loss": 0.0376, + "step": 216650 + }, + { + "epoch": 1.4, + "learning_rate": 9.024377650270755e-05, + "loss": 0.0282, + "step": 216660 + }, + { + "epoch": 1.4, + "learning_rate": 9.02340951483506e-05, + "loss": 0.0352, + "step": 216670 + }, + { + "epoch": 1.4, + "learning_rate": 9.022441379399368e-05, + "loss": 0.0281, + "step": 216680 + }, + { + "epoch": 1.4, + "learning_rate": 9.021473243963675e-05, + "loss": 0.0276, + "step": 216690 + }, + { + "epoch": 1.4, + "learning_rate": 9.020505108527983e-05, + "loss": 0.0295, + "step": 216700 + }, + { + "epoch": 1.4, + "learning_rate": 9.019536973092288e-05, + "loss": 0.03, + "step": 216710 + }, + { + "epoch": 1.4, + "learning_rate": 9.018568837656595e-05, + "loss": 0.0317, + "step": 216720 + }, + { + "epoch": 1.4, + "learning_rate": 9.017600702220903e-05, + "loss": 0.0227, + "step": 216730 + }, + { + "epoch": 1.4, + "learning_rate": 9.016632566785208e-05, + "loss": 0.0332, + "step": 216740 + }, + { + "epoch": 1.4, + "learning_rate": 9.015664431349516e-05, + "loss": 0.0276, + "step": 216750 + }, + { + "epoch": 1.4, + "learning_rate": 9.014696295913822e-05, + "loss": 0.0309, + "step": 216760 + }, + { + "epoch": 1.4, + "learning_rate": 9.01372816047813e-05, + "loss": 0.0262, + "step": 216770 + }, + { + "epoch": 1.4, + "learning_rate": 9.012760025042436e-05, + "loss": 0.0338, + "step": 216780 + }, + { + "epoch": 1.4, + "learning_rate": 9.011791889606742e-05, + "loss": 0.0234, + "step": 216790 + }, + { + "epoch": 1.4, + "learning_rate": 9.01082375417105e-05, + "loss": 0.0263, + "step": 216800 + }, + { + "epoch": 1.4, + "learning_rate": 9.009855618735356e-05, + "loss": 0.0284, + "step": 216810 + }, + { + "epoch": 1.4, + "learning_rate": 9.008887483299662e-05, + "loss": 0.0285, + "step": 216820 + }, + { + "epoch": 1.4, + "learning_rate": 9.00791934786397e-05, + "loss": 0.0299, + "step": 216830 + }, + { + "epoch": 1.4, + "learning_rate": 9.006951212428277e-05, + "loss": 0.0287, + "step": 216840 + }, + { + "epoch": 1.4, + "learning_rate": 9.005983076992583e-05, + "loss": 0.0258, + "step": 216850 + }, + { + "epoch": 1.4, + "learning_rate": 9.00501494155689e-05, + "loss": 0.0371, + "step": 216860 + }, + { + "epoch": 1.4, + "learning_rate": 9.004046806121198e-05, + "loss": 0.0293, + "step": 216870 + }, + { + "epoch": 1.4, + "learning_rate": 9.003078670685503e-05, + "loss": 0.0258, + "step": 216880 + }, + { + "epoch": 1.4, + "learning_rate": 9.00211053524981e-05, + "loss": 0.0239, + "step": 216890 + }, + { + "epoch": 1.4, + "learning_rate": 9.001142399814118e-05, + "loss": 0.0303, + "step": 216900 + }, + { + "epoch": 1.4, + "learning_rate": 9.000174264378424e-05, + "loss": 0.0259, + "step": 216910 + }, + { + "epoch": 1.4, + "learning_rate": 8.99920612894273e-05, + "loss": 0.0233, + "step": 216920 + }, + { + "epoch": 1.4, + "learning_rate": 8.998237993507038e-05, + "loss": 0.0266, + "step": 216930 + }, + { + "epoch": 1.4, + "learning_rate": 8.997269858071344e-05, + "loss": 0.0258, + "step": 216940 + }, + { + "epoch": 1.4, + "learning_rate": 8.996301722635651e-05, + "loss": 0.0301, + "step": 216950 + }, + { + "epoch": 1.4, + "learning_rate": 8.995333587199958e-05, + "loss": 0.0306, + "step": 216960 + }, + { + "epoch": 1.4, + "learning_rate": 8.994365451764266e-05, + "loss": 0.0301, + "step": 216970 + }, + { + "epoch": 1.4, + "learning_rate": 8.993397316328572e-05, + "loss": 0.0357, + "step": 216980 + }, + { + "epoch": 1.4, + "learning_rate": 8.992429180892877e-05, + "loss": 0.0262, + "step": 216990 + }, + { + "epoch": 1.4, + "learning_rate": 8.991461045457185e-05, + "loss": 0.0342, + "step": 217000 + }, + { + "epoch": 1.4, + "eval_cer": 0.9198969607953904, + "eval_loss": 0.020930752158164978, + "eval_runtime": 120.4671, + "eval_samples_per_second": 16.602, + "eval_steps_per_second": 4.151, + "step": 217000 + }, + { + "epoch": 1.4, + "learning_rate": 8.990492910021492e-05, + "loss": 0.025, + "step": 217010 + }, + { + "epoch": 1.4, + "learning_rate": 8.989524774585797e-05, + "loss": 0.0321, + "step": 217020 + }, + { + "epoch": 1.4, + "learning_rate": 8.988556639150105e-05, + "loss": 0.0283, + "step": 217030 + }, + { + "epoch": 1.4, + "learning_rate": 8.987588503714412e-05, + "loss": 0.0282, + "step": 217040 + }, + { + "epoch": 1.4, + "learning_rate": 8.98662036827872e-05, + "loss": 0.0263, + "step": 217050 + }, + { + "epoch": 1.4, + "learning_rate": 8.985652232843025e-05, + "loss": 0.0265, + "step": 217060 + }, + { + "epoch": 1.4, + "learning_rate": 8.984684097407333e-05, + "loss": 0.0281, + "step": 217070 + }, + { + "epoch": 1.4, + "learning_rate": 8.98371596197164e-05, + "loss": 0.0311, + "step": 217080 + }, + { + "epoch": 1.4, + "learning_rate": 8.982747826535945e-05, + "loss": 0.0271, + "step": 217090 + }, + { + "epoch": 1.4, + "learning_rate": 8.981779691100253e-05, + "loss": 0.027, + "step": 217100 + }, + { + "epoch": 1.4, + "learning_rate": 8.98081155566456e-05, + "loss": 0.0322, + "step": 217110 + }, + { + "epoch": 1.4, + "learning_rate": 8.979843420228868e-05, + "loss": 0.0309, + "step": 217120 + }, + { + "epoch": 1.4, + "learning_rate": 8.978875284793173e-05, + "loss": 0.0281, + "step": 217130 + }, + { + "epoch": 1.4, + "learning_rate": 8.97790714935748e-05, + "loss": 0.0271, + "step": 217140 + }, + { + "epoch": 1.4, + "learning_rate": 8.976939013921788e-05, + "loss": 0.0261, + "step": 217150 + }, + { + "epoch": 1.4, + "learning_rate": 8.975970878486093e-05, + "loss": 0.0285, + "step": 217160 + }, + { + "epoch": 1.4, + "learning_rate": 8.975002743050401e-05, + "loss": 0.031, + "step": 217170 + }, + { + "epoch": 1.4, + "learning_rate": 8.974034607614707e-05, + "loss": 0.0345, + "step": 217180 + }, + { + "epoch": 1.4, + "learning_rate": 8.973066472179014e-05, + "loss": 0.0312, + "step": 217190 + }, + { + "epoch": 1.4, + "learning_rate": 8.97209833674332e-05, + "loss": 0.028, + "step": 217200 + }, + { + "epoch": 1.4, + "learning_rate": 8.971130201307627e-05, + "loss": 0.0291, + "step": 217210 + }, + { + "epoch": 1.4, + "learning_rate": 8.970162065871935e-05, + "loss": 0.0251, + "step": 217220 + }, + { + "epoch": 1.4, + "learning_rate": 8.96919393043624e-05, + "loss": 0.0332, + "step": 217230 + }, + { + "epoch": 1.4, + "learning_rate": 8.968225795000547e-05, + "loss": 0.0289, + "step": 217240 + }, + { + "epoch": 1.4, + "learning_rate": 8.967257659564855e-05, + "loss": 0.0239, + "step": 217250 + }, + { + "epoch": 1.4, + "learning_rate": 8.966289524129162e-05, + "loss": 0.0285, + "step": 217260 + }, + { + "epoch": 1.4, + "learning_rate": 8.965321388693468e-05, + "loss": 0.0338, + "step": 217270 + }, + { + "epoch": 1.4, + "learning_rate": 8.964353253257775e-05, + "loss": 0.0359, + "step": 217280 + }, + { + "epoch": 1.4, + "learning_rate": 8.963385117822082e-05, + "loss": 0.0325, + "step": 217290 + }, + { + "epoch": 1.4, + "learning_rate": 8.962416982386388e-05, + "loss": 0.0333, + "step": 217300 + }, + { + "epoch": 1.4, + "learning_rate": 8.961448846950695e-05, + "loss": 0.0273, + "step": 217310 + }, + { + "epoch": 1.4, + "learning_rate": 8.960480711515003e-05, + "loss": 0.03, + "step": 217320 + }, + { + "epoch": 1.4, + "learning_rate": 8.95951257607931e-05, + "loss": 0.0313, + "step": 217330 + }, + { + "epoch": 1.4, + "learning_rate": 8.958544440643615e-05, + "loss": 0.0247, + "step": 217340 + }, + { + "epoch": 1.4, + "learning_rate": 8.957576305207923e-05, + "loss": 0.0281, + "step": 217350 + }, + { + "epoch": 1.4, + "learning_rate": 8.95660816977223e-05, + "loss": 0.0277, + "step": 217360 + }, + { + "epoch": 1.4, + "learning_rate": 8.955640034336536e-05, + "loss": 0.0271, + "step": 217370 + }, + { + "epoch": 1.4, + "learning_rate": 8.954671898900843e-05, + "loss": 0.0261, + "step": 217380 + }, + { + "epoch": 1.4, + "learning_rate": 8.953703763465149e-05, + "loss": 0.0286, + "step": 217390 + }, + { + "epoch": 1.4, + "learning_rate": 8.952735628029457e-05, + "loss": 0.0376, + "step": 217400 + }, + { + "epoch": 1.4, + "learning_rate": 8.951767492593762e-05, + "loss": 0.0303, + "step": 217410 + }, + { + "epoch": 1.4, + "learning_rate": 8.95079935715807e-05, + "loss": 0.0286, + "step": 217420 + }, + { + "epoch": 1.4, + "learning_rate": 8.949831221722377e-05, + "loss": 0.0289, + "step": 217430 + }, + { + "epoch": 1.4, + "learning_rate": 8.948863086286682e-05, + "loss": 0.0311, + "step": 217440 + }, + { + "epoch": 1.4, + "learning_rate": 8.94789495085099e-05, + "loss": 0.0264, + "step": 217450 + }, + { + "epoch": 1.4, + "learning_rate": 8.946926815415297e-05, + "loss": 0.027, + "step": 217460 + }, + { + "epoch": 1.4, + "learning_rate": 8.945958679979605e-05, + "loss": 0.0306, + "step": 217470 + }, + { + "epoch": 1.4, + "learning_rate": 8.94499054454391e-05, + "loss": 0.0307, + "step": 217480 + }, + { + "epoch": 1.4, + "learning_rate": 8.944022409108217e-05, + "loss": 0.0229, + "step": 217490 + }, + { + "epoch": 1.4, + "learning_rate": 8.943054273672525e-05, + "loss": 0.028, + "step": 217500 + }, + { + "epoch": 1.4, + "learning_rate": 8.94208613823683e-05, + "loss": 0.0284, + "step": 217510 + }, + { + "epoch": 1.4, + "learning_rate": 8.941118002801138e-05, + "loss": 0.0233, + "step": 217520 + }, + { + "epoch": 1.4, + "learning_rate": 8.940149867365445e-05, + "loss": 0.0267, + "step": 217530 + }, + { + "epoch": 1.4, + "learning_rate": 8.939181731929753e-05, + "loss": 0.0236, + "step": 217540 + }, + { + "epoch": 1.4, + "learning_rate": 8.938213596494058e-05, + "loss": 0.0306, + "step": 217550 + }, + { + "epoch": 1.4, + "learning_rate": 8.937245461058365e-05, + "loss": 0.0318, + "step": 217560 + }, + { + "epoch": 1.4, + "learning_rate": 8.936277325622673e-05, + "loss": 0.0244, + "step": 217570 + }, + { + "epoch": 1.4, + "learning_rate": 8.935309190186978e-05, + "loss": 0.0258, + "step": 217580 + }, + { + "epoch": 1.4, + "learning_rate": 8.934341054751284e-05, + "loss": 0.0249, + "step": 217590 + }, + { + "epoch": 1.4, + "learning_rate": 8.933372919315592e-05, + "loss": 0.0237, + "step": 217600 + }, + { + "epoch": 1.4, + "learning_rate": 8.932404783879899e-05, + "loss": 0.0251, + "step": 217610 + }, + { + "epoch": 1.4, + "learning_rate": 8.931436648444206e-05, + "loss": 0.0302, + "step": 217620 + }, + { + "epoch": 1.4, + "learning_rate": 8.930468513008512e-05, + "loss": 0.0259, + "step": 217630 + }, + { + "epoch": 1.4, + "learning_rate": 8.92950037757282e-05, + "loss": 0.0279, + "step": 217640 + }, + { + "epoch": 1.4, + "learning_rate": 8.928532242137125e-05, + "loss": 0.0291, + "step": 217650 + }, + { + "epoch": 1.4, + "learning_rate": 8.927564106701432e-05, + "loss": 0.029, + "step": 217660 + }, + { + "epoch": 1.4, + "learning_rate": 8.92659597126574e-05, + "loss": 0.0274, + "step": 217670 + }, + { + "epoch": 1.4, + "learning_rate": 8.925627835830047e-05, + "loss": 0.0367, + "step": 217680 + }, + { + "epoch": 1.41, + "learning_rate": 8.924659700394352e-05, + "loss": 0.029, + "step": 217690 + }, + { + "epoch": 1.41, + "learning_rate": 8.92369156495866e-05, + "loss": 0.0306, + "step": 217700 + }, + { + "epoch": 1.41, + "learning_rate": 8.922723429522967e-05, + "loss": 0.0361, + "step": 217710 + }, + { + "epoch": 1.41, + "learning_rate": 8.921755294087273e-05, + "loss": 0.0288, + "step": 217720 + }, + { + "epoch": 1.41, + "learning_rate": 8.92078715865158e-05, + "loss": 0.0333, + "step": 217730 + }, + { + "epoch": 1.41, + "learning_rate": 8.919819023215888e-05, + "loss": 0.0334, + "step": 217740 + }, + { + "epoch": 1.41, + "learning_rate": 8.918850887780194e-05, + "loss": 0.0276, + "step": 217750 + }, + { + "epoch": 1.41, + "learning_rate": 8.9178827523445e-05, + "loss": 0.0289, + "step": 217760 + }, + { + "epoch": 1.41, + "learning_rate": 8.916914616908808e-05, + "loss": 0.0244, + "step": 217770 + }, + { + "epoch": 1.41, + "learning_rate": 8.915946481473114e-05, + "loss": 0.0327, + "step": 217780 + }, + { + "epoch": 1.41, + "learning_rate": 8.91497834603742e-05, + "loss": 0.0319, + "step": 217790 + }, + { + "epoch": 1.41, + "learning_rate": 8.914010210601728e-05, + "loss": 0.0233, + "step": 217800 + }, + { + "epoch": 1.41, + "learning_rate": 8.913042075166034e-05, + "loss": 0.0261, + "step": 217810 + }, + { + "epoch": 1.41, + "learning_rate": 8.912073939730342e-05, + "loss": 0.031, + "step": 217820 + }, + { + "epoch": 1.41, + "learning_rate": 8.911105804294647e-05, + "loss": 0.0249, + "step": 217830 + }, + { + "epoch": 1.41, + "learning_rate": 8.910137668858955e-05, + "loss": 0.0309, + "step": 217840 + }, + { + "epoch": 1.41, + "learning_rate": 8.909169533423262e-05, + "loss": 0.0349, + "step": 217850 + }, + { + "epoch": 1.41, + "learning_rate": 8.908201397987567e-05, + "loss": 0.0269, + "step": 217860 + }, + { + "epoch": 1.41, + "learning_rate": 8.907233262551875e-05, + "loss": 0.033, + "step": 217870 + }, + { + "epoch": 1.41, + "learning_rate": 8.906265127116182e-05, + "loss": 0.027, + "step": 217880 + }, + { + "epoch": 1.41, + "learning_rate": 8.90529699168049e-05, + "loss": 0.0244, + "step": 217890 + }, + { + "epoch": 1.41, + "learning_rate": 8.904328856244795e-05, + "loss": 0.0264, + "step": 217900 + }, + { + "epoch": 1.41, + "learning_rate": 8.903360720809102e-05, + "loss": 0.0324, + "step": 217910 + }, + { + "epoch": 1.41, + "learning_rate": 8.90239258537341e-05, + "loss": 0.027, + "step": 217920 + }, + { + "epoch": 1.41, + "learning_rate": 8.901424449937715e-05, + "loss": 0.0232, + "step": 217930 + }, + { + "epoch": 1.41, + "learning_rate": 8.900456314502023e-05, + "loss": 0.031, + "step": 217940 + }, + { + "epoch": 1.41, + "learning_rate": 8.89948817906633e-05, + "loss": 0.0304, + "step": 217950 + }, + { + "epoch": 1.41, + "learning_rate": 8.898520043630638e-05, + "loss": 0.0341, + "step": 217960 + }, + { + "epoch": 1.41, + "learning_rate": 8.897551908194943e-05, + "loss": 0.0309, + "step": 217970 + }, + { + "epoch": 1.41, + "learning_rate": 8.89658377275925e-05, + "loss": 0.0257, + "step": 217980 + }, + { + "epoch": 1.41, + "learning_rate": 8.895615637323557e-05, + "loss": 0.03, + "step": 217990 + }, + { + "epoch": 1.41, + "learning_rate": 8.894647501887863e-05, + "loss": 0.0293, + "step": 218000 + }, + { + "epoch": 1.41, + "eval_cer": 0.9199186532595187, + "eval_loss": 0.02118774503469467, + "eval_runtime": 120.0083, + "eval_samples_per_second": 16.666, + "eval_steps_per_second": 4.166, + "step": 218000 + }, + { + "epoch": 1.41, + "learning_rate": 8.89367936645217e-05, + "loss": 0.0284, + "step": 218010 + }, + { + "epoch": 1.41, + "learning_rate": 8.892711231016477e-05, + "loss": 0.0282, + "step": 218020 + }, + { + "epoch": 1.41, + "learning_rate": 8.891743095580784e-05, + "loss": 0.0264, + "step": 218030 + }, + { + "epoch": 1.41, + "learning_rate": 8.89077496014509e-05, + "loss": 0.0312, + "step": 218040 + }, + { + "epoch": 1.41, + "learning_rate": 8.889806824709397e-05, + "loss": 0.0278, + "step": 218050 + }, + { + "epoch": 1.41, + "learning_rate": 8.888838689273705e-05, + "loss": 0.0239, + "step": 218060 + }, + { + "epoch": 1.41, + "learning_rate": 8.88787055383801e-05, + "loss": 0.0258, + "step": 218070 + }, + { + "epoch": 1.41, + "learning_rate": 8.886902418402317e-05, + "loss": 0.0275, + "step": 218080 + }, + { + "epoch": 1.41, + "learning_rate": 8.885934282966625e-05, + "loss": 0.0327, + "step": 218090 + }, + { + "epoch": 1.41, + "learning_rate": 8.884966147530932e-05, + "loss": 0.0341, + "step": 218100 + }, + { + "epoch": 1.41, + "learning_rate": 8.883998012095237e-05, + "loss": 0.0226, + "step": 218110 + }, + { + "epoch": 1.41, + "learning_rate": 8.883029876659545e-05, + "loss": 0.0254, + "step": 218120 + }, + { + "epoch": 1.41, + "learning_rate": 8.882061741223852e-05, + "loss": 0.0259, + "step": 218130 + }, + { + "epoch": 1.41, + "learning_rate": 8.881093605788158e-05, + "loss": 0.0278, + "step": 218140 + }, + { + "epoch": 1.41, + "learning_rate": 8.880125470352465e-05, + "loss": 0.0291, + "step": 218150 + }, + { + "epoch": 1.41, + "learning_rate": 8.879157334916773e-05, + "loss": 0.0315, + "step": 218160 + }, + { + "epoch": 1.41, + "learning_rate": 8.87818919948108e-05, + "loss": 0.0262, + "step": 218170 + }, + { + "epoch": 1.41, + "learning_rate": 8.877221064045385e-05, + "loss": 0.0274, + "step": 218180 + }, + { + "epoch": 1.41, + "learning_rate": 8.876252928609693e-05, + "loss": 0.0235, + "step": 218190 + }, + { + "epoch": 1.41, + "learning_rate": 8.875284793173999e-05, + "loss": 0.0271, + "step": 218200 + }, + { + "epoch": 1.41, + "learning_rate": 8.874316657738305e-05, + "loss": 0.0254, + "step": 218210 + }, + { + "epoch": 1.41, + "learning_rate": 8.873348522302613e-05, + "loss": 0.0242, + "step": 218220 + }, + { + "epoch": 1.41, + "learning_rate": 8.872380386866919e-05, + "loss": 0.0346, + "step": 218230 + }, + { + "epoch": 1.41, + "learning_rate": 8.871412251431227e-05, + "loss": 0.028, + "step": 218240 + }, + { + "epoch": 1.41, + "learning_rate": 8.870444115995532e-05, + "loss": 0.0299, + "step": 218250 + }, + { + "epoch": 1.41, + "learning_rate": 8.86947598055984e-05, + "loss": 0.0308, + "step": 218260 + }, + { + "epoch": 1.41, + "learning_rate": 8.868507845124147e-05, + "loss": 0.0267, + "step": 218270 + }, + { + "epoch": 1.41, + "learning_rate": 8.867539709688452e-05, + "loss": 0.0339, + "step": 218280 + }, + { + "epoch": 1.41, + "learning_rate": 8.86657157425276e-05, + "loss": 0.0254, + "step": 218290 + }, + { + "epoch": 1.41, + "learning_rate": 8.865603438817067e-05, + "loss": 0.0298, + "step": 218300 + }, + { + "epoch": 1.41, + "learning_rate": 8.864635303381375e-05, + "loss": 0.0306, + "step": 218310 + }, + { + "epoch": 1.41, + "learning_rate": 8.86366716794568e-05, + "loss": 0.0278, + "step": 218320 + }, + { + "epoch": 1.41, + "learning_rate": 8.862699032509987e-05, + "loss": 0.0302, + "step": 218330 + }, + { + "epoch": 1.41, + "learning_rate": 8.861730897074295e-05, + "loss": 0.0282, + "step": 218340 + }, + { + "epoch": 1.41, + "learning_rate": 8.8607627616386e-05, + "loss": 0.0263, + "step": 218350 + }, + { + "epoch": 1.41, + "learning_rate": 8.859794626202908e-05, + "loss": 0.0336, + "step": 218360 + }, + { + "epoch": 1.41, + "learning_rate": 8.858826490767215e-05, + "loss": 0.0354, + "step": 218370 + }, + { + "epoch": 1.41, + "learning_rate": 8.857858355331521e-05, + "loss": 0.031, + "step": 218380 + }, + { + "epoch": 1.41, + "learning_rate": 8.856890219895828e-05, + "loss": 0.0304, + "step": 218390 + }, + { + "epoch": 1.41, + "learning_rate": 8.855922084460134e-05, + "loss": 0.0321, + "step": 218400 + }, + { + "epoch": 1.41, + "learning_rate": 8.854953949024442e-05, + "loss": 0.0271, + "step": 218410 + }, + { + "epoch": 1.41, + "learning_rate": 8.853985813588748e-05, + "loss": 0.032, + "step": 218420 + }, + { + "epoch": 1.41, + "learning_rate": 8.853017678153054e-05, + "loss": 0.0285, + "step": 218430 + }, + { + "epoch": 1.41, + "learning_rate": 8.852049542717362e-05, + "loss": 0.0292, + "step": 218440 + }, + { + "epoch": 1.41, + "learning_rate": 8.851081407281669e-05, + "loss": 0.0314, + "step": 218450 + }, + { + "epoch": 1.41, + "learning_rate": 8.850113271845976e-05, + "loss": 0.0363, + "step": 218460 + }, + { + "epoch": 1.41, + "learning_rate": 8.849145136410282e-05, + "loss": 0.036, + "step": 218470 + }, + { + "epoch": 1.41, + "learning_rate": 8.848177000974589e-05, + "loss": 0.0387, + "step": 218480 + }, + { + "epoch": 1.41, + "learning_rate": 8.847208865538895e-05, + "loss": 0.0275, + "step": 218490 + }, + { + "epoch": 1.41, + "learning_rate": 8.846240730103202e-05, + "loss": 0.0292, + "step": 218500 + }, + { + "epoch": 1.41, + "learning_rate": 8.84527259466751e-05, + "loss": 0.0303, + "step": 218510 + }, + { + "epoch": 1.41, + "learning_rate": 8.844304459231817e-05, + "loss": 0.0312, + "step": 218520 + }, + { + "epoch": 1.41, + "learning_rate": 8.843336323796122e-05, + "loss": 0.0296, + "step": 218530 + }, + { + "epoch": 1.41, + "learning_rate": 8.84236818836043e-05, + "loss": 0.0299, + "step": 218540 + }, + { + "epoch": 1.41, + "learning_rate": 8.841400052924737e-05, + "loss": 0.0275, + "step": 218550 + }, + { + "epoch": 1.41, + "learning_rate": 8.840431917489043e-05, + "loss": 0.0314, + "step": 218560 + }, + { + "epoch": 1.41, + "learning_rate": 8.83946378205335e-05, + "loss": 0.0256, + "step": 218570 + }, + { + "epoch": 1.41, + "learning_rate": 8.838495646617656e-05, + "loss": 0.0317, + "step": 218580 + }, + { + "epoch": 1.41, + "learning_rate": 8.837527511181964e-05, + "loss": 0.0315, + "step": 218590 + }, + { + "epoch": 1.41, + "learning_rate": 8.83655937574627e-05, + "loss": 0.0279, + "step": 218600 + }, + { + "epoch": 1.41, + "learning_rate": 8.835591240310578e-05, + "loss": 0.0278, + "step": 218610 + }, + { + "epoch": 1.41, + "learning_rate": 8.834623104874884e-05, + "loss": 0.023, + "step": 218620 + }, + { + "epoch": 1.41, + "learning_rate": 8.83365496943919e-05, + "loss": 0.0297, + "step": 218630 + }, + { + "epoch": 1.41, + "learning_rate": 8.832686834003498e-05, + "loss": 0.0247, + "step": 218640 + }, + { + "epoch": 1.41, + "learning_rate": 8.831718698567804e-05, + "loss": 0.0304, + "step": 218650 + }, + { + "epoch": 1.41, + "learning_rate": 8.830750563132111e-05, + "loss": 0.0257, + "step": 218660 + }, + { + "epoch": 1.41, + "learning_rate": 8.829782427696417e-05, + "loss": 0.0281, + "step": 218670 + }, + { + "epoch": 1.41, + "learning_rate": 8.828814292260724e-05, + "loss": 0.0276, + "step": 218680 + }, + { + "epoch": 1.41, + "learning_rate": 8.827846156825032e-05, + "loss": 0.0221, + "step": 218690 + }, + { + "epoch": 1.41, + "learning_rate": 8.826878021389337e-05, + "loss": 0.0332, + "step": 218700 + }, + { + "epoch": 1.41, + "learning_rate": 8.825909885953645e-05, + "loss": 0.0288, + "step": 218710 + }, + { + "epoch": 1.41, + "learning_rate": 8.824941750517952e-05, + "loss": 0.0291, + "step": 218720 + }, + { + "epoch": 1.41, + "learning_rate": 8.823973615082257e-05, + "loss": 0.0246, + "step": 218730 + }, + { + "epoch": 1.41, + "learning_rate": 8.823005479646565e-05, + "loss": 0.0267, + "step": 218740 + }, + { + "epoch": 1.41, + "learning_rate": 8.822037344210872e-05, + "loss": 0.0271, + "step": 218750 + }, + { + "epoch": 1.41, + "learning_rate": 8.82106920877518e-05, + "loss": 0.0287, + "step": 218760 + }, + { + "epoch": 1.41, + "learning_rate": 8.820101073339485e-05, + "loss": 0.0342, + "step": 218770 + }, + { + "epoch": 1.41, + "learning_rate": 8.819132937903792e-05, + "loss": 0.0306, + "step": 218780 + }, + { + "epoch": 1.41, + "learning_rate": 8.8181648024681e-05, + "loss": 0.0314, + "step": 218790 + }, + { + "epoch": 1.41, + "learning_rate": 8.817196667032405e-05, + "loss": 0.0359, + "step": 218800 + }, + { + "epoch": 1.41, + "learning_rate": 8.816228531596713e-05, + "loss": 0.0238, + "step": 218810 + }, + { + "epoch": 1.41, + "learning_rate": 8.81526039616102e-05, + "loss": 0.0297, + "step": 218820 + }, + { + "epoch": 1.41, + "learning_rate": 8.814292260725327e-05, + "loss": 0.0336, + "step": 218830 + }, + { + "epoch": 1.41, + "learning_rate": 8.813324125289633e-05, + "loss": 0.0258, + "step": 218840 + }, + { + "epoch": 1.41, + "learning_rate": 8.81235598985394e-05, + "loss": 0.0244, + "step": 218850 + }, + { + "epoch": 1.41, + "learning_rate": 8.811387854418247e-05, + "loss": 0.0287, + "step": 218860 + }, + { + "epoch": 1.41, + "learning_rate": 8.810419718982553e-05, + "loss": 0.0253, + "step": 218870 + }, + { + "epoch": 1.41, + "learning_rate": 8.809451583546859e-05, + "loss": 0.035, + "step": 218880 + }, + { + "epoch": 1.41, + "learning_rate": 8.808483448111167e-05, + "loss": 0.0318, + "step": 218890 + }, + { + "epoch": 1.41, + "learning_rate": 8.807515312675474e-05, + "loss": 0.0294, + "step": 218900 + }, + { + "epoch": 1.41, + "learning_rate": 8.80654717723978e-05, + "loss": 0.0262, + "step": 218910 + }, + { + "epoch": 1.41, + "learning_rate": 8.805579041804087e-05, + "loss": 0.028, + "step": 218920 + }, + { + "epoch": 1.41, + "learning_rate": 8.804610906368395e-05, + "loss": 0.0291, + "step": 218930 + }, + { + "epoch": 1.41, + "learning_rate": 8.8036427709327e-05, + "loss": 0.0342, + "step": 218940 + }, + { + "epoch": 1.41, + "learning_rate": 8.802674635497007e-05, + "loss": 0.0271, + "step": 218950 + }, + { + "epoch": 1.41, + "learning_rate": 8.801706500061315e-05, + "loss": 0.0273, + "step": 218960 + }, + { + "epoch": 1.41, + "learning_rate": 8.800738364625622e-05, + "loss": 0.0305, + "step": 218970 + }, + { + "epoch": 1.41, + "learning_rate": 8.799770229189927e-05, + "loss": 0.0309, + "step": 218980 + }, + { + "epoch": 1.41, + "learning_rate": 8.798802093754235e-05, + "loss": 0.0292, + "step": 218990 + }, + { + "epoch": 1.41, + "learning_rate": 8.797833958318541e-05, + "loss": 0.0281, + "step": 219000 + }, + { + "epoch": 1.41, + "eval_cer": 0.9199114224381426, + "eval_loss": 0.020875846967101097, + "eval_runtime": 120.3649, + "eval_samples_per_second": 16.616, + "eval_steps_per_second": 4.154, + "step": 219000 + }, + { + "epoch": 1.41, + "learning_rate": 8.796865822882848e-05, + "loss": 0.029, + "step": 219010 + }, + { + "epoch": 1.41, + "learning_rate": 8.795897687447155e-05, + "loss": 0.0278, + "step": 219020 + }, + { + "epoch": 1.41, + "learning_rate": 8.794929552011463e-05, + "loss": 0.0298, + "step": 219030 + }, + { + "epoch": 1.41, + "learning_rate": 8.793961416575769e-05, + "loss": 0.0317, + "step": 219040 + }, + { + "epoch": 1.41, + "learning_rate": 8.792993281140075e-05, + "loss": 0.0408, + "step": 219050 + }, + { + "epoch": 1.41, + "learning_rate": 8.792025145704383e-05, + "loss": 0.0263, + "step": 219060 + }, + { + "epoch": 1.41, + "learning_rate": 8.791057010268689e-05, + "loss": 0.0247, + "step": 219070 + }, + { + "epoch": 1.41, + "learning_rate": 8.790088874832994e-05, + "loss": 0.0266, + "step": 219080 + }, + { + "epoch": 1.41, + "learning_rate": 8.789120739397302e-05, + "loss": 0.026, + "step": 219090 + }, + { + "epoch": 1.41, + "learning_rate": 8.788152603961609e-05, + "loss": 0.0251, + "step": 219100 + }, + { + "epoch": 1.41, + "learning_rate": 8.787184468525917e-05, + "loss": 0.023, + "step": 219110 + }, + { + "epoch": 1.41, + "learning_rate": 8.786216333090222e-05, + "loss": 0.0243, + "step": 219120 + }, + { + "epoch": 1.41, + "learning_rate": 8.78524819765453e-05, + "loss": 0.0238, + "step": 219130 + }, + { + "epoch": 1.41, + "learning_rate": 8.784280062218837e-05, + "loss": 0.0268, + "step": 219140 + }, + { + "epoch": 1.41, + "learning_rate": 8.783311926783142e-05, + "loss": 0.0304, + "step": 219150 + }, + { + "epoch": 1.41, + "learning_rate": 8.78234379134745e-05, + "loss": 0.0228, + "step": 219160 + }, + { + "epoch": 1.41, + "learning_rate": 8.781375655911757e-05, + "loss": 0.0381, + "step": 219170 + }, + { + "epoch": 1.41, + "learning_rate": 8.780407520476065e-05, + "loss": 0.0305, + "step": 219180 + }, + { + "epoch": 1.41, + "learning_rate": 8.77943938504037e-05, + "loss": 0.0282, + "step": 219190 + }, + { + "epoch": 1.41, + "learning_rate": 8.778471249604677e-05, + "loss": 0.0325, + "step": 219200 + }, + { + "epoch": 1.41, + "learning_rate": 8.777503114168985e-05, + "loss": 0.0234, + "step": 219210 + }, + { + "epoch": 1.41, + "learning_rate": 8.77653497873329e-05, + "loss": 0.0273, + "step": 219220 + }, + { + "epoch": 1.41, + "learning_rate": 8.775566843297598e-05, + "loss": 0.0305, + "step": 219230 + }, + { + "epoch": 1.42, + "learning_rate": 8.774598707861904e-05, + "loss": 0.0287, + "step": 219240 + }, + { + "epoch": 1.42, + "learning_rate": 8.773630572426212e-05, + "loss": 0.0304, + "step": 219250 + }, + { + "epoch": 1.42, + "learning_rate": 8.772662436990518e-05, + "loss": 0.0311, + "step": 219260 + }, + { + "epoch": 1.42, + "learning_rate": 8.771694301554824e-05, + "loss": 0.0281, + "step": 219270 + }, + { + "epoch": 1.42, + "learning_rate": 8.770726166119132e-05, + "loss": 0.0264, + "step": 219280 + }, + { + "epoch": 1.42, + "learning_rate": 8.769758030683438e-05, + "loss": 0.0296, + "step": 219290 + }, + { + "epoch": 1.42, + "learning_rate": 8.768789895247744e-05, + "loss": 0.0289, + "step": 219300 + }, + { + "epoch": 1.42, + "learning_rate": 8.767821759812052e-05, + "loss": 0.0292, + "step": 219310 + }, + { + "epoch": 1.42, + "learning_rate": 8.766853624376359e-05, + "loss": 0.0341, + "step": 219320 + }, + { + "epoch": 1.42, + "learning_rate": 8.765885488940665e-05, + "loss": 0.0286, + "step": 219330 + }, + { + "epoch": 1.42, + "learning_rate": 8.764917353504972e-05, + "loss": 0.0296, + "step": 219340 + }, + { + "epoch": 1.42, + "learning_rate": 8.76394921806928e-05, + "loss": 0.029, + "step": 219350 + }, + { + "epoch": 1.42, + "learning_rate": 8.762981082633585e-05, + "loss": 0.0238, + "step": 219360 + }, + { + "epoch": 1.42, + "learning_rate": 8.762012947197892e-05, + "loss": 0.0288, + "step": 219370 + }, + { + "epoch": 1.42, + "learning_rate": 8.7610448117622e-05, + "loss": 0.0307, + "step": 219380 + }, + { + "epoch": 1.42, + "learning_rate": 8.760076676326507e-05, + "loss": 0.0308, + "step": 219390 + }, + { + "epoch": 1.42, + "learning_rate": 8.759108540890812e-05, + "loss": 0.0278, + "step": 219400 + }, + { + "epoch": 1.42, + "learning_rate": 8.75814040545512e-05, + "loss": 0.0296, + "step": 219410 + }, + { + "epoch": 1.42, + "learning_rate": 8.757172270019426e-05, + "loss": 0.0271, + "step": 219420 + }, + { + "epoch": 1.42, + "learning_rate": 8.756204134583733e-05, + "loss": 0.0321, + "step": 219430 + }, + { + "epoch": 1.42, + "learning_rate": 8.75523599914804e-05, + "loss": 0.0341, + "step": 219440 + }, + { + "epoch": 1.42, + "learning_rate": 8.754267863712348e-05, + "loss": 0.0277, + "step": 219450 + }, + { + "epoch": 1.42, + "learning_rate": 8.753299728276654e-05, + "loss": 0.0312, + "step": 219460 + }, + { + "epoch": 1.42, + "learning_rate": 8.75233159284096e-05, + "loss": 0.0291, + "step": 219470 + }, + { + "epoch": 1.42, + "learning_rate": 8.751363457405267e-05, + "loss": 0.0258, + "step": 219480 + }, + { + "epoch": 1.42, + "learning_rate": 8.750395321969574e-05, + "loss": 0.0255, + "step": 219490 + }, + { + "epoch": 1.42, + "learning_rate": 8.74942718653388e-05, + "loss": 0.0285, + "step": 219500 + }, + { + "epoch": 1.42, + "learning_rate": 8.748459051098187e-05, + "loss": 0.0323, + "step": 219510 + }, + { + "epoch": 1.42, + "learning_rate": 8.747490915662494e-05, + "loss": 0.0268, + "step": 219520 + }, + { + "epoch": 1.42, + "learning_rate": 8.746522780226802e-05, + "loss": 0.0269, + "step": 219530 + }, + { + "epoch": 1.42, + "learning_rate": 8.745554644791107e-05, + "loss": 0.0297, + "step": 219540 + }, + { + "epoch": 1.42, + "learning_rate": 8.744586509355415e-05, + "loss": 0.0264, + "step": 219550 + }, + { + "epoch": 1.42, + "learning_rate": 8.743618373919722e-05, + "loss": 0.0258, + "step": 219560 + }, + { + "epoch": 1.42, + "learning_rate": 8.742650238484027e-05, + "loss": 0.0284, + "step": 219570 + }, + { + "epoch": 1.42, + "learning_rate": 8.741682103048335e-05, + "loss": 0.0278, + "step": 219580 + }, + { + "epoch": 1.42, + "learning_rate": 8.740713967612642e-05, + "loss": 0.0288, + "step": 219590 + }, + { + "epoch": 1.42, + "learning_rate": 8.73974583217695e-05, + "loss": 0.0278, + "step": 219600 + }, + { + "epoch": 1.42, + "learning_rate": 8.738777696741255e-05, + "loss": 0.0242, + "step": 219610 + }, + { + "epoch": 1.42, + "learning_rate": 8.737809561305562e-05, + "loss": 0.0237, + "step": 219620 + }, + { + "epoch": 1.42, + "learning_rate": 8.73684142586987e-05, + "loss": 0.0294, + "step": 219630 + }, + { + "epoch": 1.42, + "learning_rate": 8.735873290434175e-05, + "loss": 0.0303, + "step": 219640 + }, + { + "epoch": 1.42, + "learning_rate": 8.734905154998483e-05, + "loss": 0.0303, + "step": 219650 + }, + { + "epoch": 1.42, + "learning_rate": 8.73393701956279e-05, + "loss": 0.0282, + "step": 219660 + }, + { + "epoch": 1.42, + "learning_rate": 8.732968884127096e-05, + "loss": 0.0257, + "step": 219670 + }, + { + "epoch": 1.42, + "learning_rate": 8.732000748691403e-05, + "loss": 0.0281, + "step": 219680 + }, + { + "epoch": 1.42, + "learning_rate": 8.731032613255709e-05, + "loss": 0.0271, + "step": 219690 + }, + { + "epoch": 1.42, + "learning_rate": 8.730064477820017e-05, + "loss": 0.0223, + "step": 219700 + }, + { + "epoch": 1.42, + "learning_rate": 8.729096342384323e-05, + "loss": 0.0207, + "step": 219710 + }, + { + "epoch": 1.42, + "learning_rate": 8.728128206948629e-05, + "loss": 0.0319, + "step": 219720 + }, + { + "epoch": 1.42, + "learning_rate": 8.727160071512937e-05, + "loss": 0.0304, + "step": 219730 + }, + { + "epoch": 1.42, + "learning_rate": 8.726191936077244e-05, + "loss": 0.0289, + "step": 219740 + }, + { + "epoch": 1.42, + "learning_rate": 8.72522380064155e-05, + "loss": 0.0326, + "step": 219750 + }, + { + "epoch": 1.42, + "learning_rate": 8.724255665205857e-05, + "loss": 0.0238, + "step": 219760 + }, + { + "epoch": 1.42, + "learning_rate": 8.723287529770164e-05, + "loss": 0.0278, + "step": 219770 + }, + { + "epoch": 1.42, + "learning_rate": 8.72231939433447e-05, + "loss": 0.0321, + "step": 219780 + }, + { + "epoch": 1.42, + "learning_rate": 8.721351258898777e-05, + "loss": 0.0248, + "step": 219790 + }, + { + "epoch": 1.42, + "learning_rate": 8.720383123463085e-05, + "loss": 0.0269, + "step": 219800 + }, + { + "epoch": 1.42, + "learning_rate": 8.719414988027391e-05, + "loss": 0.032, + "step": 219810 + }, + { + "epoch": 1.42, + "learning_rate": 8.718446852591697e-05, + "loss": 0.027, + "step": 219820 + }, + { + "epoch": 1.42, + "learning_rate": 8.717478717156005e-05, + "loss": 0.0287, + "step": 219830 + }, + { + "epoch": 1.42, + "learning_rate": 8.716510581720311e-05, + "loss": 0.027, + "step": 219840 + }, + { + "epoch": 1.42, + "learning_rate": 8.715542446284618e-05, + "loss": 0.027, + "step": 219850 + }, + { + "epoch": 1.42, + "learning_rate": 8.714574310848925e-05, + "loss": 0.0276, + "step": 219860 + }, + { + "epoch": 1.42, + "learning_rate": 8.713606175413233e-05, + "loss": 0.0305, + "step": 219870 + }, + { + "epoch": 1.42, + "learning_rate": 8.712638039977539e-05, + "loss": 0.028, + "step": 219880 + }, + { + "epoch": 1.42, + "learning_rate": 8.711669904541844e-05, + "loss": 0.0272, + "step": 219890 + }, + { + "epoch": 1.42, + "learning_rate": 8.710701769106152e-05, + "loss": 0.0259, + "step": 219900 + }, + { + "epoch": 1.42, + "learning_rate": 8.709733633670459e-05, + "loss": 0.0329, + "step": 219910 + }, + { + "epoch": 1.42, + "learning_rate": 8.708765498234764e-05, + "loss": 0.0285, + "step": 219920 + }, + { + "epoch": 1.42, + "learning_rate": 8.707797362799072e-05, + "loss": 0.0296, + "step": 219930 + }, + { + "epoch": 1.42, + "learning_rate": 8.706829227363379e-05, + "loss": 0.0243, + "step": 219940 + }, + { + "epoch": 1.42, + "learning_rate": 8.705861091927687e-05, + "loss": 0.0274, + "step": 219950 + }, + { + "epoch": 1.42, + "learning_rate": 8.704892956491992e-05, + "loss": 0.0319, + "step": 219960 + }, + { + "epoch": 1.42, + "learning_rate": 8.7039248210563e-05, + "loss": 0.0299, + "step": 219970 + }, + { + "epoch": 1.42, + "learning_rate": 8.702956685620607e-05, + "loss": 0.029, + "step": 219980 + }, + { + "epoch": 1.42, + "learning_rate": 8.701988550184912e-05, + "loss": 0.0277, + "step": 219990 + }, + { + "epoch": 1.42, + "learning_rate": 8.70102041474922e-05, + "loss": 0.0286, + "step": 220000 + }, + { + "epoch": 1.42, + "eval_cer": 0.9197812676533725, + "eval_loss": 0.02094407007098198, + "eval_runtime": 120.2687, + "eval_samples_per_second": 16.629, + "eval_steps_per_second": 4.157, + "step": 220000 + }, + { + "epoch": 1.42, + "learning_rate": 8.700052279313527e-05, + "loss": 0.0248, + "step": 220010 + }, + { + "epoch": 1.42, + "learning_rate": 8.699084143877835e-05, + "loss": 0.0287, + "step": 220020 + }, + { + "epoch": 1.42, + "learning_rate": 8.69811600844214e-05, + "loss": 0.0262, + "step": 220030 + }, + { + "epoch": 1.42, + "learning_rate": 8.697147873006447e-05, + "loss": 0.0293, + "step": 220040 + }, + { + "epoch": 1.42, + "learning_rate": 8.696179737570755e-05, + "loss": 0.0248, + "step": 220050 + }, + { + "epoch": 1.42, + "learning_rate": 8.69521160213506e-05, + "loss": 0.026, + "step": 220060 + }, + { + "epoch": 1.42, + "learning_rate": 8.694243466699368e-05, + "loss": 0.0303, + "step": 220070 + }, + { + "epoch": 1.42, + "learning_rate": 8.693275331263674e-05, + "loss": 0.0323, + "step": 220080 + }, + { + "epoch": 1.42, + "learning_rate": 8.692307195827981e-05, + "loss": 0.0306, + "step": 220090 + }, + { + "epoch": 1.42, + "learning_rate": 8.691339060392288e-05, + "loss": 0.0322, + "step": 220100 + }, + { + "epoch": 1.42, + "learning_rate": 8.690370924956594e-05, + "loss": 0.0276, + "step": 220110 + }, + { + "epoch": 1.42, + "learning_rate": 8.689402789520902e-05, + "loss": 0.0282, + "step": 220120 + }, + { + "epoch": 1.42, + "learning_rate": 8.688434654085208e-05, + "loss": 0.0335, + "step": 220130 + }, + { + "epoch": 1.42, + "learning_rate": 8.687466518649514e-05, + "loss": 0.0301, + "step": 220140 + }, + { + "epoch": 1.42, + "learning_rate": 8.686498383213822e-05, + "loss": 0.0294, + "step": 220150 + }, + { + "epoch": 1.42, + "learning_rate": 8.685530247778129e-05, + "loss": 0.0268, + "step": 220160 + }, + { + "epoch": 1.42, + "learning_rate": 8.684562112342435e-05, + "loss": 0.0302, + "step": 220170 + }, + { + "epoch": 1.42, + "learning_rate": 8.683593976906742e-05, + "loss": 0.0297, + "step": 220180 + }, + { + "epoch": 1.42, + "learning_rate": 8.682625841471049e-05, + "loss": 0.0249, + "step": 220190 + }, + { + "epoch": 1.42, + "learning_rate": 8.681657706035355e-05, + "loss": 0.0291, + "step": 220200 + }, + { + "epoch": 1.42, + "learning_rate": 8.680689570599662e-05, + "loss": 0.0248, + "step": 220210 + }, + { + "epoch": 1.42, + "learning_rate": 8.67972143516397e-05, + "loss": 0.0288, + "step": 220220 + }, + { + "epoch": 1.42, + "learning_rate": 8.678753299728276e-05, + "loss": 0.0235, + "step": 220230 + }, + { + "epoch": 1.42, + "learning_rate": 8.677785164292582e-05, + "loss": 0.0308, + "step": 220240 + }, + { + "epoch": 1.42, + "learning_rate": 8.67681702885689e-05, + "loss": 0.0312, + "step": 220250 + }, + { + "epoch": 1.42, + "learning_rate": 8.675848893421196e-05, + "loss": 0.0293, + "step": 220260 + }, + { + "epoch": 1.42, + "learning_rate": 8.674880757985503e-05, + "loss": 0.0302, + "step": 220270 + }, + { + "epoch": 1.42, + "learning_rate": 8.67391262254981e-05, + "loss": 0.0265, + "step": 220280 + }, + { + "epoch": 1.42, + "learning_rate": 8.672944487114116e-05, + "loss": 0.0347, + "step": 220290 + }, + { + "epoch": 1.42, + "learning_rate": 8.671976351678424e-05, + "loss": 0.0382, + "step": 220300 + }, + { + "epoch": 1.42, + "learning_rate": 8.67100821624273e-05, + "loss": 0.0296, + "step": 220310 + }, + { + "epoch": 1.42, + "learning_rate": 8.670040080807037e-05, + "loss": 0.0283, + "step": 220320 + }, + { + "epoch": 1.42, + "learning_rate": 8.669071945371344e-05, + "loss": 0.0231, + "step": 220330 + }, + { + "epoch": 1.42, + "learning_rate": 8.66810380993565e-05, + "loss": 0.0287, + "step": 220340 + }, + { + "epoch": 1.42, + "learning_rate": 8.667135674499957e-05, + "loss": 0.0318, + "step": 220350 + }, + { + "epoch": 1.42, + "learning_rate": 8.666167539064264e-05, + "loss": 0.0261, + "step": 220360 + }, + { + "epoch": 1.42, + "learning_rate": 8.665199403628572e-05, + "loss": 0.0241, + "step": 220370 + }, + { + "epoch": 1.42, + "learning_rate": 8.664231268192877e-05, + "loss": 0.0328, + "step": 220380 + }, + { + "epoch": 1.42, + "learning_rate": 8.663263132757184e-05, + "loss": 0.0272, + "step": 220390 + }, + { + "epoch": 1.42, + "learning_rate": 8.662294997321492e-05, + "loss": 0.0301, + "step": 220400 + }, + { + "epoch": 1.42, + "learning_rate": 8.661326861885797e-05, + "loss": 0.0244, + "step": 220410 + }, + { + "epoch": 1.42, + "learning_rate": 8.660358726450105e-05, + "loss": 0.0281, + "step": 220420 + }, + { + "epoch": 1.42, + "learning_rate": 8.659390591014412e-05, + "loss": 0.024, + "step": 220430 + }, + { + "epoch": 1.42, + "learning_rate": 8.65842245557872e-05, + "loss": 0.0313, + "step": 220440 + }, + { + "epoch": 1.42, + "learning_rate": 8.657454320143025e-05, + "loss": 0.0303, + "step": 220450 + }, + { + "epoch": 1.42, + "learning_rate": 8.656486184707332e-05, + "loss": 0.0257, + "step": 220460 + }, + { + "epoch": 1.42, + "learning_rate": 8.65551804927164e-05, + "loss": 0.0259, + "step": 220470 + }, + { + "epoch": 1.42, + "learning_rate": 8.654549913835945e-05, + "loss": 0.0268, + "step": 220480 + }, + { + "epoch": 1.42, + "learning_rate": 8.653581778400251e-05, + "loss": 0.0283, + "step": 220490 + }, + { + "epoch": 1.42, + "learning_rate": 8.65261364296456e-05, + "loss": 0.0251, + "step": 220500 + }, + { + "epoch": 1.42, + "learning_rate": 8.651645507528866e-05, + "loss": 0.026, + "step": 220510 + }, + { + "epoch": 1.42, + "learning_rate": 8.650677372093173e-05, + "loss": 0.0233, + "step": 220520 + }, + { + "epoch": 1.42, + "learning_rate": 8.649709236657479e-05, + "loss": 0.0329, + "step": 220530 + }, + { + "epoch": 1.42, + "learning_rate": 8.648741101221787e-05, + "loss": 0.0331, + "step": 220540 + }, + { + "epoch": 1.42, + "learning_rate": 8.647772965786093e-05, + "loss": 0.0301, + "step": 220550 + }, + { + "epoch": 1.42, + "learning_rate": 8.646804830350399e-05, + "loss": 0.0248, + "step": 220560 + }, + { + "epoch": 1.42, + "learning_rate": 8.645836694914707e-05, + "loss": 0.026, + "step": 220570 + }, + { + "epoch": 1.42, + "learning_rate": 8.644868559479014e-05, + "loss": 0.0295, + "step": 220580 + }, + { + "epoch": 1.42, + "learning_rate": 8.643900424043319e-05, + "loss": 0.0251, + "step": 220590 + }, + { + "epoch": 1.42, + "learning_rate": 8.642932288607627e-05, + "loss": 0.0271, + "step": 220600 + }, + { + "epoch": 1.42, + "learning_rate": 8.641964153171934e-05, + "loss": 0.0224, + "step": 220610 + }, + { + "epoch": 1.42, + "learning_rate": 8.64099601773624e-05, + "loss": 0.0286, + "step": 220620 + }, + { + "epoch": 1.42, + "learning_rate": 8.640027882300547e-05, + "loss": 0.0257, + "step": 220630 + }, + { + "epoch": 1.42, + "learning_rate": 8.639059746864855e-05, + "loss": 0.0267, + "step": 220640 + }, + { + "epoch": 1.42, + "learning_rate": 8.638091611429161e-05, + "loss": 0.0315, + "step": 220650 + }, + { + "epoch": 1.42, + "learning_rate": 8.637123475993467e-05, + "loss": 0.0293, + "step": 220660 + }, + { + "epoch": 1.42, + "learning_rate": 8.636155340557775e-05, + "loss": 0.0255, + "step": 220670 + }, + { + "epoch": 1.42, + "learning_rate": 8.635187205122081e-05, + "loss": 0.0312, + "step": 220680 + }, + { + "epoch": 1.42, + "learning_rate": 8.634219069686387e-05, + "loss": 0.0282, + "step": 220690 + }, + { + "epoch": 1.42, + "learning_rate": 8.633250934250695e-05, + "loss": 0.0241, + "step": 220700 + }, + { + "epoch": 1.42, + "learning_rate": 8.632282798815001e-05, + "loss": 0.0289, + "step": 220710 + }, + { + "epoch": 1.42, + "learning_rate": 8.631314663379309e-05, + "loss": 0.0269, + "step": 220720 + }, + { + "epoch": 1.42, + "learning_rate": 8.630346527943614e-05, + "loss": 0.0327, + "step": 220730 + }, + { + "epoch": 1.42, + "learning_rate": 8.629378392507922e-05, + "loss": 0.0265, + "step": 220740 + }, + { + "epoch": 1.42, + "learning_rate": 8.628410257072229e-05, + "loss": 0.0323, + "step": 220750 + }, + { + "epoch": 1.42, + "learning_rate": 8.627442121636534e-05, + "loss": 0.0311, + "step": 220760 + }, + { + "epoch": 1.42, + "learning_rate": 8.626473986200842e-05, + "loss": 0.0339, + "step": 220770 + }, + { + "epoch": 1.42, + "learning_rate": 8.625505850765149e-05, + "loss": 0.028, + "step": 220780 + }, + { + "epoch": 1.43, + "learning_rate": 8.624537715329457e-05, + "loss": 0.03, + "step": 220790 + }, + { + "epoch": 1.43, + "learning_rate": 8.623569579893762e-05, + "loss": 0.0232, + "step": 220800 + }, + { + "epoch": 1.43, + "learning_rate": 8.622601444458069e-05, + "loss": 0.0298, + "step": 220810 + }, + { + "epoch": 1.43, + "learning_rate": 8.621633309022377e-05, + "loss": 0.0379, + "step": 220820 + }, + { + "epoch": 1.43, + "learning_rate": 8.620665173586682e-05, + "loss": 0.0273, + "step": 220830 + }, + { + "epoch": 1.43, + "learning_rate": 8.61969703815099e-05, + "loss": 0.0266, + "step": 220840 + }, + { + "epoch": 1.43, + "learning_rate": 8.618728902715297e-05, + "loss": 0.0302, + "step": 220850 + }, + { + "epoch": 1.43, + "learning_rate": 8.617760767279605e-05, + "loss": 0.0271, + "step": 220860 + }, + { + "epoch": 1.43, + "learning_rate": 8.61679263184391e-05, + "loss": 0.0289, + "step": 220870 + }, + { + "epoch": 1.43, + "learning_rate": 8.615824496408217e-05, + "loss": 0.0208, + "step": 220880 + }, + { + "epoch": 1.43, + "learning_rate": 8.614856360972524e-05, + "loss": 0.0278, + "step": 220890 + }, + { + "epoch": 1.43, + "learning_rate": 8.61388822553683e-05, + "loss": 0.0297, + "step": 220900 + }, + { + "epoch": 1.43, + "learning_rate": 8.612920090101136e-05, + "loss": 0.0309, + "step": 220910 + }, + { + "epoch": 1.43, + "learning_rate": 8.611951954665444e-05, + "loss": 0.0256, + "step": 220920 + }, + { + "epoch": 1.43, + "learning_rate": 8.610983819229751e-05, + "loss": 0.0314, + "step": 220930 + }, + { + "epoch": 1.43, + "learning_rate": 8.610015683794058e-05, + "loss": 0.0218, + "step": 220940 + }, + { + "epoch": 1.43, + "learning_rate": 8.609047548358364e-05, + "loss": 0.032, + "step": 220950 + }, + { + "epoch": 1.43, + "learning_rate": 8.608079412922672e-05, + "loss": 0.0306, + "step": 220960 + }, + { + "epoch": 1.43, + "learning_rate": 8.607111277486977e-05, + "loss": 0.0331, + "step": 220970 + }, + { + "epoch": 1.43, + "learning_rate": 8.606143142051284e-05, + "loss": 0.0312, + "step": 220980 + }, + { + "epoch": 1.43, + "learning_rate": 8.605175006615592e-05, + "loss": 0.0303, + "step": 220990 + }, + { + "epoch": 1.43, + "learning_rate": 8.604206871179899e-05, + "loss": 0.0297, + "step": 221000 + }, + { + "epoch": 1.43, + "eval_cer": 0.9199529996610553, + "eval_loss": 0.02053585834801197, + "eval_runtime": 120.2097, + "eval_samples_per_second": 16.638, + "eval_steps_per_second": 4.159, + "step": 221000 + }, + { + "epoch": 1.43, + "learning_rate": 8.603238735744204e-05, + "loss": 0.0319, + "step": 221010 + }, + { + "epoch": 1.43, + "learning_rate": 8.602270600308512e-05, + "loss": 0.0258, + "step": 221020 + }, + { + "epoch": 1.43, + "learning_rate": 8.601302464872819e-05, + "loss": 0.0343, + "step": 221030 + }, + { + "epoch": 1.43, + "learning_rate": 8.600334329437125e-05, + "loss": 0.0301, + "step": 221040 + }, + { + "epoch": 1.43, + "learning_rate": 8.599366194001432e-05, + "loss": 0.0243, + "step": 221050 + }, + { + "epoch": 1.43, + "learning_rate": 8.59839805856574e-05, + "loss": 0.0247, + "step": 221060 + }, + { + "epoch": 1.43, + "learning_rate": 8.597429923130046e-05, + "loss": 0.0256, + "step": 221070 + }, + { + "epoch": 1.43, + "learning_rate": 8.596461787694352e-05, + "loss": 0.0336, + "step": 221080 + }, + { + "epoch": 1.43, + "learning_rate": 8.59549365225866e-05, + "loss": 0.0282, + "step": 221090 + }, + { + "epoch": 1.43, + "learning_rate": 8.594525516822966e-05, + "loss": 0.0302, + "step": 221100 + }, + { + "epoch": 1.43, + "learning_rate": 8.593557381387272e-05, + "loss": 0.0264, + "step": 221110 + }, + { + "epoch": 1.43, + "learning_rate": 8.59258924595158e-05, + "loss": 0.03, + "step": 221120 + }, + { + "epoch": 1.43, + "learning_rate": 8.591621110515886e-05, + "loss": 0.0272, + "step": 221130 + }, + { + "epoch": 1.43, + "learning_rate": 8.590652975080194e-05, + "loss": 0.0258, + "step": 221140 + }, + { + "epoch": 1.43, + "learning_rate": 8.5896848396445e-05, + "loss": 0.0244, + "step": 221150 + }, + { + "epoch": 1.43, + "learning_rate": 8.588716704208807e-05, + "loss": 0.0269, + "step": 221160 + }, + { + "epoch": 1.43, + "learning_rate": 8.587748568773114e-05, + "loss": 0.0216, + "step": 221170 + }, + { + "epoch": 1.43, + "learning_rate": 8.586780433337419e-05, + "loss": 0.03, + "step": 221180 + }, + { + "epoch": 1.43, + "learning_rate": 8.585812297901727e-05, + "loss": 0.0256, + "step": 221190 + }, + { + "epoch": 1.43, + "learning_rate": 8.584844162466034e-05, + "loss": 0.0251, + "step": 221200 + }, + { + "epoch": 1.43, + "learning_rate": 8.583876027030342e-05, + "loss": 0.0274, + "step": 221210 + }, + { + "epoch": 1.43, + "learning_rate": 8.582907891594647e-05, + "loss": 0.0372, + "step": 221220 + }, + { + "epoch": 1.43, + "learning_rate": 8.581939756158954e-05, + "loss": 0.0321, + "step": 221230 + }, + { + "epoch": 1.43, + "learning_rate": 8.580971620723262e-05, + "loss": 0.0288, + "step": 221240 + }, + { + "epoch": 1.43, + "learning_rate": 8.580003485287567e-05, + "loss": 0.025, + "step": 221250 + }, + { + "epoch": 1.43, + "learning_rate": 8.579035349851875e-05, + "loss": 0.0291, + "step": 221260 + }, + { + "epoch": 1.43, + "learning_rate": 8.578067214416182e-05, + "loss": 0.0281, + "step": 221270 + }, + { + "epoch": 1.43, + "learning_rate": 8.577099078980488e-05, + "loss": 0.0332, + "step": 221280 + }, + { + "epoch": 1.43, + "learning_rate": 8.576130943544795e-05, + "loss": 0.0284, + "step": 221290 + }, + { + "epoch": 1.43, + "learning_rate": 8.575162808109101e-05, + "loss": 0.0274, + "step": 221300 + }, + { + "epoch": 1.43, + "learning_rate": 8.57419467267341e-05, + "loss": 0.031, + "step": 221310 + }, + { + "epoch": 1.43, + "learning_rate": 8.573226537237715e-05, + "loss": 0.032, + "step": 221320 + }, + { + "epoch": 1.43, + "learning_rate": 8.572258401802021e-05, + "loss": 0.0329, + "step": 221330 + }, + { + "epoch": 1.43, + "learning_rate": 8.57129026636633e-05, + "loss": 0.0244, + "step": 221340 + }, + { + "epoch": 1.43, + "learning_rate": 8.570322130930636e-05, + "loss": 0.0301, + "step": 221350 + }, + { + "epoch": 1.43, + "learning_rate": 8.569353995494943e-05, + "loss": 0.0271, + "step": 221360 + }, + { + "epoch": 1.43, + "learning_rate": 8.568385860059249e-05, + "loss": 0.0299, + "step": 221370 + }, + { + "epoch": 1.43, + "learning_rate": 8.567417724623556e-05, + "loss": 0.0286, + "step": 221380 + }, + { + "epoch": 1.43, + "learning_rate": 8.566449589187862e-05, + "loss": 0.0312, + "step": 221390 + }, + { + "epoch": 1.43, + "learning_rate": 8.565481453752169e-05, + "loss": 0.0243, + "step": 221400 + }, + { + "epoch": 1.43, + "learning_rate": 8.564513318316477e-05, + "loss": 0.0298, + "step": 221410 + }, + { + "epoch": 1.43, + "learning_rate": 8.563545182880784e-05, + "loss": 0.0315, + "step": 221420 + }, + { + "epoch": 1.43, + "learning_rate": 8.562577047445089e-05, + "loss": 0.0316, + "step": 221430 + }, + { + "epoch": 1.43, + "learning_rate": 8.561608912009397e-05, + "loss": 0.0292, + "step": 221440 + }, + { + "epoch": 1.43, + "learning_rate": 8.560640776573704e-05, + "loss": 0.0314, + "step": 221450 + }, + { + "epoch": 1.43, + "learning_rate": 8.55967264113801e-05, + "loss": 0.0252, + "step": 221460 + }, + { + "epoch": 1.43, + "learning_rate": 8.558704505702317e-05, + "loss": 0.0325, + "step": 221470 + }, + { + "epoch": 1.43, + "learning_rate": 8.557736370266623e-05, + "loss": 0.0289, + "step": 221480 + }, + { + "epoch": 1.43, + "learning_rate": 8.556768234830931e-05, + "loss": 0.0294, + "step": 221490 + }, + { + "epoch": 1.43, + "learning_rate": 8.555800099395237e-05, + "loss": 0.0267, + "step": 221500 + }, + { + "epoch": 1.43, + "learning_rate": 8.554831963959545e-05, + "loss": 0.0305, + "step": 221510 + }, + { + "epoch": 1.43, + "learning_rate": 8.553863828523851e-05, + "loss": 0.0302, + "step": 221520 + }, + { + "epoch": 1.43, + "learning_rate": 8.552895693088157e-05, + "loss": 0.0243, + "step": 221530 + }, + { + "epoch": 1.43, + "learning_rate": 8.551927557652465e-05, + "loss": 0.0225, + "step": 221540 + }, + { + "epoch": 1.43, + "learning_rate": 8.550959422216771e-05, + "loss": 0.0257, + "step": 221550 + }, + { + "epoch": 1.43, + "learning_rate": 8.549991286781079e-05, + "loss": 0.0282, + "step": 221560 + }, + { + "epoch": 1.43, + "learning_rate": 8.549023151345384e-05, + "loss": 0.0229, + "step": 221570 + }, + { + "epoch": 1.43, + "learning_rate": 8.548055015909691e-05, + "loss": 0.027, + "step": 221580 + }, + { + "epoch": 1.43, + "learning_rate": 8.547086880473999e-05, + "loss": 0.0316, + "step": 221590 + }, + { + "epoch": 1.43, + "learning_rate": 8.546118745038304e-05, + "loss": 0.0277, + "step": 221600 + }, + { + "epoch": 1.43, + "learning_rate": 8.545150609602612e-05, + "loss": 0.0358, + "step": 221610 + }, + { + "epoch": 1.43, + "learning_rate": 8.544182474166919e-05, + "loss": 0.0269, + "step": 221620 + }, + { + "epoch": 1.43, + "learning_rate": 8.543214338731227e-05, + "loss": 0.0277, + "step": 221630 + }, + { + "epoch": 1.43, + "learning_rate": 8.542246203295532e-05, + "loss": 0.0309, + "step": 221640 + }, + { + "epoch": 1.43, + "learning_rate": 8.541278067859839e-05, + "loss": 0.0247, + "step": 221650 + }, + { + "epoch": 1.43, + "learning_rate": 8.540309932424147e-05, + "loss": 0.0319, + "step": 221660 + }, + { + "epoch": 1.43, + "learning_rate": 8.539341796988452e-05, + "loss": 0.0274, + "step": 221670 + }, + { + "epoch": 1.43, + "learning_rate": 8.538373661552759e-05, + "loss": 0.0271, + "step": 221680 + }, + { + "epoch": 1.43, + "learning_rate": 8.537405526117067e-05, + "loss": 0.0299, + "step": 221690 + }, + { + "epoch": 1.43, + "learning_rate": 8.536437390681373e-05, + "loss": 0.0329, + "step": 221700 + }, + { + "epoch": 1.43, + "learning_rate": 8.53546925524568e-05, + "loss": 0.0309, + "step": 221710 + }, + { + "epoch": 1.43, + "learning_rate": 8.534501119809986e-05, + "loss": 0.0326, + "step": 221720 + }, + { + "epoch": 1.43, + "learning_rate": 8.533532984374294e-05, + "loss": 0.0269, + "step": 221730 + }, + { + "epoch": 1.43, + "learning_rate": 8.5325648489386e-05, + "loss": 0.0328, + "step": 221740 + }, + { + "epoch": 1.43, + "learning_rate": 8.531596713502906e-05, + "loss": 0.0289, + "step": 221750 + }, + { + "epoch": 1.43, + "learning_rate": 8.530628578067214e-05, + "loss": 0.0298, + "step": 221760 + }, + { + "epoch": 1.43, + "learning_rate": 8.529660442631521e-05, + "loss": 0.0333, + "step": 221770 + }, + { + "epoch": 1.43, + "learning_rate": 8.528692307195826e-05, + "loss": 0.031, + "step": 221780 + }, + { + "epoch": 1.43, + "learning_rate": 8.527724171760134e-05, + "loss": 0.0295, + "step": 221790 + }, + { + "epoch": 1.43, + "learning_rate": 8.526756036324441e-05, + "loss": 0.0273, + "step": 221800 + }, + { + "epoch": 1.43, + "learning_rate": 8.525787900888747e-05, + "loss": 0.0291, + "step": 221810 + }, + { + "epoch": 1.43, + "learning_rate": 8.524819765453054e-05, + "loss": 0.0256, + "step": 221820 + }, + { + "epoch": 1.43, + "learning_rate": 8.523851630017362e-05, + "loss": 0.029, + "step": 221830 + }, + { + "epoch": 1.43, + "learning_rate": 8.522883494581669e-05, + "loss": 0.0276, + "step": 221840 + }, + { + "epoch": 1.43, + "learning_rate": 8.521915359145974e-05, + "loss": 0.0285, + "step": 221850 + }, + { + "epoch": 1.43, + "learning_rate": 8.520947223710282e-05, + "loss": 0.0271, + "step": 221860 + }, + { + "epoch": 1.43, + "learning_rate": 8.519979088274589e-05, + "loss": 0.0306, + "step": 221870 + }, + { + "epoch": 1.43, + "learning_rate": 8.519010952838894e-05, + "loss": 0.0391, + "step": 221880 + }, + { + "epoch": 1.43, + "learning_rate": 8.518042817403202e-05, + "loss": 0.0293, + "step": 221890 + }, + { + "epoch": 1.43, + "learning_rate": 8.517074681967508e-05, + "loss": 0.0323, + "step": 221900 + }, + { + "epoch": 1.43, + "learning_rate": 8.516106546531816e-05, + "loss": 0.0249, + "step": 221910 + }, + { + "epoch": 1.43, + "learning_rate": 8.515138411096122e-05, + "loss": 0.0333, + "step": 221920 + }, + { + "epoch": 1.43, + "learning_rate": 8.51417027566043e-05, + "loss": 0.0261, + "step": 221930 + }, + { + "epoch": 1.43, + "learning_rate": 8.513202140224736e-05, + "loss": 0.0259, + "step": 221940 + }, + { + "epoch": 1.43, + "learning_rate": 8.512234004789042e-05, + "loss": 0.026, + "step": 221950 + }, + { + "epoch": 1.43, + "learning_rate": 8.51126586935335e-05, + "loss": 0.0304, + "step": 221960 + }, + { + "epoch": 1.43, + "learning_rate": 8.510297733917656e-05, + "loss": 0.0265, + "step": 221970 + }, + { + "epoch": 1.43, + "learning_rate": 8.509329598481964e-05, + "loss": 0.027, + "step": 221980 + }, + { + "epoch": 1.43, + "learning_rate": 8.50836146304627e-05, + "loss": 0.0273, + "step": 221990 + }, + { + "epoch": 1.43, + "learning_rate": 8.507393327610576e-05, + "loss": 0.0256, + "step": 222000 + }, + { + "epoch": 1.43, + "eval_cer": 0.9199059993221105, + "eval_loss": 0.02071262337267399, + "eval_runtime": 120.0993, + "eval_samples_per_second": 16.653, + "eval_steps_per_second": 4.163, + "step": 222000 + }, + { + "epoch": 1.43, + "learning_rate": 8.506425192174884e-05, + "loss": 0.027, + "step": 222010 + }, + { + "epoch": 1.43, + "learning_rate": 8.505457056739189e-05, + "loss": 0.0239, + "step": 222020 + }, + { + "epoch": 1.43, + "learning_rate": 8.504488921303497e-05, + "loss": 0.0306, + "step": 222030 + }, + { + "epoch": 1.43, + "learning_rate": 8.503520785867804e-05, + "loss": 0.0346, + "step": 222040 + }, + { + "epoch": 1.43, + "learning_rate": 8.502552650432112e-05, + "loss": 0.0284, + "step": 222050 + }, + { + "epoch": 1.43, + "learning_rate": 8.501584514996417e-05, + "loss": 0.0311, + "step": 222060 + }, + { + "epoch": 1.43, + "learning_rate": 8.500616379560724e-05, + "loss": 0.0287, + "step": 222070 + }, + { + "epoch": 1.43, + "learning_rate": 8.499648244125032e-05, + "loss": 0.0241, + "step": 222080 + }, + { + "epoch": 1.43, + "learning_rate": 8.498680108689337e-05, + "loss": 0.0282, + "step": 222090 + }, + { + "epoch": 1.43, + "learning_rate": 8.497711973253644e-05, + "loss": 0.0251, + "step": 222100 + }, + { + "epoch": 1.43, + "learning_rate": 8.496743837817952e-05, + "loss": 0.0273, + "step": 222110 + }, + { + "epoch": 1.43, + "learning_rate": 8.495775702382257e-05, + "loss": 0.0244, + "step": 222120 + }, + { + "epoch": 1.43, + "learning_rate": 8.494807566946565e-05, + "loss": 0.0295, + "step": 222130 + }, + { + "epoch": 1.43, + "learning_rate": 8.493839431510871e-05, + "loss": 0.0261, + "step": 222140 + }, + { + "epoch": 1.43, + "learning_rate": 8.49287129607518e-05, + "loss": 0.0255, + "step": 222150 + }, + { + "epoch": 1.43, + "learning_rate": 8.491903160639485e-05, + "loss": 0.0257, + "step": 222160 + }, + { + "epoch": 1.43, + "learning_rate": 8.490935025203791e-05, + "loss": 0.0263, + "step": 222170 + }, + { + "epoch": 1.43, + "learning_rate": 8.489966889768099e-05, + "loss": 0.0345, + "step": 222180 + }, + { + "epoch": 1.43, + "learning_rate": 8.488998754332405e-05, + "loss": 0.0259, + "step": 222190 + }, + { + "epoch": 1.43, + "learning_rate": 8.488030618896711e-05, + "loss": 0.0312, + "step": 222200 + }, + { + "epoch": 1.43, + "learning_rate": 8.487062483461019e-05, + "loss": 0.0296, + "step": 222210 + }, + { + "epoch": 1.43, + "learning_rate": 8.486094348025326e-05, + "loss": 0.0262, + "step": 222220 + }, + { + "epoch": 1.43, + "learning_rate": 8.485126212589632e-05, + "loss": 0.0282, + "step": 222230 + }, + { + "epoch": 1.43, + "learning_rate": 8.484158077153939e-05, + "loss": 0.0267, + "step": 222240 + }, + { + "epoch": 1.43, + "learning_rate": 8.483189941718247e-05, + "loss": 0.0321, + "step": 222250 + }, + { + "epoch": 1.43, + "learning_rate": 8.482221806282552e-05, + "loss": 0.0277, + "step": 222260 + }, + { + "epoch": 1.43, + "learning_rate": 8.481253670846859e-05, + "loss": 0.0289, + "step": 222270 + }, + { + "epoch": 1.43, + "learning_rate": 8.480285535411167e-05, + "loss": 0.0261, + "step": 222280 + }, + { + "epoch": 1.43, + "learning_rate": 8.479317399975474e-05, + "loss": 0.0261, + "step": 222290 + }, + { + "epoch": 1.43, + "learning_rate": 8.478349264539779e-05, + "loss": 0.0267, + "step": 222300 + }, + { + "epoch": 1.43, + "learning_rate": 8.477381129104087e-05, + "loss": 0.0232, + "step": 222310 + }, + { + "epoch": 1.43, + "learning_rate": 8.476412993668393e-05, + "loss": 0.031, + "step": 222320 + }, + { + "epoch": 1.43, + "learning_rate": 8.4754448582327e-05, + "loss": 0.0301, + "step": 222330 + }, + { + "epoch": 1.44, + "learning_rate": 8.474476722797007e-05, + "loss": 0.0322, + "step": 222340 + }, + { + "epoch": 1.44, + "learning_rate": 8.473508587361315e-05, + "loss": 0.0278, + "step": 222350 + }, + { + "epoch": 1.44, + "learning_rate": 8.472540451925621e-05, + "loss": 0.029, + "step": 222360 + }, + { + "epoch": 1.44, + "learning_rate": 8.471572316489927e-05, + "loss": 0.033, + "step": 222370 + }, + { + "epoch": 1.44, + "learning_rate": 8.470604181054234e-05, + "loss": 0.029, + "step": 222380 + }, + { + "epoch": 1.44, + "learning_rate": 8.469636045618541e-05, + "loss": 0.0243, + "step": 222390 + }, + { + "epoch": 1.44, + "learning_rate": 8.468667910182846e-05, + "loss": 0.0286, + "step": 222400 + }, + { + "epoch": 1.44, + "learning_rate": 8.467699774747154e-05, + "loss": 0.0304, + "step": 222410 + }, + { + "epoch": 1.44, + "learning_rate": 8.466731639311461e-05, + "loss": 0.0306, + "step": 222420 + }, + { + "epoch": 1.44, + "learning_rate": 8.465763503875769e-05, + "loss": 0.0258, + "step": 222430 + }, + { + "epoch": 1.44, + "learning_rate": 8.464795368440074e-05, + "loss": 0.0311, + "step": 222440 + }, + { + "epoch": 1.44, + "learning_rate": 8.463827233004382e-05, + "loss": 0.0306, + "step": 222450 + }, + { + "epoch": 1.44, + "learning_rate": 8.462859097568689e-05, + "loss": 0.0274, + "step": 222460 + }, + { + "epoch": 1.44, + "learning_rate": 8.461890962132994e-05, + "loss": 0.0246, + "step": 222470 + }, + { + "epoch": 1.44, + "learning_rate": 8.460922826697302e-05, + "loss": 0.0259, + "step": 222480 + }, + { + "epoch": 1.44, + "learning_rate": 8.459954691261609e-05, + "loss": 0.0249, + "step": 222490 + }, + { + "epoch": 1.44, + "learning_rate": 8.458986555825917e-05, + "loss": 0.0304, + "step": 222500 + }, + { + "epoch": 1.44, + "learning_rate": 8.458018420390222e-05, + "loss": 0.0329, + "step": 222510 + }, + { + "epoch": 1.44, + "learning_rate": 8.457050284954529e-05, + "loss": 0.0248, + "step": 222520 + }, + { + "epoch": 1.44, + "learning_rate": 8.456082149518837e-05, + "loss": 0.0283, + "step": 222530 + }, + { + "epoch": 1.44, + "learning_rate": 8.455114014083142e-05, + "loss": 0.0249, + "step": 222540 + }, + { + "epoch": 1.44, + "learning_rate": 8.45414587864745e-05, + "loss": 0.0232, + "step": 222550 + }, + { + "epoch": 1.44, + "learning_rate": 8.453177743211756e-05, + "loss": 0.0234, + "step": 222560 + }, + { + "epoch": 1.44, + "learning_rate": 8.452209607776063e-05, + "loss": 0.0257, + "step": 222570 + }, + { + "epoch": 1.44, + "learning_rate": 8.45124147234037e-05, + "loss": 0.027, + "step": 222580 + }, + { + "epoch": 1.44, + "learning_rate": 8.450273336904676e-05, + "loss": 0.0291, + "step": 222590 + }, + { + "epoch": 1.44, + "learning_rate": 8.449305201468984e-05, + "loss": 0.0267, + "step": 222600 + }, + { + "epoch": 1.44, + "learning_rate": 8.44833706603329e-05, + "loss": 0.0307, + "step": 222610 + }, + { + "epoch": 1.44, + "learning_rate": 8.447368930597596e-05, + "loss": 0.0288, + "step": 222620 + }, + { + "epoch": 1.44, + "learning_rate": 8.446400795161904e-05, + "loss": 0.035, + "step": 222630 + }, + { + "epoch": 1.44, + "learning_rate": 8.445432659726211e-05, + "loss": 0.0283, + "step": 222640 + }, + { + "epoch": 1.44, + "learning_rate": 8.444464524290517e-05, + "loss": 0.0237, + "step": 222650 + }, + { + "epoch": 1.44, + "learning_rate": 8.443496388854824e-05, + "loss": 0.0294, + "step": 222660 + }, + { + "epoch": 1.44, + "learning_rate": 8.44252825341913e-05, + "loss": 0.0244, + "step": 222670 + }, + { + "epoch": 1.44, + "learning_rate": 8.441560117983437e-05, + "loss": 0.026, + "step": 222680 + }, + { + "epoch": 1.44, + "learning_rate": 8.440591982547744e-05, + "loss": 0.0363, + "step": 222690 + }, + { + "epoch": 1.44, + "learning_rate": 8.439623847112052e-05, + "loss": 0.026, + "step": 222700 + }, + { + "epoch": 1.44, + "learning_rate": 8.438655711676359e-05, + "loss": 0.0284, + "step": 222710 + }, + { + "epoch": 1.44, + "learning_rate": 8.437687576240664e-05, + "loss": 0.0302, + "step": 222720 + }, + { + "epoch": 1.44, + "learning_rate": 8.436719440804972e-05, + "loss": 0.0256, + "step": 222730 + }, + { + "epoch": 1.44, + "learning_rate": 8.435751305369278e-05, + "loss": 0.0285, + "step": 222740 + }, + { + "epoch": 1.44, + "learning_rate": 8.434783169933585e-05, + "loss": 0.0267, + "step": 222750 + }, + { + "epoch": 1.44, + "learning_rate": 8.433815034497892e-05, + "loss": 0.0249, + "step": 222760 + }, + { + "epoch": 1.44, + "learning_rate": 8.432846899062198e-05, + "loss": 0.0355, + "step": 222770 + }, + { + "epoch": 1.44, + "learning_rate": 8.431878763626506e-05, + "loss": 0.025, + "step": 222780 + }, + { + "epoch": 1.44, + "learning_rate": 8.430910628190811e-05, + "loss": 0.0285, + "step": 222790 + }, + { + "epoch": 1.44, + "learning_rate": 8.42994249275512e-05, + "loss": 0.0286, + "step": 222800 + }, + { + "epoch": 1.44, + "learning_rate": 8.428974357319426e-05, + "loss": 0.0267, + "step": 222810 + }, + { + "epoch": 1.44, + "learning_rate": 8.428006221883731e-05, + "loss": 0.0304, + "step": 222820 + }, + { + "epoch": 1.44, + "learning_rate": 8.42703808644804e-05, + "loss": 0.0365, + "step": 222830 + }, + { + "epoch": 1.44, + "learning_rate": 8.426069951012346e-05, + "loss": 0.0288, + "step": 222840 + }, + { + "epoch": 1.44, + "learning_rate": 8.425101815576654e-05, + "loss": 0.0323, + "step": 222850 + }, + { + "epoch": 1.44, + "learning_rate": 8.424133680140959e-05, + "loss": 0.0293, + "step": 222860 + }, + { + "epoch": 1.44, + "learning_rate": 8.423165544705266e-05, + "loss": 0.029, + "step": 222870 + }, + { + "epoch": 1.44, + "learning_rate": 8.422197409269574e-05, + "loss": 0.0291, + "step": 222880 + }, + { + "epoch": 1.44, + "learning_rate": 8.421229273833879e-05, + "loss": 0.0274, + "step": 222890 + }, + { + "epoch": 1.44, + "learning_rate": 8.420261138398187e-05, + "loss": 0.0288, + "step": 222900 + }, + { + "epoch": 1.44, + "learning_rate": 8.419293002962494e-05, + "loss": 0.0266, + "step": 222910 + }, + { + "epoch": 1.44, + "learning_rate": 8.418324867526802e-05, + "loss": 0.0237, + "step": 222920 + }, + { + "epoch": 1.44, + "learning_rate": 8.417356732091107e-05, + "loss": 0.0252, + "step": 222930 + }, + { + "epoch": 1.44, + "learning_rate": 8.416388596655414e-05, + "loss": 0.0311, + "step": 222940 + }, + { + "epoch": 1.44, + "learning_rate": 8.415420461219722e-05, + "loss": 0.0317, + "step": 222950 + }, + { + "epoch": 1.44, + "learning_rate": 8.414452325784027e-05, + "loss": 0.0255, + "step": 222960 + }, + { + "epoch": 1.44, + "learning_rate": 8.413484190348333e-05, + "loss": 0.0257, + "step": 222970 + }, + { + "epoch": 1.44, + "learning_rate": 8.412516054912641e-05, + "loss": 0.0279, + "step": 222980 + }, + { + "epoch": 1.44, + "learning_rate": 8.411547919476948e-05, + "loss": 0.0249, + "step": 222990 + }, + { + "epoch": 1.44, + "learning_rate": 8.410579784041255e-05, + "loss": 0.0261, + "step": 223000 + }, + { + "epoch": 1.44, + "eval_cer": 0.9198445373404135, + "eval_loss": 0.02085886336863041, + "eval_runtime": 120.1768, + "eval_samples_per_second": 16.642, + "eval_steps_per_second": 4.161, + "step": 223000 + }, + { + "epoch": 1.44, + "learning_rate": 8.409611648605561e-05, + "loss": 0.0336, + "step": 223010 + }, + { + "epoch": 1.44, + "learning_rate": 8.408643513169869e-05, + "loss": 0.0425, + "step": 223020 + }, + { + "epoch": 1.44, + "learning_rate": 8.407675377734175e-05, + "loss": 0.0325, + "step": 223030 + }, + { + "epoch": 1.44, + "learning_rate": 8.406707242298481e-05, + "loss": 0.0303, + "step": 223040 + }, + { + "epoch": 1.44, + "learning_rate": 8.405739106862789e-05, + "loss": 0.0317, + "step": 223050 + }, + { + "epoch": 1.44, + "learning_rate": 8.404770971427096e-05, + "loss": 0.0246, + "step": 223060 + }, + { + "epoch": 1.44, + "learning_rate": 8.403802835991401e-05, + "loss": 0.0294, + "step": 223070 + }, + { + "epoch": 1.44, + "learning_rate": 8.402834700555709e-05, + "loss": 0.0238, + "step": 223080 + }, + { + "epoch": 1.44, + "learning_rate": 8.401866565120016e-05, + "loss": 0.0277, + "step": 223090 + }, + { + "epoch": 1.44, + "learning_rate": 8.400898429684322e-05, + "loss": 0.0318, + "step": 223100 + }, + { + "epoch": 1.44, + "learning_rate": 8.399930294248629e-05, + "loss": 0.0278, + "step": 223110 + }, + { + "epoch": 1.44, + "learning_rate": 8.398962158812937e-05, + "loss": 0.0319, + "step": 223120 + }, + { + "epoch": 1.44, + "learning_rate": 8.397994023377243e-05, + "loss": 0.0304, + "step": 223130 + }, + { + "epoch": 1.44, + "learning_rate": 8.397025887941549e-05, + "loss": 0.0342, + "step": 223140 + }, + { + "epoch": 1.44, + "learning_rate": 8.396057752505857e-05, + "loss": 0.0323, + "step": 223150 + }, + { + "epoch": 1.44, + "learning_rate": 8.395089617070163e-05, + "loss": 0.0353, + "step": 223160 + }, + { + "epoch": 1.44, + "learning_rate": 8.394121481634469e-05, + "loss": 0.0292, + "step": 223170 + }, + { + "epoch": 1.44, + "learning_rate": 8.393153346198777e-05, + "loss": 0.0292, + "step": 223180 + }, + { + "epoch": 1.44, + "learning_rate": 8.392185210763083e-05, + "loss": 0.0274, + "step": 223190 + }, + { + "epoch": 1.44, + "learning_rate": 8.391217075327391e-05, + "loss": 0.0222, + "step": 223200 + }, + { + "epoch": 1.44, + "learning_rate": 8.390248939891696e-05, + "loss": 0.0286, + "step": 223210 + }, + { + "epoch": 1.44, + "learning_rate": 8.389280804456004e-05, + "loss": 0.0288, + "step": 223220 + }, + { + "epoch": 1.44, + "learning_rate": 8.388312669020311e-05, + "loss": 0.0258, + "step": 223230 + }, + { + "epoch": 1.44, + "learning_rate": 8.387344533584616e-05, + "loss": 0.03, + "step": 223240 + }, + { + "epoch": 1.44, + "learning_rate": 8.386376398148924e-05, + "loss": 0.0321, + "step": 223250 + }, + { + "epoch": 1.44, + "learning_rate": 8.385408262713231e-05, + "loss": 0.0287, + "step": 223260 + }, + { + "epoch": 1.44, + "learning_rate": 8.384440127277539e-05, + "loss": 0.0269, + "step": 223270 + }, + { + "epoch": 1.44, + "learning_rate": 8.383471991841844e-05, + "loss": 0.0256, + "step": 223280 + }, + { + "epoch": 1.44, + "learning_rate": 8.382503856406151e-05, + "loss": 0.027, + "step": 223290 + }, + { + "epoch": 1.44, + "learning_rate": 8.381535720970459e-05, + "loss": 0.0301, + "step": 223300 + }, + { + "epoch": 1.44, + "learning_rate": 8.380567585534764e-05, + "loss": 0.0328, + "step": 223310 + }, + { + "epoch": 1.44, + "learning_rate": 8.379599450099072e-05, + "loss": 0.0314, + "step": 223320 + }, + { + "epoch": 1.44, + "learning_rate": 8.378631314663379e-05, + "loss": 0.0294, + "step": 223330 + }, + { + "epoch": 1.44, + "learning_rate": 8.377663179227687e-05, + "loss": 0.0324, + "step": 223340 + }, + { + "epoch": 1.44, + "learning_rate": 8.376695043791992e-05, + "loss": 0.0297, + "step": 223350 + }, + { + "epoch": 1.44, + "learning_rate": 8.375726908356299e-05, + "loss": 0.0356, + "step": 223360 + }, + { + "epoch": 1.44, + "learning_rate": 8.374758772920607e-05, + "loss": 0.0267, + "step": 223370 + }, + { + "epoch": 1.44, + "learning_rate": 8.373790637484912e-05, + "loss": 0.0261, + "step": 223380 + }, + { + "epoch": 1.44, + "learning_rate": 8.372822502049218e-05, + "loss": 0.028, + "step": 223390 + }, + { + "epoch": 1.44, + "learning_rate": 8.371854366613526e-05, + "loss": 0.0281, + "step": 223400 + }, + { + "epoch": 1.44, + "learning_rate": 8.370886231177833e-05, + "loss": 0.0249, + "step": 223410 + }, + { + "epoch": 1.44, + "learning_rate": 8.36991809574214e-05, + "loss": 0.0242, + "step": 223420 + }, + { + "epoch": 1.44, + "learning_rate": 8.368949960306446e-05, + "loss": 0.025, + "step": 223430 + }, + { + "epoch": 1.44, + "learning_rate": 8.367981824870754e-05, + "loss": 0.0308, + "step": 223440 + }, + { + "epoch": 1.44, + "learning_rate": 8.36701368943506e-05, + "loss": 0.0286, + "step": 223450 + }, + { + "epoch": 1.44, + "learning_rate": 8.366045553999366e-05, + "loss": 0.0286, + "step": 223460 + }, + { + "epoch": 1.44, + "learning_rate": 8.365077418563674e-05, + "loss": 0.0295, + "step": 223470 + }, + { + "epoch": 1.44, + "learning_rate": 8.364109283127981e-05, + "loss": 0.0247, + "step": 223480 + }, + { + "epoch": 1.44, + "learning_rate": 8.363141147692286e-05, + "loss": 0.0277, + "step": 223490 + }, + { + "epoch": 1.44, + "learning_rate": 8.362173012256594e-05, + "loss": 0.0304, + "step": 223500 + }, + { + "epoch": 1.44, + "learning_rate": 8.3612048768209e-05, + "loss": 0.0274, + "step": 223510 + }, + { + "epoch": 1.44, + "learning_rate": 8.360236741385207e-05, + "loss": 0.034, + "step": 223520 + }, + { + "epoch": 1.44, + "learning_rate": 8.359268605949514e-05, + "loss": 0.0327, + "step": 223530 + }, + { + "epoch": 1.44, + "learning_rate": 8.358300470513822e-05, + "loss": 0.025, + "step": 223540 + }, + { + "epoch": 1.44, + "learning_rate": 8.357332335078128e-05, + "loss": 0.0289, + "step": 223550 + }, + { + "epoch": 1.44, + "learning_rate": 8.356364199642434e-05, + "loss": 0.0269, + "step": 223560 + }, + { + "epoch": 1.44, + "learning_rate": 8.355396064206742e-05, + "loss": 0.03, + "step": 223570 + }, + { + "epoch": 1.44, + "learning_rate": 8.354427928771048e-05, + "loss": 0.0283, + "step": 223580 + }, + { + "epoch": 1.44, + "learning_rate": 8.353459793335354e-05, + "loss": 0.0247, + "step": 223590 + }, + { + "epoch": 1.44, + "learning_rate": 8.352491657899662e-05, + "loss": 0.0277, + "step": 223600 + }, + { + "epoch": 1.44, + "learning_rate": 8.351523522463968e-05, + "loss": 0.0301, + "step": 223610 + }, + { + "epoch": 1.44, + "learning_rate": 8.350555387028276e-05, + "loss": 0.0265, + "step": 223620 + }, + { + "epoch": 1.44, + "learning_rate": 8.349587251592581e-05, + "loss": 0.0269, + "step": 223630 + }, + { + "epoch": 1.44, + "learning_rate": 8.34861911615689e-05, + "loss": 0.0293, + "step": 223640 + }, + { + "epoch": 1.44, + "learning_rate": 8.347650980721196e-05, + "loss": 0.0273, + "step": 223650 + }, + { + "epoch": 1.44, + "learning_rate": 8.346682845285501e-05, + "loss": 0.0258, + "step": 223660 + }, + { + "epoch": 1.44, + "learning_rate": 8.345714709849809e-05, + "loss": 0.0305, + "step": 223670 + }, + { + "epoch": 1.44, + "learning_rate": 8.344746574414116e-05, + "loss": 0.0326, + "step": 223680 + }, + { + "epoch": 1.44, + "learning_rate": 8.343778438978424e-05, + "loss": 0.0307, + "step": 223690 + }, + { + "epoch": 1.44, + "learning_rate": 8.342810303542729e-05, + "loss": 0.0311, + "step": 223700 + }, + { + "epoch": 1.44, + "learning_rate": 8.341842168107036e-05, + "loss": 0.0311, + "step": 223710 + }, + { + "epoch": 1.44, + "learning_rate": 8.340874032671344e-05, + "loss": 0.0349, + "step": 223720 + }, + { + "epoch": 1.44, + "learning_rate": 8.339905897235649e-05, + "loss": 0.037, + "step": 223730 + }, + { + "epoch": 1.44, + "learning_rate": 8.338937761799957e-05, + "loss": 0.0314, + "step": 223740 + }, + { + "epoch": 1.44, + "learning_rate": 8.337969626364264e-05, + "loss": 0.0294, + "step": 223750 + }, + { + "epoch": 1.44, + "learning_rate": 8.33700149092857e-05, + "loss": 0.0258, + "step": 223760 + }, + { + "epoch": 1.44, + "learning_rate": 8.336033355492877e-05, + "loss": 0.0266, + "step": 223770 + }, + { + "epoch": 1.44, + "learning_rate": 8.335065220057184e-05, + "loss": 0.0298, + "step": 223780 + }, + { + "epoch": 1.44, + "learning_rate": 8.334097084621492e-05, + "loss": 0.0278, + "step": 223790 + }, + { + "epoch": 1.44, + "learning_rate": 8.333128949185797e-05, + "loss": 0.0256, + "step": 223800 + }, + { + "epoch": 1.44, + "learning_rate": 8.332160813750103e-05, + "loss": 0.0259, + "step": 223810 + }, + { + "epoch": 1.44, + "learning_rate": 8.331192678314411e-05, + "loss": 0.0219, + "step": 223820 + }, + { + "epoch": 1.44, + "learning_rate": 8.330224542878718e-05, + "loss": 0.0293, + "step": 223830 + }, + { + "epoch": 1.44, + "learning_rate": 8.329256407443025e-05, + "loss": 0.0303, + "step": 223840 + }, + { + "epoch": 1.44, + "learning_rate": 8.328288272007331e-05, + "loss": 0.023, + "step": 223850 + }, + { + "epoch": 1.44, + "learning_rate": 8.327320136571638e-05, + "loss": 0.0293, + "step": 223860 + }, + { + "epoch": 1.44, + "learning_rate": 8.326352001135945e-05, + "loss": 0.0324, + "step": 223870 + }, + { + "epoch": 1.44, + "learning_rate": 8.325383865700251e-05, + "loss": 0.0255, + "step": 223880 + }, + { + "epoch": 1.45, + "learning_rate": 8.324415730264559e-05, + "loss": 0.0313, + "step": 223890 + }, + { + "epoch": 1.45, + "learning_rate": 8.323447594828866e-05, + "loss": 0.0269, + "step": 223900 + }, + { + "epoch": 1.45, + "learning_rate": 8.322479459393171e-05, + "loss": 0.0277, + "step": 223910 + }, + { + "epoch": 1.45, + "learning_rate": 8.321511323957479e-05, + "loss": 0.0267, + "step": 223920 + }, + { + "epoch": 1.45, + "learning_rate": 8.320543188521786e-05, + "loss": 0.0264, + "step": 223930 + }, + { + "epoch": 1.45, + "learning_rate": 8.319575053086092e-05, + "loss": 0.032, + "step": 223940 + }, + { + "epoch": 1.45, + "learning_rate": 8.318606917650399e-05, + "loss": 0.0338, + "step": 223950 + }, + { + "epoch": 1.45, + "learning_rate": 8.317638782214705e-05, + "loss": 0.0267, + "step": 223960 + }, + { + "epoch": 1.45, + "learning_rate": 8.316670646779013e-05, + "loss": 0.0253, + "step": 223970 + }, + { + "epoch": 1.45, + "learning_rate": 8.315702511343319e-05, + "loss": 0.0233, + "step": 223980 + }, + { + "epoch": 1.45, + "learning_rate": 8.314734375907627e-05, + "loss": 0.0293, + "step": 223990 + }, + { + "epoch": 1.45, + "learning_rate": 8.313766240471933e-05, + "loss": 0.0274, + "step": 224000 + }, + { + "epoch": 1.45, + "eval_cer": 0.9198824991526381, + "eval_loss": 0.020434506237506866, + "eval_runtime": 120.0541, + "eval_samples_per_second": 16.659, + "eval_steps_per_second": 4.165, + "step": 224000 + }, + { + "epoch": 1.45, + "learning_rate": 8.312798105036239e-05, + "loss": 0.0298, + "step": 224010 + }, + { + "epoch": 1.45, + "learning_rate": 8.311829969600547e-05, + "loss": 0.0326, + "step": 224020 + }, + { + "epoch": 1.45, + "learning_rate": 8.310861834164853e-05, + "loss": 0.0247, + "step": 224030 + }, + { + "epoch": 1.45, + "learning_rate": 8.309893698729161e-05, + "loss": 0.0236, + "step": 224040 + }, + { + "epoch": 1.45, + "learning_rate": 8.308925563293466e-05, + "loss": 0.0275, + "step": 224050 + }, + { + "epoch": 1.45, + "learning_rate": 8.307957427857773e-05, + "loss": 0.0272, + "step": 224060 + }, + { + "epoch": 1.45, + "learning_rate": 8.306989292422081e-05, + "loss": 0.0317, + "step": 224070 + }, + { + "epoch": 1.45, + "learning_rate": 8.306021156986386e-05, + "loss": 0.0269, + "step": 224080 + }, + { + "epoch": 1.45, + "learning_rate": 8.305053021550694e-05, + "loss": 0.0259, + "step": 224090 + }, + { + "epoch": 1.45, + "learning_rate": 8.304084886115001e-05, + "loss": 0.0292, + "step": 224100 + }, + { + "epoch": 1.45, + "learning_rate": 8.303116750679309e-05, + "loss": 0.0287, + "step": 224110 + }, + { + "epoch": 1.45, + "learning_rate": 8.302148615243614e-05, + "loss": 0.0272, + "step": 224120 + }, + { + "epoch": 1.45, + "learning_rate": 8.301180479807921e-05, + "loss": 0.0265, + "step": 224130 + }, + { + "epoch": 1.45, + "learning_rate": 8.300212344372229e-05, + "loss": 0.0259, + "step": 224140 + }, + { + "epoch": 1.45, + "learning_rate": 8.299244208936534e-05, + "loss": 0.0261, + "step": 224150 + }, + { + "epoch": 1.45, + "learning_rate": 8.298276073500842e-05, + "loss": 0.0303, + "step": 224160 + }, + { + "epoch": 1.45, + "learning_rate": 8.297307938065149e-05, + "loss": 0.0248, + "step": 224170 + }, + { + "epoch": 1.45, + "learning_rate": 8.296339802629455e-05, + "loss": 0.0288, + "step": 224180 + }, + { + "epoch": 1.45, + "learning_rate": 8.295371667193762e-05, + "loss": 0.0311, + "step": 224190 + }, + { + "epoch": 1.45, + "learning_rate": 8.294403531758069e-05, + "loss": 0.0362, + "step": 224200 + }, + { + "epoch": 1.45, + "learning_rate": 8.293435396322376e-05, + "loss": 0.0229, + "step": 224210 + }, + { + "epoch": 1.45, + "learning_rate": 8.292467260886682e-05, + "loss": 0.0284, + "step": 224220 + }, + { + "epoch": 1.45, + "learning_rate": 8.291499125450988e-05, + "loss": 0.0306, + "step": 224230 + }, + { + "epoch": 1.45, + "learning_rate": 8.290530990015296e-05, + "loss": 0.0308, + "step": 224240 + }, + { + "epoch": 1.45, + "learning_rate": 8.289562854579603e-05, + "loss": 0.0279, + "step": 224250 + }, + { + "epoch": 1.45, + "learning_rate": 8.28859471914391e-05, + "loss": 0.0259, + "step": 224260 + }, + { + "epoch": 1.45, + "learning_rate": 8.287626583708216e-05, + "loss": 0.0275, + "step": 224270 + }, + { + "epoch": 1.45, + "learning_rate": 8.286658448272523e-05, + "loss": 0.0255, + "step": 224280 + }, + { + "epoch": 1.45, + "learning_rate": 8.28569031283683e-05, + "loss": 0.0299, + "step": 224290 + }, + { + "epoch": 1.45, + "learning_rate": 8.284722177401136e-05, + "loss": 0.027, + "step": 224300 + }, + { + "epoch": 1.45, + "learning_rate": 8.283754041965444e-05, + "loss": 0.0232, + "step": 224310 + }, + { + "epoch": 1.45, + "learning_rate": 8.282785906529751e-05, + "loss": 0.0271, + "step": 224320 + }, + { + "epoch": 1.45, + "learning_rate": 8.281817771094056e-05, + "loss": 0.0258, + "step": 224330 + }, + { + "epoch": 1.45, + "learning_rate": 8.280849635658364e-05, + "loss": 0.0253, + "step": 224340 + }, + { + "epoch": 1.45, + "learning_rate": 8.27988150022267e-05, + "loss": 0.0235, + "step": 224350 + }, + { + "epoch": 1.45, + "learning_rate": 8.278913364786977e-05, + "loss": 0.0303, + "step": 224360 + }, + { + "epoch": 1.45, + "learning_rate": 8.277945229351284e-05, + "loss": 0.0285, + "step": 224370 + }, + { + "epoch": 1.45, + "learning_rate": 8.27697709391559e-05, + "loss": 0.0259, + "step": 224380 + }, + { + "epoch": 1.45, + "learning_rate": 8.276008958479898e-05, + "loss": 0.0265, + "step": 224390 + }, + { + "epoch": 1.45, + "learning_rate": 8.275040823044204e-05, + "loss": 0.0336, + "step": 224400 + }, + { + "epoch": 1.45, + "learning_rate": 8.274072687608512e-05, + "loss": 0.0244, + "step": 224410 + }, + { + "epoch": 1.45, + "learning_rate": 8.273104552172818e-05, + "loss": 0.025, + "step": 224420 + }, + { + "epoch": 1.45, + "learning_rate": 8.272136416737124e-05, + "loss": 0.0289, + "step": 224430 + }, + { + "epoch": 1.45, + "learning_rate": 8.271168281301432e-05, + "loss": 0.0275, + "step": 224440 + }, + { + "epoch": 1.45, + "learning_rate": 8.270200145865738e-05, + "loss": 0.034, + "step": 224450 + }, + { + "epoch": 1.45, + "learning_rate": 8.269232010430046e-05, + "loss": 0.0256, + "step": 224460 + }, + { + "epoch": 1.45, + "learning_rate": 8.268263874994351e-05, + "loss": 0.0304, + "step": 224470 + }, + { + "epoch": 1.45, + "learning_rate": 8.267295739558658e-05, + "loss": 0.0261, + "step": 224480 + }, + { + "epoch": 1.45, + "learning_rate": 8.266327604122966e-05, + "loss": 0.0293, + "step": 224490 + }, + { + "epoch": 1.45, + "learning_rate": 8.265359468687271e-05, + "loss": 0.0239, + "step": 224500 + }, + { + "epoch": 1.45, + "learning_rate": 8.264391333251579e-05, + "loss": 0.0282, + "step": 224510 + }, + { + "epoch": 1.45, + "learning_rate": 8.263423197815886e-05, + "loss": 0.0266, + "step": 224520 + }, + { + "epoch": 1.45, + "learning_rate": 8.262455062380194e-05, + "loss": 0.0244, + "step": 224530 + }, + { + "epoch": 1.45, + "learning_rate": 8.261486926944499e-05, + "loss": 0.0278, + "step": 224540 + }, + { + "epoch": 1.45, + "learning_rate": 8.260518791508806e-05, + "loss": 0.0288, + "step": 224550 + }, + { + "epoch": 1.45, + "learning_rate": 8.259550656073114e-05, + "loss": 0.0279, + "step": 224560 + }, + { + "epoch": 1.45, + "learning_rate": 8.258582520637419e-05, + "loss": 0.0262, + "step": 224570 + }, + { + "epoch": 1.45, + "learning_rate": 8.257614385201726e-05, + "loss": 0.0282, + "step": 224580 + }, + { + "epoch": 1.45, + "learning_rate": 8.256646249766034e-05, + "loss": 0.0235, + "step": 224590 + }, + { + "epoch": 1.45, + "learning_rate": 8.25567811433034e-05, + "loss": 0.0311, + "step": 224600 + }, + { + "epoch": 1.45, + "learning_rate": 8.254709978894647e-05, + "loss": 0.0302, + "step": 224610 + }, + { + "epoch": 1.45, + "learning_rate": 8.253741843458953e-05, + "loss": 0.0315, + "step": 224620 + }, + { + "epoch": 1.45, + "learning_rate": 8.252773708023261e-05, + "loss": 0.0292, + "step": 224630 + }, + { + "epoch": 1.45, + "learning_rate": 8.251805572587567e-05, + "loss": 0.0262, + "step": 224640 + }, + { + "epoch": 1.45, + "learning_rate": 8.250837437151873e-05, + "loss": 0.024, + "step": 224650 + }, + { + "epoch": 1.45, + "learning_rate": 8.249869301716181e-05, + "loss": 0.0242, + "step": 224660 + }, + { + "epoch": 1.45, + "learning_rate": 8.248901166280488e-05, + "loss": 0.0278, + "step": 224670 + }, + { + "epoch": 1.45, + "learning_rate": 8.247933030844793e-05, + "loss": 0.0242, + "step": 224680 + }, + { + "epoch": 1.45, + "learning_rate": 8.246964895409101e-05, + "loss": 0.0288, + "step": 224690 + }, + { + "epoch": 1.45, + "learning_rate": 8.245996759973408e-05, + "loss": 0.0318, + "step": 224700 + }, + { + "epoch": 1.45, + "learning_rate": 8.245028624537714e-05, + "loss": 0.0299, + "step": 224710 + }, + { + "epoch": 1.45, + "learning_rate": 8.244060489102021e-05, + "loss": 0.0253, + "step": 224720 + }, + { + "epoch": 1.45, + "learning_rate": 8.243092353666329e-05, + "loss": 0.025, + "step": 224730 + }, + { + "epoch": 1.45, + "learning_rate": 8.242124218230636e-05, + "loss": 0.0244, + "step": 224740 + }, + { + "epoch": 1.45, + "learning_rate": 8.241156082794941e-05, + "loss": 0.0337, + "step": 224750 + }, + { + "epoch": 1.45, + "learning_rate": 8.240187947359249e-05, + "loss": 0.0249, + "step": 224760 + }, + { + "epoch": 1.45, + "learning_rate": 8.239219811923556e-05, + "loss": 0.0259, + "step": 224770 + }, + { + "epoch": 1.45, + "learning_rate": 8.238251676487861e-05, + "loss": 0.0242, + "step": 224780 + }, + { + "epoch": 1.45, + "learning_rate": 8.237283541052169e-05, + "loss": 0.0329, + "step": 224790 + }, + { + "epoch": 1.45, + "learning_rate": 8.236315405616475e-05, + "loss": 0.0277, + "step": 224800 + }, + { + "epoch": 1.45, + "learning_rate": 8.235347270180783e-05, + "loss": 0.0291, + "step": 224810 + }, + { + "epoch": 1.45, + "learning_rate": 8.234379134745089e-05, + "loss": 0.0257, + "step": 224820 + }, + { + "epoch": 1.45, + "learning_rate": 8.233410999309397e-05, + "loss": 0.0265, + "step": 224830 + }, + { + "epoch": 1.45, + "learning_rate": 8.232442863873703e-05, + "loss": 0.0272, + "step": 224840 + }, + { + "epoch": 1.45, + "learning_rate": 8.231474728438009e-05, + "loss": 0.0256, + "step": 224850 + }, + { + "epoch": 1.45, + "learning_rate": 8.230506593002317e-05, + "loss": 0.0223, + "step": 224860 + }, + { + "epoch": 1.45, + "learning_rate": 8.229538457566623e-05, + "loss": 0.0301, + "step": 224870 + }, + { + "epoch": 1.45, + "learning_rate": 8.228570322130931e-05, + "loss": 0.028, + "step": 224880 + }, + { + "epoch": 1.45, + "learning_rate": 8.227602186695236e-05, + "loss": 0.025, + "step": 224890 + }, + { + "epoch": 1.45, + "learning_rate": 8.226634051259543e-05, + "loss": 0.0291, + "step": 224900 + }, + { + "epoch": 1.45, + "learning_rate": 8.225665915823851e-05, + "loss": 0.0304, + "step": 224910 + }, + { + "epoch": 1.45, + "learning_rate": 8.224697780388156e-05, + "loss": 0.0267, + "step": 224920 + }, + { + "epoch": 1.45, + "learning_rate": 8.223729644952464e-05, + "loss": 0.028, + "step": 224930 + }, + { + "epoch": 1.45, + "learning_rate": 8.222761509516771e-05, + "loss": 0.0282, + "step": 224940 + }, + { + "epoch": 1.45, + "learning_rate": 8.221793374081079e-05, + "loss": 0.0244, + "step": 224950 + }, + { + "epoch": 1.45, + "learning_rate": 8.220825238645384e-05, + "loss": 0.0295, + "step": 224960 + }, + { + "epoch": 1.45, + "learning_rate": 8.219857103209691e-05, + "loss": 0.0241, + "step": 224970 + }, + { + "epoch": 1.45, + "learning_rate": 8.218888967773999e-05, + "loss": 0.0317, + "step": 224980 + }, + { + "epoch": 1.45, + "learning_rate": 8.217920832338304e-05, + "loss": 0.0324, + "step": 224990 + }, + { + "epoch": 1.45, + "learning_rate": 8.21695269690261e-05, + "loss": 0.0343, + "step": 225000 + }, + { + "epoch": 1.45, + "eval_cer": 0.9198978646480623, + "eval_loss": 0.020093819126486778, + "eval_runtime": 120.1806, + "eval_samples_per_second": 16.642, + "eval_steps_per_second": 4.16, + "step": 225000 + }, + { + "epoch": 1.45, + "learning_rate": 8.215984561466919e-05, + "loss": 0.0234, + "step": 225010 + }, + { + "epoch": 1.45, + "learning_rate": 8.215016426031225e-05, + "loss": 0.0293, + "step": 225020 + }, + { + "epoch": 1.45, + "learning_rate": 8.214048290595532e-05, + "loss": 0.0252, + "step": 225030 + }, + { + "epoch": 1.45, + "learning_rate": 8.213080155159838e-05, + "loss": 0.0238, + "step": 225040 + }, + { + "epoch": 1.45, + "learning_rate": 8.212112019724146e-05, + "loss": 0.0307, + "step": 225050 + }, + { + "epoch": 1.45, + "learning_rate": 8.211143884288452e-05, + "loss": 0.0236, + "step": 225060 + }, + { + "epoch": 1.45, + "learning_rate": 8.210175748852758e-05, + "loss": 0.0292, + "step": 225070 + }, + { + "epoch": 1.45, + "learning_rate": 8.209207613417066e-05, + "loss": 0.0343, + "step": 225080 + }, + { + "epoch": 1.45, + "learning_rate": 8.208239477981373e-05, + "loss": 0.0258, + "step": 225090 + }, + { + "epoch": 1.45, + "learning_rate": 8.207271342545678e-05, + "loss": 0.0315, + "step": 225100 + }, + { + "epoch": 1.45, + "learning_rate": 8.206303207109986e-05, + "loss": 0.0237, + "step": 225110 + }, + { + "epoch": 1.45, + "learning_rate": 8.205335071674293e-05, + "loss": 0.0277, + "step": 225120 + }, + { + "epoch": 1.45, + "learning_rate": 8.2043669362386e-05, + "loss": 0.0307, + "step": 225130 + }, + { + "epoch": 1.45, + "learning_rate": 8.203398800802906e-05, + "loss": 0.0369, + "step": 225140 + }, + { + "epoch": 1.45, + "learning_rate": 8.202430665367214e-05, + "loss": 0.0296, + "step": 225150 + }, + { + "epoch": 1.45, + "learning_rate": 8.20146252993152e-05, + "loss": 0.0264, + "step": 225160 + }, + { + "epoch": 1.45, + "learning_rate": 8.200494394495826e-05, + "loss": 0.0335, + "step": 225170 + }, + { + "epoch": 1.45, + "learning_rate": 8.199526259060134e-05, + "loss": 0.0266, + "step": 225180 + }, + { + "epoch": 1.45, + "learning_rate": 8.19855812362444e-05, + "loss": 0.0244, + "step": 225190 + }, + { + "epoch": 1.45, + "learning_rate": 8.197589988188746e-05, + "loss": 0.0269, + "step": 225200 + }, + { + "epoch": 1.45, + "learning_rate": 8.196621852753054e-05, + "loss": 0.0286, + "step": 225210 + }, + { + "epoch": 1.45, + "learning_rate": 8.19565371731736e-05, + "loss": 0.0302, + "step": 225220 + }, + { + "epoch": 1.45, + "learning_rate": 8.194685581881668e-05, + "loss": 0.025, + "step": 225230 + }, + { + "epoch": 1.45, + "learning_rate": 8.193717446445974e-05, + "loss": 0.0285, + "step": 225240 + }, + { + "epoch": 1.45, + "learning_rate": 8.192749311010282e-05, + "loss": 0.0256, + "step": 225250 + }, + { + "epoch": 1.45, + "learning_rate": 8.191781175574588e-05, + "loss": 0.0251, + "step": 225260 + }, + { + "epoch": 1.45, + "learning_rate": 8.190813040138894e-05, + "loss": 0.0306, + "step": 225270 + }, + { + "epoch": 1.45, + "learning_rate": 8.189844904703202e-05, + "loss": 0.0247, + "step": 225280 + }, + { + "epoch": 1.45, + "learning_rate": 8.188876769267508e-05, + "loss": 0.0276, + "step": 225290 + }, + { + "epoch": 1.45, + "learning_rate": 8.187908633831816e-05, + "loss": 0.0275, + "step": 225300 + }, + { + "epoch": 1.45, + "learning_rate": 8.186940498396121e-05, + "loss": 0.0234, + "step": 225310 + }, + { + "epoch": 1.45, + "learning_rate": 8.185972362960428e-05, + "loss": 0.0266, + "step": 225320 + }, + { + "epoch": 1.45, + "learning_rate": 8.185004227524736e-05, + "loss": 0.0324, + "step": 225330 + }, + { + "epoch": 1.45, + "learning_rate": 8.184036092089041e-05, + "loss": 0.0304, + "step": 225340 + }, + { + "epoch": 1.45, + "learning_rate": 8.183067956653349e-05, + "loss": 0.0304, + "step": 225350 + }, + { + "epoch": 1.45, + "learning_rate": 8.182099821217656e-05, + "loss": 0.0256, + "step": 225360 + }, + { + "epoch": 1.45, + "learning_rate": 8.181131685781962e-05, + "loss": 0.0346, + "step": 225370 + }, + { + "epoch": 1.45, + "learning_rate": 8.180163550346269e-05, + "loss": 0.0284, + "step": 225380 + }, + { + "epoch": 1.45, + "learning_rate": 8.179195414910576e-05, + "loss": 0.0318, + "step": 225390 + }, + { + "epoch": 1.45, + "learning_rate": 8.178227279474884e-05, + "loss": 0.0256, + "step": 225400 + }, + { + "epoch": 1.45, + "learning_rate": 8.177259144039189e-05, + "loss": 0.0279, + "step": 225410 + }, + { + "epoch": 1.45, + "learning_rate": 8.176291008603496e-05, + "loss": 0.0291, + "step": 225420 + }, + { + "epoch": 1.45, + "learning_rate": 8.175322873167804e-05, + "loss": 0.0315, + "step": 225430 + }, + { + "epoch": 1.46, + "learning_rate": 8.17435473773211e-05, + "loss": 0.0243, + "step": 225440 + }, + { + "epoch": 1.46, + "learning_rate": 8.173386602296417e-05, + "loss": 0.0256, + "step": 225450 + }, + { + "epoch": 1.46, + "learning_rate": 8.172418466860723e-05, + "loss": 0.0258, + "step": 225460 + }, + { + "epoch": 1.46, + "learning_rate": 8.17145033142503e-05, + "loss": 0.0311, + "step": 225470 + }, + { + "epoch": 1.46, + "learning_rate": 8.170482195989337e-05, + "loss": 0.025, + "step": 225480 + }, + { + "epoch": 1.46, + "learning_rate": 8.169514060553643e-05, + "loss": 0.0292, + "step": 225490 + }, + { + "epoch": 1.46, + "learning_rate": 8.168545925117951e-05, + "loss": 0.0296, + "step": 225500 + }, + { + "epoch": 1.46, + "learning_rate": 8.167577789682258e-05, + "loss": 0.0285, + "step": 225510 + }, + { + "epoch": 1.46, + "learning_rate": 8.166609654246563e-05, + "loss": 0.0277, + "step": 225520 + }, + { + "epoch": 1.46, + "learning_rate": 8.165641518810871e-05, + "loss": 0.0273, + "step": 225530 + }, + { + "epoch": 1.46, + "learning_rate": 8.164673383375178e-05, + "loss": 0.027, + "step": 225540 + }, + { + "epoch": 1.46, + "learning_rate": 8.163705247939484e-05, + "loss": 0.0311, + "step": 225550 + }, + { + "epoch": 1.46, + "learning_rate": 8.162737112503791e-05, + "loss": 0.0294, + "step": 225560 + }, + { + "epoch": 1.46, + "learning_rate": 8.161768977068098e-05, + "loss": 0.0271, + "step": 225570 + }, + { + "epoch": 1.46, + "learning_rate": 8.160800841632404e-05, + "loss": 0.0262, + "step": 225580 + }, + { + "epoch": 1.46, + "learning_rate": 8.159832706196711e-05, + "loss": 0.0302, + "step": 225590 + }, + { + "epoch": 1.46, + "learning_rate": 8.158864570761019e-05, + "loss": 0.0408, + "step": 225600 + }, + { + "epoch": 1.46, + "learning_rate": 8.157896435325326e-05, + "loss": 0.0296, + "step": 225610 + }, + { + "epoch": 1.46, + "learning_rate": 8.156928299889631e-05, + "loss": 0.0333, + "step": 225620 + }, + { + "epoch": 1.46, + "learning_rate": 8.155960164453939e-05, + "loss": 0.0235, + "step": 225630 + }, + { + "epoch": 1.46, + "learning_rate": 8.154992029018245e-05, + "loss": 0.0306, + "step": 225640 + }, + { + "epoch": 1.46, + "learning_rate": 8.154023893582552e-05, + "loss": 0.0304, + "step": 225650 + }, + { + "epoch": 1.46, + "learning_rate": 8.153055758146859e-05, + "loss": 0.0308, + "step": 225660 + }, + { + "epoch": 1.46, + "learning_rate": 8.152087622711165e-05, + "loss": 0.0248, + "step": 225670 + }, + { + "epoch": 1.46, + "learning_rate": 8.151119487275473e-05, + "loss": 0.026, + "step": 225680 + }, + { + "epoch": 1.46, + "learning_rate": 8.150151351839779e-05, + "loss": 0.0294, + "step": 225690 + }, + { + "epoch": 1.46, + "learning_rate": 8.149183216404086e-05, + "loss": 0.0287, + "step": 225700 + }, + { + "epoch": 1.46, + "learning_rate": 8.148215080968393e-05, + "loss": 0.0296, + "step": 225710 + }, + { + "epoch": 1.46, + "learning_rate": 8.147246945532698e-05, + "loss": 0.0244, + "step": 225720 + }, + { + "epoch": 1.46, + "learning_rate": 8.146278810097006e-05, + "loss": 0.0317, + "step": 225730 + }, + { + "epoch": 1.46, + "learning_rate": 8.145310674661313e-05, + "loss": 0.0283, + "step": 225740 + }, + { + "epoch": 1.46, + "learning_rate": 8.144342539225621e-05, + "loss": 0.0267, + "step": 225750 + }, + { + "epoch": 1.46, + "learning_rate": 8.143374403789926e-05, + "loss": 0.0297, + "step": 225760 + }, + { + "epoch": 1.46, + "learning_rate": 8.142406268354233e-05, + "loss": 0.0211, + "step": 225770 + }, + { + "epoch": 1.46, + "learning_rate": 8.141438132918541e-05, + "loss": 0.0262, + "step": 225780 + }, + { + "epoch": 1.46, + "learning_rate": 8.140469997482846e-05, + "loss": 0.0318, + "step": 225790 + }, + { + "epoch": 1.46, + "learning_rate": 8.139501862047154e-05, + "loss": 0.0278, + "step": 225800 + }, + { + "epoch": 1.46, + "learning_rate": 8.138533726611461e-05, + "loss": 0.032, + "step": 225810 + }, + { + "epoch": 1.46, + "learning_rate": 8.137565591175769e-05, + "loss": 0.027, + "step": 225820 + }, + { + "epoch": 1.46, + "learning_rate": 8.136597455740074e-05, + "loss": 0.0248, + "step": 225830 + }, + { + "epoch": 1.46, + "learning_rate": 8.13562932030438e-05, + "loss": 0.0275, + "step": 225840 + }, + { + "epoch": 1.46, + "learning_rate": 8.134661184868689e-05, + "loss": 0.0276, + "step": 225850 + }, + { + "epoch": 1.46, + "learning_rate": 8.133693049432994e-05, + "loss": 0.0294, + "step": 225860 + }, + { + "epoch": 1.46, + "learning_rate": 8.1327249139973e-05, + "loss": 0.0326, + "step": 225870 + }, + { + "epoch": 1.46, + "learning_rate": 8.131756778561608e-05, + "loss": 0.028, + "step": 225880 + }, + { + "epoch": 1.46, + "learning_rate": 8.130788643125915e-05, + "loss": 0.0254, + "step": 225890 + }, + { + "epoch": 1.46, + "learning_rate": 8.129820507690222e-05, + "loss": 0.0322, + "step": 225900 + }, + { + "epoch": 1.46, + "learning_rate": 8.128852372254528e-05, + "loss": 0.031, + "step": 225910 + }, + { + "epoch": 1.46, + "learning_rate": 8.127884236818836e-05, + "loss": 0.0284, + "step": 225920 + }, + { + "epoch": 1.46, + "learning_rate": 8.126916101383142e-05, + "loss": 0.028, + "step": 225930 + }, + { + "epoch": 1.46, + "learning_rate": 8.125947965947448e-05, + "loss": 0.0273, + "step": 225940 + }, + { + "epoch": 1.46, + "learning_rate": 8.124979830511756e-05, + "loss": 0.0267, + "step": 225950 + }, + { + "epoch": 1.46, + "learning_rate": 8.124011695076063e-05, + "loss": 0.0236, + "step": 225960 + }, + { + "epoch": 1.46, + "learning_rate": 8.123043559640368e-05, + "loss": 0.0285, + "step": 225970 + }, + { + "epoch": 1.46, + "learning_rate": 8.122075424204676e-05, + "loss": 0.0295, + "step": 225980 + }, + { + "epoch": 1.46, + "learning_rate": 8.121107288768983e-05, + "loss": 0.0289, + "step": 225990 + }, + { + "epoch": 1.46, + "learning_rate": 8.120139153333289e-05, + "loss": 0.0249, + "step": 226000 + }, + { + "epoch": 1.46, + "eval_cer": 0.9199150378488307, + "eval_loss": 0.020439114421606064, + "eval_runtime": 120.1357, + "eval_samples_per_second": 16.648, + "eval_steps_per_second": 4.162, + "step": 226000 + }, + { + "epoch": 1.46, + "learning_rate": 8.119171017897596e-05, + "loss": 0.0261, + "step": 226010 + }, + { + "epoch": 1.46, + "learning_rate": 8.118202882461904e-05, + "loss": 0.0253, + "step": 226020 + }, + { + "epoch": 1.46, + "learning_rate": 8.11723474702621e-05, + "loss": 0.0216, + "step": 226030 + }, + { + "epoch": 1.46, + "learning_rate": 8.116266611590516e-05, + "loss": 0.0257, + "step": 226040 + }, + { + "epoch": 1.46, + "learning_rate": 8.115298476154824e-05, + "loss": 0.0288, + "step": 226050 + }, + { + "epoch": 1.46, + "learning_rate": 8.11433034071913e-05, + "loss": 0.0269, + "step": 226060 + }, + { + "epoch": 1.46, + "learning_rate": 8.113362205283436e-05, + "loss": 0.0255, + "step": 226070 + }, + { + "epoch": 1.46, + "learning_rate": 8.112394069847744e-05, + "loss": 0.0238, + "step": 226080 + }, + { + "epoch": 1.46, + "learning_rate": 8.11142593441205e-05, + "loss": 0.0347, + "step": 226090 + }, + { + "epoch": 1.46, + "learning_rate": 8.110457798976358e-05, + "loss": 0.0283, + "step": 226100 + }, + { + "epoch": 1.46, + "learning_rate": 8.109489663540663e-05, + "loss": 0.0235, + "step": 226110 + }, + { + "epoch": 1.46, + "learning_rate": 8.108521528104971e-05, + "loss": 0.0273, + "step": 226120 + }, + { + "epoch": 1.46, + "learning_rate": 8.107553392669278e-05, + "loss": 0.0323, + "step": 226130 + }, + { + "epoch": 1.46, + "learning_rate": 8.106585257233583e-05, + "loss": 0.0275, + "step": 226140 + }, + { + "epoch": 1.46, + "learning_rate": 8.105617121797891e-05, + "loss": 0.0293, + "step": 226150 + }, + { + "epoch": 1.46, + "learning_rate": 8.104648986362198e-05, + "loss": 0.0281, + "step": 226160 + }, + { + "epoch": 1.46, + "learning_rate": 8.103680850926506e-05, + "loss": 0.0252, + "step": 226170 + }, + { + "epoch": 1.46, + "learning_rate": 8.102712715490811e-05, + "loss": 0.0259, + "step": 226180 + }, + { + "epoch": 1.46, + "learning_rate": 8.101744580055118e-05, + "loss": 0.0294, + "step": 226190 + }, + { + "epoch": 1.46, + "learning_rate": 8.100776444619426e-05, + "loss": 0.0241, + "step": 226200 + }, + { + "epoch": 1.46, + "learning_rate": 8.099808309183731e-05, + "loss": 0.0253, + "step": 226210 + }, + { + "epoch": 1.46, + "learning_rate": 8.098840173748039e-05, + "loss": 0.0252, + "step": 226220 + }, + { + "epoch": 1.46, + "learning_rate": 8.097872038312346e-05, + "loss": 0.0292, + "step": 226230 + }, + { + "epoch": 1.46, + "learning_rate": 8.096903902876654e-05, + "loss": 0.0359, + "step": 226240 + }, + { + "epoch": 1.46, + "learning_rate": 8.095935767440959e-05, + "loss": 0.027, + "step": 226250 + }, + { + "epoch": 1.46, + "learning_rate": 8.094967632005266e-05, + "loss": 0.0284, + "step": 226260 + }, + { + "epoch": 1.46, + "learning_rate": 8.093999496569574e-05, + "loss": 0.0295, + "step": 226270 + }, + { + "epoch": 1.46, + "learning_rate": 8.093031361133879e-05, + "loss": 0.0221, + "step": 226280 + }, + { + "epoch": 1.46, + "learning_rate": 8.092063225698185e-05, + "loss": 0.0277, + "step": 226290 + }, + { + "epoch": 1.46, + "learning_rate": 8.091095090262493e-05, + "loss": 0.0269, + "step": 226300 + }, + { + "epoch": 1.46, + "learning_rate": 8.0901269548268e-05, + "loss": 0.0286, + "step": 226310 + }, + { + "epoch": 1.46, + "learning_rate": 8.089158819391107e-05, + "loss": 0.0327, + "step": 226320 + }, + { + "epoch": 1.46, + "learning_rate": 8.088190683955413e-05, + "loss": 0.0259, + "step": 226330 + }, + { + "epoch": 1.46, + "learning_rate": 8.087222548519721e-05, + "loss": 0.029, + "step": 226340 + }, + { + "epoch": 1.46, + "learning_rate": 8.086254413084027e-05, + "loss": 0.0301, + "step": 226350 + }, + { + "epoch": 1.46, + "learning_rate": 8.085286277648333e-05, + "loss": 0.0274, + "step": 226360 + }, + { + "epoch": 1.46, + "learning_rate": 8.084318142212641e-05, + "loss": 0.027, + "step": 226370 + }, + { + "epoch": 1.46, + "learning_rate": 8.083350006776948e-05, + "loss": 0.0303, + "step": 226380 + }, + { + "epoch": 1.46, + "learning_rate": 8.082381871341253e-05, + "loss": 0.0228, + "step": 226390 + }, + { + "epoch": 1.46, + "learning_rate": 8.081413735905561e-05, + "loss": 0.0247, + "step": 226400 + }, + { + "epoch": 1.46, + "learning_rate": 8.080445600469868e-05, + "loss": 0.0252, + "step": 226410 + }, + { + "epoch": 1.46, + "learning_rate": 8.079477465034174e-05, + "loss": 0.0307, + "step": 226420 + }, + { + "epoch": 1.46, + "learning_rate": 8.078509329598481e-05, + "loss": 0.0252, + "step": 226430 + }, + { + "epoch": 1.46, + "learning_rate": 8.077541194162789e-05, + "loss": 0.0299, + "step": 226440 + }, + { + "epoch": 1.46, + "learning_rate": 8.076573058727095e-05, + "loss": 0.0289, + "step": 226450 + }, + { + "epoch": 1.46, + "learning_rate": 8.075604923291401e-05, + "loss": 0.0325, + "step": 226460 + }, + { + "epoch": 1.46, + "learning_rate": 8.074636787855709e-05, + "loss": 0.0278, + "step": 226470 + }, + { + "epoch": 1.46, + "learning_rate": 8.073668652420015e-05, + "loss": 0.0277, + "step": 226480 + }, + { + "epoch": 1.46, + "learning_rate": 8.07270051698432e-05, + "loss": 0.0291, + "step": 226490 + }, + { + "epoch": 1.46, + "learning_rate": 8.071732381548629e-05, + "loss": 0.0248, + "step": 226500 + }, + { + "epoch": 1.46, + "learning_rate": 8.070764246112935e-05, + "loss": 0.0246, + "step": 226510 + }, + { + "epoch": 1.46, + "learning_rate": 8.069796110677243e-05, + "loss": 0.025, + "step": 226520 + }, + { + "epoch": 1.46, + "learning_rate": 8.068827975241548e-05, + "loss": 0.0271, + "step": 226530 + }, + { + "epoch": 1.46, + "learning_rate": 8.067859839805856e-05, + "loss": 0.0249, + "step": 226540 + }, + { + "epoch": 1.46, + "learning_rate": 8.066891704370163e-05, + "loss": 0.0291, + "step": 226550 + }, + { + "epoch": 1.46, + "learning_rate": 8.065923568934468e-05, + "loss": 0.0335, + "step": 226560 + }, + { + "epoch": 1.46, + "learning_rate": 8.064955433498776e-05, + "loss": 0.0346, + "step": 226570 + }, + { + "epoch": 1.46, + "learning_rate": 8.063987298063083e-05, + "loss": 0.0291, + "step": 226580 + }, + { + "epoch": 1.46, + "learning_rate": 8.063019162627391e-05, + "loss": 0.0283, + "step": 226590 + }, + { + "epoch": 1.46, + "learning_rate": 8.062051027191696e-05, + "loss": 0.0274, + "step": 226600 + }, + { + "epoch": 1.46, + "learning_rate": 8.061082891756003e-05, + "loss": 0.0314, + "step": 226610 + }, + { + "epoch": 1.46, + "learning_rate": 8.060114756320311e-05, + "loss": 0.0264, + "step": 226620 + }, + { + "epoch": 1.46, + "learning_rate": 8.059146620884616e-05, + "loss": 0.0256, + "step": 226630 + }, + { + "epoch": 1.46, + "learning_rate": 8.058178485448924e-05, + "loss": 0.0286, + "step": 226640 + }, + { + "epoch": 1.46, + "learning_rate": 8.05721035001323e-05, + "loss": 0.0332, + "step": 226650 + }, + { + "epoch": 1.46, + "learning_rate": 8.056242214577537e-05, + "loss": 0.0248, + "step": 226660 + }, + { + "epoch": 1.46, + "learning_rate": 8.055274079141844e-05, + "loss": 0.0268, + "step": 226670 + }, + { + "epoch": 1.46, + "learning_rate": 8.05430594370615e-05, + "loss": 0.0302, + "step": 226680 + }, + { + "epoch": 1.46, + "learning_rate": 8.053337808270459e-05, + "loss": 0.0301, + "step": 226690 + }, + { + "epoch": 1.46, + "learning_rate": 8.052369672834764e-05, + "loss": 0.0272, + "step": 226700 + }, + { + "epoch": 1.46, + "learning_rate": 8.05140153739907e-05, + "loss": 0.0287, + "step": 226710 + }, + { + "epoch": 1.46, + "learning_rate": 8.050433401963378e-05, + "loss": 0.0286, + "step": 226720 + }, + { + "epoch": 1.46, + "learning_rate": 8.049465266527685e-05, + "loss": 0.0269, + "step": 226730 + }, + { + "epoch": 1.46, + "learning_rate": 8.048497131091992e-05, + "loss": 0.0301, + "step": 226740 + }, + { + "epoch": 1.46, + "learning_rate": 8.047528995656298e-05, + "loss": 0.0264, + "step": 226750 + }, + { + "epoch": 1.46, + "learning_rate": 8.046560860220605e-05, + "loss": 0.0268, + "step": 226760 + }, + { + "epoch": 1.46, + "learning_rate": 8.045592724784912e-05, + "loss": 0.0305, + "step": 226770 + }, + { + "epoch": 1.46, + "learning_rate": 8.044624589349218e-05, + "loss": 0.0272, + "step": 226780 + }, + { + "epoch": 1.46, + "learning_rate": 8.043656453913526e-05, + "loss": 0.0342, + "step": 226790 + }, + { + "epoch": 1.46, + "learning_rate": 8.042688318477833e-05, + "loss": 0.0348, + "step": 226800 + }, + { + "epoch": 1.46, + "learning_rate": 8.041720183042138e-05, + "loss": 0.0329, + "step": 226810 + }, + { + "epoch": 1.46, + "learning_rate": 8.040752047606446e-05, + "loss": 0.0268, + "step": 226820 + }, + { + "epoch": 1.46, + "learning_rate": 8.039783912170753e-05, + "loss": 0.0353, + "step": 226830 + }, + { + "epoch": 1.46, + "learning_rate": 8.038815776735059e-05, + "loss": 0.0332, + "step": 226840 + }, + { + "epoch": 1.46, + "learning_rate": 8.037847641299366e-05, + "loss": 0.0321, + "step": 226850 + }, + { + "epoch": 1.46, + "learning_rate": 8.036879505863672e-05, + "loss": 0.0322, + "step": 226860 + }, + { + "epoch": 1.46, + "learning_rate": 8.03591137042798e-05, + "loss": 0.0318, + "step": 226870 + }, + { + "epoch": 1.46, + "learning_rate": 8.034943234992286e-05, + "loss": 0.0269, + "step": 226880 + }, + { + "epoch": 1.46, + "learning_rate": 8.033975099556594e-05, + "loss": 0.0285, + "step": 226890 + }, + { + "epoch": 1.46, + "learning_rate": 8.0330069641209e-05, + "loss": 0.0348, + "step": 226900 + }, + { + "epoch": 1.46, + "learning_rate": 8.032038828685206e-05, + "loss": 0.0239, + "step": 226910 + }, + { + "epoch": 1.46, + "learning_rate": 8.031070693249514e-05, + "loss": 0.0294, + "step": 226920 + }, + { + "epoch": 1.46, + "learning_rate": 8.03010255781382e-05, + "loss": 0.0244, + "step": 226930 + }, + { + "epoch": 1.46, + "learning_rate": 8.029134422378128e-05, + "loss": 0.0299, + "step": 226940 + }, + { + "epoch": 1.46, + "learning_rate": 8.028166286942433e-05, + "loss": 0.0252, + "step": 226950 + }, + { + "epoch": 1.46, + "learning_rate": 8.02719815150674e-05, + "loss": 0.0246, + "step": 226960 + }, + { + "epoch": 1.46, + "learning_rate": 8.026230016071048e-05, + "loss": 0.0277, + "step": 226970 + }, + { + "epoch": 1.46, + "learning_rate": 8.025261880635353e-05, + "loss": 0.0298, + "step": 226980 + }, + { + "epoch": 1.47, + "learning_rate": 8.024293745199661e-05, + "loss": 0.0316, + "step": 226990 + }, + { + "epoch": 1.47, + "learning_rate": 8.023325609763968e-05, + "loss": 0.0267, + "step": 227000 + }, + { + "epoch": 1.47, + "eval_cer": 0.9199240763755507, + "eval_loss": 0.020223721861839294, + "eval_runtime": 120.1186, + "eval_samples_per_second": 16.65, + "eval_steps_per_second": 4.163, + "step": 227000 + }, + { + "epoch": 1.47, + "learning_rate": 8.022357474328276e-05, + "loss": 0.0293, + "step": 227010 + }, + { + "epoch": 1.47, + "learning_rate": 8.021389338892581e-05, + "loss": 0.0351, + "step": 227020 + }, + { + "epoch": 1.47, + "learning_rate": 8.020421203456888e-05, + "loss": 0.0342, + "step": 227030 + }, + { + "epoch": 1.47, + "learning_rate": 8.019453068021196e-05, + "loss": 0.0375, + "step": 227040 + }, + { + "epoch": 1.47, + "learning_rate": 8.018484932585501e-05, + "loss": 0.0237, + "step": 227050 + }, + { + "epoch": 1.47, + "learning_rate": 8.017516797149808e-05, + "loss": 0.0317, + "step": 227060 + }, + { + "epoch": 1.47, + "learning_rate": 8.016548661714116e-05, + "loss": 0.0276, + "step": 227070 + }, + { + "epoch": 1.47, + "learning_rate": 8.015580526278422e-05, + "loss": 0.0258, + "step": 227080 + }, + { + "epoch": 1.47, + "learning_rate": 8.014612390842729e-05, + "loss": 0.0287, + "step": 227090 + }, + { + "epoch": 1.47, + "learning_rate": 8.013644255407036e-05, + "loss": 0.0214, + "step": 227100 + }, + { + "epoch": 1.47, + "learning_rate": 8.012676119971344e-05, + "loss": 0.0253, + "step": 227110 + }, + { + "epoch": 1.47, + "learning_rate": 8.011707984535649e-05, + "loss": 0.0298, + "step": 227120 + }, + { + "epoch": 1.47, + "learning_rate": 8.010739849099955e-05, + "loss": 0.0258, + "step": 227130 + }, + { + "epoch": 1.47, + "learning_rate": 8.009771713664263e-05, + "loss": 0.0337, + "step": 227140 + }, + { + "epoch": 1.47, + "learning_rate": 8.00880357822857e-05, + "loss": 0.0277, + "step": 227150 + }, + { + "epoch": 1.47, + "learning_rate": 8.007835442792875e-05, + "loss": 0.0291, + "step": 227160 + }, + { + "epoch": 1.47, + "learning_rate": 8.006867307357183e-05, + "loss": 0.0274, + "step": 227170 + }, + { + "epoch": 1.47, + "learning_rate": 8.00589917192149e-05, + "loss": 0.0289, + "step": 227180 + }, + { + "epoch": 1.47, + "learning_rate": 8.004931036485796e-05, + "loss": 0.0271, + "step": 227190 + }, + { + "epoch": 1.47, + "learning_rate": 8.003962901050103e-05, + "loss": 0.0287, + "step": 227200 + }, + { + "epoch": 1.47, + "learning_rate": 8.002994765614411e-05, + "loss": 0.0262, + "step": 227210 + }, + { + "epoch": 1.47, + "learning_rate": 8.002026630178718e-05, + "loss": 0.0281, + "step": 227220 + }, + { + "epoch": 1.47, + "learning_rate": 8.001058494743023e-05, + "loss": 0.0254, + "step": 227230 + }, + { + "epoch": 1.47, + "learning_rate": 8.000090359307331e-05, + "loss": 0.0267, + "step": 227240 + }, + { + "epoch": 1.47, + "learning_rate": 7.999122223871638e-05, + "loss": 0.0283, + "step": 227250 + }, + { + "epoch": 1.47, + "learning_rate": 7.998154088435943e-05, + "loss": 0.026, + "step": 227260 + }, + { + "epoch": 1.47, + "learning_rate": 7.997185953000251e-05, + "loss": 0.0289, + "step": 227270 + }, + { + "epoch": 1.47, + "learning_rate": 7.996217817564557e-05, + "loss": 0.0308, + "step": 227280 + }, + { + "epoch": 1.47, + "learning_rate": 7.995249682128865e-05, + "loss": 0.0327, + "step": 227290 + }, + { + "epoch": 1.47, + "learning_rate": 7.994281546693171e-05, + "loss": 0.0269, + "step": 227300 + }, + { + "epoch": 1.47, + "learning_rate": 7.993313411257479e-05, + "loss": 0.0282, + "step": 227310 + }, + { + "epoch": 1.47, + "learning_rate": 7.992345275821785e-05, + "loss": 0.0253, + "step": 227320 + }, + { + "epoch": 1.47, + "learning_rate": 7.99137714038609e-05, + "loss": 0.0364, + "step": 227330 + }, + { + "epoch": 1.47, + "learning_rate": 7.990409004950399e-05, + "loss": 0.0239, + "step": 227340 + }, + { + "epoch": 1.47, + "learning_rate": 7.989440869514705e-05, + "loss": 0.0235, + "step": 227350 + }, + { + "epoch": 1.47, + "learning_rate": 7.988472734079013e-05, + "loss": 0.0241, + "step": 227360 + }, + { + "epoch": 1.47, + "learning_rate": 7.987504598643318e-05, + "loss": 0.0228, + "step": 227370 + }, + { + "epoch": 1.47, + "learning_rate": 7.986536463207625e-05, + "loss": 0.0338, + "step": 227380 + }, + { + "epoch": 1.47, + "learning_rate": 7.985568327771933e-05, + "loss": 0.0249, + "step": 227390 + }, + { + "epoch": 1.47, + "learning_rate": 7.984600192336238e-05, + "loss": 0.0321, + "step": 227400 + }, + { + "epoch": 1.47, + "learning_rate": 7.983632056900546e-05, + "loss": 0.0292, + "step": 227410 + }, + { + "epoch": 1.47, + "learning_rate": 7.982663921464853e-05, + "loss": 0.0323, + "step": 227420 + }, + { + "epoch": 1.47, + "learning_rate": 7.981695786029161e-05, + "loss": 0.0295, + "step": 227430 + }, + { + "epoch": 1.47, + "learning_rate": 7.980727650593466e-05, + "loss": 0.0289, + "step": 227440 + }, + { + "epoch": 1.47, + "learning_rate": 7.979759515157773e-05, + "loss": 0.0276, + "step": 227450 + }, + { + "epoch": 1.47, + "learning_rate": 7.978791379722081e-05, + "loss": 0.0268, + "step": 227460 + }, + { + "epoch": 1.47, + "learning_rate": 7.977823244286386e-05, + "loss": 0.0235, + "step": 227470 + }, + { + "epoch": 1.47, + "learning_rate": 7.976855108850693e-05, + "loss": 0.0294, + "step": 227480 + }, + { + "epoch": 1.47, + "learning_rate": 7.975886973415e-05, + "loss": 0.0268, + "step": 227490 + }, + { + "epoch": 1.47, + "learning_rate": 7.974918837979307e-05, + "loss": 0.0261, + "step": 227500 + }, + { + "epoch": 1.47, + "learning_rate": 7.973950702543614e-05, + "loss": 0.0298, + "step": 227510 + }, + { + "epoch": 1.47, + "learning_rate": 7.97298256710792e-05, + "loss": 0.0226, + "step": 227520 + }, + { + "epoch": 1.47, + "learning_rate": 7.972014431672228e-05, + "loss": 0.0301, + "step": 227530 + }, + { + "epoch": 1.47, + "learning_rate": 7.971046296236534e-05, + "loss": 0.0259, + "step": 227540 + }, + { + "epoch": 1.47, + "learning_rate": 7.97007816080084e-05, + "loss": 0.0275, + "step": 227550 + }, + { + "epoch": 1.47, + "learning_rate": 7.969110025365148e-05, + "loss": 0.0292, + "step": 227560 + }, + { + "epoch": 1.47, + "learning_rate": 7.968141889929455e-05, + "loss": 0.0312, + "step": 227570 + }, + { + "epoch": 1.47, + "learning_rate": 7.96717375449376e-05, + "loss": 0.0362, + "step": 227580 + }, + { + "epoch": 1.47, + "learning_rate": 7.966205619058068e-05, + "loss": 0.0274, + "step": 227590 + }, + { + "epoch": 1.47, + "learning_rate": 7.965237483622375e-05, + "loss": 0.0301, + "step": 227600 + }, + { + "epoch": 1.47, + "learning_rate": 7.964269348186681e-05, + "loss": 0.0242, + "step": 227610 + }, + { + "epoch": 1.47, + "learning_rate": 7.963301212750988e-05, + "loss": 0.0264, + "step": 227620 + }, + { + "epoch": 1.47, + "learning_rate": 7.962333077315296e-05, + "loss": 0.0286, + "step": 227630 + }, + { + "epoch": 1.47, + "learning_rate": 7.961364941879603e-05, + "loss": 0.0256, + "step": 227640 + }, + { + "epoch": 1.47, + "learning_rate": 7.960396806443908e-05, + "loss": 0.0244, + "step": 227650 + }, + { + "epoch": 1.47, + "learning_rate": 7.959428671008216e-05, + "loss": 0.0268, + "step": 227660 + }, + { + "epoch": 1.47, + "learning_rate": 7.958460535572523e-05, + "loss": 0.0325, + "step": 227670 + }, + { + "epoch": 1.47, + "learning_rate": 7.957492400136828e-05, + "loss": 0.0296, + "step": 227680 + }, + { + "epoch": 1.47, + "learning_rate": 7.956524264701136e-05, + "loss": 0.0314, + "step": 227690 + }, + { + "epoch": 1.47, + "learning_rate": 7.955556129265442e-05, + "loss": 0.0275, + "step": 227700 + }, + { + "epoch": 1.47, + "learning_rate": 7.95458799382975e-05, + "loss": 0.0312, + "step": 227710 + }, + { + "epoch": 1.47, + "learning_rate": 7.953619858394056e-05, + "loss": 0.0255, + "step": 227720 + }, + { + "epoch": 1.47, + "learning_rate": 7.952651722958364e-05, + "loss": 0.0299, + "step": 227730 + }, + { + "epoch": 1.47, + "learning_rate": 7.95168358752267e-05, + "loss": 0.0269, + "step": 227740 + }, + { + "epoch": 1.47, + "learning_rate": 7.950715452086976e-05, + "loss": 0.0331, + "step": 227750 + }, + { + "epoch": 1.47, + "learning_rate": 7.949747316651284e-05, + "loss": 0.0236, + "step": 227760 + }, + { + "epoch": 1.47, + "learning_rate": 7.94877918121559e-05, + "loss": 0.0301, + "step": 227770 + }, + { + "epoch": 1.47, + "learning_rate": 7.947811045779898e-05, + "loss": 0.0287, + "step": 227780 + }, + { + "epoch": 1.47, + "learning_rate": 7.946842910344203e-05, + "loss": 0.0252, + "step": 227790 + }, + { + "epoch": 1.47, + "learning_rate": 7.94587477490851e-05, + "loss": 0.0287, + "step": 227800 + }, + { + "epoch": 1.47, + "learning_rate": 7.944906639472818e-05, + "loss": 0.0269, + "step": 227810 + }, + { + "epoch": 1.47, + "learning_rate": 7.943938504037123e-05, + "loss": 0.0227, + "step": 227820 + }, + { + "epoch": 1.47, + "learning_rate": 7.942970368601431e-05, + "loss": 0.0306, + "step": 227830 + }, + { + "epoch": 1.47, + "learning_rate": 7.942002233165738e-05, + "loss": 0.0285, + "step": 227840 + }, + { + "epoch": 1.47, + "learning_rate": 7.941034097730045e-05, + "loss": 0.0285, + "step": 227850 + }, + { + "epoch": 1.47, + "learning_rate": 7.940065962294351e-05, + "loss": 0.0283, + "step": 227860 + }, + { + "epoch": 1.47, + "learning_rate": 7.939097826858658e-05, + "loss": 0.0283, + "step": 227870 + }, + { + "epoch": 1.47, + "learning_rate": 7.938129691422966e-05, + "loss": 0.0255, + "step": 227880 + }, + { + "epoch": 1.47, + "learning_rate": 7.937161555987271e-05, + "loss": 0.0319, + "step": 227890 + }, + { + "epoch": 1.47, + "learning_rate": 7.936193420551578e-05, + "loss": 0.0266, + "step": 227900 + }, + { + "epoch": 1.47, + "learning_rate": 7.935225285115886e-05, + "loss": 0.0279, + "step": 227910 + }, + { + "epoch": 1.47, + "learning_rate": 7.934257149680192e-05, + "loss": 0.0227, + "step": 227920 + }, + { + "epoch": 1.47, + "learning_rate": 7.933289014244499e-05, + "loss": 0.0304, + "step": 227930 + }, + { + "epoch": 1.47, + "learning_rate": 7.932320878808805e-05, + "loss": 0.0335, + "step": 227940 + }, + { + "epoch": 1.47, + "learning_rate": 7.931352743373112e-05, + "loss": 0.0252, + "step": 227950 + }, + { + "epoch": 1.47, + "learning_rate": 7.930384607937419e-05, + "loss": 0.0292, + "step": 227960 + }, + { + "epoch": 1.47, + "learning_rate": 7.929416472501725e-05, + "loss": 0.0236, + "step": 227970 + }, + { + "epoch": 1.47, + "learning_rate": 7.928448337066033e-05, + "loss": 0.0271, + "step": 227980 + }, + { + "epoch": 1.47, + "learning_rate": 7.92748020163034e-05, + "loss": 0.0315, + "step": 227990 + }, + { + "epoch": 1.47, + "learning_rate": 7.926512066194645e-05, + "loss": 0.0264, + "step": 228000 + }, + { + "epoch": 1.47, + "eval_cer": 0.9198535758671337, + "eval_loss": 0.020223427563905716, + "eval_runtime": 119.9893, + "eval_samples_per_second": 16.668, + "eval_steps_per_second": 4.167, + "step": 228000 + }, + { + "epoch": 1.47, + "learning_rate": 7.925543930758953e-05, + "loss": 0.0268, + "step": 228010 + }, + { + "epoch": 1.47, + "learning_rate": 7.92457579532326e-05, + "loss": 0.0279, + "step": 228020 + }, + { + "epoch": 1.47, + "learning_rate": 7.923607659887566e-05, + "loss": 0.031, + "step": 228030 + }, + { + "epoch": 1.47, + "learning_rate": 7.922639524451873e-05, + "loss": 0.0301, + "step": 228040 + }, + { + "epoch": 1.47, + "learning_rate": 7.92167138901618e-05, + "loss": 0.0332, + "step": 228050 + }, + { + "epoch": 1.47, + "learning_rate": 7.920703253580488e-05, + "loss": 0.029, + "step": 228060 + }, + { + "epoch": 1.47, + "learning_rate": 7.919735118144793e-05, + "loss": 0.0369, + "step": 228070 + }, + { + "epoch": 1.47, + "learning_rate": 7.918766982709101e-05, + "loss": 0.0235, + "step": 228080 + }, + { + "epoch": 1.47, + "learning_rate": 7.917798847273408e-05, + "loss": 0.0306, + "step": 228090 + }, + { + "epoch": 1.47, + "learning_rate": 7.916830711837713e-05, + "loss": 0.0289, + "step": 228100 + }, + { + "epoch": 1.47, + "learning_rate": 7.915862576402021e-05, + "loss": 0.0275, + "step": 228110 + }, + { + "epoch": 1.47, + "learning_rate": 7.914894440966327e-05, + "loss": 0.0258, + "step": 228120 + }, + { + "epoch": 1.47, + "learning_rate": 7.913926305530635e-05, + "loss": 0.0264, + "step": 228130 + }, + { + "epoch": 1.47, + "learning_rate": 7.91295817009494e-05, + "loss": 0.0282, + "step": 228140 + }, + { + "epoch": 1.47, + "learning_rate": 7.911990034659247e-05, + "loss": 0.0304, + "step": 228150 + }, + { + "epoch": 1.47, + "learning_rate": 7.911021899223555e-05, + "loss": 0.0267, + "step": 228160 + }, + { + "epoch": 1.47, + "learning_rate": 7.91005376378786e-05, + "loss": 0.0287, + "step": 228170 + }, + { + "epoch": 1.47, + "learning_rate": 7.909085628352169e-05, + "loss": 0.03, + "step": 228180 + }, + { + "epoch": 1.47, + "learning_rate": 7.908117492916475e-05, + "loss": 0.0293, + "step": 228190 + }, + { + "epoch": 1.47, + "learning_rate": 7.907149357480783e-05, + "loss": 0.0274, + "step": 228200 + }, + { + "epoch": 1.47, + "learning_rate": 7.906181222045088e-05, + "loss": 0.0325, + "step": 228210 + }, + { + "epoch": 1.47, + "learning_rate": 7.905213086609395e-05, + "loss": 0.0246, + "step": 228220 + }, + { + "epoch": 1.47, + "learning_rate": 7.904244951173703e-05, + "loss": 0.0284, + "step": 228230 + }, + { + "epoch": 1.47, + "learning_rate": 7.903276815738008e-05, + "loss": 0.0245, + "step": 228240 + }, + { + "epoch": 1.47, + "learning_rate": 7.902308680302315e-05, + "loss": 0.0264, + "step": 228250 + }, + { + "epoch": 1.47, + "learning_rate": 7.901340544866623e-05, + "loss": 0.0239, + "step": 228260 + }, + { + "epoch": 1.47, + "learning_rate": 7.90037240943093e-05, + "loss": 0.0295, + "step": 228270 + }, + { + "epoch": 1.47, + "learning_rate": 7.899404273995236e-05, + "loss": 0.0242, + "step": 228280 + }, + { + "epoch": 1.47, + "learning_rate": 7.898436138559543e-05, + "loss": 0.0231, + "step": 228290 + }, + { + "epoch": 1.47, + "learning_rate": 7.897468003123851e-05, + "loss": 0.0276, + "step": 228300 + }, + { + "epoch": 1.47, + "learning_rate": 7.896499867688156e-05, + "loss": 0.0281, + "step": 228310 + }, + { + "epoch": 1.47, + "learning_rate": 7.895531732252463e-05, + "loss": 0.0217, + "step": 228320 + }, + { + "epoch": 1.47, + "learning_rate": 7.89456359681677e-05, + "loss": 0.0292, + "step": 228330 + }, + { + "epoch": 1.47, + "learning_rate": 7.893595461381077e-05, + "loss": 0.0242, + "step": 228340 + }, + { + "epoch": 1.47, + "learning_rate": 7.892627325945382e-05, + "loss": 0.0275, + "step": 228350 + }, + { + "epoch": 1.47, + "learning_rate": 7.89165919050969e-05, + "loss": 0.022, + "step": 228360 + }, + { + "epoch": 1.47, + "learning_rate": 7.890691055073997e-05, + "loss": 0.0265, + "step": 228370 + }, + { + "epoch": 1.47, + "learning_rate": 7.889722919638304e-05, + "loss": 0.0317, + "step": 228380 + }, + { + "epoch": 1.47, + "learning_rate": 7.88875478420261e-05, + "loss": 0.0251, + "step": 228390 + }, + { + "epoch": 1.47, + "learning_rate": 7.887786648766918e-05, + "loss": 0.0275, + "step": 228400 + }, + { + "epoch": 1.47, + "learning_rate": 7.886818513331225e-05, + "loss": 0.0285, + "step": 228410 + }, + { + "epoch": 1.47, + "learning_rate": 7.88585037789553e-05, + "loss": 0.0232, + "step": 228420 + }, + { + "epoch": 1.47, + "learning_rate": 7.884882242459838e-05, + "loss": 0.029, + "step": 228430 + }, + { + "epoch": 1.47, + "learning_rate": 7.883914107024145e-05, + "loss": 0.026, + "step": 228440 + }, + { + "epoch": 1.47, + "learning_rate": 7.882945971588451e-05, + "loss": 0.0251, + "step": 228450 + }, + { + "epoch": 1.47, + "learning_rate": 7.881977836152758e-05, + "loss": 0.0265, + "step": 228460 + }, + { + "epoch": 1.47, + "learning_rate": 7.881009700717065e-05, + "loss": 0.0258, + "step": 228470 + }, + { + "epoch": 1.47, + "learning_rate": 7.880041565281373e-05, + "loss": 0.0289, + "step": 228480 + }, + { + "epoch": 1.47, + "learning_rate": 7.879073429845678e-05, + "loss": 0.0329, + "step": 228490 + }, + { + "epoch": 1.47, + "learning_rate": 7.878105294409986e-05, + "loss": 0.0273, + "step": 228500 + }, + { + "epoch": 1.47, + "learning_rate": 7.877137158974293e-05, + "loss": 0.0301, + "step": 228510 + }, + { + "epoch": 1.47, + "learning_rate": 7.876169023538598e-05, + "loss": 0.0261, + "step": 228520 + }, + { + "epoch": 1.47, + "learning_rate": 7.875200888102906e-05, + "loss": 0.0264, + "step": 228530 + }, + { + "epoch": 1.48, + "learning_rate": 7.874232752667212e-05, + "loss": 0.026, + "step": 228540 + }, + { + "epoch": 1.48, + "learning_rate": 7.87326461723152e-05, + "loss": 0.0275, + "step": 228550 + }, + { + "epoch": 1.48, + "learning_rate": 7.872296481795826e-05, + "loss": 0.0295, + "step": 228560 + }, + { + "epoch": 1.48, + "learning_rate": 7.871328346360132e-05, + "loss": 0.0258, + "step": 228570 + }, + { + "epoch": 1.48, + "learning_rate": 7.87036021092444e-05, + "loss": 0.0284, + "step": 228580 + }, + { + "epoch": 1.48, + "learning_rate": 7.869392075488746e-05, + "loss": 0.024, + "step": 228590 + }, + { + "epoch": 1.48, + "learning_rate": 7.868423940053054e-05, + "loss": 0.0252, + "step": 228600 + }, + { + "epoch": 1.48, + "learning_rate": 7.86745580461736e-05, + "loss": 0.0299, + "step": 228610 + }, + { + "epoch": 1.48, + "learning_rate": 7.866487669181668e-05, + "loss": 0.0239, + "step": 228620 + }, + { + "epoch": 1.48, + "learning_rate": 7.865519533745973e-05, + "loss": 0.0266, + "step": 228630 + }, + { + "epoch": 1.48, + "learning_rate": 7.86455139831028e-05, + "loss": 0.0247, + "step": 228640 + }, + { + "epoch": 1.48, + "learning_rate": 7.863583262874588e-05, + "loss": 0.0285, + "step": 228650 + }, + { + "epoch": 1.48, + "learning_rate": 7.862615127438893e-05, + "loss": 0.0311, + "step": 228660 + }, + { + "epoch": 1.48, + "learning_rate": 7.8616469920032e-05, + "loss": 0.029, + "step": 228670 + }, + { + "epoch": 1.48, + "learning_rate": 7.860678856567508e-05, + "loss": 0.0292, + "step": 228680 + }, + { + "epoch": 1.48, + "learning_rate": 7.859710721131814e-05, + "loss": 0.0311, + "step": 228690 + }, + { + "epoch": 1.48, + "learning_rate": 7.858742585696121e-05, + "loss": 0.026, + "step": 228700 + }, + { + "epoch": 1.48, + "learning_rate": 7.857774450260428e-05, + "loss": 0.0304, + "step": 228710 + }, + { + "epoch": 1.48, + "learning_rate": 7.856806314824736e-05, + "loss": 0.0296, + "step": 228720 + }, + { + "epoch": 1.48, + "learning_rate": 7.855838179389041e-05, + "loss": 0.029, + "step": 228730 + }, + { + "epoch": 1.48, + "learning_rate": 7.854870043953348e-05, + "loss": 0.0288, + "step": 228740 + }, + { + "epoch": 1.48, + "learning_rate": 7.853901908517656e-05, + "loss": 0.0265, + "step": 228750 + }, + { + "epoch": 1.48, + "learning_rate": 7.852933773081962e-05, + "loss": 0.0255, + "step": 228760 + }, + { + "epoch": 1.48, + "learning_rate": 7.851965637646267e-05, + "loss": 0.0279, + "step": 228770 + }, + { + "epoch": 1.48, + "learning_rate": 7.850997502210575e-05, + "loss": 0.0314, + "step": 228780 + }, + { + "epoch": 1.48, + "learning_rate": 7.850029366774882e-05, + "loss": 0.0369, + "step": 228790 + }, + { + "epoch": 1.48, + "learning_rate": 7.849061231339189e-05, + "loss": 0.0284, + "step": 228800 + }, + { + "epoch": 1.48, + "learning_rate": 7.848093095903495e-05, + "loss": 0.0323, + "step": 228810 + }, + { + "epoch": 1.48, + "learning_rate": 7.847124960467803e-05, + "loss": 0.0302, + "step": 228820 + }, + { + "epoch": 1.48, + "learning_rate": 7.84615682503211e-05, + "loss": 0.0244, + "step": 228830 + }, + { + "epoch": 1.48, + "learning_rate": 7.845188689596415e-05, + "loss": 0.026, + "step": 228840 + }, + { + "epoch": 1.48, + "learning_rate": 7.844220554160723e-05, + "loss": 0.0281, + "step": 228850 + }, + { + "epoch": 1.48, + "learning_rate": 7.84325241872503e-05, + "loss": 0.0354, + "step": 228860 + }, + { + "epoch": 1.48, + "learning_rate": 7.842284283289335e-05, + "loss": 0.0344, + "step": 228870 + }, + { + "epoch": 1.48, + "learning_rate": 7.841316147853643e-05, + "loss": 0.0257, + "step": 228880 + }, + { + "epoch": 1.48, + "learning_rate": 7.84034801241795e-05, + "loss": 0.0365, + "step": 228890 + }, + { + "epoch": 1.48, + "learning_rate": 7.839379876982258e-05, + "loss": 0.0289, + "step": 228900 + }, + { + "epoch": 1.48, + "learning_rate": 7.838411741546563e-05, + "loss": 0.0287, + "step": 228910 + }, + { + "epoch": 1.48, + "learning_rate": 7.837443606110871e-05, + "loss": 0.0269, + "step": 228920 + }, + { + "epoch": 1.48, + "learning_rate": 7.836475470675178e-05, + "loss": 0.0244, + "step": 228930 + }, + { + "epoch": 1.48, + "learning_rate": 7.835507335239483e-05, + "loss": 0.027, + "step": 228940 + }, + { + "epoch": 1.48, + "learning_rate": 7.834539199803791e-05, + "loss": 0.0255, + "step": 228950 + }, + { + "epoch": 1.48, + "learning_rate": 7.833571064368097e-05, + "loss": 0.0246, + "step": 228960 + }, + { + "epoch": 1.48, + "learning_rate": 7.832602928932403e-05, + "loss": 0.0282, + "step": 228970 + }, + { + "epoch": 1.48, + "learning_rate": 7.83163479349671e-05, + "loss": 0.0264, + "step": 228980 + }, + { + "epoch": 1.48, + "learning_rate": 7.830666658061017e-05, + "loss": 0.0275, + "step": 228990 + }, + { + "epoch": 1.48, + "learning_rate": 7.829698522625325e-05, + "loss": 0.031, + "step": 229000 + }, + { + "epoch": 1.48, + "eval_cer": 0.9198644220991978, + "eval_loss": 0.020123105496168137, + "eval_runtime": 120.4002, + "eval_samples_per_second": 16.611, + "eval_steps_per_second": 4.153, + "step": 229000 + }, + { + "epoch": 1.48, + "learning_rate": 7.82873038718963e-05, + "loss": 0.0289, + "step": 229010 + }, + { + "epoch": 1.48, + "learning_rate": 7.827762251753938e-05, + "loss": 0.0215, + "step": 229020 + }, + { + "epoch": 1.48, + "learning_rate": 7.826794116318245e-05, + "loss": 0.0274, + "step": 229030 + }, + { + "epoch": 1.48, + "learning_rate": 7.82582598088255e-05, + "loss": 0.0282, + "step": 229040 + }, + { + "epoch": 1.48, + "learning_rate": 7.824857845446858e-05, + "loss": 0.0269, + "step": 229050 + }, + { + "epoch": 1.48, + "learning_rate": 7.823889710011165e-05, + "loss": 0.0321, + "step": 229060 + }, + { + "epoch": 1.48, + "learning_rate": 7.822921574575473e-05, + "loss": 0.0245, + "step": 229070 + }, + { + "epoch": 1.48, + "learning_rate": 7.821953439139778e-05, + "loss": 0.0239, + "step": 229080 + }, + { + "epoch": 1.48, + "learning_rate": 7.820985303704085e-05, + "loss": 0.0281, + "step": 229090 + }, + { + "epoch": 1.48, + "learning_rate": 7.820017168268393e-05, + "loss": 0.0311, + "step": 229100 + }, + { + "epoch": 1.48, + "learning_rate": 7.819049032832698e-05, + "loss": 0.0245, + "step": 229110 + }, + { + "epoch": 1.48, + "learning_rate": 7.818080897397006e-05, + "loss": 0.0256, + "step": 229120 + }, + { + "epoch": 1.48, + "learning_rate": 7.817112761961313e-05, + "loss": 0.0281, + "step": 229130 + }, + { + "epoch": 1.48, + "learning_rate": 7.816144626525621e-05, + "loss": 0.0271, + "step": 229140 + }, + { + "epoch": 1.48, + "learning_rate": 7.815176491089926e-05, + "loss": 0.0332, + "step": 229150 + }, + { + "epoch": 1.48, + "learning_rate": 7.814208355654233e-05, + "loss": 0.0288, + "step": 229160 + }, + { + "epoch": 1.48, + "learning_rate": 7.81324022021854e-05, + "loss": 0.027, + "step": 229170 + }, + { + "epoch": 1.48, + "learning_rate": 7.812272084782846e-05, + "loss": 0.0263, + "step": 229180 + }, + { + "epoch": 1.48, + "learning_rate": 7.811303949347152e-05, + "loss": 0.0256, + "step": 229190 + }, + { + "epoch": 1.48, + "learning_rate": 7.81033581391146e-05, + "loss": 0.028, + "step": 229200 + }, + { + "epoch": 1.48, + "learning_rate": 7.809367678475767e-05, + "loss": 0.0336, + "step": 229210 + }, + { + "epoch": 1.48, + "learning_rate": 7.808399543040074e-05, + "loss": 0.0305, + "step": 229220 + }, + { + "epoch": 1.48, + "learning_rate": 7.80743140760438e-05, + "loss": 0.0285, + "step": 229230 + }, + { + "epoch": 1.48, + "learning_rate": 7.806463272168688e-05, + "loss": 0.0266, + "step": 229240 + }, + { + "epoch": 1.48, + "learning_rate": 7.805495136732994e-05, + "loss": 0.0282, + "step": 229250 + }, + { + "epoch": 1.48, + "learning_rate": 7.8045270012973e-05, + "loss": 0.0267, + "step": 229260 + }, + { + "epoch": 1.48, + "learning_rate": 7.803558865861608e-05, + "loss": 0.0287, + "step": 229270 + }, + { + "epoch": 1.48, + "learning_rate": 7.802590730425915e-05, + "loss": 0.0274, + "step": 229280 + }, + { + "epoch": 1.48, + "learning_rate": 7.80162259499022e-05, + "loss": 0.0259, + "step": 229290 + }, + { + "epoch": 1.48, + "learning_rate": 7.800654459554528e-05, + "loss": 0.0252, + "step": 229300 + }, + { + "epoch": 1.48, + "learning_rate": 7.799686324118835e-05, + "loss": 0.0227, + "step": 229310 + }, + { + "epoch": 1.48, + "learning_rate": 7.798718188683141e-05, + "loss": 0.0248, + "step": 229320 + }, + { + "epoch": 1.48, + "learning_rate": 7.797750053247448e-05, + "loss": 0.026, + "step": 229330 + }, + { + "epoch": 1.48, + "learning_rate": 7.796781917811756e-05, + "loss": 0.0253, + "step": 229340 + }, + { + "epoch": 1.48, + "learning_rate": 7.795813782376062e-05, + "loss": 0.0269, + "step": 229350 + }, + { + "epoch": 1.48, + "learning_rate": 7.794845646940368e-05, + "loss": 0.0241, + "step": 229360 + }, + { + "epoch": 1.48, + "learning_rate": 7.793877511504676e-05, + "loss": 0.0294, + "step": 229370 + }, + { + "epoch": 1.48, + "learning_rate": 7.792909376068982e-05, + "loss": 0.022, + "step": 229380 + }, + { + "epoch": 1.48, + "learning_rate": 7.791941240633288e-05, + "loss": 0.0276, + "step": 229390 + }, + { + "epoch": 1.48, + "learning_rate": 7.790973105197596e-05, + "loss": 0.0244, + "step": 229400 + }, + { + "epoch": 1.48, + "learning_rate": 7.790004969761902e-05, + "loss": 0.0258, + "step": 229410 + }, + { + "epoch": 1.48, + "learning_rate": 7.78903683432621e-05, + "loss": 0.0258, + "step": 229420 + }, + { + "epoch": 1.48, + "learning_rate": 7.788068698890515e-05, + "loss": 0.0285, + "step": 229430 + }, + { + "epoch": 1.48, + "learning_rate": 7.787100563454823e-05, + "loss": 0.0239, + "step": 229440 + }, + { + "epoch": 1.48, + "learning_rate": 7.78613242801913e-05, + "loss": 0.0297, + "step": 229450 + }, + { + "epoch": 1.48, + "learning_rate": 7.785164292583435e-05, + "loss": 0.0265, + "step": 229460 + }, + { + "epoch": 1.48, + "learning_rate": 7.784196157147743e-05, + "loss": 0.0235, + "step": 229470 + }, + { + "epoch": 1.48, + "learning_rate": 7.78322802171205e-05, + "loss": 0.0285, + "step": 229480 + }, + { + "epoch": 1.48, + "learning_rate": 7.782259886276358e-05, + "loss": 0.0273, + "step": 229490 + }, + { + "epoch": 1.48, + "learning_rate": 7.781291750840663e-05, + "loss": 0.0288, + "step": 229500 + }, + { + "epoch": 1.48, + "learning_rate": 7.78032361540497e-05, + "loss": 0.0247, + "step": 229510 + }, + { + "epoch": 1.48, + "learning_rate": 7.779355479969278e-05, + "loss": 0.0266, + "step": 229520 + }, + { + "epoch": 1.48, + "learning_rate": 7.778387344533583e-05, + "loss": 0.0239, + "step": 229530 + }, + { + "epoch": 1.48, + "learning_rate": 7.777419209097891e-05, + "loss": 0.0279, + "step": 229540 + }, + { + "epoch": 1.48, + "learning_rate": 7.776451073662198e-05, + "loss": 0.0285, + "step": 229550 + }, + { + "epoch": 1.48, + "learning_rate": 7.775482938226504e-05, + "loss": 0.0244, + "step": 229560 + }, + { + "epoch": 1.48, + "learning_rate": 7.774514802790811e-05, + "loss": 0.0278, + "step": 229570 + }, + { + "epoch": 1.48, + "learning_rate": 7.773546667355118e-05, + "loss": 0.0291, + "step": 229580 + }, + { + "epoch": 1.48, + "learning_rate": 7.772578531919426e-05, + "loss": 0.0254, + "step": 229590 + }, + { + "epoch": 1.48, + "learning_rate": 7.771610396483731e-05, + "loss": 0.0331, + "step": 229600 + }, + { + "epoch": 1.48, + "learning_rate": 7.770642261048037e-05, + "loss": 0.0272, + "step": 229610 + }, + { + "epoch": 1.48, + "learning_rate": 7.769674125612345e-05, + "loss": 0.0273, + "step": 229620 + }, + { + "epoch": 1.48, + "learning_rate": 7.768705990176652e-05, + "loss": 0.0264, + "step": 229630 + }, + { + "epoch": 1.48, + "learning_rate": 7.767737854740959e-05, + "loss": 0.0261, + "step": 229640 + }, + { + "epoch": 1.48, + "learning_rate": 7.766769719305265e-05, + "loss": 0.0248, + "step": 229650 + }, + { + "epoch": 1.48, + "learning_rate": 7.765801583869572e-05, + "loss": 0.0282, + "step": 229660 + }, + { + "epoch": 1.48, + "learning_rate": 7.764833448433879e-05, + "loss": 0.0252, + "step": 229670 + }, + { + "epoch": 1.48, + "learning_rate": 7.763865312998185e-05, + "loss": 0.0277, + "step": 229680 + }, + { + "epoch": 1.48, + "learning_rate": 7.762897177562493e-05, + "loss": 0.0307, + "step": 229690 + }, + { + "epoch": 1.48, + "learning_rate": 7.7619290421268e-05, + "loss": 0.026, + "step": 229700 + }, + { + "epoch": 1.48, + "learning_rate": 7.760960906691105e-05, + "loss": 0.0263, + "step": 229710 + }, + { + "epoch": 1.48, + "learning_rate": 7.759992771255413e-05, + "loss": 0.0278, + "step": 229720 + }, + { + "epoch": 1.48, + "learning_rate": 7.75902463581972e-05, + "loss": 0.0274, + "step": 229730 + }, + { + "epoch": 1.48, + "learning_rate": 7.758056500384026e-05, + "loss": 0.0256, + "step": 229740 + }, + { + "epoch": 1.48, + "learning_rate": 7.757088364948333e-05, + "loss": 0.0288, + "step": 229750 + }, + { + "epoch": 1.48, + "learning_rate": 7.75612022951264e-05, + "loss": 0.0252, + "step": 229760 + }, + { + "epoch": 1.48, + "learning_rate": 7.755152094076947e-05, + "loss": 0.0283, + "step": 229770 + }, + { + "epoch": 1.48, + "learning_rate": 7.754183958641253e-05, + "loss": 0.0241, + "step": 229780 + }, + { + "epoch": 1.48, + "learning_rate": 7.753215823205561e-05, + "loss": 0.0246, + "step": 229790 + }, + { + "epoch": 1.48, + "learning_rate": 7.752247687769867e-05, + "loss": 0.0262, + "step": 229800 + }, + { + "epoch": 1.48, + "learning_rate": 7.751279552334173e-05, + "loss": 0.0298, + "step": 229810 + }, + { + "epoch": 1.48, + "learning_rate": 7.75031141689848e-05, + "loss": 0.0279, + "step": 229820 + }, + { + "epoch": 1.48, + "learning_rate": 7.749343281462787e-05, + "loss": 0.0263, + "step": 229830 + }, + { + "epoch": 1.48, + "learning_rate": 7.748375146027095e-05, + "loss": 0.0296, + "step": 229840 + }, + { + "epoch": 1.48, + "learning_rate": 7.7474070105914e-05, + "loss": 0.0243, + "step": 229850 + }, + { + "epoch": 1.48, + "learning_rate": 7.746438875155707e-05, + "loss": 0.0302, + "step": 229860 + }, + { + "epoch": 1.48, + "learning_rate": 7.745470739720015e-05, + "loss": 0.0303, + "step": 229870 + }, + { + "epoch": 1.48, + "learning_rate": 7.74450260428432e-05, + "loss": 0.0286, + "step": 229880 + }, + { + "epoch": 1.48, + "learning_rate": 7.743534468848628e-05, + "loss": 0.0314, + "step": 229890 + }, + { + "epoch": 1.48, + "learning_rate": 7.742566333412935e-05, + "loss": 0.0299, + "step": 229900 + }, + { + "epoch": 1.48, + "learning_rate": 7.741598197977243e-05, + "loss": 0.0286, + "step": 229910 + }, + { + "epoch": 1.48, + "learning_rate": 7.740630062541548e-05, + "loss": 0.0274, + "step": 229920 + }, + { + "epoch": 1.48, + "learning_rate": 7.739661927105855e-05, + "loss": 0.0314, + "step": 229930 + }, + { + "epoch": 1.48, + "learning_rate": 7.738693791670163e-05, + "loss": 0.0245, + "step": 229940 + }, + { + "epoch": 1.48, + "learning_rate": 7.737725656234468e-05, + "loss": 0.0269, + "step": 229950 + }, + { + "epoch": 1.48, + "learning_rate": 7.736757520798775e-05, + "loss": 0.0443, + "step": 229960 + }, + { + "epoch": 1.48, + "learning_rate": 7.735789385363083e-05, + "loss": 0.0279, + "step": 229970 + }, + { + "epoch": 1.48, + "learning_rate": 7.734821249927389e-05, + "loss": 0.0248, + "step": 229980 + }, + { + "epoch": 1.48, + "learning_rate": 7.733853114491696e-05, + "loss": 0.0229, + "step": 229990 + }, + { + "epoch": 1.48, + "learning_rate": 7.732884979056003e-05, + "loss": 0.0273, + "step": 230000 + }, + { + "epoch": 1.48, + "eval_cer": 0.919877979889278, + "eval_loss": 0.019865069538354874, + "eval_runtime": 119.8796, + "eval_samples_per_second": 16.683, + "eval_steps_per_second": 4.171, + "step": 230000 + }, + { + "epoch": 1.48, + "learning_rate": 7.73191684362031e-05, + "loss": 0.0266, + "step": 230010 + }, + { + "epoch": 1.48, + "learning_rate": 7.730948708184616e-05, + "loss": 0.0322, + "step": 230020 + }, + { + "epoch": 1.48, + "learning_rate": 7.729980572748922e-05, + "loss": 0.022, + "step": 230030 + }, + { + "epoch": 1.48, + "learning_rate": 7.72901243731323e-05, + "loss": 0.0286, + "step": 230040 + }, + { + "epoch": 1.48, + "learning_rate": 7.728044301877537e-05, + "loss": 0.0245, + "step": 230050 + }, + { + "epoch": 1.48, + "learning_rate": 7.727076166441842e-05, + "loss": 0.0246, + "step": 230060 + }, + { + "epoch": 1.48, + "learning_rate": 7.72610803100615e-05, + "loss": 0.0279, + "step": 230070 + }, + { + "epoch": 1.48, + "learning_rate": 7.725139895570457e-05, + "loss": 0.0257, + "step": 230080 + }, + { + "epoch": 1.49, + "learning_rate": 7.724171760134764e-05, + "loss": 0.0219, + "step": 230090 + }, + { + "epoch": 1.49, + "learning_rate": 7.72320362469907e-05, + "loss": 0.0322, + "step": 230100 + }, + { + "epoch": 1.49, + "learning_rate": 7.722235489263378e-05, + "loss": 0.0363, + "step": 230110 + }, + { + "epoch": 1.49, + "learning_rate": 7.721267353827685e-05, + "loss": 0.0275, + "step": 230120 + }, + { + "epoch": 1.49, + "learning_rate": 7.72029921839199e-05, + "loss": 0.0309, + "step": 230130 + }, + { + "epoch": 1.49, + "learning_rate": 7.719331082956298e-05, + "loss": 0.0301, + "step": 230140 + }, + { + "epoch": 1.49, + "learning_rate": 7.718362947520605e-05, + "loss": 0.0275, + "step": 230150 + }, + { + "epoch": 1.49, + "learning_rate": 7.71739481208491e-05, + "loss": 0.0232, + "step": 230160 + }, + { + "epoch": 1.49, + "learning_rate": 7.716426676649218e-05, + "loss": 0.0222, + "step": 230170 + }, + { + "epoch": 1.49, + "learning_rate": 7.715458541213524e-05, + "loss": 0.0367, + "step": 230180 + }, + { + "epoch": 1.49, + "learning_rate": 7.714490405777832e-05, + "loss": 0.0309, + "step": 230190 + }, + { + "epoch": 1.49, + "learning_rate": 7.713522270342138e-05, + "loss": 0.0256, + "step": 230200 + }, + { + "epoch": 1.49, + "learning_rate": 7.712554134906446e-05, + "loss": 0.0282, + "step": 230210 + }, + { + "epoch": 1.49, + "learning_rate": 7.711585999470752e-05, + "loss": 0.0278, + "step": 230220 + }, + { + "epoch": 1.49, + "learning_rate": 7.710617864035058e-05, + "loss": 0.0283, + "step": 230230 + }, + { + "epoch": 1.49, + "learning_rate": 7.709649728599366e-05, + "loss": 0.0286, + "step": 230240 + }, + { + "epoch": 1.49, + "learning_rate": 7.708681593163672e-05, + "loss": 0.0311, + "step": 230250 + }, + { + "epoch": 1.49, + "learning_rate": 7.70771345772798e-05, + "loss": 0.0292, + "step": 230260 + }, + { + "epoch": 1.49, + "learning_rate": 7.706745322292285e-05, + "loss": 0.0299, + "step": 230270 + }, + { + "epoch": 1.49, + "learning_rate": 7.705777186856592e-05, + "loss": 0.0255, + "step": 230280 + }, + { + "epoch": 1.49, + "learning_rate": 7.7048090514209e-05, + "loss": 0.0267, + "step": 230290 + }, + { + "epoch": 1.49, + "learning_rate": 7.703840915985205e-05, + "loss": 0.027, + "step": 230300 + }, + { + "epoch": 1.49, + "learning_rate": 7.702872780549513e-05, + "loss": 0.0234, + "step": 230310 + }, + { + "epoch": 1.49, + "learning_rate": 7.70190464511382e-05, + "loss": 0.031, + "step": 230320 + }, + { + "epoch": 1.49, + "learning_rate": 7.700936509678128e-05, + "loss": 0.0334, + "step": 230330 + }, + { + "epoch": 1.49, + "learning_rate": 7.699968374242433e-05, + "loss": 0.0383, + "step": 230340 + }, + { + "epoch": 1.49, + "learning_rate": 7.69900023880674e-05, + "loss": 0.0265, + "step": 230350 + }, + { + "epoch": 1.49, + "learning_rate": 7.698032103371048e-05, + "loss": 0.023, + "step": 230360 + }, + { + "epoch": 1.49, + "learning_rate": 7.697063967935353e-05, + "loss": 0.0293, + "step": 230370 + }, + { + "epoch": 1.49, + "learning_rate": 7.69609583249966e-05, + "loss": 0.0271, + "step": 230380 + }, + { + "epoch": 1.49, + "learning_rate": 7.695127697063968e-05, + "loss": 0.0273, + "step": 230390 + }, + { + "epoch": 1.49, + "learning_rate": 7.694159561628274e-05, + "loss": 0.0228, + "step": 230400 + }, + { + "epoch": 1.49, + "learning_rate": 7.693191426192581e-05, + "loss": 0.0278, + "step": 230410 + }, + { + "epoch": 1.49, + "learning_rate": 7.692223290756888e-05, + "loss": 0.0222, + "step": 230420 + }, + { + "epoch": 1.49, + "learning_rate": 7.691255155321195e-05, + "loss": 0.0261, + "step": 230430 + }, + { + "epoch": 1.49, + "learning_rate": 7.690287019885501e-05, + "loss": 0.0317, + "step": 230440 + }, + { + "epoch": 1.49, + "learning_rate": 7.689318884449807e-05, + "loss": 0.0254, + "step": 230450 + }, + { + "epoch": 1.49, + "learning_rate": 7.688350749014115e-05, + "loss": 0.0298, + "step": 230460 + }, + { + "epoch": 1.49, + "learning_rate": 7.687382613578422e-05, + "loss": 0.0261, + "step": 230470 + }, + { + "epoch": 1.49, + "learning_rate": 7.686414478142727e-05, + "loss": 0.0304, + "step": 230480 + }, + { + "epoch": 1.49, + "learning_rate": 7.685446342707035e-05, + "loss": 0.0351, + "step": 230490 + }, + { + "epoch": 1.49, + "learning_rate": 7.684478207271342e-05, + "loss": 0.0263, + "step": 230500 + }, + { + "epoch": 1.49, + "learning_rate": 7.683510071835648e-05, + "loss": 0.0272, + "step": 230510 + }, + { + "epoch": 1.49, + "learning_rate": 7.682541936399955e-05, + "loss": 0.0253, + "step": 230520 + }, + { + "epoch": 1.49, + "learning_rate": 7.681573800964263e-05, + "loss": 0.0235, + "step": 230530 + }, + { + "epoch": 1.49, + "learning_rate": 7.68060566552857e-05, + "loss": 0.0285, + "step": 230540 + }, + { + "epoch": 1.49, + "learning_rate": 7.679637530092875e-05, + "loss": 0.0253, + "step": 230550 + }, + { + "epoch": 1.49, + "learning_rate": 7.678669394657183e-05, + "loss": 0.0278, + "step": 230560 + }, + { + "epoch": 1.49, + "learning_rate": 7.67770125922149e-05, + "loss": 0.031, + "step": 230570 + }, + { + "epoch": 1.49, + "learning_rate": 7.676733123785795e-05, + "loss": 0.0276, + "step": 230580 + }, + { + "epoch": 1.49, + "learning_rate": 7.675764988350103e-05, + "loss": 0.0322, + "step": 230590 + }, + { + "epoch": 1.49, + "learning_rate": 7.67479685291441e-05, + "loss": 0.0277, + "step": 230600 + }, + { + "epoch": 1.49, + "learning_rate": 7.673828717478717e-05, + "loss": 0.0278, + "step": 230610 + }, + { + "epoch": 1.49, + "learning_rate": 7.672860582043023e-05, + "loss": 0.0331, + "step": 230620 + }, + { + "epoch": 1.49, + "learning_rate": 7.671892446607331e-05, + "loss": 0.0253, + "step": 230630 + }, + { + "epoch": 1.49, + "learning_rate": 7.670924311171637e-05, + "loss": 0.0291, + "step": 230640 + }, + { + "epoch": 1.49, + "learning_rate": 7.669956175735943e-05, + "loss": 0.0273, + "step": 230650 + }, + { + "epoch": 1.49, + "learning_rate": 7.66898804030025e-05, + "loss": 0.0331, + "step": 230660 + }, + { + "epoch": 1.49, + "learning_rate": 7.668019904864557e-05, + "loss": 0.0287, + "step": 230670 + }, + { + "epoch": 1.49, + "learning_rate": 7.667051769428865e-05, + "loss": 0.0264, + "step": 230680 + }, + { + "epoch": 1.49, + "learning_rate": 7.66608363399317e-05, + "loss": 0.0263, + "step": 230690 + }, + { + "epoch": 1.49, + "learning_rate": 7.665115498557477e-05, + "loss": 0.0363, + "step": 230700 + }, + { + "epoch": 1.49, + "learning_rate": 7.664147363121785e-05, + "loss": 0.0286, + "step": 230710 + }, + { + "epoch": 1.49, + "learning_rate": 7.66317922768609e-05, + "loss": 0.026, + "step": 230720 + }, + { + "epoch": 1.49, + "learning_rate": 7.662211092250398e-05, + "loss": 0.0281, + "step": 230730 + }, + { + "epoch": 1.49, + "learning_rate": 7.661242956814705e-05, + "loss": 0.0232, + "step": 230740 + }, + { + "epoch": 1.49, + "learning_rate": 7.660274821379012e-05, + "loss": 0.025, + "step": 230750 + }, + { + "epoch": 1.49, + "learning_rate": 7.659306685943318e-05, + "loss": 0.0214, + "step": 230760 + }, + { + "epoch": 1.49, + "learning_rate": 7.658338550507625e-05, + "loss": 0.0283, + "step": 230770 + }, + { + "epoch": 1.49, + "learning_rate": 7.657370415071933e-05, + "loss": 0.03, + "step": 230780 + }, + { + "epoch": 1.49, + "learning_rate": 7.656402279636238e-05, + "loss": 0.0277, + "step": 230790 + }, + { + "epoch": 1.49, + "learning_rate": 7.655434144200545e-05, + "loss": 0.0272, + "step": 230800 + }, + { + "epoch": 1.49, + "learning_rate": 7.654466008764853e-05, + "loss": 0.0267, + "step": 230810 + }, + { + "epoch": 1.49, + "learning_rate": 7.653497873329159e-05, + "loss": 0.0273, + "step": 230820 + }, + { + "epoch": 1.49, + "learning_rate": 7.652529737893466e-05, + "loss": 0.0255, + "step": 230830 + }, + { + "epoch": 1.49, + "learning_rate": 7.651561602457773e-05, + "loss": 0.0284, + "step": 230840 + }, + { + "epoch": 1.49, + "learning_rate": 7.650593467022079e-05, + "loss": 0.0284, + "step": 230850 + }, + { + "epoch": 1.49, + "learning_rate": 7.649625331586386e-05, + "loss": 0.0319, + "step": 230860 + }, + { + "epoch": 1.49, + "learning_rate": 7.648657196150692e-05, + "loss": 0.0259, + "step": 230870 + }, + { + "epoch": 1.49, + "learning_rate": 7.647689060715e-05, + "loss": 0.033, + "step": 230880 + }, + { + "epoch": 1.49, + "learning_rate": 7.646720925279307e-05, + "loss": 0.0333, + "step": 230890 + }, + { + "epoch": 1.49, + "learning_rate": 7.645752789843612e-05, + "loss": 0.0257, + "step": 230900 + }, + { + "epoch": 1.49, + "learning_rate": 7.64478465440792e-05, + "loss": 0.0247, + "step": 230910 + }, + { + "epoch": 1.49, + "learning_rate": 7.643816518972227e-05, + "loss": 0.0234, + "step": 230920 + }, + { + "epoch": 1.49, + "learning_rate": 7.642848383536533e-05, + "loss": 0.0275, + "step": 230930 + }, + { + "epoch": 1.49, + "learning_rate": 7.64188024810084e-05, + "loss": 0.0282, + "step": 230940 + }, + { + "epoch": 1.49, + "learning_rate": 7.640912112665147e-05, + "loss": 0.0289, + "step": 230950 + }, + { + "epoch": 1.49, + "learning_rate": 7.639943977229455e-05, + "loss": 0.0305, + "step": 230960 + }, + { + "epoch": 1.49, + "learning_rate": 7.63897584179376e-05, + "loss": 0.0221, + "step": 230970 + }, + { + "epoch": 1.49, + "learning_rate": 7.638007706358068e-05, + "loss": 0.0292, + "step": 230980 + }, + { + "epoch": 1.49, + "learning_rate": 7.637039570922375e-05, + "loss": 0.0276, + "step": 230990 + }, + { + "epoch": 1.49, + "learning_rate": 7.63607143548668e-05, + "loss": 0.024, + "step": 231000 + }, + { + "epoch": 1.49, + "eval_cer": 0.9199014800587504, + "eval_loss": 0.019931979477405548, + "eval_runtime": 120.0906, + "eval_samples_per_second": 16.654, + "eval_steps_per_second": 4.164, + "step": 231000 + }, + { + "epoch": 1.49, + "learning_rate": 7.635103300050988e-05, + "loss": 0.0329, + "step": 231010 + }, + { + "epoch": 1.49, + "learning_rate": 7.634135164615294e-05, + "loss": 0.0307, + "step": 231020 + }, + { + "epoch": 1.49, + "learning_rate": 7.633167029179602e-05, + "loss": 0.025, + "step": 231030 + }, + { + "epoch": 1.49, + "learning_rate": 7.632198893743908e-05, + "loss": 0.027, + "step": 231040 + }, + { + "epoch": 1.49, + "learning_rate": 7.631230758308214e-05, + "loss": 0.0297, + "step": 231050 + }, + { + "epoch": 1.49, + "learning_rate": 7.630262622872522e-05, + "loss": 0.0305, + "step": 231060 + }, + { + "epoch": 1.49, + "learning_rate": 7.629294487436828e-05, + "loss": 0.0267, + "step": 231070 + }, + { + "epoch": 1.49, + "learning_rate": 7.628326352001136e-05, + "loss": 0.0316, + "step": 231080 + }, + { + "epoch": 1.49, + "learning_rate": 7.627358216565442e-05, + "loss": 0.0312, + "step": 231090 + }, + { + "epoch": 1.49, + "learning_rate": 7.62639008112975e-05, + "loss": 0.0283, + "step": 231100 + }, + { + "epoch": 1.49, + "learning_rate": 7.625421945694055e-05, + "loss": 0.0277, + "step": 231110 + }, + { + "epoch": 1.49, + "learning_rate": 7.624453810258362e-05, + "loss": 0.0337, + "step": 231120 + }, + { + "epoch": 1.49, + "learning_rate": 7.62348567482267e-05, + "loss": 0.028, + "step": 231130 + }, + { + "epoch": 1.49, + "learning_rate": 7.622517539386975e-05, + "loss": 0.0307, + "step": 231140 + }, + { + "epoch": 1.49, + "learning_rate": 7.621549403951282e-05, + "loss": 0.0311, + "step": 231150 + }, + { + "epoch": 1.49, + "learning_rate": 7.62058126851559e-05, + "loss": 0.028, + "step": 231160 + }, + { + "epoch": 1.49, + "learning_rate": 7.619613133079897e-05, + "loss": 0.0255, + "step": 231170 + }, + { + "epoch": 1.49, + "learning_rate": 7.618644997644203e-05, + "loss": 0.0285, + "step": 231180 + }, + { + "epoch": 1.49, + "learning_rate": 7.61767686220851e-05, + "loss": 0.0265, + "step": 231190 + }, + { + "epoch": 1.49, + "learning_rate": 7.616708726772818e-05, + "loss": 0.0276, + "step": 231200 + }, + { + "epoch": 1.49, + "learning_rate": 7.615740591337123e-05, + "loss": 0.0271, + "step": 231210 + }, + { + "epoch": 1.49, + "learning_rate": 7.61477245590143e-05, + "loss": 0.0256, + "step": 231220 + }, + { + "epoch": 1.49, + "learning_rate": 7.613804320465738e-05, + "loss": 0.0281, + "step": 231230 + }, + { + "epoch": 1.49, + "learning_rate": 7.612836185030044e-05, + "loss": 0.0283, + "step": 231240 + }, + { + "epoch": 1.49, + "learning_rate": 7.61186804959435e-05, + "loss": 0.0249, + "step": 231250 + }, + { + "epoch": 1.49, + "learning_rate": 7.610899914158657e-05, + "loss": 0.029, + "step": 231260 + }, + { + "epoch": 1.49, + "learning_rate": 7.609931778722964e-05, + "loss": 0.0305, + "step": 231270 + }, + { + "epoch": 1.49, + "learning_rate": 7.608963643287271e-05, + "loss": 0.0261, + "step": 231280 + }, + { + "epoch": 1.49, + "learning_rate": 7.607995507851577e-05, + "loss": 0.0286, + "step": 231290 + }, + { + "epoch": 1.49, + "learning_rate": 7.607027372415885e-05, + "loss": 0.029, + "step": 231300 + }, + { + "epoch": 1.49, + "learning_rate": 7.606059236980192e-05, + "loss": 0.0258, + "step": 231310 + }, + { + "epoch": 1.49, + "learning_rate": 7.605091101544497e-05, + "loss": 0.0247, + "step": 231320 + }, + { + "epoch": 1.49, + "learning_rate": 7.604122966108805e-05, + "loss": 0.0236, + "step": 231330 + }, + { + "epoch": 1.49, + "learning_rate": 7.603154830673112e-05, + "loss": 0.0313, + "step": 231340 + }, + { + "epoch": 1.49, + "learning_rate": 7.602186695237417e-05, + "loss": 0.0331, + "step": 231350 + }, + { + "epoch": 1.49, + "learning_rate": 7.601218559801725e-05, + "loss": 0.0251, + "step": 231360 + }, + { + "epoch": 1.49, + "learning_rate": 7.600250424366032e-05, + "loss": 0.0272, + "step": 231370 + }, + { + "epoch": 1.49, + "learning_rate": 7.59928228893034e-05, + "loss": 0.0267, + "step": 231380 + }, + { + "epoch": 1.49, + "learning_rate": 7.598314153494645e-05, + "loss": 0.0245, + "step": 231390 + }, + { + "epoch": 1.49, + "learning_rate": 7.597346018058953e-05, + "loss": 0.0307, + "step": 231400 + }, + { + "epoch": 1.49, + "learning_rate": 7.59637788262326e-05, + "loss": 0.0312, + "step": 231410 + }, + { + "epoch": 1.49, + "learning_rate": 7.595409747187565e-05, + "loss": 0.0335, + "step": 231420 + }, + { + "epoch": 1.49, + "learning_rate": 7.594441611751873e-05, + "loss": 0.0287, + "step": 231430 + }, + { + "epoch": 1.49, + "learning_rate": 7.59347347631618e-05, + "loss": 0.0257, + "step": 231440 + }, + { + "epoch": 1.49, + "learning_rate": 7.592505340880487e-05, + "loss": 0.0264, + "step": 231450 + }, + { + "epoch": 1.49, + "learning_rate": 7.591537205444793e-05, + "loss": 0.0269, + "step": 231460 + }, + { + "epoch": 1.49, + "learning_rate": 7.590569070009099e-05, + "loss": 0.027, + "step": 231470 + }, + { + "epoch": 1.49, + "learning_rate": 7.589600934573407e-05, + "loss": 0.0309, + "step": 231480 + }, + { + "epoch": 1.49, + "learning_rate": 7.588632799137713e-05, + "loss": 0.0261, + "step": 231490 + }, + { + "epoch": 1.49, + "learning_rate": 7.58766466370202e-05, + "loss": 0.0263, + "step": 231500 + }, + { + "epoch": 1.49, + "learning_rate": 7.586696528266327e-05, + "loss": 0.0239, + "step": 231510 + }, + { + "epoch": 1.49, + "learning_rate": 7.585728392830635e-05, + "loss": 0.0265, + "step": 231520 + }, + { + "epoch": 1.49, + "learning_rate": 7.58476025739494e-05, + "loss": 0.0275, + "step": 231530 + }, + { + "epoch": 1.49, + "learning_rate": 7.583792121959247e-05, + "loss": 0.0262, + "step": 231540 + }, + { + "epoch": 1.49, + "learning_rate": 7.582823986523555e-05, + "loss": 0.0302, + "step": 231550 + }, + { + "epoch": 1.49, + "learning_rate": 7.58185585108786e-05, + "loss": 0.0258, + "step": 231560 + }, + { + "epoch": 1.49, + "learning_rate": 7.580887715652167e-05, + "loss": 0.0261, + "step": 231570 + }, + { + "epoch": 1.49, + "learning_rate": 7.579919580216475e-05, + "loss": 0.0289, + "step": 231580 + }, + { + "epoch": 1.49, + "learning_rate": 7.578951444780781e-05, + "loss": 0.0229, + "step": 231590 + }, + { + "epoch": 1.49, + "learning_rate": 7.577983309345088e-05, + "loss": 0.0323, + "step": 231600 + }, + { + "epoch": 1.49, + "learning_rate": 7.577015173909395e-05, + "loss": 0.0258, + "step": 231610 + }, + { + "epoch": 1.49, + "learning_rate": 7.576047038473703e-05, + "loss": 0.0294, + "step": 231620 + }, + { + "epoch": 1.49, + "learning_rate": 7.575078903038008e-05, + "loss": 0.0308, + "step": 231630 + }, + { + "epoch": 1.5, + "learning_rate": 7.574110767602315e-05, + "loss": 0.0281, + "step": 231640 + }, + { + "epoch": 1.5, + "learning_rate": 7.573142632166623e-05, + "loss": 0.0294, + "step": 231650 + }, + { + "epoch": 1.5, + "learning_rate": 7.572174496730929e-05, + "loss": 0.0259, + "step": 231660 + }, + { + "epoch": 1.5, + "learning_rate": 7.571206361295234e-05, + "loss": 0.0226, + "step": 231670 + }, + { + "epoch": 1.5, + "learning_rate": 7.570238225859542e-05, + "loss": 0.0301, + "step": 231680 + }, + { + "epoch": 1.5, + "learning_rate": 7.569270090423849e-05, + "loss": 0.0271, + "step": 231690 + }, + { + "epoch": 1.5, + "learning_rate": 7.568301954988156e-05, + "loss": 0.0245, + "step": 231700 + }, + { + "epoch": 1.5, + "learning_rate": 7.567333819552462e-05, + "loss": 0.0254, + "step": 231710 + }, + { + "epoch": 1.5, + "learning_rate": 7.56636568411677e-05, + "loss": 0.0316, + "step": 231720 + }, + { + "epoch": 1.5, + "learning_rate": 7.565397548681077e-05, + "loss": 0.0332, + "step": 231730 + }, + { + "epoch": 1.5, + "learning_rate": 7.564429413245382e-05, + "loss": 0.0234, + "step": 231740 + }, + { + "epoch": 1.5, + "learning_rate": 7.56346127780969e-05, + "loss": 0.0307, + "step": 231750 + }, + { + "epoch": 1.5, + "learning_rate": 7.562493142373997e-05, + "loss": 0.0262, + "step": 231760 + }, + { + "epoch": 1.5, + "learning_rate": 7.561525006938302e-05, + "loss": 0.0278, + "step": 231770 + }, + { + "epoch": 1.5, + "learning_rate": 7.56055687150261e-05, + "loss": 0.0284, + "step": 231780 + }, + { + "epoch": 1.5, + "learning_rate": 7.559588736066917e-05, + "loss": 0.0246, + "step": 231790 + }, + { + "epoch": 1.5, + "learning_rate": 7.558620600631225e-05, + "loss": 0.0262, + "step": 231800 + }, + { + "epoch": 1.5, + "learning_rate": 7.55765246519553e-05, + "loss": 0.031, + "step": 231810 + }, + { + "epoch": 1.5, + "learning_rate": 7.556684329759838e-05, + "loss": 0.0265, + "step": 231820 + }, + { + "epoch": 1.5, + "learning_rate": 7.555716194324145e-05, + "loss": 0.0267, + "step": 231830 + }, + { + "epoch": 1.5, + "learning_rate": 7.55474805888845e-05, + "loss": 0.032, + "step": 231840 + }, + { + "epoch": 1.5, + "learning_rate": 7.553779923452758e-05, + "loss": 0.0311, + "step": 231850 + }, + { + "epoch": 1.5, + "learning_rate": 7.552811788017064e-05, + "loss": 0.0285, + "step": 231860 + }, + { + "epoch": 1.5, + "learning_rate": 7.551843652581372e-05, + "loss": 0.0233, + "step": 231870 + }, + { + "epoch": 1.5, + "learning_rate": 7.550875517145678e-05, + "loss": 0.0232, + "step": 231880 + }, + { + "epoch": 1.5, + "learning_rate": 7.549907381709984e-05, + "loss": 0.026, + "step": 231890 + }, + { + "epoch": 1.5, + "learning_rate": 7.548939246274292e-05, + "loss": 0.0286, + "step": 231900 + }, + { + "epoch": 1.5, + "learning_rate": 7.547971110838598e-05, + "loss": 0.029, + "step": 231910 + }, + { + "epoch": 1.5, + "learning_rate": 7.547002975402906e-05, + "loss": 0.0233, + "step": 231920 + }, + { + "epoch": 1.5, + "learning_rate": 7.546034839967212e-05, + "loss": 0.0283, + "step": 231930 + }, + { + "epoch": 1.5, + "learning_rate": 7.545066704531519e-05, + "loss": 0.0281, + "step": 231940 + }, + { + "epoch": 1.5, + "learning_rate": 7.544098569095825e-05, + "loss": 0.0267, + "step": 231950 + }, + { + "epoch": 1.5, + "learning_rate": 7.543130433660132e-05, + "loss": 0.0283, + "step": 231960 + }, + { + "epoch": 1.5, + "learning_rate": 7.54216229822444e-05, + "loss": 0.0324, + "step": 231970 + }, + { + "epoch": 1.5, + "learning_rate": 7.541194162788745e-05, + "loss": 0.0267, + "step": 231980 + }, + { + "epoch": 1.5, + "learning_rate": 7.540226027353052e-05, + "loss": 0.0284, + "step": 231990 + }, + { + "epoch": 1.5, + "learning_rate": 7.53925789191736e-05, + "loss": 0.0295, + "step": 232000 + }, + { + "epoch": 1.5, + "eval_cer": 0.9198915376793583, + "eval_loss": 0.019776683300733566, + "eval_runtime": 120.0, + "eval_samples_per_second": 16.667, + "eval_steps_per_second": 4.167, + "step": 232000 + }, + { + "epoch": 1.5, + "learning_rate": 7.538289756481666e-05, + "loss": 0.0288, + "step": 232010 + }, + { + "epoch": 1.5, + "learning_rate": 7.537321621045973e-05, + "loss": 0.0322, + "step": 232020 + }, + { + "epoch": 1.5, + "learning_rate": 7.53635348561028e-05, + "loss": 0.0271, + "step": 232030 + }, + { + "epoch": 1.5, + "learning_rate": 7.535385350174586e-05, + "loss": 0.0292, + "step": 232040 + }, + { + "epoch": 1.5, + "learning_rate": 7.534417214738893e-05, + "loss": 0.0282, + "step": 232050 + }, + { + "epoch": 1.5, + "learning_rate": 7.5334490793032e-05, + "loss": 0.027, + "step": 232060 + }, + { + "epoch": 1.5, + "learning_rate": 7.532480943867508e-05, + "loss": 0.0252, + "step": 232070 + }, + { + "epoch": 1.5, + "learning_rate": 7.531512808431814e-05, + "loss": 0.0251, + "step": 232080 + }, + { + "epoch": 1.5, + "learning_rate": 7.53054467299612e-05, + "loss": 0.0283, + "step": 232090 + }, + { + "epoch": 1.5, + "learning_rate": 7.529576537560427e-05, + "loss": 0.0244, + "step": 232100 + }, + { + "epoch": 1.5, + "learning_rate": 7.528608402124734e-05, + "loss": 0.0264, + "step": 232110 + }, + { + "epoch": 1.5, + "learning_rate": 7.527640266689041e-05, + "loss": 0.0311, + "step": 232120 + }, + { + "epoch": 1.5, + "learning_rate": 7.526672131253347e-05, + "loss": 0.0276, + "step": 232130 + }, + { + "epoch": 1.5, + "learning_rate": 7.525703995817654e-05, + "loss": 0.0267, + "step": 232140 + }, + { + "epoch": 1.5, + "learning_rate": 7.524735860381962e-05, + "loss": 0.0274, + "step": 232150 + }, + { + "epoch": 1.5, + "learning_rate": 7.523767724946267e-05, + "loss": 0.024, + "step": 232160 + }, + { + "epoch": 1.5, + "learning_rate": 7.522799589510575e-05, + "loss": 0.0312, + "step": 232170 + }, + { + "epoch": 1.5, + "learning_rate": 7.521831454074882e-05, + "loss": 0.0323, + "step": 232180 + }, + { + "epoch": 1.5, + "learning_rate": 7.520863318639187e-05, + "loss": 0.0295, + "step": 232190 + }, + { + "epoch": 1.5, + "learning_rate": 7.519895183203495e-05, + "loss": 0.0269, + "step": 232200 + }, + { + "epoch": 1.5, + "learning_rate": 7.518927047767802e-05, + "loss": 0.0249, + "step": 232210 + }, + { + "epoch": 1.5, + "learning_rate": 7.51795891233211e-05, + "loss": 0.0339, + "step": 232220 + }, + { + "epoch": 1.5, + "learning_rate": 7.516990776896415e-05, + "loss": 0.0288, + "step": 232230 + }, + { + "epoch": 1.5, + "learning_rate": 7.516022641460722e-05, + "loss": 0.0283, + "step": 232240 + }, + { + "epoch": 1.5, + "learning_rate": 7.51505450602503e-05, + "loss": 0.0265, + "step": 232250 + }, + { + "epoch": 1.5, + "learning_rate": 7.514086370589335e-05, + "loss": 0.0268, + "step": 232260 + }, + { + "epoch": 1.5, + "learning_rate": 7.513118235153643e-05, + "loss": 0.0227, + "step": 232270 + }, + { + "epoch": 1.5, + "learning_rate": 7.51215009971795e-05, + "loss": 0.0299, + "step": 232280 + }, + { + "epoch": 1.5, + "learning_rate": 7.511181964282257e-05, + "loss": 0.0269, + "step": 232290 + }, + { + "epoch": 1.5, + "learning_rate": 7.510213828846563e-05, + "loss": 0.0297, + "step": 232300 + }, + { + "epoch": 1.5, + "learning_rate": 7.509245693410869e-05, + "loss": 0.0264, + "step": 232310 + }, + { + "epoch": 1.5, + "learning_rate": 7.508277557975177e-05, + "loss": 0.0255, + "step": 232320 + }, + { + "epoch": 1.5, + "learning_rate": 7.507309422539483e-05, + "loss": 0.0276, + "step": 232330 + }, + { + "epoch": 1.5, + "learning_rate": 7.506341287103789e-05, + "loss": 0.0286, + "step": 232340 + }, + { + "epoch": 1.5, + "learning_rate": 7.505373151668097e-05, + "loss": 0.0236, + "step": 232350 + }, + { + "epoch": 1.5, + "learning_rate": 7.504405016232404e-05, + "loss": 0.0268, + "step": 232360 + }, + { + "epoch": 1.5, + "learning_rate": 7.50343688079671e-05, + "loss": 0.0303, + "step": 232370 + }, + { + "epoch": 1.5, + "learning_rate": 7.502468745361017e-05, + "loss": 0.0275, + "step": 232380 + }, + { + "epoch": 1.5, + "learning_rate": 7.501500609925325e-05, + "loss": 0.0243, + "step": 232390 + }, + { + "epoch": 1.5, + "learning_rate": 7.50053247448963e-05, + "loss": 0.0254, + "step": 232400 + }, + { + "epoch": 1.5, + "learning_rate": 7.499564339053937e-05, + "loss": 0.0307, + "step": 232410 + }, + { + "epoch": 1.5, + "learning_rate": 7.498596203618245e-05, + "loss": 0.0328, + "step": 232420 + }, + { + "epoch": 1.5, + "learning_rate": 7.497628068182551e-05, + "loss": 0.024, + "step": 232430 + }, + { + "epoch": 1.5, + "learning_rate": 7.496659932746857e-05, + "loss": 0.0243, + "step": 232440 + }, + { + "epoch": 1.5, + "learning_rate": 7.495691797311165e-05, + "loss": 0.0249, + "step": 232450 + }, + { + "epoch": 1.5, + "learning_rate": 7.494723661875471e-05, + "loss": 0.0213, + "step": 232460 + }, + { + "epoch": 1.5, + "learning_rate": 7.493755526439778e-05, + "loss": 0.0272, + "step": 232470 + }, + { + "epoch": 1.5, + "learning_rate": 7.492787391004085e-05, + "loss": 0.0273, + "step": 232480 + }, + { + "epoch": 1.5, + "learning_rate": 7.491819255568393e-05, + "loss": 0.0245, + "step": 232490 + }, + { + "epoch": 1.5, + "learning_rate": 7.490851120132698e-05, + "loss": 0.0256, + "step": 232500 + }, + { + "epoch": 1.5, + "learning_rate": 7.489882984697004e-05, + "loss": 0.0287, + "step": 232510 + }, + { + "epoch": 1.5, + "learning_rate": 7.488914849261312e-05, + "loss": 0.0259, + "step": 232520 + }, + { + "epoch": 1.5, + "learning_rate": 7.487946713825619e-05, + "loss": 0.0341, + "step": 232530 + }, + { + "epoch": 1.5, + "learning_rate": 7.486978578389926e-05, + "loss": 0.0245, + "step": 232540 + }, + { + "epoch": 1.5, + "learning_rate": 7.486010442954232e-05, + "loss": 0.0257, + "step": 232550 + }, + { + "epoch": 1.5, + "learning_rate": 7.485042307518539e-05, + "loss": 0.0217, + "step": 232560 + }, + { + "epoch": 1.5, + "learning_rate": 7.484074172082846e-05, + "loss": 0.0227, + "step": 232570 + }, + { + "epoch": 1.5, + "learning_rate": 7.483106036647152e-05, + "loss": 0.0265, + "step": 232580 + }, + { + "epoch": 1.5, + "learning_rate": 7.48213790121146e-05, + "loss": 0.0234, + "step": 232590 + }, + { + "epoch": 1.5, + "learning_rate": 7.481169765775765e-05, + "loss": 0.0287, + "step": 232600 + }, + { + "epoch": 1.5, + "learning_rate": 7.480201630340073e-05, + "loss": 0.0306, + "step": 232610 + }, + { + "epoch": 1.5, + "learning_rate": 7.47923349490438e-05, + "loss": 0.0284, + "step": 232620 + }, + { + "epoch": 1.5, + "learning_rate": 7.478265359468687e-05, + "loss": 0.0332, + "step": 232630 + }, + { + "epoch": 1.5, + "learning_rate": 7.477297224032993e-05, + "loss": 0.0247, + "step": 232640 + }, + { + "epoch": 1.5, + "learning_rate": 7.4763290885973e-05, + "loss": 0.0312, + "step": 232650 + }, + { + "epoch": 1.5, + "learning_rate": 7.475360953161607e-05, + "loss": 0.0276, + "step": 232660 + }, + { + "epoch": 1.5, + "learning_rate": 7.474392817725913e-05, + "loss": 0.0317, + "step": 232670 + }, + { + "epoch": 1.5, + "learning_rate": 7.473424682290221e-05, + "loss": 0.0245, + "step": 232680 + }, + { + "epoch": 1.5, + "learning_rate": 7.472456546854528e-05, + "loss": 0.026, + "step": 232690 + }, + { + "epoch": 1.5, + "learning_rate": 7.471488411418834e-05, + "loss": 0.0262, + "step": 232700 + }, + { + "epoch": 1.5, + "learning_rate": 7.470520275983141e-05, + "loss": 0.0264, + "step": 232710 + }, + { + "epoch": 1.5, + "learning_rate": 7.469552140547448e-05, + "loss": 0.0261, + "step": 232720 + }, + { + "epoch": 1.5, + "learning_rate": 7.468584005111754e-05, + "loss": 0.0281, + "step": 232730 + }, + { + "epoch": 1.5, + "learning_rate": 7.467615869676061e-05, + "loss": 0.0268, + "step": 232740 + }, + { + "epoch": 1.5, + "learning_rate": 7.466647734240369e-05, + "loss": 0.027, + "step": 232750 + }, + { + "epoch": 1.5, + "learning_rate": 7.465679598804674e-05, + "loss": 0.0318, + "step": 232760 + }, + { + "epoch": 1.5, + "learning_rate": 7.464711463368982e-05, + "loss": 0.0204, + "step": 232770 + }, + { + "epoch": 1.5, + "learning_rate": 7.463743327933289e-05, + "loss": 0.0282, + "step": 232780 + }, + { + "epoch": 1.5, + "learning_rate": 7.462775192497595e-05, + "loss": 0.0263, + "step": 232790 + }, + { + "epoch": 1.5, + "learning_rate": 7.461807057061902e-05, + "loss": 0.0259, + "step": 232800 + }, + { + "epoch": 1.5, + "learning_rate": 7.460838921626209e-05, + "loss": 0.0315, + "step": 232810 + }, + { + "epoch": 1.5, + "learning_rate": 7.459870786190515e-05, + "loss": 0.0279, + "step": 232820 + }, + { + "epoch": 1.5, + "learning_rate": 7.458902650754822e-05, + "loss": 0.0235, + "step": 232830 + }, + { + "epoch": 1.5, + "learning_rate": 7.45793451531913e-05, + "loss": 0.0269, + "step": 232840 + }, + { + "epoch": 1.5, + "learning_rate": 7.456966379883436e-05, + "loss": 0.0316, + "step": 232850 + }, + { + "epoch": 1.5, + "learning_rate": 7.455998244447742e-05, + "loss": 0.0241, + "step": 232860 + }, + { + "epoch": 1.5, + "learning_rate": 7.45503010901205e-05, + "loss": 0.029, + "step": 232870 + }, + { + "epoch": 1.5, + "learning_rate": 7.454061973576356e-05, + "loss": 0.0328, + "step": 232880 + }, + { + "epoch": 1.5, + "learning_rate": 7.453093838140663e-05, + "loss": 0.0299, + "step": 232890 + }, + { + "epoch": 1.5, + "learning_rate": 7.45212570270497e-05, + "loss": 0.0323, + "step": 232900 + }, + { + "epoch": 1.5, + "learning_rate": 7.451157567269278e-05, + "loss": 0.0293, + "step": 232910 + }, + { + "epoch": 1.5, + "learning_rate": 7.450189431833583e-05, + "loss": 0.0273, + "step": 232920 + }, + { + "epoch": 1.5, + "learning_rate": 7.44922129639789e-05, + "loss": 0.0317, + "step": 232930 + }, + { + "epoch": 1.5, + "learning_rate": 7.448253160962197e-05, + "loss": 0.0273, + "step": 232940 + }, + { + "epoch": 1.5, + "learning_rate": 7.447285025526504e-05, + "loss": 0.0256, + "step": 232950 + }, + { + "epoch": 1.5, + "learning_rate": 7.44631689009081e-05, + "loss": 0.0313, + "step": 232960 + }, + { + "epoch": 1.5, + "learning_rate": 7.445348754655117e-05, + "loss": 0.0326, + "step": 232970 + }, + { + "epoch": 1.5, + "learning_rate": 7.444380619219424e-05, + "loss": 0.0244, + "step": 232980 + }, + { + "epoch": 1.5, + "learning_rate": 7.44341248378373e-05, + "loss": 0.0271, + "step": 232990 + }, + { + "epoch": 1.5, + "learning_rate": 7.442444348348037e-05, + "loss": 0.0281, + "step": 233000 + }, + { + "epoch": 1.5, + "eval_cer": 0.9199141339961586, + "eval_loss": 0.019634824246168137, + "eval_runtime": 120.2752, + "eval_samples_per_second": 16.629, + "eval_steps_per_second": 4.157, + "step": 233000 + }, + { + "epoch": 1.5, + "learning_rate": 7.441476212912345e-05, + "loss": 0.0279, + "step": 233010 + }, + { + "epoch": 1.5, + "learning_rate": 7.44050807747665e-05, + "loss": 0.0254, + "step": 233020 + }, + { + "epoch": 1.5, + "learning_rate": 7.439539942040958e-05, + "loss": 0.0229, + "step": 233030 + }, + { + "epoch": 1.5, + "learning_rate": 7.438571806605265e-05, + "loss": 0.0317, + "step": 233040 + }, + { + "epoch": 1.5, + "learning_rate": 7.437603671169572e-05, + "loss": 0.0253, + "step": 233050 + }, + { + "epoch": 1.5, + "learning_rate": 7.436635535733878e-05, + "loss": 0.0285, + "step": 233060 + }, + { + "epoch": 1.5, + "learning_rate": 7.435667400298185e-05, + "loss": 0.0252, + "step": 233070 + }, + { + "epoch": 1.5, + "learning_rate": 7.434699264862491e-05, + "loss": 0.0276, + "step": 233080 + }, + { + "epoch": 1.5, + "learning_rate": 7.433731129426798e-05, + "loss": 0.0208, + "step": 233090 + }, + { + "epoch": 1.5, + "learning_rate": 7.432762993991106e-05, + "loss": 0.0236, + "step": 233100 + }, + { + "epoch": 1.5, + "learning_rate": 7.431794858555413e-05, + "loss": 0.0276, + "step": 233110 + }, + { + "epoch": 1.5, + "learning_rate": 7.43082672311972e-05, + "loss": 0.0268, + "step": 233120 + }, + { + "epoch": 1.5, + "learning_rate": 7.429858587684026e-05, + "loss": 0.0252, + "step": 233130 + }, + { + "epoch": 1.5, + "learning_rate": 7.428890452248333e-05, + "loss": 0.0265, + "step": 233140 + }, + { + "epoch": 1.5, + "learning_rate": 7.427922316812639e-05, + "loss": 0.0285, + "step": 233150 + }, + { + "epoch": 1.5, + "learning_rate": 7.426954181376946e-05, + "loss": 0.0288, + "step": 233160 + }, + { + "epoch": 1.5, + "learning_rate": 7.425986045941254e-05, + "loss": 0.028, + "step": 233170 + }, + { + "epoch": 1.5, + "learning_rate": 7.425017910505559e-05, + "loss": 0.0265, + "step": 233180 + }, + { + "epoch": 1.51, + "learning_rate": 7.424049775069867e-05, + "loss": 0.0279, + "step": 233190 + }, + { + "epoch": 1.51, + "learning_rate": 7.423081639634174e-05, + "loss": 0.0275, + "step": 233200 + }, + { + "epoch": 1.51, + "learning_rate": 7.42211350419848e-05, + "loss": 0.0276, + "step": 233210 + }, + { + "epoch": 1.51, + "learning_rate": 7.421145368762787e-05, + "loss": 0.0242, + "step": 233220 + }, + { + "epoch": 1.51, + "learning_rate": 7.420177233327094e-05, + "loss": 0.0235, + "step": 233230 + }, + { + "epoch": 1.51, + "learning_rate": 7.4192090978914e-05, + "loss": 0.0296, + "step": 233240 + }, + { + "epoch": 1.51, + "learning_rate": 7.418240962455707e-05, + "loss": 0.0263, + "step": 233250 + }, + { + "epoch": 1.51, + "learning_rate": 7.417272827020015e-05, + "loss": 0.0299, + "step": 233260 + }, + { + "epoch": 1.51, + "learning_rate": 7.416304691584321e-05, + "loss": 0.0307, + "step": 233270 + }, + { + "epoch": 1.51, + "learning_rate": 7.415336556148627e-05, + "loss": 0.0259, + "step": 233280 + }, + { + "epoch": 1.51, + "learning_rate": 7.414368420712935e-05, + "loss": 0.0261, + "step": 233290 + }, + { + "epoch": 1.51, + "learning_rate": 7.413400285277241e-05, + "loss": 0.0267, + "step": 233300 + }, + { + "epoch": 1.51, + "learning_rate": 7.412432149841548e-05, + "loss": 0.0287, + "step": 233310 + }, + { + "epoch": 1.51, + "learning_rate": 7.411464014405855e-05, + "loss": 0.0249, + "step": 233320 + }, + { + "epoch": 1.51, + "learning_rate": 7.410495878970161e-05, + "loss": 0.0251, + "step": 233330 + }, + { + "epoch": 1.51, + "learning_rate": 7.409527743534468e-05, + "loss": 0.027, + "step": 233340 + }, + { + "epoch": 1.51, + "learning_rate": 7.408559608098774e-05, + "loss": 0.0311, + "step": 233350 + }, + { + "epoch": 1.51, + "learning_rate": 7.407591472663082e-05, + "loss": 0.0307, + "step": 233360 + }, + { + "epoch": 1.51, + "learning_rate": 7.406623337227389e-05, + "loss": 0.0212, + "step": 233370 + }, + { + "epoch": 1.51, + "learning_rate": 7.405655201791696e-05, + "loss": 0.0281, + "step": 233380 + }, + { + "epoch": 1.51, + "learning_rate": 7.404687066356002e-05, + "loss": 0.0262, + "step": 233390 + }, + { + "epoch": 1.51, + "learning_rate": 7.403718930920309e-05, + "loss": 0.0215, + "step": 233400 + }, + { + "epoch": 1.51, + "learning_rate": 7.402750795484616e-05, + "loss": 0.0282, + "step": 233410 + }, + { + "epoch": 1.51, + "learning_rate": 7.401782660048922e-05, + "loss": 0.0247, + "step": 233420 + }, + { + "epoch": 1.51, + "learning_rate": 7.40081452461323e-05, + "loss": 0.0259, + "step": 233430 + }, + { + "epoch": 1.51, + "learning_rate": 7.399846389177535e-05, + "loss": 0.0283, + "step": 233440 + }, + { + "epoch": 1.51, + "learning_rate": 7.398878253741843e-05, + "loss": 0.0319, + "step": 233450 + }, + { + "epoch": 1.51, + "learning_rate": 7.39791011830615e-05, + "loss": 0.0246, + "step": 233460 + }, + { + "epoch": 1.51, + "learning_rate": 7.396941982870457e-05, + "loss": 0.0279, + "step": 233470 + }, + { + "epoch": 1.51, + "learning_rate": 7.395973847434763e-05, + "loss": 0.0272, + "step": 233480 + }, + { + "epoch": 1.51, + "learning_rate": 7.39500571199907e-05, + "loss": 0.0227, + "step": 233490 + }, + { + "epoch": 1.51, + "learning_rate": 7.394037576563376e-05, + "loss": 0.0228, + "step": 233500 + }, + { + "epoch": 1.51, + "learning_rate": 7.393069441127683e-05, + "loss": 0.0259, + "step": 233510 + }, + { + "epoch": 1.51, + "learning_rate": 7.392101305691991e-05, + "loss": 0.0285, + "step": 233520 + }, + { + "epoch": 1.51, + "learning_rate": 7.391133170256298e-05, + "loss": 0.0288, + "step": 233530 + }, + { + "epoch": 1.51, + "learning_rate": 7.390165034820603e-05, + "loss": 0.0311, + "step": 233540 + }, + { + "epoch": 1.51, + "learning_rate": 7.389196899384911e-05, + "loss": 0.0282, + "step": 233550 + }, + { + "epoch": 1.51, + "learning_rate": 7.388228763949218e-05, + "loss": 0.0241, + "step": 233560 + }, + { + "epoch": 1.51, + "learning_rate": 7.387260628513524e-05, + "loss": 0.0284, + "step": 233570 + }, + { + "epoch": 1.51, + "learning_rate": 7.386292493077831e-05, + "loss": 0.0242, + "step": 233580 + }, + { + "epoch": 1.51, + "learning_rate": 7.385324357642137e-05, + "loss": 0.0311, + "step": 233590 + }, + { + "epoch": 1.51, + "learning_rate": 7.384356222206444e-05, + "loss": 0.0278, + "step": 233600 + }, + { + "epoch": 1.51, + "learning_rate": 7.383388086770751e-05, + "loss": 0.0288, + "step": 233610 + }, + { + "epoch": 1.51, + "learning_rate": 7.382419951335059e-05, + "loss": 0.025, + "step": 233620 + }, + { + "epoch": 1.51, + "learning_rate": 7.381451815899365e-05, + "loss": 0.0271, + "step": 233630 + }, + { + "epoch": 1.51, + "learning_rate": 7.380483680463672e-05, + "loss": 0.0305, + "step": 233640 + }, + { + "epoch": 1.51, + "learning_rate": 7.379515545027979e-05, + "loss": 0.0273, + "step": 233650 + }, + { + "epoch": 1.51, + "learning_rate": 7.378547409592285e-05, + "loss": 0.0204, + "step": 233660 + }, + { + "epoch": 1.51, + "learning_rate": 7.377579274156592e-05, + "loss": 0.0277, + "step": 233670 + }, + { + "epoch": 1.51, + "learning_rate": 7.376611138720898e-05, + "loss": 0.0278, + "step": 233680 + }, + { + "epoch": 1.51, + "learning_rate": 7.375643003285205e-05, + "loss": 0.0253, + "step": 233690 + }, + { + "epoch": 1.51, + "learning_rate": 7.374674867849512e-05, + "loss": 0.0254, + "step": 233700 + }, + { + "epoch": 1.51, + "learning_rate": 7.37370673241382e-05, + "loss": 0.0314, + "step": 233710 + }, + { + "epoch": 1.51, + "learning_rate": 7.372738596978126e-05, + "loss": 0.0282, + "step": 233720 + }, + { + "epoch": 1.51, + "learning_rate": 7.371770461542433e-05, + "loss": 0.0271, + "step": 233730 + }, + { + "epoch": 1.51, + "learning_rate": 7.37080232610674e-05, + "loss": 0.0281, + "step": 233740 + }, + { + "epoch": 1.51, + "learning_rate": 7.369834190671046e-05, + "loss": 0.026, + "step": 233750 + }, + { + "epoch": 1.51, + "learning_rate": 7.368866055235353e-05, + "loss": 0.0295, + "step": 233760 + }, + { + "epoch": 1.51, + "learning_rate": 7.36789791979966e-05, + "loss": 0.0273, + "step": 233770 + }, + { + "epoch": 1.51, + "learning_rate": 7.366929784363967e-05, + "loss": 0.029, + "step": 233780 + }, + { + "epoch": 1.51, + "learning_rate": 7.365961648928273e-05, + "loss": 0.0298, + "step": 233790 + }, + { + "epoch": 1.51, + "learning_rate": 7.36499351349258e-05, + "loss": 0.0287, + "step": 233800 + }, + { + "epoch": 1.51, + "learning_rate": 7.364025378056887e-05, + "loss": 0.0271, + "step": 233810 + }, + { + "epoch": 1.51, + "learning_rate": 7.363057242621194e-05, + "loss": 0.0301, + "step": 233820 + }, + { + "epoch": 1.51, + "learning_rate": 7.3620891071855e-05, + "loss": 0.0281, + "step": 233830 + }, + { + "epoch": 1.51, + "learning_rate": 7.361120971749807e-05, + "loss": 0.026, + "step": 233840 + }, + { + "epoch": 1.51, + "learning_rate": 7.360152836314114e-05, + "loss": 0.0263, + "step": 233850 + }, + { + "epoch": 1.51, + "learning_rate": 7.35918470087842e-05, + "loss": 0.0247, + "step": 233860 + }, + { + "epoch": 1.51, + "learning_rate": 7.358216565442728e-05, + "loss": 0.0302, + "step": 233870 + }, + { + "epoch": 1.51, + "learning_rate": 7.357248430007035e-05, + "loss": 0.0248, + "step": 233880 + }, + { + "epoch": 1.51, + "learning_rate": 7.35628029457134e-05, + "loss": 0.0264, + "step": 233890 + }, + { + "epoch": 1.51, + "learning_rate": 7.355312159135648e-05, + "loss": 0.0238, + "step": 233900 + }, + { + "epoch": 1.51, + "learning_rate": 7.354344023699955e-05, + "loss": 0.0278, + "step": 233910 + }, + { + "epoch": 1.51, + "learning_rate": 7.353375888264261e-05, + "loss": 0.0247, + "step": 233920 + }, + { + "epoch": 1.51, + "learning_rate": 7.352407752828568e-05, + "loss": 0.0282, + "step": 233930 + }, + { + "epoch": 1.51, + "learning_rate": 7.351439617392876e-05, + "loss": 0.026, + "step": 233940 + }, + { + "epoch": 1.51, + "learning_rate": 7.350471481957181e-05, + "loss": 0.0245, + "step": 233950 + }, + { + "epoch": 1.51, + "learning_rate": 7.349503346521488e-05, + "loss": 0.0324, + "step": 233960 + }, + { + "epoch": 1.51, + "learning_rate": 7.348535211085796e-05, + "loss": 0.0257, + "step": 233970 + }, + { + "epoch": 1.51, + "learning_rate": 7.347567075650103e-05, + "loss": 0.0251, + "step": 233980 + }, + { + "epoch": 1.51, + "learning_rate": 7.346598940214409e-05, + "loss": 0.0285, + "step": 233990 + }, + { + "epoch": 1.51, + "learning_rate": 7.345630804778716e-05, + "loss": 0.0243, + "step": 234000 + }, + { + "epoch": 1.51, + "eval_cer": 0.9198472488984295, + "eval_loss": 0.019518280401825905, + "eval_runtime": 120.3803, + "eval_samples_per_second": 16.614, + "eval_steps_per_second": 4.154, + "step": 234000 + }, + { + "epoch": 1.51, + "learning_rate": 7.344662669343022e-05, + "loss": 0.0231, + "step": 234010 + }, + { + "epoch": 1.51, + "learning_rate": 7.343694533907329e-05, + "loss": 0.0305, + "step": 234020 + }, + { + "epoch": 1.51, + "learning_rate": 7.342726398471636e-05, + "loss": 0.031, + "step": 234030 + }, + { + "epoch": 1.51, + "learning_rate": 7.341758263035944e-05, + "loss": 0.0231, + "step": 234040 + }, + { + "epoch": 1.51, + "learning_rate": 7.340790127600249e-05, + "loss": 0.024, + "step": 234050 + }, + { + "epoch": 1.51, + "learning_rate": 7.339821992164557e-05, + "loss": 0.0274, + "step": 234060 + }, + { + "epoch": 1.51, + "learning_rate": 7.338853856728864e-05, + "loss": 0.0263, + "step": 234070 + }, + { + "epoch": 1.51, + "learning_rate": 7.33788572129317e-05, + "loss": 0.0282, + "step": 234080 + }, + { + "epoch": 1.51, + "learning_rate": 7.336917585857477e-05, + "loss": 0.0237, + "step": 234090 + }, + { + "epoch": 1.51, + "learning_rate": 7.335949450421783e-05, + "loss": 0.023, + "step": 234100 + }, + { + "epoch": 1.51, + "learning_rate": 7.33498131498609e-05, + "loss": 0.0256, + "step": 234110 + }, + { + "epoch": 1.51, + "learning_rate": 7.334013179550397e-05, + "loss": 0.0262, + "step": 234120 + }, + { + "epoch": 1.51, + "learning_rate": 7.333045044114705e-05, + "loss": 0.0228, + "step": 234130 + }, + { + "epoch": 1.51, + "learning_rate": 7.332076908679011e-05, + "loss": 0.0256, + "step": 234140 + }, + { + "epoch": 1.51, + "learning_rate": 7.331108773243318e-05, + "loss": 0.0274, + "step": 234150 + }, + { + "epoch": 1.51, + "learning_rate": 7.330140637807624e-05, + "loss": 0.0313, + "step": 234160 + }, + { + "epoch": 1.51, + "learning_rate": 7.329172502371931e-05, + "loss": 0.0263, + "step": 234170 + }, + { + "epoch": 1.51, + "learning_rate": 7.328204366936238e-05, + "loss": 0.0238, + "step": 234180 + }, + { + "epoch": 1.51, + "learning_rate": 7.327236231500544e-05, + "loss": 0.0254, + "step": 234190 + }, + { + "epoch": 1.51, + "learning_rate": 7.326268096064852e-05, + "loss": 0.0262, + "step": 234200 + }, + { + "epoch": 1.51, + "learning_rate": 7.325299960629158e-05, + "loss": 0.0293, + "step": 234210 + }, + { + "epoch": 1.51, + "learning_rate": 7.324331825193466e-05, + "loss": 0.0261, + "step": 234220 + }, + { + "epoch": 1.51, + "learning_rate": 7.323363689757772e-05, + "loss": 0.027, + "step": 234230 + }, + { + "epoch": 1.51, + "learning_rate": 7.322395554322079e-05, + "loss": 0.0289, + "step": 234240 + }, + { + "epoch": 1.51, + "learning_rate": 7.321427418886385e-05, + "loss": 0.0278, + "step": 234250 + }, + { + "epoch": 1.51, + "learning_rate": 7.320459283450692e-05, + "loss": 0.0263, + "step": 234260 + }, + { + "epoch": 1.51, + "learning_rate": 7.319491148014999e-05, + "loss": 0.0334, + "step": 234270 + }, + { + "epoch": 1.51, + "learning_rate": 7.318523012579305e-05, + "loss": 0.0224, + "step": 234280 + }, + { + "epoch": 1.51, + "learning_rate": 7.317554877143613e-05, + "loss": 0.0301, + "step": 234290 + }, + { + "epoch": 1.51, + "learning_rate": 7.31658674170792e-05, + "loss": 0.0272, + "step": 234300 + }, + { + "epoch": 1.51, + "learning_rate": 7.315618606272225e-05, + "loss": 0.0282, + "step": 234310 + }, + { + "epoch": 1.51, + "learning_rate": 7.314650470836533e-05, + "loss": 0.0288, + "step": 234320 + }, + { + "epoch": 1.51, + "learning_rate": 7.31368233540084e-05, + "loss": 0.0285, + "step": 234330 + }, + { + "epoch": 1.51, + "learning_rate": 7.312714199965146e-05, + "loss": 0.0233, + "step": 234340 + }, + { + "epoch": 1.51, + "learning_rate": 7.311746064529453e-05, + "loss": 0.0318, + "step": 234350 + }, + { + "epoch": 1.51, + "learning_rate": 7.310777929093761e-05, + "loss": 0.0288, + "step": 234360 + }, + { + "epoch": 1.51, + "learning_rate": 7.309809793658066e-05, + "loss": 0.0269, + "step": 234370 + }, + { + "epoch": 1.51, + "learning_rate": 7.308841658222373e-05, + "loss": 0.0254, + "step": 234380 + }, + { + "epoch": 1.51, + "learning_rate": 7.307873522786681e-05, + "loss": 0.0284, + "step": 234390 + }, + { + "epoch": 1.51, + "learning_rate": 7.306905387350988e-05, + "loss": 0.0273, + "step": 234400 + }, + { + "epoch": 1.51, + "learning_rate": 7.305937251915294e-05, + "loss": 0.0297, + "step": 234410 + }, + { + "epoch": 1.51, + "learning_rate": 7.304969116479601e-05, + "loss": 0.0322, + "step": 234420 + }, + { + "epoch": 1.51, + "learning_rate": 7.304000981043907e-05, + "loss": 0.0254, + "step": 234430 + }, + { + "epoch": 1.51, + "learning_rate": 7.303032845608214e-05, + "loss": 0.025, + "step": 234440 + }, + { + "epoch": 1.51, + "learning_rate": 7.30206471017252e-05, + "loss": 0.0326, + "step": 234450 + }, + { + "epoch": 1.51, + "learning_rate": 7.301096574736829e-05, + "loss": 0.0276, + "step": 234460 + }, + { + "epoch": 1.51, + "learning_rate": 7.300128439301134e-05, + "loss": 0.0235, + "step": 234470 + }, + { + "epoch": 1.51, + "learning_rate": 7.299160303865442e-05, + "loss": 0.0257, + "step": 234480 + }, + { + "epoch": 1.51, + "learning_rate": 7.298192168429749e-05, + "loss": 0.0293, + "step": 234490 + }, + { + "epoch": 1.51, + "learning_rate": 7.297224032994055e-05, + "loss": 0.0306, + "step": 234500 + }, + { + "epoch": 1.51, + "learning_rate": 7.296255897558362e-05, + "loss": 0.0227, + "step": 234510 + }, + { + "epoch": 1.51, + "learning_rate": 7.295287762122668e-05, + "loss": 0.025, + "step": 234520 + }, + { + "epoch": 1.51, + "learning_rate": 7.294319626686975e-05, + "loss": 0.0229, + "step": 234530 + }, + { + "epoch": 1.51, + "learning_rate": 7.293351491251282e-05, + "loss": 0.0255, + "step": 234540 + }, + { + "epoch": 1.51, + "learning_rate": 7.29238335581559e-05, + "loss": 0.0234, + "step": 234550 + }, + { + "epoch": 1.51, + "learning_rate": 7.291415220379896e-05, + "loss": 0.035, + "step": 234560 + }, + { + "epoch": 1.51, + "learning_rate": 7.290447084944203e-05, + "loss": 0.0341, + "step": 234570 + }, + { + "epoch": 1.51, + "learning_rate": 7.28947894950851e-05, + "loss": 0.0209, + "step": 234580 + }, + { + "epoch": 1.51, + "learning_rate": 7.288510814072816e-05, + "loss": 0.0297, + "step": 234590 + }, + { + "epoch": 1.51, + "learning_rate": 7.287542678637123e-05, + "loss": 0.0273, + "step": 234600 + }, + { + "epoch": 1.51, + "learning_rate": 7.28657454320143e-05, + "loss": 0.0264, + "step": 234610 + }, + { + "epoch": 1.51, + "learning_rate": 7.285606407765737e-05, + "loss": 0.0264, + "step": 234620 + }, + { + "epoch": 1.51, + "learning_rate": 7.284638272330043e-05, + "loss": 0.0288, + "step": 234630 + }, + { + "epoch": 1.51, + "learning_rate": 7.28367013689435e-05, + "loss": 0.0266, + "step": 234640 + }, + { + "epoch": 1.51, + "learning_rate": 7.282702001458657e-05, + "loss": 0.0263, + "step": 234650 + }, + { + "epoch": 1.51, + "learning_rate": 7.281733866022964e-05, + "loss": 0.0242, + "step": 234660 + }, + { + "epoch": 1.51, + "learning_rate": 7.28076573058727e-05, + "loss": 0.023, + "step": 234670 + }, + { + "epoch": 1.51, + "learning_rate": 7.279797595151577e-05, + "loss": 0.0285, + "step": 234680 + }, + { + "epoch": 1.51, + "learning_rate": 7.278829459715884e-05, + "loss": 0.0298, + "step": 234690 + }, + { + "epoch": 1.51, + "learning_rate": 7.27786132428019e-05, + "loss": 0.0267, + "step": 234700 + }, + { + "epoch": 1.51, + "learning_rate": 7.276893188844498e-05, + "loss": 0.0248, + "step": 234710 + }, + { + "epoch": 1.51, + "learning_rate": 7.275925053408805e-05, + "loss": 0.0252, + "step": 234720 + }, + { + "epoch": 1.51, + "learning_rate": 7.27495691797311e-05, + "loss": 0.0276, + "step": 234730 + }, + { + "epoch": 1.52, + "learning_rate": 7.273988782537418e-05, + "loss": 0.026, + "step": 234740 + }, + { + "epoch": 1.52, + "learning_rate": 7.273020647101725e-05, + "loss": 0.0291, + "step": 234750 + }, + { + "epoch": 1.52, + "learning_rate": 7.272052511666031e-05, + "loss": 0.0305, + "step": 234760 + }, + { + "epoch": 1.52, + "learning_rate": 7.271084376230338e-05, + "loss": 0.0225, + "step": 234770 + }, + { + "epoch": 1.52, + "learning_rate": 7.270116240794645e-05, + "loss": 0.0292, + "step": 234780 + }, + { + "epoch": 1.52, + "learning_rate": 7.269148105358951e-05, + "loss": 0.0249, + "step": 234790 + }, + { + "epoch": 1.52, + "learning_rate": 7.268179969923258e-05, + "loss": 0.0229, + "step": 234800 + }, + { + "epoch": 1.52, + "learning_rate": 7.267211834487566e-05, + "loss": 0.0233, + "step": 234810 + }, + { + "epoch": 1.52, + "learning_rate": 7.266243699051873e-05, + "loss": 0.0269, + "step": 234820 + }, + { + "epoch": 1.52, + "learning_rate": 7.265275563616179e-05, + "loss": 0.0241, + "step": 234830 + }, + { + "epoch": 1.52, + "learning_rate": 7.264307428180486e-05, + "loss": 0.0272, + "step": 234840 + }, + { + "epoch": 1.52, + "learning_rate": 7.263339292744792e-05, + "loss": 0.0302, + "step": 234850 + }, + { + "epoch": 1.52, + "learning_rate": 7.262371157309099e-05, + "loss": 0.0251, + "step": 234860 + }, + { + "epoch": 1.52, + "learning_rate": 7.261403021873406e-05, + "loss": 0.0233, + "step": 234870 + }, + { + "epoch": 1.52, + "learning_rate": 7.260434886437712e-05, + "loss": 0.0266, + "step": 234880 + }, + { + "epoch": 1.52, + "learning_rate": 7.259466751002019e-05, + "loss": 0.0351, + "step": 234890 + }, + { + "epoch": 1.52, + "learning_rate": 7.258498615566327e-05, + "loss": 0.0327, + "step": 234900 + }, + { + "epoch": 1.52, + "learning_rate": 7.257530480130633e-05, + "loss": 0.026, + "step": 234910 + }, + { + "epoch": 1.52, + "learning_rate": 7.25656234469494e-05, + "loss": 0.0254, + "step": 234920 + }, + { + "epoch": 1.52, + "learning_rate": 7.255594209259247e-05, + "loss": 0.0276, + "step": 234930 + }, + { + "epoch": 1.52, + "learning_rate": 7.254626073823553e-05, + "loss": 0.0296, + "step": 234940 + }, + { + "epoch": 1.52, + "learning_rate": 7.25365793838786e-05, + "loss": 0.0263, + "step": 234950 + }, + { + "epoch": 1.52, + "learning_rate": 7.252689802952167e-05, + "loss": 0.0282, + "step": 234960 + }, + { + "epoch": 1.52, + "learning_rate": 7.251721667516475e-05, + "loss": 0.0293, + "step": 234970 + }, + { + "epoch": 1.52, + "learning_rate": 7.25075353208078e-05, + "loss": 0.0327, + "step": 234980 + }, + { + "epoch": 1.52, + "learning_rate": 7.249785396645086e-05, + "loss": 0.0232, + "step": 234990 + }, + { + "epoch": 1.52, + "learning_rate": 7.248817261209394e-05, + "loss": 0.0258, + "step": 235000 + }, + { + "epoch": 1.52, + "eval_cer": 0.9198888261213423, + "eval_loss": 0.019709018990397453, + "eval_runtime": 120.2635, + "eval_samples_per_second": 16.63, + "eval_steps_per_second": 4.158, + "step": 235000 + }, + { + "epoch": 1.52, + "learning_rate": 7.247849125773701e-05, + "loss": 0.0354, + "step": 235010 + }, + { + "epoch": 1.52, + "learning_rate": 7.246880990338008e-05, + "loss": 0.0305, + "step": 235020 + }, + { + "epoch": 1.52, + "learning_rate": 7.245912854902314e-05, + "loss": 0.0266, + "step": 235030 + }, + { + "epoch": 1.52, + "learning_rate": 7.244944719466621e-05, + "loss": 0.0355, + "step": 235040 + }, + { + "epoch": 1.52, + "learning_rate": 7.243976584030928e-05, + "loss": 0.0263, + "step": 235050 + }, + { + "epoch": 1.52, + "learning_rate": 7.243008448595234e-05, + "loss": 0.0246, + "step": 235060 + }, + { + "epoch": 1.52, + "learning_rate": 7.242040313159542e-05, + "loss": 0.031, + "step": 235070 + }, + { + "epoch": 1.52, + "learning_rate": 7.241072177723847e-05, + "loss": 0.0277, + "step": 235080 + }, + { + "epoch": 1.52, + "learning_rate": 7.240104042288155e-05, + "loss": 0.0258, + "step": 235090 + }, + { + "epoch": 1.52, + "learning_rate": 7.239135906852462e-05, + "loss": 0.0264, + "step": 235100 + }, + { + "epoch": 1.52, + "learning_rate": 7.238167771416769e-05, + "loss": 0.0276, + "step": 235110 + }, + { + "epoch": 1.52, + "learning_rate": 7.237199635981075e-05, + "loss": 0.026, + "step": 235120 + }, + { + "epoch": 1.52, + "learning_rate": 7.236231500545382e-05, + "loss": 0.0277, + "step": 235130 + }, + { + "epoch": 1.52, + "learning_rate": 7.235263365109689e-05, + "loss": 0.0246, + "step": 235140 + }, + { + "epoch": 1.52, + "learning_rate": 7.234295229673995e-05, + "loss": 0.028, + "step": 235150 + }, + { + "epoch": 1.52, + "learning_rate": 7.233327094238303e-05, + "loss": 0.0241, + "step": 235160 + }, + { + "epoch": 1.52, + "learning_rate": 7.23235895880261e-05, + "loss": 0.0272, + "step": 235170 + }, + { + "epoch": 1.52, + "learning_rate": 7.231390823366916e-05, + "loss": 0.0267, + "step": 235180 + }, + { + "epoch": 1.52, + "learning_rate": 7.230422687931223e-05, + "loss": 0.0297, + "step": 235190 + }, + { + "epoch": 1.52, + "learning_rate": 7.22945455249553e-05, + "loss": 0.029, + "step": 235200 + }, + { + "epoch": 1.52, + "learning_rate": 7.228486417059836e-05, + "loss": 0.0283, + "step": 235210 + }, + { + "epoch": 1.52, + "learning_rate": 7.227518281624143e-05, + "loss": 0.0279, + "step": 235220 + }, + { + "epoch": 1.52, + "learning_rate": 7.226550146188451e-05, + "loss": 0.0269, + "step": 235230 + }, + { + "epoch": 1.52, + "learning_rate": 7.225582010752756e-05, + "loss": 0.0249, + "step": 235240 + }, + { + "epoch": 1.52, + "learning_rate": 7.224613875317064e-05, + "loss": 0.0221, + "step": 235250 + }, + { + "epoch": 1.52, + "learning_rate": 7.223645739881371e-05, + "loss": 0.0298, + "step": 235260 + }, + { + "epoch": 1.52, + "learning_rate": 7.222677604445677e-05, + "loss": 0.0286, + "step": 235270 + }, + { + "epoch": 1.52, + "learning_rate": 7.221709469009984e-05, + "loss": 0.0275, + "step": 235280 + }, + { + "epoch": 1.52, + "learning_rate": 7.22074133357429e-05, + "loss": 0.0252, + "step": 235290 + }, + { + "epoch": 1.52, + "learning_rate": 7.219773198138597e-05, + "loss": 0.0231, + "step": 235300 + }, + { + "epoch": 1.52, + "learning_rate": 7.218805062702904e-05, + "loss": 0.0276, + "step": 235310 + }, + { + "epoch": 1.52, + "learning_rate": 7.217836927267212e-05, + "loss": 0.0253, + "step": 235320 + }, + { + "epoch": 1.52, + "learning_rate": 7.216868791831518e-05, + "loss": 0.03, + "step": 235330 + }, + { + "epoch": 1.52, + "learning_rate": 7.215900656395824e-05, + "loss": 0.0285, + "step": 235340 + }, + { + "epoch": 1.52, + "learning_rate": 7.214932520960132e-05, + "loss": 0.028, + "step": 235350 + }, + { + "epoch": 1.52, + "learning_rate": 7.213964385524438e-05, + "loss": 0.0255, + "step": 235360 + }, + { + "epoch": 1.52, + "learning_rate": 7.212996250088745e-05, + "loss": 0.0258, + "step": 235370 + }, + { + "epoch": 1.52, + "learning_rate": 7.212028114653052e-05, + "loss": 0.0357, + "step": 235380 + }, + { + "epoch": 1.52, + "learning_rate": 7.21105997921736e-05, + "loss": 0.0245, + "step": 235390 + }, + { + "epoch": 1.52, + "learning_rate": 7.210091843781665e-05, + "loss": 0.027, + "step": 235400 + }, + { + "epoch": 1.52, + "learning_rate": 7.209123708345971e-05, + "loss": 0.0265, + "step": 235410 + }, + { + "epoch": 1.52, + "learning_rate": 7.20815557291028e-05, + "loss": 0.0254, + "step": 235420 + }, + { + "epoch": 1.52, + "learning_rate": 7.207187437474586e-05, + "loss": 0.0253, + "step": 235430 + }, + { + "epoch": 1.52, + "learning_rate": 7.206219302038893e-05, + "loss": 0.0281, + "step": 235440 + }, + { + "epoch": 1.52, + "learning_rate": 7.205251166603199e-05, + "loss": 0.0265, + "step": 235450 + }, + { + "epoch": 1.52, + "learning_rate": 7.204283031167506e-05, + "loss": 0.0304, + "step": 235460 + }, + { + "epoch": 1.52, + "learning_rate": 7.203314895731813e-05, + "loss": 0.0254, + "step": 235470 + }, + { + "epoch": 1.52, + "learning_rate": 7.202346760296119e-05, + "loss": 0.0294, + "step": 235480 + }, + { + "epoch": 1.52, + "learning_rate": 7.201378624860427e-05, + "loss": 0.025, + "step": 235490 + }, + { + "epoch": 1.52, + "learning_rate": 7.200410489424732e-05, + "loss": 0.0204, + "step": 235500 + }, + { + "epoch": 1.52, + "learning_rate": 7.19944235398904e-05, + "loss": 0.0311, + "step": 235510 + }, + { + "epoch": 1.52, + "learning_rate": 7.198474218553347e-05, + "loss": 0.0213, + "step": 235520 + }, + { + "epoch": 1.52, + "learning_rate": 7.197506083117654e-05, + "loss": 0.0293, + "step": 235530 + }, + { + "epoch": 1.52, + "learning_rate": 7.19653794768196e-05, + "loss": 0.0272, + "step": 235540 + }, + { + "epoch": 1.52, + "learning_rate": 7.195569812246267e-05, + "loss": 0.0243, + "step": 235550 + }, + { + "epoch": 1.52, + "learning_rate": 7.194601676810574e-05, + "loss": 0.0291, + "step": 235560 + }, + { + "epoch": 1.52, + "learning_rate": 7.19363354137488e-05, + "loss": 0.0251, + "step": 235570 + }, + { + "epoch": 1.52, + "learning_rate": 7.192665405939188e-05, + "loss": 0.0224, + "step": 235580 + }, + { + "epoch": 1.52, + "learning_rate": 7.191697270503495e-05, + "loss": 0.0244, + "step": 235590 + }, + { + "epoch": 1.52, + "learning_rate": 7.190729135067801e-05, + "loss": 0.026, + "step": 235600 + }, + { + "epoch": 1.52, + "learning_rate": 7.189760999632108e-05, + "loss": 0.029, + "step": 235610 + }, + { + "epoch": 1.52, + "learning_rate": 7.188792864196415e-05, + "loss": 0.025, + "step": 235620 + }, + { + "epoch": 1.52, + "learning_rate": 7.187824728760721e-05, + "loss": 0.0283, + "step": 235630 + }, + { + "epoch": 1.52, + "learning_rate": 7.186856593325028e-05, + "loss": 0.0265, + "step": 235640 + }, + { + "epoch": 1.52, + "learning_rate": 7.185888457889336e-05, + "loss": 0.0256, + "step": 235650 + }, + { + "epoch": 1.52, + "learning_rate": 7.184920322453641e-05, + "loss": 0.0335, + "step": 235660 + }, + { + "epoch": 1.52, + "learning_rate": 7.183952187017949e-05, + "loss": 0.0282, + "step": 235670 + }, + { + "epoch": 1.52, + "learning_rate": 7.182984051582256e-05, + "loss": 0.0278, + "step": 235680 + }, + { + "epoch": 1.52, + "learning_rate": 7.182015916146562e-05, + "loss": 0.0302, + "step": 235690 + }, + { + "epoch": 1.52, + "learning_rate": 7.181047780710869e-05, + "loss": 0.0334, + "step": 235700 + }, + { + "epoch": 1.52, + "learning_rate": 7.180079645275176e-05, + "loss": 0.0333, + "step": 235710 + }, + { + "epoch": 1.52, + "learning_rate": 7.179111509839482e-05, + "loss": 0.0231, + "step": 235720 + }, + { + "epoch": 1.52, + "learning_rate": 7.178143374403789e-05, + "loss": 0.0255, + "step": 235730 + }, + { + "epoch": 1.52, + "learning_rate": 7.177175238968097e-05, + "loss": 0.0273, + "step": 235740 + }, + { + "epoch": 1.52, + "learning_rate": 7.176207103532403e-05, + "loss": 0.0282, + "step": 235750 + }, + { + "epoch": 1.52, + "learning_rate": 7.175238968096709e-05, + "loss": 0.0268, + "step": 235760 + }, + { + "epoch": 1.52, + "learning_rate": 7.174270832661017e-05, + "loss": 0.0263, + "step": 235770 + }, + { + "epoch": 1.52, + "learning_rate": 7.173302697225323e-05, + "loss": 0.0243, + "step": 235780 + }, + { + "epoch": 1.52, + "learning_rate": 7.17233456178963e-05, + "loss": 0.0288, + "step": 235790 + }, + { + "epoch": 1.52, + "learning_rate": 7.171366426353937e-05, + "loss": 0.0269, + "step": 235800 + }, + { + "epoch": 1.52, + "learning_rate": 7.170398290918245e-05, + "loss": 0.028, + "step": 235810 + }, + { + "epoch": 1.52, + "learning_rate": 7.16943015548255e-05, + "loss": 0.0267, + "step": 235820 + }, + { + "epoch": 1.52, + "learning_rate": 7.168462020046856e-05, + "loss": 0.027, + "step": 235830 + }, + { + "epoch": 1.52, + "learning_rate": 7.167493884611164e-05, + "loss": 0.03, + "step": 235840 + }, + { + "epoch": 1.52, + "learning_rate": 7.166525749175471e-05, + "loss": 0.0349, + "step": 235850 + }, + { + "epoch": 1.52, + "learning_rate": 7.165557613739778e-05, + "loss": 0.0247, + "step": 235860 + }, + { + "epoch": 1.52, + "learning_rate": 7.164589478304084e-05, + "loss": 0.0303, + "step": 235870 + }, + { + "epoch": 1.52, + "learning_rate": 7.163621342868391e-05, + "loss": 0.025, + "step": 235880 + }, + { + "epoch": 1.52, + "learning_rate": 7.162653207432698e-05, + "loss": 0.0253, + "step": 235890 + }, + { + "epoch": 1.52, + "learning_rate": 7.161685071997004e-05, + "loss": 0.0267, + "step": 235900 + }, + { + "epoch": 1.52, + "learning_rate": 7.160716936561312e-05, + "loss": 0.0204, + "step": 235910 + }, + { + "epoch": 1.52, + "learning_rate": 7.159748801125617e-05, + "loss": 0.0288, + "step": 235920 + }, + { + "epoch": 1.52, + "learning_rate": 7.158780665689925e-05, + "loss": 0.0274, + "step": 235930 + }, + { + "epoch": 1.52, + "learning_rate": 7.157812530254232e-05, + "loss": 0.0242, + "step": 235940 + }, + { + "epoch": 1.52, + "learning_rate": 7.156844394818539e-05, + "loss": 0.0281, + "step": 235950 + }, + { + "epoch": 1.52, + "learning_rate": 7.155876259382845e-05, + "loss": 0.0266, + "step": 235960 + }, + { + "epoch": 1.52, + "learning_rate": 7.154908123947152e-05, + "loss": 0.0235, + "step": 235970 + }, + { + "epoch": 1.52, + "learning_rate": 7.153939988511459e-05, + "loss": 0.028, + "step": 235980 + }, + { + "epoch": 1.52, + "learning_rate": 7.152971853075765e-05, + "loss": 0.0279, + "step": 235990 + }, + { + "epoch": 1.52, + "learning_rate": 7.152003717640073e-05, + "loss": 0.0272, + "step": 236000 + }, + { + "epoch": 1.52, + "eval_cer": 0.9198336911083493, + "eval_loss": 0.019630778580904007, + "eval_runtime": 120.0957, + "eval_samples_per_second": 16.653, + "eval_steps_per_second": 4.163, + "step": 236000 + }, + { + "epoch": 1.52, + "learning_rate": 7.15103558220438e-05, + "loss": 0.0283, + "step": 236010 + }, + { + "epoch": 1.52, + "learning_rate": 7.150067446768686e-05, + "loss": 0.0277, + "step": 236020 + }, + { + "epoch": 1.52, + "learning_rate": 7.149099311332993e-05, + "loss": 0.031, + "step": 236030 + }, + { + "epoch": 1.52, + "learning_rate": 7.1481311758973e-05, + "loss": 0.025, + "step": 236040 + }, + { + "epoch": 1.52, + "learning_rate": 7.147163040461606e-05, + "loss": 0.0232, + "step": 236050 + }, + { + "epoch": 1.52, + "learning_rate": 7.146194905025913e-05, + "loss": 0.0339, + "step": 236060 + }, + { + "epoch": 1.52, + "learning_rate": 7.145226769590221e-05, + "loss": 0.0262, + "step": 236070 + }, + { + "epoch": 1.52, + "learning_rate": 7.144258634154526e-05, + "loss": 0.0252, + "step": 236080 + }, + { + "epoch": 1.52, + "learning_rate": 7.143290498718834e-05, + "loss": 0.0237, + "step": 236090 + }, + { + "epoch": 1.52, + "learning_rate": 7.142322363283141e-05, + "loss": 0.0231, + "step": 236100 + }, + { + "epoch": 1.52, + "learning_rate": 7.141354227847447e-05, + "loss": 0.026, + "step": 236110 + }, + { + "epoch": 1.52, + "learning_rate": 7.140386092411754e-05, + "loss": 0.0261, + "step": 236120 + }, + { + "epoch": 1.52, + "learning_rate": 7.13941795697606e-05, + "loss": 0.0294, + "step": 236130 + }, + { + "epoch": 1.52, + "learning_rate": 7.138449821540367e-05, + "loss": 0.0245, + "step": 236140 + }, + { + "epoch": 1.52, + "learning_rate": 7.137481686104674e-05, + "loss": 0.0246, + "step": 236150 + }, + { + "epoch": 1.52, + "learning_rate": 7.136513550668982e-05, + "loss": 0.0305, + "step": 236160 + }, + { + "epoch": 1.52, + "learning_rate": 7.135545415233288e-05, + "loss": 0.0268, + "step": 236170 + }, + { + "epoch": 1.52, + "learning_rate": 7.134577279797594e-05, + "loss": 0.0203, + "step": 236180 + }, + { + "epoch": 1.52, + "learning_rate": 7.133609144361902e-05, + "loss": 0.0296, + "step": 236190 + }, + { + "epoch": 1.52, + "learning_rate": 7.132641008926208e-05, + "loss": 0.0235, + "step": 236200 + }, + { + "epoch": 1.52, + "learning_rate": 7.131672873490515e-05, + "loss": 0.0232, + "step": 236210 + }, + { + "epoch": 1.52, + "learning_rate": 7.130704738054822e-05, + "loss": 0.024, + "step": 236220 + }, + { + "epoch": 1.52, + "learning_rate": 7.129736602619128e-05, + "loss": 0.0299, + "step": 236230 + }, + { + "epoch": 1.52, + "learning_rate": 7.128768467183435e-05, + "loss": 0.0297, + "step": 236240 + }, + { + "epoch": 1.52, + "learning_rate": 7.127800331747741e-05, + "loss": 0.0258, + "step": 236250 + }, + { + "epoch": 1.52, + "learning_rate": 7.12683219631205e-05, + "loss": 0.0217, + "step": 236260 + }, + { + "epoch": 1.52, + "learning_rate": 7.125864060876356e-05, + "loss": 0.0261, + "step": 236270 + }, + { + "epoch": 1.53, + "learning_rate": 7.124895925440663e-05, + "loss": 0.0255, + "step": 236280 + }, + { + "epoch": 1.53, + "learning_rate": 7.123927790004969e-05, + "loss": 0.0259, + "step": 236290 + }, + { + "epoch": 1.53, + "learning_rate": 7.122959654569276e-05, + "loss": 0.0256, + "step": 236300 + }, + { + "epoch": 1.53, + "learning_rate": 7.121991519133583e-05, + "loss": 0.025, + "step": 236310 + }, + { + "epoch": 1.53, + "learning_rate": 7.121023383697889e-05, + "loss": 0.0297, + "step": 236320 + }, + { + "epoch": 1.53, + "learning_rate": 7.120055248262196e-05, + "loss": 0.0287, + "step": 236330 + }, + { + "epoch": 1.53, + "learning_rate": 7.119087112826502e-05, + "loss": 0.0225, + "step": 236340 + }, + { + "epoch": 1.53, + "learning_rate": 7.11811897739081e-05, + "loss": 0.0262, + "step": 236350 + }, + { + "epoch": 1.53, + "learning_rate": 7.117150841955117e-05, + "loss": 0.0282, + "step": 236360 + }, + { + "epoch": 1.53, + "learning_rate": 7.116182706519424e-05, + "loss": 0.0268, + "step": 236370 + }, + { + "epoch": 1.53, + "learning_rate": 7.11521457108373e-05, + "loss": 0.0323, + "step": 236380 + }, + { + "epoch": 1.53, + "learning_rate": 7.114246435648037e-05, + "loss": 0.0275, + "step": 236390 + }, + { + "epoch": 1.53, + "learning_rate": 7.113278300212343e-05, + "loss": 0.0237, + "step": 236400 + }, + { + "epoch": 1.53, + "learning_rate": 7.11231016477665e-05, + "loss": 0.0258, + "step": 236410 + }, + { + "epoch": 1.53, + "learning_rate": 7.111342029340958e-05, + "loss": 0.0333, + "step": 236420 + }, + { + "epoch": 1.53, + "learning_rate": 7.110373893905263e-05, + "loss": 0.0258, + "step": 236430 + }, + { + "epoch": 1.53, + "learning_rate": 7.109405758469571e-05, + "loss": 0.029, + "step": 236440 + }, + { + "epoch": 1.53, + "learning_rate": 7.108437623033878e-05, + "loss": 0.0298, + "step": 236450 + }, + { + "epoch": 1.53, + "learning_rate": 7.107469487598185e-05, + "loss": 0.0223, + "step": 236460 + }, + { + "epoch": 1.53, + "learning_rate": 7.106501352162491e-05, + "loss": 0.0266, + "step": 236470 + }, + { + "epoch": 1.53, + "learning_rate": 7.105533216726798e-05, + "loss": 0.0339, + "step": 236480 + }, + { + "epoch": 1.53, + "learning_rate": 7.104565081291104e-05, + "loss": 0.0274, + "step": 236490 + }, + { + "epoch": 1.53, + "learning_rate": 7.103596945855411e-05, + "loss": 0.0248, + "step": 236500 + }, + { + "epoch": 1.53, + "learning_rate": 7.102628810419719e-05, + "loss": 0.0351, + "step": 236510 + }, + { + "epoch": 1.53, + "learning_rate": 7.101660674984026e-05, + "loss": 0.0202, + "step": 236520 + }, + { + "epoch": 1.53, + "learning_rate": 7.100692539548331e-05, + "loss": 0.0248, + "step": 236530 + }, + { + "epoch": 1.53, + "learning_rate": 7.099724404112639e-05, + "loss": 0.0258, + "step": 236540 + }, + { + "epoch": 1.53, + "learning_rate": 7.098756268676946e-05, + "loss": 0.026, + "step": 236550 + }, + { + "epoch": 1.53, + "learning_rate": 7.097788133241252e-05, + "loss": 0.0295, + "step": 236560 + }, + { + "epoch": 1.53, + "learning_rate": 7.096819997805559e-05, + "loss": 0.0334, + "step": 236570 + }, + { + "epoch": 1.53, + "learning_rate": 7.095851862369867e-05, + "loss": 0.0221, + "step": 236580 + }, + { + "epoch": 1.53, + "learning_rate": 7.094883726934172e-05, + "loss": 0.0213, + "step": 236590 + }, + { + "epoch": 1.53, + "learning_rate": 7.093915591498479e-05, + "loss": 0.0252, + "step": 236600 + }, + { + "epoch": 1.53, + "learning_rate": 7.092947456062787e-05, + "loss": 0.0262, + "step": 236610 + }, + { + "epoch": 1.53, + "learning_rate": 7.091979320627093e-05, + "loss": 0.0272, + "step": 236620 + }, + { + "epoch": 1.53, + "learning_rate": 7.0910111851914e-05, + "loss": 0.0295, + "step": 236630 + }, + { + "epoch": 1.53, + "learning_rate": 7.090043049755707e-05, + "loss": 0.0291, + "step": 236640 + }, + { + "epoch": 1.53, + "learning_rate": 7.089074914320013e-05, + "loss": 0.0263, + "step": 236650 + }, + { + "epoch": 1.53, + "learning_rate": 7.08810677888432e-05, + "loss": 0.0257, + "step": 236660 + }, + { + "epoch": 1.53, + "learning_rate": 7.087138643448626e-05, + "loss": 0.0221, + "step": 236670 + }, + { + "epoch": 1.53, + "learning_rate": 7.086170508012934e-05, + "loss": 0.024, + "step": 236680 + }, + { + "epoch": 1.53, + "learning_rate": 7.08520237257724e-05, + "loss": 0.0314, + "step": 236690 + }, + { + "epoch": 1.53, + "learning_rate": 7.084234237141548e-05, + "loss": 0.0249, + "step": 236700 + }, + { + "epoch": 1.53, + "learning_rate": 7.083266101705854e-05, + "loss": 0.0234, + "step": 236710 + }, + { + "epoch": 1.53, + "learning_rate": 7.082297966270161e-05, + "loss": 0.0315, + "step": 236720 + }, + { + "epoch": 1.53, + "learning_rate": 7.081329830834467e-05, + "loss": 0.0263, + "step": 236730 + }, + { + "epoch": 1.53, + "learning_rate": 7.080361695398774e-05, + "loss": 0.023, + "step": 236740 + }, + { + "epoch": 1.53, + "learning_rate": 7.079393559963081e-05, + "loss": 0.0326, + "step": 236750 + }, + { + "epoch": 1.53, + "learning_rate": 7.078425424527387e-05, + "loss": 0.0284, + "step": 236760 + }, + { + "epoch": 1.53, + "learning_rate": 7.077457289091695e-05, + "loss": 0.026, + "step": 236770 + }, + { + "epoch": 1.53, + "learning_rate": 7.076489153656002e-05, + "loss": 0.0279, + "step": 236780 + }, + { + "epoch": 1.53, + "learning_rate": 7.075521018220307e-05, + "loss": 0.0267, + "step": 236790 + }, + { + "epoch": 1.53, + "learning_rate": 7.074552882784615e-05, + "loss": 0.0241, + "step": 236800 + }, + { + "epoch": 1.53, + "learning_rate": 7.073584747348922e-05, + "loss": 0.0266, + "step": 236810 + }, + { + "epoch": 1.53, + "learning_rate": 7.072616611913228e-05, + "loss": 0.0242, + "step": 236820 + }, + { + "epoch": 1.53, + "learning_rate": 7.071648476477535e-05, + "loss": 0.0279, + "step": 236830 + }, + { + "epoch": 1.53, + "learning_rate": 7.070680341041843e-05, + "loss": 0.0278, + "step": 236840 + }, + { + "epoch": 1.53, + "learning_rate": 7.069712205606148e-05, + "loss": 0.0312, + "step": 236850 + }, + { + "epoch": 1.53, + "learning_rate": 7.068744070170455e-05, + "loss": 0.0274, + "step": 236860 + }, + { + "epoch": 1.53, + "learning_rate": 7.067775934734763e-05, + "loss": 0.0298, + "step": 236870 + }, + { + "epoch": 1.53, + "learning_rate": 7.06680779929907e-05, + "loss": 0.0268, + "step": 236880 + }, + { + "epoch": 1.53, + "learning_rate": 7.065839663863376e-05, + "loss": 0.028, + "step": 236890 + }, + { + "epoch": 1.53, + "learning_rate": 7.064871528427683e-05, + "loss": 0.024, + "step": 236900 + }, + { + "epoch": 1.53, + "learning_rate": 7.06390339299199e-05, + "loss": 0.0265, + "step": 236910 + }, + { + "epoch": 1.53, + "learning_rate": 7.062935257556296e-05, + "loss": 0.0288, + "step": 236920 + }, + { + "epoch": 1.53, + "learning_rate": 7.061967122120603e-05, + "loss": 0.0278, + "step": 236930 + }, + { + "epoch": 1.53, + "learning_rate": 7.06099898668491e-05, + "loss": 0.0253, + "step": 236940 + }, + { + "epoch": 1.53, + "learning_rate": 7.060030851249216e-05, + "loss": 0.028, + "step": 236950 + }, + { + "epoch": 1.53, + "learning_rate": 7.059062715813524e-05, + "loss": 0.0237, + "step": 236960 + }, + { + "epoch": 1.53, + "learning_rate": 7.05809458037783e-05, + "loss": 0.0352, + "step": 236970 + }, + { + "epoch": 1.53, + "learning_rate": 7.057126444942137e-05, + "loss": 0.0235, + "step": 236980 + }, + { + "epoch": 1.53, + "learning_rate": 7.056158309506444e-05, + "loss": 0.031, + "step": 236990 + }, + { + "epoch": 1.53, + "learning_rate": 7.05519017407075e-05, + "loss": 0.0261, + "step": 237000 + }, + { + "epoch": 1.53, + "eval_cer": 0.9198870184159982, + "eval_loss": 0.019820256158709526, + "eval_runtime": 120.3827, + "eval_samples_per_second": 16.614, + "eval_steps_per_second": 4.153, + "step": 237000 + }, + { + "epoch": 1.53, + "learning_rate": 7.054222038635057e-05, + "loss": 0.0272, + "step": 237010 + }, + { + "epoch": 1.53, + "learning_rate": 7.053253903199364e-05, + "loss": 0.02, + "step": 237020 + }, + { + "epoch": 1.53, + "learning_rate": 7.052285767763672e-05, + "loss": 0.0271, + "step": 237030 + }, + { + "epoch": 1.53, + "learning_rate": 7.051317632327978e-05, + "loss": 0.0267, + "step": 237040 + }, + { + "epoch": 1.53, + "learning_rate": 7.050349496892285e-05, + "loss": 0.025, + "step": 237050 + }, + { + "epoch": 1.53, + "learning_rate": 7.049381361456592e-05, + "loss": 0.0304, + "step": 237060 + }, + { + "epoch": 1.53, + "learning_rate": 7.048413226020898e-05, + "loss": 0.0261, + "step": 237070 + }, + { + "epoch": 1.53, + "learning_rate": 7.047445090585205e-05, + "loss": 0.0267, + "step": 237080 + }, + { + "epoch": 1.53, + "learning_rate": 7.046476955149511e-05, + "loss": 0.0262, + "step": 237090 + }, + { + "epoch": 1.53, + "learning_rate": 7.04550881971382e-05, + "loss": 0.03, + "step": 237100 + }, + { + "epoch": 1.53, + "learning_rate": 7.044540684278125e-05, + "loss": 0.0267, + "step": 237110 + }, + { + "epoch": 1.53, + "learning_rate": 7.043572548842433e-05, + "loss": 0.0261, + "step": 237120 + }, + { + "epoch": 1.53, + "learning_rate": 7.042604413406739e-05, + "loss": 0.0239, + "step": 237130 + }, + { + "epoch": 1.53, + "learning_rate": 7.041636277971046e-05, + "loss": 0.0301, + "step": 237140 + }, + { + "epoch": 1.53, + "learning_rate": 7.040668142535352e-05, + "loss": 0.0271, + "step": 237150 + }, + { + "epoch": 1.53, + "learning_rate": 7.039700007099659e-05, + "loss": 0.0273, + "step": 237160 + }, + { + "epoch": 1.53, + "learning_rate": 7.038731871663966e-05, + "loss": 0.0273, + "step": 237170 + }, + { + "epoch": 1.53, + "learning_rate": 7.037763736228272e-05, + "loss": 0.0282, + "step": 237180 + }, + { + "epoch": 1.53, + "learning_rate": 7.03679560079258e-05, + "loss": 0.0268, + "step": 237190 + }, + { + "epoch": 1.53, + "learning_rate": 7.035827465356887e-05, + "loss": 0.0291, + "step": 237200 + }, + { + "epoch": 1.53, + "learning_rate": 7.034859329921192e-05, + "loss": 0.029, + "step": 237210 + }, + { + "epoch": 1.53, + "learning_rate": 7.0338911944855e-05, + "loss": 0.0234, + "step": 237220 + }, + { + "epoch": 1.53, + "learning_rate": 7.032923059049807e-05, + "loss": 0.0284, + "step": 237230 + }, + { + "epoch": 1.53, + "learning_rate": 7.031954923614113e-05, + "loss": 0.0262, + "step": 237240 + }, + { + "epoch": 1.53, + "learning_rate": 7.03098678817842e-05, + "loss": 0.0293, + "step": 237250 + }, + { + "epoch": 1.53, + "learning_rate": 7.030018652742728e-05, + "loss": 0.025, + "step": 237260 + }, + { + "epoch": 1.53, + "learning_rate": 7.029050517307033e-05, + "loss": 0.0286, + "step": 237270 + }, + { + "epoch": 1.53, + "learning_rate": 7.02808238187134e-05, + "loss": 0.0269, + "step": 237280 + }, + { + "epoch": 1.53, + "learning_rate": 7.027114246435648e-05, + "loss": 0.0324, + "step": 237290 + }, + { + "epoch": 1.53, + "learning_rate": 7.026146110999955e-05, + "loss": 0.03, + "step": 237300 + }, + { + "epoch": 1.53, + "learning_rate": 7.025177975564261e-05, + "loss": 0.0237, + "step": 237310 + }, + { + "epoch": 1.53, + "learning_rate": 7.024209840128568e-05, + "loss": 0.0279, + "step": 237320 + }, + { + "epoch": 1.53, + "learning_rate": 7.023241704692874e-05, + "loss": 0.0241, + "step": 237330 + }, + { + "epoch": 1.53, + "learning_rate": 7.022273569257181e-05, + "loss": 0.0247, + "step": 237340 + }, + { + "epoch": 1.53, + "learning_rate": 7.021305433821488e-05, + "loss": 0.0319, + "step": 237350 + }, + { + "epoch": 1.53, + "learning_rate": 7.020337298385796e-05, + "loss": 0.0274, + "step": 237360 + }, + { + "epoch": 1.53, + "learning_rate": 7.019369162950101e-05, + "loss": 0.0251, + "step": 237370 + }, + { + "epoch": 1.53, + "learning_rate": 7.018401027514409e-05, + "loss": 0.0287, + "step": 237380 + }, + { + "epoch": 1.53, + "learning_rate": 7.017432892078716e-05, + "loss": 0.0265, + "step": 237390 + }, + { + "epoch": 1.53, + "learning_rate": 7.016464756643022e-05, + "loss": 0.0239, + "step": 237400 + }, + { + "epoch": 1.53, + "learning_rate": 7.015496621207329e-05, + "loss": 0.0237, + "step": 237410 + }, + { + "epoch": 1.53, + "learning_rate": 7.014528485771635e-05, + "loss": 0.0235, + "step": 237420 + }, + { + "epoch": 1.53, + "learning_rate": 7.013560350335942e-05, + "loss": 0.0343, + "step": 237430 + }, + { + "epoch": 1.53, + "learning_rate": 7.012592214900249e-05, + "loss": 0.0257, + "step": 237440 + }, + { + "epoch": 1.53, + "learning_rate": 7.011624079464557e-05, + "loss": 0.0274, + "step": 237450 + }, + { + "epoch": 1.53, + "learning_rate": 7.010655944028863e-05, + "loss": 0.0279, + "step": 237460 + }, + { + "epoch": 1.53, + "learning_rate": 7.00968780859317e-05, + "loss": 0.0258, + "step": 237470 + }, + { + "epoch": 1.53, + "learning_rate": 7.008719673157476e-05, + "loss": 0.0273, + "step": 237480 + }, + { + "epoch": 1.53, + "learning_rate": 7.007751537721783e-05, + "loss": 0.0235, + "step": 237490 + }, + { + "epoch": 1.53, + "learning_rate": 7.00678340228609e-05, + "loss": 0.0249, + "step": 237500 + }, + { + "epoch": 1.53, + "learning_rate": 7.005815266850396e-05, + "loss": 0.0255, + "step": 237510 + }, + { + "epoch": 1.53, + "learning_rate": 7.004847131414703e-05, + "loss": 0.021, + "step": 237520 + }, + { + "epoch": 1.53, + "learning_rate": 7.00387899597901e-05, + "loss": 0.0256, + "step": 237530 + }, + { + "epoch": 1.53, + "learning_rate": 7.002910860543318e-05, + "loss": 0.0254, + "step": 237540 + }, + { + "epoch": 1.53, + "learning_rate": 7.001942725107624e-05, + "loss": 0.0267, + "step": 237550 + }, + { + "epoch": 1.53, + "learning_rate": 7.000974589671931e-05, + "loss": 0.0257, + "step": 237560 + }, + { + "epoch": 1.53, + "learning_rate": 7.000006454236237e-05, + "loss": 0.023, + "step": 237570 + }, + { + "epoch": 1.53, + "learning_rate": 6.999038318800544e-05, + "loss": 0.0257, + "step": 237580 + }, + { + "epoch": 1.53, + "learning_rate": 6.998070183364851e-05, + "loss": 0.024, + "step": 237590 + }, + { + "epoch": 1.53, + "learning_rate": 6.997102047929157e-05, + "loss": 0.0232, + "step": 237600 + }, + { + "epoch": 1.53, + "learning_rate": 6.996133912493465e-05, + "loss": 0.0291, + "step": 237610 + }, + { + "epoch": 1.53, + "learning_rate": 6.995165777057772e-05, + "loss": 0.0233, + "step": 237620 + }, + { + "epoch": 1.53, + "learning_rate": 6.994197641622077e-05, + "loss": 0.0261, + "step": 237630 + }, + { + "epoch": 1.53, + "learning_rate": 6.993229506186385e-05, + "loss": 0.0333, + "step": 237640 + }, + { + "epoch": 1.53, + "learning_rate": 6.992261370750692e-05, + "loss": 0.0323, + "step": 237650 + }, + { + "epoch": 1.53, + "learning_rate": 6.991293235314998e-05, + "loss": 0.0299, + "step": 237660 + }, + { + "epoch": 1.53, + "learning_rate": 6.990325099879305e-05, + "loss": 0.0265, + "step": 237670 + }, + { + "epoch": 1.53, + "learning_rate": 6.989356964443612e-05, + "loss": 0.0221, + "step": 237680 + }, + { + "epoch": 1.53, + "learning_rate": 6.988388829007918e-05, + "loss": 0.0288, + "step": 237690 + }, + { + "epoch": 1.53, + "learning_rate": 6.987420693572225e-05, + "loss": 0.03, + "step": 237700 + }, + { + "epoch": 1.53, + "learning_rate": 6.986452558136533e-05, + "loss": 0.0289, + "step": 237710 + }, + { + "epoch": 1.53, + "learning_rate": 6.98548442270084e-05, + "loss": 0.0265, + "step": 237720 + }, + { + "epoch": 1.53, + "learning_rate": 6.984516287265146e-05, + "loss": 0.0309, + "step": 237730 + }, + { + "epoch": 1.53, + "learning_rate": 6.983548151829453e-05, + "loss": 0.0219, + "step": 237740 + }, + { + "epoch": 1.53, + "learning_rate": 6.98258001639376e-05, + "loss": 0.0247, + "step": 237750 + }, + { + "epoch": 1.53, + "learning_rate": 6.981611880958066e-05, + "loss": 0.026, + "step": 237760 + }, + { + "epoch": 1.53, + "learning_rate": 6.980643745522373e-05, + "loss": 0.0238, + "step": 237770 + }, + { + "epoch": 1.53, + "learning_rate": 6.979675610086679e-05, + "loss": 0.0269, + "step": 237780 + }, + { + "epoch": 1.53, + "learning_rate": 6.978707474650986e-05, + "loss": 0.0297, + "step": 237790 + }, + { + "epoch": 1.53, + "learning_rate": 6.977739339215294e-05, + "loss": 0.0259, + "step": 237800 + }, + { + "epoch": 1.53, + "learning_rate": 6.9767712037796e-05, + "loss": 0.0236, + "step": 237810 + }, + { + "epoch": 1.53, + "learning_rate": 6.975803068343907e-05, + "loss": 0.0273, + "step": 237820 + }, + { + "epoch": 1.54, + "learning_rate": 6.974834932908214e-05, + "loss": 0.0258, + "step": 237830 + }, + { + "epoch": 1.54, + "learning_rate": 6.97386679747252e-05, + "loss": 0.027, + "step": 237840 + }, + { + "epoch": 1.54, + "learning_rate": 6.972898662036827e-05, + "loss": 0.0259, + "step": 237850 + }, + { + "epoch": 1.54, + "learning_rate": 6.971930526601134e-05, + "loss": 0.0246, + "step": 237860 + }, + { + "epoch": 1.54, + "learning_rate": 6.970962391165442e-05, + "loss": 0.0232, + "step": 237870 + }, + { + "epoch": 1.54, + "learning_rate": 6.969994255729747e-05, + "loss": 0.0337, + "step": 237880 + }, + { + "epoch": 1.54, + "learning_rate": 6.969026120294055e-05, + "loss": 0.0248, + "step": 237890 + }, + { + "epoch": 1.54, + "learning_rate": 6.968057984858361e-05, + "loss": 0.0283, + "step": 237900 + }, + { + "epoch": 1.54, + "learning_rate": 6.967089849422668e-05, + "loss": 0.0264, + "step": 237910 + }, + { + "epoch": 1.54, + "learning_rate": 6.966121713986975e-05, + "loss": 0.0254, + "step": 237920 + }, + { + "epoch": 1.54, + "learning_rate": 6.965153578551281e-05, + "loss": 0.0285, + "step": 237930 + }, + { + "epoch": 1.54, + "learning_rate": 6.964185443115588e-05, + "loss": 0.0219, + "step": 237940 + }, + { + "epoch": 1.54, + "learning_rate": 6.963217307679895e-05, + "loss": 0.021, + "step": 237950 + }, + { + "epoch": 1.54, + "learning_rate": 6.962249172244203e-05, + "loss": 0.0253, + "step": 237960 + }, + { + "epoch": 1.54, + "learning_rate": 6.961281036808509e-05, + "loss": 0.028, + "step": 237970 + }, + { + "epoch": 1.54, + "learning_rate": 6.960312901372814e-05, + "loss": 0.0326, + "step": 237980 + }, + { + "epoch": 1.54, + "learning_rate": 6.959344765937122e-05, + "loss": 0.0261, + "step": 237990 + }, + { + "epoch": 1.54, + "learning_rate": 6.958376630501429e-05, + "loss": 0.0222, + "step": 238000 + }, + { + "epoch": 1.54, + "eval_cer": 0.9198617105411818, + "eval_loss": 0.019788194447755814, + "eval_runtime": 119.9476, + "eval_samples_per_second": 16.674, + "eval_steps_per_second": 4.168, + "step": 238000 + }, + { + "epoch": 1.54, + "learning_rate": 6.957408495065736e-05, + "loss": 0.0316, + "step": 238010 + }, + { + "epoch": 1.54, + "learning_rate": 6.956440359630042e-05, + "loss": 0.0366, + "step": 238020 + }, + { + "epoch": 1.54, + "learning_rate": 6.95547222419435e-05, + "loss": 0.03, + "step": 238030 + }, + { + "epoch": 1.54, + "learning_rate": 6.954504088758656e-05, + "loss": 0.027, + "step": 238040 + }, + { + "epoch": 1.54, + "learning_rate": 6.953535953322962e-05, + "loss": 0.0266, + "step": 238050 + }, + { + "epoch": 1.54, + "learning_rate": 6.95256781788727e-05, + "loss": 0.0316, + "step": 238060 + }, + { + "epoch": 1.54, + "learning_rate": 6.951599682451577e-05, + "loss": 0.0262, + "step": 238070 + }, + { + "epoch": 1.54, + "learning_rate": 6.950631547015883e-05, + "loss": 0.0263, + "step": 238080 + }, + { + "epoch": 1.54, + "learning_rate": 6.94966341158019e-05, + "loss": 0.024, + "step": 238090 + }, + { + "epoch": 1.54, + "learning_rate": 6.948695276144497e-05, + "loss": 0.0264, + "step": 238100 + }, + { + "epoch": 1.54, + "learning_rate": 6.947727140708803e-05, + "loss": 0.0243, + "step": 238110 + }, + { + "epoch": 1.54, + "learning_rate": 6.94675900527311e-05, + "loss": 0.0293, + "step": 238120 + }, + { + "epoch": 1.54, + "learning_rate": 6.945790869837418e-05, + "loss": 0.0283, + "step": 238130 + }, + { + "epoch": 1.54, + "learning_rate": 6.944822734401723e-05, + "loss": 0.0283, + "step": 238140 + }, + { + "epoch": 1.54, + "learning_rate": 6.943854598966031e-05, + "loss": 0.0255, + "step": 238150 + }, + { + "epoch": 1.54, + "learning_rate": 6.942886463530338e-05, + "loss": 0.0241, + "step": 238160 + }, + { + "epoch": 1.54, + "learning_rate": 6.941918328094644e-05, + "loss": 0.0327, + "step": 238170 + }, + { + "epoch": 1.54, + "learning_rate": 6.940950192658951e-05, + "loss": 0.0263, + "step": 238180 + }, + { + "epoch": 1.54, + "learning_rate": 6.939982057223258e-05, + "loss": 0.0242, + "step": 238190 + }, + { + "epoch": 1.54, + "learning_rate": 6.939013921787564e-05, + "loss": 0.0268, + "step": 238200 + }, + { + "epoch": 1.54, + "learning_rate": 6.938045786351871e-05, + "loss": 0.0256, + "step": 238210 + }, + { + "epoch": 1.54, + "learning_rate": 6.937077650916179e-05, + "loss": 0.0255, + "step": 238220 + }, + { + "epoch": 1.54, + "learning_rate": 6.936109515480485e-05, + "loss": 0.0274, + "step": 238230 + }, + { + "epoch": 1.54, + "learning_rate": 6.935141380044792e-05, + "loss": 0.0228, + "step": 238240 + }, + { + "epoch": 1.54, + "learning_rate": 6.934173244609099e-05, + "loss": 0.0229, + "step": 238250 + }, + { + "epoch": 1.54, + "learning_rate": 6.933205109173405e-05, + "loss": 0.0234, + "step": 238260 + }, + { + "epoch": 1.54, + "learning_rate": 6.932236973737712e-05, + "loss": 0.025, + "step": 238270 + }, + { + "epoch": 1.54, + "learning_rate": 6.931268838302019e-05, + "loss": 0.0219, + "step": 238280 + }, + { + "epoch": 1.54, + "learning_rate": 6.930300702866327e-05, + "loss": 0.0251, + "step": 238290 + }, + { + "epoch": 1.54, + "learning_rate": 6.929332567430632e-05, + "loss": 0.0272, + "step": 238300 + }, + { + "epoch": 1.54, + "learning_rate": 6.92836443199494e-05, + "loss": 0.0254, + "step": 238310 + }, + { + "epoch": 1.54, + "learning_rate": 6.927396296559246e-05, + "loss": 0.0272, + "step": 238320 + }, + { + "epoch": 1.54, + "learning_rate": 6.926428161123553e-05, + "loss": 0.0263, + "step": 238330 + }, + { + "epoch": 1.54, + "learning_rate": 6.92546002568786e-05, + "loss": 0.0298, + "step": 238340 + }, + { + "epoch": 1.54, + "learning_rate": 6.924491890252166e-05, + "loss": 0.0269, + "step": 238350 + }, + { + "epoch": 1.54, + "learning_rate": 6.923523754816473e-05, + "loss": 0.0211, + "step": 238360 + }, + { + "epoch": 1.54, + "learning_rate": 6.92255561938078e-05, + "loss": 0.0259, + "step": 238370 + }, + { + "epoch": 1.54, + "learning_rate": 6.921587483945088e-05, + "loss": 0.0329, + "step": 238380 + }, + { + "epoch": 1.54, + "learning_rate": 6.920619348509394e-05, + "loss": 0.0252, + "step": 238390 + }, + { + "epoch": 1.54, + "learning_rate": 6.9196512130737e-05, + "loss": 0.0241, + "step": 238400 + }, + { + "epoch": 1.54, + "learning_rate": 6.918683077638007e-05, + "loss": 0.0268, + "step": 238410 + }, + { + "epoch": 1.54, + "learning_rate": 6.917714942202314e-05, + "loss": 0.0321, + "step": 238420 + }, + { + "epoch": 1.54, + "learning_rate": 6.91674680676662e-05, + "loss": 0.0274, + "step": 238430 + }, + { + "epoch": 1.54, + "learning_rate": 6.915778671330927e-05, + "loss": 0.0241, + "step": 238440 + }, + { + "epoch": 1.54, + "learning_rate": 6.914810535895234e-05, + "loss": 0.027, + "step": 238450 + }, + { + "epoch": 1.54, + "learning_rate": 6.91384240045954e-05, + "loss": 0.0212, + "step": 238460 + }, + { + "epoch": 1.54, + "learning_rate": 6.912874265023847e-05, + "loss": 0.0292, + "step": 238470 + }, + { + "epoch": 1.54, + "learning_rate": 6.911906129588155e-05, + "loss": 0.029, + "step": 238480 + }, + { + "epoch": 1.54, + "learning_rate": 6.910937994152462e-05, + "loss": 0.0268, + "step": 238490 + }, + { + "epoch": 1.54, + "learning_rate": 6.909969858716768e-05, + "loss": 0.0252, + "step": 238500 + }, + { + "epoch": 1.54, + "learning_rate": 6.909001723281075e-05, + "loss": 0.0309, + "step": 238510 + }, + { + "epoch": 1.54, + "learning_rate": 6.908033587845382e-05, + "loss": 0.0229, + "step": 238520 + }, + { + "epoch": 1.54, + "learning_rate": 6.907065452409688e-05, + "loss": 0.0264, + "step": 238530 + }, + { + "epoch": 1.54, + "learning_rate": 6.906097316973995e-05, + "loss": 0.0291, + "step": 238540 + }, + { + "epoch": 1.54, + "learning_rate": 6.905129181538303e-05, + "loss": 0.0274, + "step": 238550 + }, + { + "epoch": 1.54, + "learning_rate": 6.904161046102608e-05, + "loss": 0.0273, + "step": 238560 + }, + { + "epoch": 1.54, + "learning_rate": 6.903192910666916e-05, + "loss": 0.0233, + "step": 238570 + }, + { + "epoch": 1.54, + "learning_rate": 6.902224775231223e-05, + "loss": 0.0274, + "step": 238580 + }, + { + "epoch": 1.54, + "learning_rate": 6.90125663979553e-05, + "loss": 0.0241, + "step": 238590 + }, + { + "epoch": 1.54, + "learning_rate": 6.900288504359836e-05, + "loss": 0.0268, + "step": 238600 + }, + { + "epoch": 1.54, + "learning_rate": 6.899320368924143e-05, + "loss": 0.0301, + "step": 238610 + }, + { + "epoch": 1.54, + "learning_rate": 6.898352233488449e-05, + "loss": 0.0342, + "step": 238620 + }, + { + "epoch": 1.54, + "learning_rate": 6.897384098052756e-05, + "loss": 0.0277, + "step": 238630 + }, + { + "epoch": 1.54, + "learning_rate": 6.896415962617064e-05, + "loss": 0.0246, + "step": 238640 + }, + { + "epoch": 1.54, + "learning_rate": 6.89544782718137e-05, + "loss": 0.0284, + "step": 238650 + }, + { + "epoch": 1.54, + "learning_rate": 6.894479691745676e-05, + "loss": 0.0279, + "step": 238660 + }, + { + "epoch": 1.54, + "learning_rate": 6.893511556309984e-05, + "loss": 0.0266, + "step": 238670 + }, + { + "epoch": 1.54, + "learning_rate": 6.89254342087429e-05, + "loss": 0.0265, + "step": 238680 + }, + { + "epoch": 1.54, + "learning_rate": 6.891575285438597e-05, + "loss": 0.0242, + "step": 238690 + }, + { + "epoch": 1.54, + "learning_rate": 6.890607150002904e-05, + "loss": 0.0256, + "step": 238700 + }, + { + "epoch": 1.54, + "learning_rate": 6.889639014567212e-05, + "loss": 0.0264, + "step": 238710 + }, + { + "epoch": 1.54, + "learning_rate": 6.888670879131517e-05, + "loss": 0.034, + "step": 238720 + }, + { + "epoch": 1.54, + "learning_rate": 6.887702743695823e-05, + "loss": 0.0308, + "step": 238730 + }, + { + "epoch": 1.54, + "learning_rate": 6.886734608260131e-05, + "loss": 0.0241, + "step": 238740 + }, + { + "epoch": 1.54, + "learning_rate": 6.885766472824438e-05, + "loss": 0.0249, + "step": 238750 + }, + { + "epoch": 1.54, + "learning_rate": 6.884798337388745e-05, + "loss": 0.026, + "step": 238760 + }, + { + "epoch": 1.54, + "learning_rate": 6.883830201953051e-05, + "loss": 0.0293, + "step": 238770 + }, + { + "epoch": 1.54, + "learning_rate": 6.882862066517358e-05, + "loss": 0.0233, + "step": 238780 + }, + { + "epoch": 1.54, + "learning_rate": 6.881893931081665e-05, + "loss": 0.0305, + "step": 238790 + }, + { + "epoch": 1.54, + "learning_rate": 6.880925795645971e-05, + "loss": 0.0276, + "step": 238800 + }, + { + "epoch": 1.54, + "learning_rate": 6.879957660210279e-05, + "loss": 0.0278, + "step": 238810 + }, + { + "epoch": 1.54, + "learning_rate": 6.878989524774584e-05, + "loss": 0.0307, + "step": 238820 + }, + { + "epoch": 1.54, + "learning_rate": 6.878021389338892e-05, + "loss": 0.0278, + "step": 238830 + }, + { + "epoch": 1.54, + "learning_rate": 6.877053253903199e-05, + "loss": 0.0227, + "step": 238840 + }, + { + "epoch": 1.54, + "learning_rate": 6.876085118467506e-05, + "loss": 0.0295, + "step": 238850 + }, + { + "epoch": 1.54, + "learning_rate": 6.875116983031812e-05, + "loss": 0.025, + "step": 238860 + }, + { + "epoch": 1.54, + "learning_rate": 6.874148847596119e-05, + "loss": 0.026, + "step": 238870 + }, + { + "epoch": 1.54, + "learning_rate": 6.873180712160426e-05, + "loss": 0.0286, + "step": 238880 + }, + { + "epoch": 1.54, + "learning_rate": 6.872212576724732e-05, + "loss": 0.0244, + "step": 238890 + }, + { + "epoch": 1.54, + "learning_rate": 6.87124444128904e-05, + "loss": 0.0311, + "step": 238900 + }, + { + "epoch": 1.54, + "learning_rate": 6.870276305853347e-05, + "loss": 0.029, + "step": 238910 + }, + { + "epoch": 1.54, + "learning_rate": 6.869308170417653e-05, + "loss": 0.0288, + "step": 238920 + }, + { + "epoch": 1.54, + "learning_rate": 6.86834003498196e-05, + "loss": 0.029, + "step": 238930 + }, + { + "epoch": 1.54, + "learning_rate": 6.867371899546267e-05, + "loss": 0.0269, + "step": 238940 + }, + { + "epoch": 1.54, + "learning_rate": 6.866403764110573e-05, + "loss": 0.0261, + "step": 238950 + }, + { + "epoch": 1.54, + "learning_rate": 6.86543562867488e-05, + "loss": 0.0299, + "step": 238960 + }, + { + "epoch": 1.54, + "learning_rate": 6.864467493239186e-05, + "loss": 0.0264, + "step": 238970 + }, + { + "epoch": 1.54, + "learning_rate": 6.863499357803493e-05, + "loss": 0.0289, + "step": 238980 + }, + { + "epoch": 1.54, + "learning_rate": 6.862531222367801e-05, + "loss": 0.0246, + "step": 238990 + }, + { + "epoch": 1.54, + "learning_rate": 6.861563086932108e-05, + "loss": 0.0259, + "step": 239000 + }, + { + "epoch": 1.54, + "eval_cer": 0.9199050954694384, + "eval_loss": 0.01946895383298397, + "eval_runtime": 120.4017, + "eval_samples_per_second": 16.611, + "eval_steps_per_second": 4.153, + "step": 239000 + }, + { + "epoch": 1.54, + "learning_rate": 6.860594951496414e-05, + "loss": 0.0281, + "step": 239010 + }, + { + "epoch": 1.54, + "learning_rate": 6.859626816060721e-05, + "loss": 0.0324, + "step": 239020 + }, + { + "epoch": 1.54, + "learning_rate": 6.858658680625028e-05, + "loss": 0.0294, + "step": 239030 + }, + { + "epoch": 1.54, + "learning_rate": 6.857690545189334e-05, + "loss": 0.0236, + "step": 239040 + }, + { + "epoch": 1.54, + "learning_rate": 6.856722409753641e-05, + "loss": 0.024, + "step": 239050 + }, + { + "epoch": 1.54, + "learning_rate": 6.855754274317949e-05, + "loss": 0.0266, + "step": 239060 + }, + { + "epoch": 1.54, + "learning_rate": 6.854786138882254e-05, + "loss": 0.0255, + "step": 239070 + }, + { + "epoch": 1.54, + "learning_rate": 6.853818003446561e-05, + "loss": 0.0267, + "step": 239080 + }, + { + "epoch": 1.54, + "learning_rate": 6.852849868010869e-05, + "loss": 0.0257, + "step": 239090 + }, + { + "epoch": 1.54, + "learning_rate": 6.851881732575175e-05, + "loss": 0.0272, + "step": 239100 + }, + { + "epoch": 1.54, + "learning_rate": 6.850913597139482e-05, + "loss": 0.0257, + "step": 239110 + }, + { + "epoch": 1.54, + "learning_rate": 6.849945461703789e-05, + "loss": 0.0258, + "step": 239120 + }, + { + "epoch": 1.54, + "learning_rate": 6.848977326268095e-05, + "loss": 0.0322, + "step": 239130 + }, + { + "epoch": 1.54, + "learning_rate": 6.848009190832402e-05, + "loss": 0.0296, + "step": 239140 + }, + { + "epoch": 1.54, + "learning_rate": 6.847041055396708e-05, + "loss": 0.0258, + "step": 239150 + }, + { + "epoch": 1.54, + "learning_rate": 6.846072919961016e-05, + "loss": 0.0289, + "step": 239160 + }, + { + "epoch": 1.54, + "learning_rate": 6.845104784525322e-05, + "loss": 0.0268, + "step": 239170 + }, + { + "epoch": 1.54, + "learning_rate": 6.84413664908963e-05, + "loss": 0.0251, + "step": 239180 + }, + { + "epoch": 1.54, + "learning_rate": 6.843168513653936e-05, + "loss": 0.0223, + "step": 239190 + }, + { + "epoch": 1.54, + "learning_rate": 6.842200378218243e-05, + "loss": 0.0296, + "step": 239200 + }, + { + "epoch": 1.54, + "learning_rate": 6.84123224278255e-05, + "loss": 0.0242, + "step": 239210 + }, + { + "epoch": 1.54, + "learning_rate": 6.840264107346856e-05, + "loss": 0.024, + "step": 239220 + }, + { + "epoch": 1.54, + "learning_rate": 6.839295971911163e-05, + "loss": 0.0302, + "step": 239230 + }, + { + "epoch": 1.54, + "learning_rate": 6.83832783647547e-05, + "loss": 0.026, + "step": 239240 + }, + { + "epoch": 1.54, + "learning_rate": 6.837359701039777e-05, + "loss": 0.027, + "step": 239250 + }, + { + "epoch": 1.54, + "learning_rate": 6.836391565604084e-05, + "loss": 0.0254, + "step": 239260 + }, + { + "epoch": 1.54, + "learning_rate": 6.83542343016839e-05, + "loss": 0.0294, + "step": 239270 + }, + { + "epoch": 1.54, + "learning_rate": 6.834455294732697e-05, + "loss": 0.0243, + "step": 239280 + }, + { + "epoch": 1.54, + "learning_rate": 6.833487159297004e-05, + "loss": 0.0295, + "step": 239290 + }, + { + "epoch": 1.54, + "learning_rate": 6.83251902386131e-05, + "loss": 0.0286, + "step": 239300 + }, + { + "epoch": 1.54, + "learning_rate": 6.831550888425617e-05, + "loss": 0.0199, + "step": 239310 + }, + { + "epoch": 1.54, + "learning_rate": 6.830582752989925e-05, + "loss": 0.0238, + "step": 239320 + }, + { + "epoch": 1.54, + "learning_rate": 6.82961461755423e-05, + "loss": 0.0231, + "step": 239330 + }, + { + "epoch": 1.54, + "learning_rate": 6.828646482118538e-05, + "loss": 0.0212, + "step": 239340 + }, + { + "epoch": 1.54, + "learning_rate": 6.827678346682845e-05, + "loss": 0.025, + "step": 239350 + }, + { + "epoch": 1.54, + "learning_rate": 6.826710211247152e-05, + "loss": 0.0214, + "step": 239360 + }, + { + "epoch": 1.54, + "learning_rate": 6.825742075811458e-05, + "loss": 0.0248, + "step": 239370 + }, + { + "epoch": 1.55, + "learning_rate": 6.824773940375765e-05, + "loss": 0.029, + "step": 239380 + }, + { + "epoch": 1.55, + "learning_rate": 6.823805804940071e-05, + "loss": 0.0274, + "step": 239390 + }, + { + "epoch": 1.55, + "learning_rate": 6.822837669504378e-05, + "loss": 0.03, + "step": 239400 + }, + { + "epoch": 1.55, + "learning_rate": 6.821869534068686e-05, + "loss": 0.0247, + "step": 239410 + }, + { + "epoch": 1.55, + "learning_rate": 6.820901398632993e-05, + "loss": 0.0254, + "step": 239420 + }, + { + "epoch": 1.55, + "learning_rate": 6.819933263197298e-05, + "loss": 0.0238, + "step": 239430 + }, + { + "epoch": 1.55, + "learning_rate": 6.818965127761606e-05, + "loss": 0.0272, + "step": 239440 + }, + { + "epoch": 1.55, + "learning_rate": 6.817996992325913e-05, + "loss": 0.0262, + "step": 239450 + }, + { + "epoch": 1.55, + "learning_rate": 6.817028856890219e-05, + "loss": 0.0239, + "step": 239460 + }, + { + "epoch": 1.55, + "learning_rate": 6.816060721454526e-05, + "loss": 0.0265, + "step": 239470 + }, + { + "epoch": 1.55, + "learning_rate": 6.815092586018834e-05, + "loss": 0.0303, + "step": 239480 + }, + { + "epoch": 1.55, + "learning_rate": 6.814124450583139e-05, + "loss": 0.027, + "step": 239490 + }, + { + "epoch": 1.55, + "learning_rate": 6.813156315147446e-05, + "loss": 0.0299, + "step": 239500 + }, + { + "epoch": 1.55, + "learning_rate": 6.812188179711754e-05, + "loss": 0.0265, + "step": 239510 + }, + { + "epoch": 1.55, + "learning_rate": 6.81122004427606e-05, + "loss": 0.0287, + "step": 239520 + }, + { + "epoch": 1.55, + "learning_rate": 6.810251908840367e-05, + "loss": 0.0312, + "step": 239530 + }, + { + "epoch": 1.55, + "learning_rate": 6.809283773404674e-05, + "loss": 0.0265, + "step": 239540 + }, + { + "epoch": 1.55, + "learning_rate": 6.80831563796898e-05, + "loss": 0.0223, + "step": 239550 + }, + { + "epoch": 1.55, + "learning_rate": 6.807347502533287e-05, + "loss": 0.025, + "step": 239560 + }, + { + "epoch": 1.55, + "learning_rate": 6.806379367097593e-05, + "loss": 0.0291, + "step": 239570 + }, + { + "epoch": 1.55, + "learning_rate": 6.805411231661901e-05, + "loss": 0.0272, + "step": 239580 + }, + { + "epoch": 1.55, + "learning_rate": 6.804443096226207e-05, + "loss": 0.027, + "step": 239590 + }, + { + "epoch": 1.55, + "learning_rate": 6.803474960790515e-05, + "loss": 0.0283, + "step": 239600 + }, + { + "epoch": 1.55, + "learning_rate": 6.802506825354821e-05, + "loss": 0.0326, + "step": 239610 + }, + { + "epoch": 1.55, + "learning_rate": 6.801538689919128e-05, + "loss": 0.028, + "step": 239620 + }, + { + "epoch": 1.55, + "learning_rate": 6.800570554483435e-05, + "loss": 0.029, + "step": 239630 + }, + { + "epoch": 1.55, + "learning_rate": 6.799602419047741e-05, + "loss": 0.0261, + "step": 239640 + }, + { + "epoch": 1.55, + "learning_rate": 6.798634283612048e-05, + "loss": 0.0259, + "step": 239650 + }, + { + "epoch": 1.55, + "learning_rate": 6.797666148176354e-05, + "loss": 0.025, + "step": 239660 + }, + { + "epoch": 1.55, + "learning_rate": 6.796698012740662e-05, + "loss": 0.0219, + "step": 239670 + }, + { + "epoch": 1.55, + "learning_rate": 6.795729877304969e-05, + "loss": 0.03, + "step": 239680 + }, + { + "epoch": 1.55, + "learning_rate": 6.794761741869276e-05, + "loss": 0.0316, + "step": 239690 + }, + { + "epoch": 1.55, + "learning_rate": 6.793793606433582e-05, + "loss": 0.0281, + "step": 239700 + }, + { + "epoch": 1.55, + "learning_rate": 6.792825470997889e-05, + "loss": 0.03, + "step": 239710 + }, + { + "epoch": 1.55, + "learning_rate": 6.791857335562195e-05, + "loss": 0.0317, + "step": 239720 + }, + { + "epoch": 1.55, + "learning_rate": 6.790889200126502e-05, + "loss": 0.0226, + "step": 239730 + }, + { + "epoch": 1.55, + "learning_rate": 6.78992106469081e-05, + "loss": 0.0252, + "step": 239740 + }, + { + "epoch": 1.55, + "learning_rate": 6.788952929255115e-05, + "loss": 0.0306, + "step": 239750 + }, + { + "epoch": 1.55, + "learning_rate": 6.787984793819423e-05, + "loss": 0.0223, + "step": 239760 + }, + { + "epoch": 1.55, + "learning_rate": 6.78701665838373e-05, + "loss": 0.0374, + "step": 239770 + }, + { + "epoch": 1.55, + "learning_rate": 6.786048522948037e-05, + "loss": 0.0278, + "step": 239780 + }, + { + "epoch": 1.55, + "learning_rate": 6.785080387512343e-05, + "loss": 0.0286, + "step": 239790 + }, + { + "epoch": 1.55, + "learning_rate": 6.78411225207665e-05, + "loss": 0.0277, + "step": 239800 + }, + { + "epoch": 1.55, + "learning_rate": 6.783144116640956e-05, + "loss": 0.0283, + "step": 239810 + }, + { + "epoch": 1.55, + "learning_rate": 6.782175981205263e-05, + "loss": 0.0312, + "step": 239820 + }, + { + "epoch": 1.55, + "learning_rate": 6.781207845769571e-05, + "loss": 0.0268, + "step": 239830 + }, + { + "epoch": 1.55, + "learning_rate": 6.780239710333878e-05, + "loss": 0.0295, + "step": 239840 + }, + { + "epoch": 1.55, + "learning_rate": 6.779271574898183e-05, + "loss": 0.0264, + "step": 239850 + }, + { + "epoch": 1.55, + "learning_rate": 6.778303439462491e-05, + "loss": 0.0325, + "step": 239860 + }, + { + "epoch": 1.55, + "learning_rate": 6.777335304026798e-05, + "loss": 0.0221, + "step": 239870 + }, + { + "epoch": 1.55, + "learning_rate": 6.776367168591104e-05, + "loss": 0.0192, + "step": 239880 + }, + { + "epoch": 1.55, + "learning_rate": 6.775399033155411e-05, + "loss": 0.0299, + "step": 239890 + }, + { + "epoch": 1.55, + "learning_rate": 6.774430897719719e-05, + "loss": 0.0274, + "step": 239900 + }, + { + "epoch": 1.55, + "learning_rate": 6.773462762284024e-05, + "loss": 0.0217, + "step": 239910 + }, + { + "epoch": 1.55, + "learning_rate": 6.77249462684833e-05, + "loss": 0.03, + "step": 239920 + }, + { + "epoch": 1.55, + "learning_rate": 6.771526491412639e-05, + "loss": 0.0288, + "step": 239930 + }, + { + "epoch": 1.55, + "learning_rate": 6.770558355976945e-05, + "loss": 0.0378, + "step": 239940 + }, + { + "epoch": 1.55, + "learning_rate": 6.769590220541252e-05, + "loss": 0.0326, + "step": 239950 + }, + { + "epoch": 1.55, + "learning_rate": 6.768622085105559e-05, + "loss": 0.0275, + "step": 239960 + }, + { + "epoch": 1.55, + "learning_rate": 6.767653949669865e-05, + "loss": 0.0236, + "step": 239970 + }, + { + "epoch": 1.55, + "learning_rate": 6.766685814234172e-05, + "loss": 0.0212, + "step": 239980 + }, + { + "epoch": 1.55, + "learning_rate": 6.765717678798478e-05, + "loss": 0.0237, + "step": 239990 + }, + { + "epoch": 1.55, + "learning_rate": 6.764749543362786e-05, + "loss": 0.0317, + "step": 240000 + }, + { + "epoch": 1.55, + "eval_cer": 0.9198644220991978, + "eval_loss": 0.019400835037231445, + "eval_runtime": 119.9567, + "eval_samples_per_second": 16.673, + "eval_steps_per_second": 4.168, + "step": 240000 + }, + { + "epoch": 1.55, + "learning_rate": 6.763781407927092e-05, + "loss": 0.0272, + "step": 240010 + }, + { + "epoch": 1.55, + "learning_rate": 6.7628132724914e-05, + "loss": 0.0224, + "step": 240020 + }, + { + "epoch": 1.55, + "learning_rate": 6.761845137055706e-05, + "loss": 0.0265, + "step": 240030 + }, + { + "epoch": 1.55, + "learning_rate": 6.760877001620013e-05, + "loss": 0.0284, + "step": 240040 + }, + { + "epoch": 1.55, + "learning_rate": 6.75990886618432e-05, + "loss": 0.0278, + "step": 240050 + }, + { + "epoch": 1.55, + "learning_rate": 6.758940730748626e-05, + "loss": 0.0267, + "step": 240060 + }, + { + "epoch": 1.55, + "learning_rate": 6.757972595312933e-05, + "loss": 0.025, + "step": 240070 + }, + { + "epoch": 1.55, + "learning_rate": 6.75700445987724e-05, + "loss": 0.0245, + "step": 240080 + }, + { + "epoch": 1.55, + "learning_rate": 6.756036324441547e-05, + "loss": 0.0335, + "step": 240090 + }, + { + "epoch": 1.55, + "learning_rate": 6.755068189005854e-05, + "loss": 0.0251, + "step": 240100 + }, + { + "epoch": 1.55, + "learning_rate": 6.75410005357016e-05, + "loss": 0.0252, + "step": 240110 + }, + { + "epoch": 1.55, + "learning_rate": 6.753131918134467e-05, + "loss": 0.0224, + "step": 240120 + }, + { + "epoch": 1.55, + "learning_rate": 6.752163782698774e-05, + "loss": 0.0321, + "step": 240130 + }, + { + "epoch": 1.55, + "learning_rate": 6.75119564726308e-05, + "loss": 0.0261, + "step": 240140 + }, + { + "epoch": 1.55, + "learning_rate": 6.750227511827387e-05, + "loss": 0.0305, + "step": 240150 + }, + { + "epoch": 1.55, + "learning_rate": 6.749259376391695e-05, + "loss": 0.0251, + "step": 240160 + }, + { + "epoch": 1.55, + "learning_rate": 6.748291240956e-05, + "loss": 0.0275, + "step": 240170 + }, + { + "epoch": 1.55, + "learning_rate": 6.747323105520307e-05, + "loss": 0.0246, + "step": 240180 + }, + { + "epoch": 1.55, + "learning_rate": 6.746354970084615e-05, + "loss": 0.0233, + "step": 240190 + }, + { + "epoch": 1.55, + "learning_rate": 6.745386834648922e-05, + "loss": 0.0296, + "step": 240200 + }, + { + "epoch": 1.55, + "learning_rate": 6.744418699213228e-05, + "loss": 0.0255, + "step": 240210 + }, + { + "epoch": 1.55, + "learning_rate": 6.743450563777535e-05, + "loss": 0.0295, + "step": 240220 + }, + { + "epoch": 1.55, + "learning_rate": 6.742482428341841e-05, + "loss": 0.0232, + "step": 240230 + }, + { + "epoch": 1.55, + "learning_rate": 6.741514292906148e-05, + "loss": 0.0234, + "step": 240240 + }, + { + "epoch": 1.55, + "learning_rate": 6.740546157470455e-05, + "loss": 0.0247, + "step": 240250 + }, + { + "epoch": 1.55, + "learning_rate": 6.739578022034763e-05, + "loss": 0.0245, + "step": 240260 + }, + { + "epoch": 1.55, + "learning_rate": 6.738609886599068e-05, + "loss": 0.0372, + "step": 240270 + }, + { + "epoch": 1.55, + "learning_rate": 6.737641751163376e-05, + "loss": 0.0258, + "step": 240280 + }, + { + "epoch": 1.55, + "learning_rate": 6.736673615727683e-05, + "loss": 0.0293, + "step": 240290 + }, + { + "epoch": 1.55, + "learning_rate": 6.735705480291989e-05, + "loss": 0.0224, + "step": 240300 + }, + { + "epoch": 1.55, + "learning_rate": 6.734737344856296e-05, + "loss": 0.0274, + "step": 240310 + }, + { + "epoch": 1.55, + "learning_rate": 6.733769209420602e-05, + "loss": 0.0275, + "step": 240320 + }, + { + "epoch": 1.55, + "learning_rate": 6.732801073984909e-05, + "loss": 0.0292, + "step": 240330 + }, + { + "epoch": 1.55, + "learning_rate": 6.731832938549216e-05, + "loss": 0.0231, + "step": 240340 + }, + { + "epoch": 1.55, + "learning_rate": 6.730864803113524e-05, + "loss": 0.0287, + "step": 240350 + }, + { + "epoch": 1.55, + "learning_rate": 6.72989666767783e-05, + "loss": 0.0289, + "step": 240360 + }, + { + "epoch": 1.55, + "learning_rate": 6.728928532242137e-05, + "loss": 0.0278, + "step": 240370 + }, + { + "epoch": 1.55, + "learning_rate": 6.727960396806444e-05, + "loss": 0.0237, + "step": 240380 + }, + { + "epoch": 1.55, + "learning_rate": 6.72699226137075e-05, + "loss": 0.0288, + "step": 240390 + }, + { + "epoch": 1.55, + "learning_rate": 6.726024125935057e-05, + "loss": 0.0232, + "step": 240400 + }, + { + "epoch": 1.55, + "learning_rate": 6.725055990499363e-05, + "loss": 0.026, + "step": 240410 + }, + { + "epoch": 1.55, + "learning_rate": 6.72408785506367e-05, + "loss": 0.0271, + "step": 240420 + }, + { + "epoch": 1.55, + "learning_rate": 6.723119719627977e-05, + "loss": 0.0276, + "step": 240430 + }, + { + "epoch": 1.55, + "learning_rate": 6.722151584192285e-05, + "loss": 0.026, + "step": 240440 + }, + { + "epoch": 1.55, + "learning_rate": 6.721183448756591e-05, + "loss": 0.0264, + "step": 240450 + }, + { + "epoch": 1.55, + "learning_rate": 6.720215313320898e-05, + "loss": 0.0235, + "step": 240460 + }, + { + "epoch": 1.55, + "learning_rate": 6.719247177885204e-05, + "loss": 0.0252, + "step": 240470 + }, + { + "epoch": 1.55, + "learning_rate": 6.718279042449511e-05, + "loss": 0.0264, + "step": 240480 + }, + { + "epoch": 1.55, + "learning_rate": 6.717310907013818e-05, + "loss": 0.0256, + "step": 240490 + }, + { + "epoch": 1.55, + "learning_rate": 6.716342771578124e-05, + "loss": 0.0278, + "step": 240500 + }, + { + "epoch": 1.55, + "learning_rate": 6.715374636142432e-05, + "loss": 0.026, + "step": 240510 + }, + { + "epoch": 1.55, + "learning_rate": 6.714406500706738e-05, + "loss": 0.0243, + "step": 240520 + }, + { + "epoch": 1.55, + "learning_rate": 6.713438365271044e-05, + "loss": 0.0289, + "step": 240530 + }, + { + "epoch": 1.55, + "learning_rate": 6.712470229835352e-05, + "loss": 0.0239, + "step": 240540 + }, + { + "epoch": 1.55, + "learning_rate": 6.711502094399659e-05, + "loss": 0.0212, + "step": 240550 + }, + { + "epoch": 1.55, + "learning_rate": 6.710533958963965e-05, + "loss": 0.0237, + "step": 240560 + }, + { + "epoch": 1.55, + "learning_rate": 6.709565823528272e-05, + "loss": 0.0235, + "step": 240570 + }, + { + "epoch": 1.55, + "learning_rate": 6.708597688092579e-05, + "loss": 0.0287, + "step": 240580 + }, + { + "epoch": 1.55, + "learning_rate": 6.707629552656885e-05, + "loss": 0.0319, + "step": 240590 + }, + { + "epoch": 1.55, + "learning_rate": 6.706661417221192e-05, + "loss": 0.0251, + "step": 240600 + }, + { + "epoch": 1.55, + "learning_rate": 6.7056932817855e-05, + "loss": 0.0211, + "step": 240610 + }, + { + "epoch": 1.55, + "learning_rate": 6.704725146349805e-05, + "loss": 0.0233, + "step": 240620 + }, + { + "epoch": 1.55, + "learning_rate": 6.703757010914113e-05, + "loss": 0.0247, + "step": 240630 + }, + { + "epoch": 1.55, + "learning_rate": 6.70278887547842e-05, + "loss": 0.0283, + "step": 240640 + }, + { + "epoch": 1.55, + "learning_rate": 6.701820740042726e-05, + "loss": 0.0253, + "step": 240650 + }, + { + "epoch": 1.55, + "learning_rate": 6.700852604607033e-05, + "loss": 0.0293, + "step": 240660 + }, + { + "epoch": 1.55, + "learning_rate": 6.69988446917134e-05, + "loss": 0.0266, + "step": 240670 + }, + { + "epoch": 1.55, + "learning_rate": 6.698916333735646e-05, + "loss": 0.025, + "step": 240680 + }, + { + "epoch": 1.55, + "learning_rate": 6.697948198299953e-05, + "loss": 0.0231, + "step": 240690 + }, + { + "epoch": 1.55, + "learning_rate": 6.696980062864261e-05, + "loss": 0.0259, + "step": 240700 + }, + { + "epoch": 1.55, + "learning_rate": 6.696011927428568e-05, + "loss": 0.0275, + "step": 240710 + }, + { + "epoch": 1.55, + "learning_rate": 6.695043791992874e-05, + "loss": 0.0251, + "step": 240720 + }, + { + "epoch": 1.55, + "learning_rate": 6.694075656557181e-05, + "loss": 0.0256, + "step": 240730 + }, + { + "epoch": 1.55, + "learning_rate": 6.693107521121487e-05, + "loss": 0.0255, + "step": 240740 + }, + { + "epoch": 1.55, + "learning_rate": 6.692139385685794e-05, + "loss": 0.0203, + "step": 240750 + }, + { + "epoch": 1.55, + "learning_rate": 6.6911712502501e-05, + "loss": 0.0251, + "step": 240760 + }, + { + "epoch": 1.55, + "learning_rate": 6.690203114814409e-05, + "loss": 0.0225, + "step": 240770 + }, + { + "epoch": 1.55, + "learning_rate": 6.689234979378714e-05, + "loss": 0.0271, + "step": 240780 + }, + { + "epoch": 1.55, + "learning_rate": 6.688266843943022e-05, + "loss": 0.0268, + "step": 240790 + }, + { + "epoch": 1.55, + "learning_rate": 6.687298708507328e-05, + "loss": 0.023, + "step": 240800 + }, + { + "epoch": 1.55, + "learning_rate": 6.686330573071635e-05, + "loss": 0.0233, + "step": 240810 + }, + { + "epoch": 1.55, + "learning_rate": 6.685362437635942e-05, + "loss": 0.0258, + "step": 240820 + }, + { + "epoch": 1.55, + "learning_rate": 6.684394302200248e-05, + "loss": 0.0276, + "step": 240830 + }, + { + "epoch": 1.55, + "learning_rate": 6.683426166764555e-05, + "loss": 0.0215, + "step": 240840 + }, + { + "epoch": 1.55, + "learning_rate": 6.682458031328862e-05, + "loss": 0.0225, + "step": 240850 + }, + { + "epoch": 1.55, + "learning_rate": 6.68148989589317e-05, + "loss": 0.0265, + "step": 240860 + }, + { + "epoch": 1.55, + "learning_rate": 6.680521760457476e-05, + "loss": 0.0247, + "step": 240870 + }, + { + "epoch": 1.55, + "learning_rate": 6.679553625021781e-05, + "loss": 0.0268, + "step": 240880 + }, + { + "epoch": 1.55, + "learning_rate": 6.67858548958609e-05, + "loss": 0.0299, + "step": 240890 + }, + { + "epoch": 1.55, + "learning_rate": 6.677617354150396e-05, + "loss": 0.0254, + "step": 240900 + }, + { + "epoch": 1.55, + "learning_rate": 6.676649218714703e-05, + "loss": 0.0252, + "step": 240910 + }, + { + "epoch": 1.55, + "learning_rate": 6.67568108327901e-05, + "loss": 0.0302, + "step": 240920 + }, + { + "epoch": 1.56, + "learning_rate": 6.674712947843317e-05, + "loss": 0.0227, + "step": 240930 + }, + { + "epoch": 1.56, + "learning_rate": 6.673744812407623e-05, + "loss": 0.0259, + "step": 240940 + }, + { + "epoch": 1.56, + "learning_rate": 6.672776676971929e-05, + "loss": 0.023, + "step": 240950 + }, + { + "epoch": 1.56, + "learning_rate": 6.671808541536237e-05, + "loss": 0.0256, + "step": 240960 + }, + { + "epoch": 1.56, + "learning_rate": 6.670840406100544e-05, + "loss": 0.0271, + "step": 240970 + }, + { + "epoch": 1.56, + "learning_rate": 6.66987227066485e-05, + "loss": 0.0295, + "step": 240980 + }, + { + "epoch": 1.56, + "learning_rate": 6.668904135229157e-05, + "loss": 0.0253, + "step": 240990 + }, + { + "epoch": 1.56, + "learning_rate": 6.667935999793464e-05, + "loss": 0.0266, + "step": 241000 + }, + { + "epoch": 1.56, + "eval_cer": 0.9198906338266862, + "eval_loss": 0.019124064594507217, + "eval_runtime": 120.0034, + "eval_samples_per_second": 16.666, + "eval_steps_per_second": 4.167, + "step": 241000 + }, + { + "epoch": 1.56, + "learning_rate": 6.66696786435777e-05, + "loss": 0.0262, + "step": 241010 + }, + { + "epoch": 1.56, + "learning_rate": 6.665999728922077e-05, + "loss": 0.025, + "step": 241020 + }, + { + "epoch": 1.56, + "learning_rate": 6.665031593486385e-05, + "loss": 0.0251, + "step": 241030 + }, + { + "epoch": 1.56, + "learning_rate": 6.66406345805069e-05, + "loss": 0.0287, + "step": 241040 + }, + { + "epoch": 1.56, + "learning_rate": 6.663095322614998e-05, + "loss": 0.0262, + "step": 241050 + }, + { + "epoch": 1.56, + "learning_rate": 6.662127187179305e-05, + "loss": 0.0244, + "step": 241060 + }, + { + "epoch": 1.56, + "learning_rate": 6.661159051743611e-05, + "loss": 0.0248, + "step": 241070 + }, + { + "epoch": 1.56, + "learning_rate": 6.660190916307918e-05, + "loss": 0.0241, + "step": 241080 + }, + { + "epoch": 1.56, + "learning_rate": 6.659222780872225e-05, + "loss": 0.0257, + "step": 241090 + }, + { + "epoch": 1.56, + "learning_rate": 6.658254645436531e-05, + "loss": 0.0322, + "step": 241100 + }, + { + "epoch": 1.56, + "learning_rate": 6.657286510000838e-05, + "loss": 0.0252, + "step": 241110 + }, + { + "epoch": 1.56, + "learning_rate": 6.656318374565146e-05, + "loss": 0.0274, + "step": 241120 + }, + { + "epoch": 1.56, + "learning_rate": 6.655350239129452e-05, + "loss": 0.0268, + "step": 241130 + }, + { + "epoch": 1.56, + "learning_rate": 6.654382103693759e-05, + "loss": 0.0257, + "step": 241140 + }, + { + "epoch": 1.56, + "learning_rate": 6.653413968258066e-05, + "loss": 0.034, + "step": 241150 + }, + { + "epoch": 1.56, + "learning_rate": 6.652445832822372e-05, + "loss": 0.0275, + "step": 241160 + }, + { + "epoch": 1.56, + "learning_rate": 6.651477697386679e-05, + "loss": 0.0226, + "step": 241170 + }, + { + "epoch": 1.56, + "learning_rate": 6.650509561950986e-05, + "loss": 0.0254, + "step": 241180 + }, + { + "epoch": 1.56, + "learning_rate": 6.649541426515294e-05, + "loss": 0.022, + "step": 241190 + }, + { + "epoch": 1.56, + "learning_rate": 6.648573291079599e-05, + "loss": 0.0255, + "step": 241200 + }, + { + "epoch": 1.56, + "learning_rate": 6.647605155643907e-05, + "loss": 0.029, + "step": 241210 + }, + { + "epoch": 1.56, + "learning_rate": 6.646637020208213e-05, + "loss": 0.0261, + "step": 241220 + }, + { + "epoch": 1.56, + "learning_rate": 6.64566888477252e-05, + "loss": 0.0249, + "step": 241230 + }, + { + "epoch": 1.56, + "learning_rate": 6.644700749336827e-05, + "loss": 0.0261, + "step": 241240 + }, + { + "epoch": 1.56, + "learning_rate": 6.643732613901133e-05, + "loss": 0.0258, + "step": 241250 + }, + { + "epoch": 1.56, + "learning_rate": 6.64276447846544e-05, + "loss": 0.0266, + "step": 241260 + }, + { + "epoch": 1.56, + "learning_rate": 6.641796343029747e-05, + "loss": 0.035, + "step": 241270 + }, + { + "epoch": 1.56, + "learning_rate": 6.640828207594055e-05, + "loss": 0.0283, + "step": 241280 + }, + { + "epoch": 1.56, + "learning_rate": 6.639860072158361e-05, + "loss": 0.0234, + "step": 241290 + }, + { + "epoch": 1.56, + "learning_rate": 6.638891936722666e-05, + "loss": 0.0254, + "step": 241300 + }, + { + "epoch": 1.56, + "learning_rate": 6.637923801286974e-05, + "loss": 0.0296, + "step": 241310 + }, + { + "epoch": 1.56, + "learning_rate": 6.636955665851281e-05, + "loss": 0.027, + "step": 241320 + }, + { + "epoch": 1.56, + "learning_rate": 6.635987530415588e-05, + "loss": 0.029, + "step": 241330 + }, + { + "epoch": 1.56, + "learning_rate": 6.635019394979894e-05, + "loss": 0.0282, + "step": 241340 + }, + { + "epoch": 1.56, + "learning_rate": 6.634051259544202e-05, + "loss": 0.0281, + "step": 241350 + }, + { + "epoch": 1.56, + "learning_rate": 6.633083124108508e-05, + "loss": 0.0261, + "step": 241360 + }, + { + "epoch": 1.56, + "learning_rate": 6.632114988672814e-05, + "loss": 0.0317, + "step": 241370 + }, + { + "epoch": 1.56, + "learning_rate": 6.631146853237122e-05, + "loss": 0.0203, + "step": 241380 + }, + { + "epoch": 1.56, + "learning_rate": 6.630178717801429e-05, + "loss": 0.0291, + "step": 241390 + }, + { + "epoch": 1.56, + "learning_rate": 6.629210582365735e-05, + "loss": 0.0252, + "step": 241400 + }, + { + "epoch": 1.56, + "learning_rate": 6.628242446930042e-05, + "loss": 0.0245, + "step": 241410 + }, + { + "epoch": 1.56, + "learning_rate": 6.627274311494349e-05, + "loss": 0.0221, + "step": 241420 + }, + { + "epoch": 1.56, + "learning_rate": 6.626306176058655e-05, + "loss": 0.0273, + "step": 241430 + }, + { + "epoch": 1.56, + "learning_rate": 6.625338040622962e-05, + "loss": 0.0325, + "step": 241440 + }, + { + "epoch": 1.56, + "learning_rate": 6.62436990518727e-05, + "loss": 0.024, + "step": 241450 + }, + { + "epoch": 1.56, + "learning_rate": 6.623401769751575e-05, + "loss": 0.0215, + "step": 241460 + }, + { + "epoch": 1.56, + "learning_rate": 6.622433634315883e-05, + "loss": 0.0244, + "step": 241470 + }, + { + "epoch": 1.56, + "learning_rate": 6.62146549888019e-05, + "loss": 0.0291, + "step": 241480 + }, + { + "epoch": 1.56, + "learning_rate": 6.620497363444496e-05, + "loss": 0.0261, + "step": 241490 + }, + { + "epoch": 1.56, + "learning_rate": 6.619529228008803e-05, + "loss": 0.026, + "step": 241500 + }, + { + "epoch": 1.56, + "learning_rate": 6.61856109257311e-05, + "loss": 0.0307, + "step": 241510 + }, + { + "epoch": 1.56, + "learning_rate": 6.617592957137416e-05, + "loss": 0.0251, + "step": 241520 + }, + { + "epoch": 1.56, + "learning_rate": 6.616624821701723e-05, + "loss": 0.0254, + "step": 241530 + }, + { + "epoch": 1.56, + "learning_rate": 6.615656686266031e-05, + "loss": 0.0247, + "step": 241540 + }, + { + "epoch": 1.56, + "learning_rate": 6.614688550830337e-05, + "loss": 0.0313, + "step": 241550 + }, + { + "epoch": 1.56, + "learning_rate": 6.613720415394644e-05, + "loss": 0.0287, + "step": 241560 + }, + { + "epoch": 1.56, + "learning_rate": 6.612752279958951e-05, + "loss": 0.0305, + "step": 241570 + }, + { + "epoch": 1.56, + "learning_rate": 6.611784144523257e-05, + "loss": 0.0292, + "step": 241580 + }, + { + "epoch": 1.56, + "learning_rate": 6.610816009087564e-05, + "loss": 0.0256, + "step": 241590 + }, + { + "epoch": 1.56, + "learning_rate": 6.60984787365187e-05, + "loss": 0.024, + "step": 241600 + }, + { + "epoch": 1.56, + "learning_rate": 6.608879738216177e-05, + "loss": 0.0245, + "step": 241610 + }, + { + "epoch": 1.56, + "learning_rate": 6.607911602780484e-05, + "loss": 0.0253, + "step": 241620 + }, + { + "epoch": 1.56, + "learning_rate": 6.606943467344792e-05, + "loss": 0.0272, + "step": 241630 + }, + { + "epoch": 1.56, + "learning_rate": 6.605975331909098e-05, + "loss": 0.0239, + "step": 241640 + }, + { + "epoch": 1.56, + "learning_rate": 6.605007196473405e-05, + "loss": 0.0275, + "step": 241650 + }, + { + "epoch": 1.56, + "learning_rate": 6.604039061037712e-05, + "loss": 0.0318, + "step": 241660 + }, + { + "epoch": 1.56, + "learning_rate": 6.603070925602018e-05, + "loss": 0.0317, + "step": 241670 + }, + { + "epoch": 1.56, + "learning_rate": 6.602102790166325e-05, + "loss": 0.0278, + "step": 241680 + }, + { + "epoch": 1.56, + "learning_rate": 6.601134654730632e-05, + "loss": 0.0251, + "step": 241690 + }, + { + "epoch": 1.56, + "learning_rate": 6.60016651929494e-05, + "loss": 0.0247, + "step": 241700 + }, + { + "epoch": 1.56, + "learning_rate": 6.599198383859245e-05, + "loss": 0.0278, + "step": 241710 + }, + { + "epoch": 1.56, + "learning_rate": 6.598230248423551e-05, + "loss": 0.0265, + "step": 241720 + }, + { + "epoch": 1.56, + "learning_rate": 6.59726211298786e-05, + "loss": 0.026, + "step": 241730 + }, + { + "epoch": 1.56, + "learning_rate": 6.596293977552166e-05, + "loss": 0.0256, + "step": 241740 + }, + { + "epoch": 1.56, + "learning_rate": 6.595325842116473e-05, + "loss": 0.0298, + "step": 241750 + }, + { + "epoch": 1.56, + "learning_rate": 6.594357706680779e-05, + "loss": 0.0293, + "step": 241760 + }, + { + "epoch": 1.56, + "learning_rate": 6.593389571245086e-05, + "loss": 0.026, + "step": 241770 + }, + { + "epoch": 1.56, + "learning_rate": 6.592421435809393e-05, + "loss": 0.0241, + "step": 241780 + }, + { + "epoch": 1.56, + "learning_rate": 6.591453300373699e-05, + "loss": 0.0281, + "step": 241790 + }, + { + "epoch": 1.56, + "learning_rate": 6.590485164938007e-05, + "loss": 0.0221, + "step": 241800 + }, + { + "epoch": 1.56, + "learning_rate": 6.589517029502312e-05, + "loss": 0.0288, + "step": 241810 + }, + { + "epoch": 1.56, + "learning_rate": 6.58854889406662e-05, + "loss": 0.0316, + "step": 241820 + }, + { + "epoch": 1.56, + "learning_rate": 6.587580758630927e-05, + "loss": 0.0322, + "step": 241830 + }, + { + "epoch": 1.56, + "learning_rate": 6.586612623195234e-05, + "loss": 0.0256, + "step": 241840 + }, + { + "epoch": 1.56, + "learning_rate": 6.58564448775954e-05, + "loss": 0.0237, + "step": 241850 + }, + { + "epoch": 1.56, + "learning_rate": 6.584676352323847e-05, + "loss": 0.0236, + "step": 241860 + }, + { + "epoch": 1.56, + "learning_rate": 6.583708216888154e-05, + "loss": 0.0247, + "step": 241870 + }, + { + "epoch": 1.56, + "learning_rate": 6.58274008145246e-05, + "loss": 0.0235, + "step": 241880 + }, + { + "epoch": 1.56, + "learning_rate": 6.581771946016768e-05, + "loss": 0.0248, + "step": 241890 + }, + { + "epoch": 1.56, + "learning_rate": 6.580803810581075e-05, + "loss": 0.0278, + "step": 241900 + }, + { + "epoch": 1.56, + "learning_rate": 6.579835675145381e-05, + "loss": 0.0271, + "step": 241910 + }, + { + "epoch": 1.56, + "learning_rate": 6.578867539709688e-05, + "loss": 0.0288, + "step": 241920 + }, + { + "epoch": 1.56, + "learning_rate": 6.577899404273995e-05, + "loss": 0.0286, + "step": 241930 + }, + { + "epoch": 1.56, + "learning_rate": 6.576931268838301e-05, + "loss": 0.0279, + "step": 241940 + }, + { + "epoch": 1.56, + "learning_rate": 6.575963133402608e-05, + "loss": 0.0279, + "step": 241950 + }, + { + "epoch": 1.56, + "learning_rate": 6.574994997966916e-05, + "loss": 0.0262, + "step": 241960 + }, + { + "epoch": 1.56, + "learning_rate": 6.574026862531221e-05, + "loss": 0.0244, + "step": 241970 + }, + { + "epoch": 1.56, + "learning_rate": 6.573058727095528e-05, + "loss": 0.0287, + "step": 241980 + }, + { + "epoch": 1.56, + "learning_rate": 6.572090591659836e-05, + "loss": 0.0228, + "step": 241990 + }, + { + "epoch": 1.56, + "learning_rate": 6.571122456224142e-05, + "loss": 0.0272, + "step": 242000 + }, + { + "epoch": 1.56, + "eval_cer": 0.9198599028358377, + "eval_loss": 0.019341401755809784, + "eval_runtime": 120.0186, + "eval_samples_per_second": 16.664, + "eval_steps_per_second": 4.166, + "step": 242000 + }, + { + "epoch": 1.56, + "learning_rate": 6.570154320788449e-05, + "loss": 0.0295, + "step": 242010 + }, + { + "epoch": 1.56, + "learning_rate": 6.569186185352756e-05, + "loss": 0.0279, + "step": 242020 + }, + { + "epoch": 1.56, + "learning_rate": 6.568218049917062e-05, + "loss": 0.0264, + "step": 242030 + }, + { + "epoch": 1.56, + "learning_rate": 6.567249914481369e-05, + "loss": 0.0254, + "step": 242040 + }, + { + "epoch": 1.56, + "learning_rate": 6.566281779045675e-05, + "loss": 0.0301, + "step": 242050 + }, + { + "epoch": 1.56, + "learning_rate": 6.565313643609983e-05, + "loss": 0.0256, + "step": 242060 + }, + { + "epoch": 1.56, + "learning_rate": 6.564345508174289e-05, + "loss": 0.0276, + "step": 242070 + }, + { + "epoch": 1.56, + "learning_rate": 6.563377372738597e-05, + "loss": 0.0284, + "step": 242080 + }, + { + "epoch": 1.56, + "learning_rate": 6.562409237302903e-05, + "loss": 0.0275, + "step": 242090 + }, + { + "epoch": 1.56, + "learning_rate": 6.56144110186721e-05, + "loss": 0.0287, + "step": 242100 + }, + { + "epoch": 1.56, + "learning_rate": 6.560472966431517e-05, + "loss": 0.0259, + "step": 242110 + }, + { + "epoch": 1.56, + "learning_rate": 6.559504830995823e-05, + "loss": 0.0223, + "step": 242120 + }, + { + "epoch": 1.56, + "learning_rate": 6.55853669556013e-05, + "loss": 0.0262, + "step": 242130 + }, + { + "epoch": 1.56, + "learning_rate": 6.557568560124436e-05, + "loss": 0.0265, + "step": 242140 + }, + { + "epoch": 1.56, + "learning_rate": 6.556600424688744e-05, + "loss": 0.0251, + "step": 242150 + }, + { + "epoch": 1.56, + "learning_rate": 6.555632289253051e-05, + "loss": 0.0257, + "step": 242160 + }, + { + "epoch": 1.56, + "learning_rate": 6.554664153817358e-05, + "loss": 0.0243, + "step": 242170 + }, + { + "epoch": 1.56, + "learning_rate": 6.553696018381664e-05, + "loss": 0.0242, + "step": 242180 + }, + { + "epoch": 1.56, + "learning_rate": 6.552727882945971e-05, + "loss": 0.0243, + "step": 242190 + }, + { + "epoch": 1.56, + "learning_rate": 6.551759747510278e-05, + "loss": 0.0227, + "step": 242200 + }, + { + "epoch": 1.56, + "learning_rate": 6.550791612074584e-05, + "loss": 0.0239, + "step": 242210 + }, + { + "epoch": 1.56, + "learning_rate": 6.549823476638892e-05, + "loss": 0.0246, + "step": 242220 + }, + { + "epoch": 1.56, + "learning_rate": 6.548855341203197e-05, + "loss": 0.0286, + "step": 242230 + }, + { + "epoch": 1.56, + "learning_rate": 6.547887205767505e-05, + "loss": 0.0305, + "step": 242240 + }, + { + "epoch": 1.56, + "learning_rate": 6.546919070331812e-05, + "loss": 0.0253, + "step": 242250 + }, + { + "epoch": 1.56, + "learning_rate": 6.545950934896119e-05, + "loss": 0.0286, + "step": 242260 + }, + { + "epoch": 1.56, + "learning_rate": 6.544982799460425e-05, + "loss": 0.0257, + "step": 242270 + }, + { + "epoch": 1.56, + "learning_rate": 6.544014664024732e-05, + "loss": 0.0255, + "step": 242280 + }, + { + "epoch": 1.56, + "learning_rate": 6.543046528589038e-05, + "loss": 0.0253, + "step": 242290 + }, + { + "epoch": 1.56, + "learning_rate": 6.542078393153345e-05, + "loss": 0.0254, + "step": 242300 + }, + { + "epoch": 1.56, + "learning_rate": 6.541110257717653e-05, + "loss": 0.026, + "step": 242310 + }, + { + "epoch": 1.56, + "learning_rate": 6.54014212228196e-05, + "loss": 0.0243, + "step": 242320 + }, + { + "epoch": 1.56, + "learning_rate": 6.539173986846265e-05, + "loss": 0.0233, + "step": 242330 + }, + { + "epoch": 1.56, + "learning_rate": 6.538205851410573e-05, + "loss": 0.0259, + "step": 242340 + }, + { + "epoch": 1.56, + "learning_rate": 6.53723771597488e-05, + "loss": 0.0253, + "step": 242350 + }, + { + "epoch": 1.56, + "learning_rate": 6.536269580539186e-05, + "loss": 0.0253, + "step": 242360 + }, + { + "epoch": 1.56, + "learning_rate": 6.535301445103493e-05, + "loss": 0.0282, + "step": 242370 + }, + { + "epoch": 1.56, + "learning_rate": 6.534333309667801e-05, + "loss": 0.0236, + "step": 242380 + }, + { + "epoch": 1.56, + "learning_rate": 6.533365174232106e-05, + "loss": 0.0241, + "step": 242390 + }, + { + "epoch": 1.56, + "learning_rate": 6.532397038796413e-05, + "loss": 0.0274, + "step": 242400 + }, + { + "epoch": 1.56, + "learning_rate": 6.531428903360721e-05, + "loss": 0.0231, + "step": 242410 + }, + { + "epoch": 1.56, + "learning_rate": 6.530460767925027e-05, + "loss": 0.0295, + "step": 242420 + }, + { + "epoch": 1.56, + "learning_rate": 6.529492632489334e-05, + "loss": 0.0267, + "step": 242430 + }, + { + "epoch": 1.56, + "learning_rate": 6.52852449705364e-05, + "loss": 0.0269, + "step": 242440 + }, + { + "epoch": 1.56, + "learning_rate": 6.527556361617947e-05, + "loss": 0.0259, + "step": 242450 + }, + { + "epoch": 1.56, + "learning_rate": 6.526588226182254e-05, + "loss": 0.0313, + "step": 242460 + }, + { + "epoch": 1.56, + "learning_rate": 6.52562009074656e-05, + "loss": 0.0229, + "step": 242470 + }, + { + "epoch": 1.57, + "learning_rate": 6.524651955310868e-05, + "loss": 0.0303, + "step": 242480 + }, + { + "epoch": 1.57, + "learning_rate": 6.523683819875174e-05, + "loss": 0.0268, + "step": 242490 + }, + { + "epoch": 1.57, + "learning_rate": 6.522715684439482e-05, + "loss": 0.0307, + "step": 242500 + }, + { + "epoch": 1.57, + "learning_rate": 6.521747549003788e-05, + "loss": 0.0301, + "step": 242510 + }, + { + "epoch": 1.57, + "learning_rate": 6.520779413568095e-05, + "loss": 0.0324, + "step": 242520 + }, + { + "epoch": 1.57, + "learning_rate": 6.519811278132402e-05, + "loss": 0.0251, + "step": 242530 + }, + { + "epoch": 1.57, + "learning_rate": 6.518843142696708e-05, + "loss": 0.0276, + "step": 242540 + }, + { + "epoch": 1.57, + "learning_rate": 6.517875007261015e-05, + "loss": 0.0233, + "step": 242550 + }, + { + "epoch": 1.57, + "learning_rate": 6.516906871825321e-05, + "loss": 0.0261, + "step": 242560 + }, + { + "epoch": 1.57, + "learning_rate": 6.51593873638963e-05, + "loss": 0.0302, + "step": 242570 + }, + { + "epoch": 1.57, + "learning_rate": 6.514970600953936e-05, + "loss": 0.0335, + "step": 242580 + }, + { + "epoch": 1.57, + "learning_rate": 6.514002465518243e-05, + "loss": 0.0288, + "step": 242590 + }, + { + "epoch": 1.57, + "learning_rate": 6.513034330082549e-05, + "loss": 0.0378, + "step": 242600 + }, + { + "epoch": 1.57, + "learning_rate": 6.512066194646856e-05, + "loss": 0.0269, + "step": 242610 + }, + { + "epoch": 1.57, + "learning_rate": 6.511098059211162e-05, + "loss": 0.0266, + "step": 242620 + }, + { + "epoch": 1.57, + "learning_rate": 6.510129923775469e-05, + "loss": 0.0253, + "step": 242630 + }, + { + "epoch": 1.57, + "learning_rate": 6.509161788339777e-05, + "loss": 0.0278, + "step": 242640 + }, + { + "epoch": 1.57, + "learning_rate": 6.508193652904082e-05, + "loss": 0.023, + "step": 242650 + }, + { + "epoch": 1.57, + "learning_rate": 6.50722551746839e-05, + "loss": 0.0278, + "step": 242660 + }, + { + "epoch": 1.57, + "learning_rate": 6.506257382032697e-05, + "loss": 0.0246, + "step": 242670 + }, + { + "epoch": 1.57, + "learning_rate": 6.505289246597004e-05, + "loss": 0.0223, + "step": 242680 + }, + { + "epoch": 1.57, + "learning_rate": 6.50432111116131e-05, + "loss": 0.0275, + "step": 242690 + }, + { + "epoch": 1.57, + "learning_rate": 6.503352975725617e-05, + "loss": 0.0235, + "step": 242700 + }, + { + "epoch": 1.57, + "learning_rate": 6.502384840289923e-05, + "loss": 0.0265, + "step": 242710 + }, + { + "epoch": 1.57, + "learning_rate": 6.50141670485423e-05, + "loss": 0.0268, + "step": 242720 + }, + { + "epoch": 1.57, + "learning_rate": 6.500448569418538e-05, + "loss": 0.0322, + "step": 242730 + }, + { + "epoch": 1.57, + "learning_rate": 6.499480433982845e-05, + "loss": 0.0224, + "step": 242740 + }, + { + "epoch": 1.57, + "learning_rate": 6.49851229854715e-05, + "loss": 0.032, + "step": 242750 + }, + { + "epoch": 1.57, + "learning_rate": 6.497544163111458e-05, + "loss": 0.0293, + "step": 242760 + }, + { + "epoch": 1.57, + "learning_rate": 6.496576027675765e-05, + "loss": 0.0321, + "step": 242770 + }, + { + "epoch": 1.57, + "learning_rate": 6.495607892240071e-05, + "loss": 0.0272, + "step": 242780 + }, + { + "epoch": 1.57, + "learning_rate": 6.494639756804378e-05, + "loss": 0.0237, + "step": 242790 + }, + { + "epoch": 1.57, + "learning_rate": 6.493671621368686e-05, + "loss": 0.03, + "step": 242800 + }, + { + "epoch": 1.57, + "learning_rate": 6.492703485932991e-05, + "loss": 0.0276, + "step": 242810 + }, + { + "epoch": 1.57, + "learning_rate": 6.491735350497298e-05, + "loss": 0.0261, + "step": 242820 + }, + { + "epoch": 1.57, + "learning_rate": 6.490767215061606e-05, + "loss": 0.0278, + "step": 242830 + }, + { + "epoch": 1.57, + "learning_rate": 6.489799079625912e-05, + "loss": 0.0292, + "step": 242840 + }, + { + "epoch": 1.57, + "learning_rate": 6.488830944190219e-05, + "loss": 0.0245, + "step": 242850 + }, + { + "epoch": 1.57, + "learning_rate": 6.487862808754526e-05, + "loss": 0.0264, + "step": 242860 + }, + { + "epoch": 1.57, + "learning_rate": 6.486894673318832e-05, + "loss": 0.0326, + "step": 242870 + }, + { + "epoch": 1.57, + "learning_rate": 6.485926537883139e-05, + "loss": 0.0243, + "step": 242880 + }, + { + "epoch": 1.57, + "learning_rate": 6.484958402447445e-05, + "loss": 0.0238, + "step": 242890 + }, + { + "epoch": 1.57, + "learning_rate": 6.483990267011753e-05, + "loss": 0.0261, + "step": 242900 + }, + { + "epoch": 1.57, + "learning_rate": 6.483022131576059e-05, + "loss": 0.0279, + "step": 242910 + }, + { + "epoch": 1.57, + "learning_rate": 6.482053996140367e-05, + "loss": 0.0286, + "step": 242920 + }, + { + "epoch": 1.57, + "learning_rate": 6.481085860704673e-05, + "loss": 0.0312, + "step": 242930 + }, + { + "epoch": 1.57, + "learning_rate": 6.48011772526898e-05, + "loss": 0.0362, + "step": 242940 + }, + { + "epoch": 1.57, + "learning_rate": 6.479149589833287e-05, + "loss": 0.0275, + "step": 242950 + }, + { + "epoch": 1.57, + "learning_rate": 6.478181454397593e-05, + "loss": 0.0343, + "step": 242960 + }, + { + "epoch": 1.57, + "learning_rate": 6.4772133189619e-05, + "loss": 0.0283, + "step": 242970 + }, + { + "epoch": 1.57, + "learning_rate": 6.476245183526206e-05, + "loss": 0.0279, + "step": 242980 + }, + { + "epoch": 1.57, + "learning_rate": 6.475277048090514e-05, + "loss": 0.0267, + "step": 242990 + }, + { + "epoch": 1.57, + "learning_rate": 6.474308912654821e-05, + "loss": 0.0236, + "step": 243000 + }, + { + "epoch": 1.57, + "eval_cer": 0.9198508643091177, + "eval_loss": 0.019448544830083847, + "eval_runtime": 120.0183, + "eval_samples_per_second": 16.664, + "eval_steps_per_second": 4.166, + "step": 243000 + }, + { + "epoch": 1.57, + "learning_rate": 6.473340777219128e-05, + "loss": 0.0247, + "step": 243010 + }, + { + "epoch": 1.57, + "learning_rate": 6.472372641783434e-05, + "loss": 0.0266, + "step": 243020 + }, + { + "epoch": 1.57, + "learning_rate": 6.471404506347741e-05, + "loss": 0.0275, + "step": 243030 + }, + { + "epoch": 1.57, + "learning_rate": 6.470436370912047e-05, + "loss": 0.0265, + "step": 243040 + }, + { + "epoch": 1.57, + "learning_rate": 6.469468235476354e-05, + "loss": 0.0346, + "step": 243050 + }, + { + "epoch": 1.57, + "learning_rate": 6.468500100040661e-05, + "loss": 0.0299, + "step": 243060 + }, + { + "epoch": 1.57, + "learning_rate": 6.467531964604967e-05, + "loss": 0.0315, + "step": 243070 + }, + { + "epoch": 1.57, + "learning_rate": 6.466563829169275e-05, + "loss": 0.0286, + "step": 243080 + }, + { + "epoch": 1.57, + "learning_rate": 6.465595693733582e-05, + "loss": 0.0229, + "step": 243090 + }, + { + "epoch": 1.57, + "learning_rate": 6.464627558297889e-05, + "loss": 0.0295, + "step": 243100 + }, + { + "epoch": 1.57, + "learning_rate": 6.463659422862195e-05, + "loss": 0.0272, + "step": 243110 + }, + { + "epoch": 1.57, + "learning_rate": 6.462691287426502e-05, + "loss": 0.0256, + "step": 243120 + }, + { + "epoch": 1.57, + "learning_rate": 6.461723151990808e-05, + "loss": 0.0239, + "step": 243130 + }, + { + "epoch": 1.57, + "learning_rate": 6.460755016555115e-05, + "loss": 0.0243, + "step": 243140 + }, + { + "epoch": 1.57, + "learning_rate": 6.459786881119423e-05, + "loss": 0.0243, + "step": 243150 + }, + { + "epoch": 1.57, + "learning_rate": 6.458818745683728e-05, + "loss": 0.0251, + "step": 243160 + }, + { + "epoch": 1.57, + "learning_rate": 6.457850610248035e-05, + "loss": 0.0302, + "step": 243170 + }, + { + "epoch": 1.57, + "learning_rate": 6.456882474812343e-05, + "loss": 0.0311, + "step": 243180 + }, + { + "epoch": 1.57, + "learning_rate": 6.45591433937665e-05, + "loss": 0.0279, + "step": 243190 + }, + { + "epoch": 1.57, + "learning_rate": 6.454946203940956e-05, + "loss": 0.026, + "step": 243200 + }, + { + "epoch": 1.57, + "learning_rate": 6.453978068505263e-05, + "loss": 0.0248, + "step": 243210 + }, + { + "epoch": 1.57, + "learning_rate": 6.45300993306957e-05, + "loss": 0.0273, + "step": 243220 + }, + { + "epoch": 1.57, + "learning_rate": 6.452041797633876e-05, + "loss": 0.0283, + "step": 243230 + }, + { + "epoch": 1.57, + "learning_rate": 6.451073662198183e-05, + "loss": 0.0413, + "step": 243240 + }, + { + "epoch": 1.57, + "learning_rate": 6.45010552676249e-05, + "loss": 0.0299, + "step": 243250 + }, + { + "epoch": 1.57, + "learning_rate": 6.449137391326796e-05, + "loss": 0.0197, + "step": 243260 + }, + { + "epoch": 1.57, + "learning_rate": 6.448169255891104e-05, + "loss": 0.0242, + "step": 243270 + }, + { + "epoch": 1.57, + "learning_rate": 6.44720112045541e-05, + "loss": 0.0261, + "step": 243280 + }, + { + "epoch": 1.57, + "learning_rate": 6.446232985019717e-05, + "loss": 0.0304, + "step": 243290 + }, + { + "epoch": 1.57, + "learning_rate": 6.445264849584024e-05, + "loss": 0.0242, + "step": 243300 + }, + { + "epoch": 1.57, + "learning_rate": 6.44429671414833e-05, + "loss": 0.0299, + "step": 243310 + }, + { + "epoch": 1.57, + "learning_rate": 6.443328578712637e-05, + "loss": 0.0285, + "step": 243320 + }, + { + "epoch": 1.57, + "learning_rate": 6.442360443276944e-05, + "loss": 0.0228, + "step": 243330 + }, + { + "epoch": 1.57, + "learning_rate": 6.441392307841252e-05, + "loss": 0.0249, + "step": 243340 + }, + { + "epoch": 1.57, + "learning_rate": 6.440424172405558e-05, + "loss": 0.0263, + "step": 243350 + }, + { + "epoch": 1.57, + "learning_rate": 6.439456036969865e-05, + "loss": 0.0267, + "step": 243360 + }, + { + "epoch": 1.57, + "learning_rate": 6.438487901534171e-05, + "loss": 0.0242, + "step": 243370 + }, + { + "epoch": 1.57, + "learning_rate": 6.437519766098478e-05, + "loss": 0.027, + "step": 243380 + }, + { + "epoch": 1.57, + "learning_rate": 6.436551630662785e-05, + "loss": 0.0325, + "step": 243390 + }, + { + "epoch": 1.57, + "learning_rate": 6.435583495227091e-05, + "loss": 0.0242, + "step": 243400 + }, + { + "epoch": 1.57, + "learning_rate": 6.4346153597914e-05, + "loss": 0.0312, + "step": 243410 + }, + { + "epoch": 1.57, + "learning_rate": 6.433647224355705e-05, + "loss": 0.029, + "step": 243420 + }, + { + "epoch": 1.57, + "learning_rate": 6.432679088920013e-05, + "loss": 0.0227, + "step": 243430 + }, + { + "epoch": 1.57, + "learning_rate": 6.431710953484319e-05, + "loss": 0.023, + "step": 243440 + }, + { + "epoch": 1.57, + "learning_rate": 6.430742818048626e-05, + "loss": 0.0213, + "step": 243450 + }, + { + "epoch": 1.57, + "learning_rate": 6.429774682612932e-05, + "loss": 0.0329, + "step": 243460 + }, + { + "epoch": 1.57, + "learning_rate": 6.428806547177239e-05, + "loss": 0.0279, + "step": 243470 + }, + { + "epoch": 1.57, + "learning_rate": 6.427838411741546e-05, + "loss": 0.0322, + "step": 243480 + }, + { + "epoch": 1.57, + "learning_rate": 6.426870276305852e-05, + "loss": 0.0228, + "step": 243490 + }, + { + "epoch": 1.57, + "learning_rate": 6.42590214087016e-05, + "loss": 0.0244, + "step": 243500 + }, + { + "epoch": 1.57, + "learning_rate": 6.424934005434467e-05, + "loss": 0.0247, + "step": 243510 + }, + { + "epoch": 1.57, + "learning_rate": 6.423965869998772e-05, + "loss": 0.0286, + "step": 243520 + }, + { + "epoch": 1.57, + "learning_rate": 6.42299773456308e-05, + "loss": 0.0274, + "step": 243530 + }, + { + "epoch": 1.57, + "learning_rate": 6.422029599127387e-05, + "loss": 0.026, + "step": 243540 + }, + { + "epoch": 1.57, + "learning_rate": 6.421061463691693e-05, + "loss": 0.0314, + "step": 243550 + }, + { + "epoch": 1.57, + "learning_rate": 6.420093328256e-05, + "loss": 0.0262, + "step": 243560 + }, + { + "epoch": 1.57, + "learning_rate": 6.419125192820308e-05, + "loss": 0.024, + "step": 243570 + }, + { + "epoch": 1.57, + "learning_rate": 6.418157057384613e-05, + "loss": 0.0274, + "step": 243580 + }, + { + "epoch": 1.57, + "learning_rate": 6.41718892194892e-05, + "loss": 0.0247, + "step": 243590 + }, + { + "epoch": 1.57, + "learning_rate": 6.416220786513228e-05, + "loss": 0.027, + "step": 243600 + }, + { + "epoch": 1.57, + "learning_rate": 6.415252651077535e-05, + "loss": 0.025, + "step": 243610 + }, + { + "epoch": 1.57, + "learning_rate": 6.414284515641841e-05, + "loss": 0.0257, + "step": 243620 + }, + { + "epoch": 1.57, + "learning_rate": 6.413316380206148e-05, + "loss": 0.0268, + "step": 243630 + }, + { + "epoch": 1.57, + "learning_rate": 6.412348244770454e-05, + "loss": 0.0235, + "step": 243640 + }, + { + "epoch": 1.57, + "learning_rate": 6.411380109334761e-05, + "loss": 0.0317, + "step": 243650 + }, + { + "epoch": 1.57, + "learning_rate": 6.410411973899068e-05, + "loss": 0.025, + "step": 243660 + }, + { + "epoch": 1.57, + "learning_rate": 6.409443838463376e-05, + "loss": 0.0255, + "step": 243670 + }, + { + "epoch": 1.57, + "learning_rate": 6.408475703027681e-05, + "loss": 0.0269, + "step": 243680 + }, + { + "epoch": 1.57, + "learning_rate": 6.407507567591989e-05, + "loss": 0.0219, + "step": 243690 + }, + { + "epoch": 1.57, + "learning_rate": 6.406539432156295e-05, + "loss": 0.0237, + "step": 243700 + }, + { + "epoch": 1.57, + "learning_rate": 6.405571296720602e-05, + "loss": 0.0219, + "step": 243710 + }, + { + "epoch": 1.57, + "learning_rate": 6.404603161284909e-05, + "loss": 0.0265, + "step": 243720 + }, + { + "epoch": 1.57, + "learning_rate": 6.403635025849215e-05, + "loss": 0.0218, + "step": 243730 + }, + { + "epoch": 1.57, + "learning_rate": 6.402666890413522e-05, + "loss": 0.0298, + "step": 243740 + }, + { + "epoch": 1.57, + "learning_rate": 6.401698754977829e-05, + "loss": 0.0238, + "step": 243750 + }, + { + "epoch": 1.57, + "learning_rate": 6.400730619542137e-05, + "loss": 0.0298, + "step": 243760 + }, + { + "epoch": 1.57, + "learning_rate": 6.399762484106443e-05, + "loss": 0.0219, + "step": 243770 + }, + { + "epoch": 1.57, + "learning_rate": 6.398794348670748e-05, + "loss": 0.0242, + "step": 243780 + }, + { + "epoch": 1.57, + "learning_rate": 6.397826213235056e-05, + "loss": 0.0282, + "step": 243790 + }, + { + "epoch": 1.57, + "learning_rate": 6.396858077799363e-05, + "loss": 0.0224, + "step": 243800 + }, + { + "epoch": 1.57, + "learning_rate": 6.39588994236367e-05, + "loss": 0.0275, + "step": 243810 + }, + { + "epoch": 1.57, + "learning_rate": 6.394921806927976e-05, + "loss": 0.026, + "step": 243820 + }, + { + "epoch": 1.57, + "learning_rate": 6.393953671492284e-05, + "loss": 0.0276, + "step": 243830 + }, + { + "epoch": 1.57, + "learning_rate": 6.39298553605659e-05, + "loss": 0.0288, + "step": 243840 + }, + { + "epoch": 1.57, + "learning_rate": 6.392017400620896e-05, + "loss": 0.0267, + "step": 243850 + }, + { + "epoch": 1.57, + "learning_rate": 6.391049265185204e-05, + "loss": 0.028, + "step": 243860 + }, + { + "epoch": 1.57, + "learning_rate": 6.390081129749511e-05, + "loss": 0.0217, + "step": 243870 + }, + { + "epoch": 1.57, + "learning_rate": 6.389112994313817e-05, + "loss": 0.0274, + "step": 243880 + }, + { + "epoch": 1.57, + "learning_rate": 6.388144858878124e-05, + "loss": 0.0291, + "step": 243890 + }, + { + "epoch": 1.57, + "learning_rate": 6.387176723442431e-05, + "loss": 0.0252, + "step": 243900 + }, + { + "epoch": 1.57, + "learning_rate": 6.386208588006737e-05, + "loss": 0.0269, + "step": 243910 + }, + { + "epoch": 1.57, + "learning_rate": 6.385240452571044e-05, + "loss": 0.0253, + "step": 243920 + }, + { + "epoch": 1.57, + "learning_rate": 6.384272317135352e-05, + "loss": 0.0232, + "step": 243930 + }, + { + "epoch": 1.57, + "learning_rate": 6.383304181699657e-05, + "loss": 0.0255, + "step": 243940 + }, + { + "epoch": 1.57, + "learning_rate": 6.382336046263965e-05, + "loss": 0.026, + "step": 243950 + }, + { + "epoch": 1.57, + "learning_rate": 6.381367910828272e-05, + "loss": 0.0305, + "step": 243960 + }, + { + "epoch": 1.57, + "learning_rate": 6.380399775392578e-05, + "loss": 0.0273, + "step": 243970 + }, + { + "epoch": 1.57, + "learning_rate": 6.379431639956885e-05, + "loss": 0.0213, + "step": 243980 + }, + { + "epoch": 1.57, + "learning_rate": 6.378463504521192e-05, + "loss": 0.0256, + "step": 243990 + }, + { + "epoch": 1.57, + "learning_rate": 6.377495369085498e-05, + "loss": 0.0266, + "step": 244000 + }, + { + "epoch": 1.57, + "eval_cer": 0.9198400180770534, + "eval_loss": 0.019307343289256096, + "eval_runtime": 120.042, + "eval_samples_per_second": 16.661, + "eval_steps_per_second": 4.165, + "step": 244000 + }, + { + "epoch": 1.57, + "learning_rate": 6.376527233649805e-05, + "loss": 0.0235, + "step": 244010 + }, + { + "epoch": 1.57, + "learning_rate": 6.375559098214113e-05, + "loss": 0.0252, + "step": 244020 + }, + { + "epoch": 1.58, + "learning_rate": 6.37459096277842e-05, + "loss": 0.0287, + "step": 244030 + }, + { + "epoch": 1.58, + "learning_rate": 6.373622827342726e-05, + "loss": 0.035, + "step": 244040 + }, + { + "epoch": 1.58, + "learning_rate": 6.372654691907033e-05, + "loss": 0.0262, + "step": 244050 + }, + { + "epoch": 1.58, + "learning_rate": 6.37168655647134e-05, + "loss": 0.0305, + "step": 244060 + }, + { + "epoch": 1.58, + "learning_rate": 6.370718421035646e-05, + "loss": 0.0224, + "step": 244070 + }, + { + "epoch": 1.58, + "learning_rate": 6.369750285599953e-05, + "loss": 0.0272, + "step": 244080 + }, + { + "epoch": 1.58, + "learning_rate": 6.36878215016426e-05, + "loss": 0.0239, + "step": 244090 + }, + { + "epoch": 1.58, + "learning_rate": 6.367814014728566e-05, + "loss": 0.0223, + "step": 244100 + }, + { + "epoch": 1.58, + "learning_rate": 6.366845879292874e-05, + "loss": 0.0264, + "step": 244110 + }, + { + "epoch": 1.58, + "learning_rate": 6.36587774385718e-05, + "loss": 0.0255, + "step": 244120 + }, + { + "epoch": 1.58, + "learning_rate": 6.364909608421487e-05, + "loss": 0.0236, + "step": 244130 + }, + { + "epoch": 1.58, + "learning_rate": 6.363941472985794e-05, + "loss": 0.0275, + "step": 244140 + }, + { + "epoch": 1.58, + "learning_rate": 6.3629733375501e-05, + "loss": 0.0298, + "step": 244150 + }, + { + "epoch": 1.58, + "learning_rate": 6.362005202114407e-05, + "loss": 0.027, + "step": 244160 + }, + { + "epoch": 1.58, + "learning_rate": 6.361037066678714e-05, + "loss": 0.0215, + "step": 244170 + }, + { + "epoch": 1.58, + "learning_rate": 6.360068931243022e-05, + "loss": 0.0251, + "step": 244180 + }, + { + "epoch": 1.58, + "learning_rate": 6.359100795807328e-05, + "loss": 0.0255, + "step": 244190 + }, + { + "epoch": 1.58, + "learning_rate": 6.358132660371633e-05, + "loss": 0.0225, + "step": 244200 + }, + { + "epoch": 1.58, + "learning_rate": 6.357164524935941e-05, + "loss": 0.0273, + "step": 244210 + }, + { + "epoch": 1.58, + "learning_rate": 6.356196389500248e-05, + "loss": 0.0285, + "step": 244220 + }, + { + "epoch": 1.58, + "learning_rate": 6.355228254064555e-05, + "loss": 0.0205, + "step": 244230 + }, + { + "epoch": 1.58, + "learning_rate": 6.354260118628861e-05, + "loss": 0.0337, + "step": 244240 + }, + { + "epoch": 1.58, + "learning_rate": 6.353291983193168e-05, + "loss": 0.03, + "step": 244250 + }, + { + "epoch": 1.58, + "learning_rate": 6.352323847757475e-05, + "loss": 0.0247, + "step": 244260 + }, + { + "epoch": 1.58, + "learning_rate": 6.351355712321781e-05, + "loss": 0.0275, + "step": 244270 + }, + { + "epoch": 1.58, + "learning_rate": 6.350387576886089e-05, + "loss": 0.0254, + "step": 244280 + }, + { + "epoch": 1.58, + "learning_rate": 6.349419441450396e-05, + "loss": 0.0276, + "step": 244290 + }, + { + "epoch": 1.58, + "learning_rate": 6.348451306014702e-05, + "loss": 0.0265, + "step": 244300 + }, + { + "epoch": 1.58, + "learning_rate": 6.347483170579009e-05, + "loss": 0.0244, + "step": 244310 + }, + { + "epoch": 1.58, + "learning_rate": 6.346515035143316e-05, + "loss": 0.0261, + "step": 244320 + }, + { + "epoch": 1.58, + "learning_rate": 6.345546899707622e-05, + "loss": 0.025, + "step": 244330 + }, + { + "epoch": 1.58, + "learning_rate": 6.344578764271929e-05, + "loss": 0.0238, + "step": 244340 + }, + { + "epoch": 1.58, + "learning_rate": 6.343610628836237e-05, + "loss": 0.0266, + "step": 244350 + }, + { + "epoch": 1.58, + "learning_rate": 6.342642493400542e-05, + "loss": 0.0249, + "step": 244360 + }, + { + "epoch": 1.58, + "learning_rate": 6.34167435796485e-05, + "loss": 0.028, + "step": 244370 + }, + { + "epoch": 1.58, + "learning_rate": 6.340706222529157e-05, + "loss": 0.0261, + "step": 244380 + }, + { + "epoch": 1.58, + "learning_rate": 6.339738087093463e-05, + "loss": 0.0286, + "step": 244390 + }, + { + "epoch": 1.58, + "learning_rate": 6.33876995165777e-05, + "loss": 0.0236, + "step": 244400 + }, + { + "epoch": 1.58, + "learning_rate": 6.337801816222077e-05, + "loss": 0.0271, + "step": 244410 + }, + { + "epoch": 1.58, + "learning_rate": 6.336833680786383e-05, + "loss": 0.0255, + "step": 244420 + }, + { + "epoch": 1.58, + "learning_rate": 6.33586554535069e-05, + "loss": 0.0226, + "step": 244430 + }, + { + "epoch": 1.58, + "learning_rate": 6.334897409914998e-05, + "loss": 0.0298, + "step": 244440 + }, + { + "epoch": 1.58, + "learning_rate": 6.333929274479304e-05, + "loss": 0.0296, + "step": 244450 + }, + { + "epoch": 1.58, + "learning_rate": 6.332961139043611e-05, + "loss": 0.0223, + "step": 244460 + }, + { + "epoch": 1.58, + "learning_rate": 6.331993003607918e-05, + "loss": 0.0267, + "step": 244470 + }, + { + "epoch": 1.58, + "learning_rate": 6.331024868172224e-05, + "loss": 0.0249, + "step": 244480 + }, + { + "epoch": 1.58, + "learning_rate": 6.330056732736531e-05, + "loss": 0.0225, + "step": 244490 + }, + { + "epoch": 1.58, + "learning_rate": 6.329088597300838e-05, + "loss": 0.0303, + "step": 244500 + }, + { + "epoch": 1.58, + "learning_rate": 6.328120461865144e-05, + "loss": 0.0277, + "step": 244510 + }, + { + "epoch": 1.58, + "learning_rate": 6.327152326429451e-05, + "loss": 0.028, + "step": 244520 + }, + { + "epoch": 1.58, + "learning_rate": 6.326184190993759e-05, + "loss": 0.0251, + "step": 244530 + }, + { + "epoch": 1.58, + "learning_rate": 6.325216055558065e-05, + "loss": 0.0282, + "step": 244540 + }, + { + "epoch": 1.58, + "learning_rate": 6.324247920122372e-05, + "loss": 0.0226, + "step": 244550 + }, + { + "epoch": 1.58, + "learning_rate": 6.323279784686679e-05, + "loss": 0.0229, + "step": 244560 + }, + { + "epoch": 1.58, + "learning_rate": 6.322311649250985e-05, + "loss": 0.0288, + "step": 244570 + }, + { + "epoch": 1.58, + "learning_rate": 6.321343513815292e-05, + "loss": 0.0276, + "step": 244580 + }, + { + "epoch": 1.58, + "learning_rate": 6.320375378379599e-05, + "loss": 0.0261, + "step": 244590 + }, + { + "epoch": 1.58, + "learning_rate": 6.319407242943907e-05, + "loss": 0.0316, + "step": 244600 + }, + { + "epoch": 1.58, + "learning_rate": 6.318439107508212e-05, + "loss": 0.0322, + "step": 244610 + }, + { + "epoch": 1.58, + "learning_rate": 6.317470972072518e-05, + "loss": 0.0228, + "step": 244620 + }, + { + "epoch": 1.58, + "learning_rate": 6.316502836636826e-05, + "loss": 0.028, + "step": 244630 + }, + { + "epoch": 1.58, + "learning_rate": 6.315534701201133e-05, + "loss": 0.0325, + "step": 244640 + }, + { + "epoch": 1.58, + "learning_rate": 6.31456656576544e-05, + "loss": 0.03, + "step": 244650 + }, + { + "epoch": 1.58, + "learning_rate": 6.313598430329746e-05, + "loss": 0.0275, + "step": 244660 + }, + { + "epoch": 1.58, + "learning_rate": 6.312630294894053e-05, + "loss": 0.0266, + "step": 244670 + }, + { + "epoch": 1.58, + "learning_rate": 6.31166215945836e-05, + "loss": 0.0244, + "step": 244680 + }, + { + "epoch": 1.58, + "learning_rate": 6.310694024022666e-05, + "loss": 0.0255, + "step": 244690 + }, + { + "epoch": 1.58, + "learning_rate": 6.309725888586974e-05, + "loss": 0.0231, + "step": 244700 + }, + { + "epoch": 1.58, + "learning_rate": 6.30875775315128e-05, + "loss": 0.0251, + "step": 244710 + }, + { + "epoch": 1.58, + "learning_rate": 6.307789617715587e-05, + "loss": 0.0286, + "step": 244720 + }, + { + "epoch": 1.58, + "learning_rate": 6.306821482279894e-05, + "loss": 0.0266, + "step": 244730 + }, + { + "epoch": 1.58, + "learning_rate": 6.3058533468442e-05, + "loss": 0.0293, + "step": 244740 + }, + { + "epoch": 1.58, + "learning_rate": 6.304885211408507e-05, + "loss": 0.0271, + "step": 244750 + }, + { + "epoch": 1.58, + "learning_rate": 6.303917075972814e-05, + "loss": 0.0235, + "step": 244760 + }, + { + "epoch": 1.58, + "learning_rate": 6.30294894053712e-05, + "loss": 0.0203, + "step": 244770 + }, + { + "epoch": 1.58, + "learning_rate": 6.301980805101427e-05, + "loss": 0.0238, + "step": 244780 + }, + { + "epoch": 1.58, + "learning_rate": 6.301012669665735e-05, + "loss": 0.0304, + "step": 244790 + }, + { + "epoch": 1.58, + "learning_rate": 6.300044534230042e-05, + "loss": 0.0302, + "step": 244800 + }, + { + "epoch": 1.58, + "learning_rate": 6.299076398794348e-05, + "loss": 0.0314, + "step": 244810 + }, + { + "epoch": 1.58, + "learning_rate": 6.298108263358655e-05, + "loss": 0.0246, + "step": 244820 + }, + { + "epoch": 1.58, + "learning_rate": 6.297140127922962e-05, + "loss": 0.0286, + "step": 244830 + }, + { + "epoch": 1.58, + "learning_rate": 6.296171992487268e-05, + "loss": 0.019, + "step": 244840 + }, + { + "epoch": 1.58, + "learning_rate": 6.295203857051575e-05, + "loss": 0.0223, + "step": 244850 + }, + { + "epoch": 1.58, + "learning_rate": 6.294235721615883e-05, + "loss": 0.0254, + "step": 244860 + }, + { + "epoch": 1.58, + "learning_rate": 6.293267586180188e-05, + "loss": 0.0255, + "step": 244870 + }, + { + "epoch": 1.58, + "learning_rate": 6.292299450744496e-05, + "loss": 0.02, + "step": 244880 + }, + { + "epoch": 1.58, + "learning_rate": 6.291331315308803e-05, + "loss": 0.0227, + "step": 244890 + }, + { + "epoch": 1.58, + "learning_rate": 6.29036317987311e-05, + "loss": 0.0278, + "step": 244900 + }, + { + "epoch": 1.58, + "learning_rate": 6.289395044437416e-05, + "loss": 0.0246, + "step": 244910 + }, + { + "epoch": 1.58, + "learning_rate": 6.288426909001723e-05, + "loss": 0.034, + "step": 244920 + }, + { + "epoch": 1.58, + "learning_rate": 6.287458773566029e-05, + "loss": 0.029, + "step": 244930 + }, + { + "epoch": 1.58, + "learning_rate": 6.286490638130336e-05, + "loss": 0.0276, + "step": 244940 + }, + { + "epoch": 1.58, + "learning_rate": 6.285522502694644e-05, + "loss": 0.0233, + "step": 244950 + }, + { + "epoch": 1.58, + "learning_rate": 6.28455436725895e-05, + "loss": 0.0215, + "step": 244960 + }, + { + "epoch": 1.58, + "learning_rate": 6.283586231823256e-05, + "loss": 0.024, + "step": 244970 + }, + { + "epoch": 1.58, + "learning_rate": 6.282618096387564e-05, + "loss": 0.0269, + "step": 244980 + }, + { + "epoch": 1.58, + "learning_rate": 6.28164996095187e-05, + "loss": 0.0255, + "step": 244990 + }, + { + "epoch": 1.58, + "learning_rate": 6.280681825516177e-05, + "loss": 0.027, + "step": 245000 + }, + { + "epoch": 1.58, + "eval_cer": 0.9198960569427184, + "eval_loss": 0.01949627697467804, + "eval_runtime": 120.0652, + "eval_samples_per_second": 16.658, + "eval_steps_per_second": 4.164, + "step": 245000 + }, + { + "epoch": 1.58, + "learning_rate": 6.279713690080484e-05, + "loss": 0.0205, + "step": 245010 + }, + { + "epoch": 1.58, + "learning_rate": 6.278745554644792e-05, + "loss": 0.0261, + "step": 245020 + }, + { + "epoch": 1.58, + "learning_rate": 6.277777419209097e-05, + "loss": 0.028, + "step": 245030 + }, + { + "epoch": 1.58, + "learning_rate": 6.276809283773403e-05, + "loss": 0.0325, + "step": 245040 + }, + { + "epoch": 1.58, + "learning_rate": 6.275841148337711e-05, + "loss": 0.0253, + "step": 245050 + }, + { + "epoch": 1.58, + "learning_rate": 6.274873012902018e-05, + "loss": 0.0254, + "step": 245060 + }, + { + "epoch": 1.58, + "learning_rate": 6.273904877466325e-05, + "loss": 0.0289, + "step": 245070 + }, + { + "epoch": 1.58, + "learning_rate": 6.272936742030631e-05, + "loss": 0.0265, + "step": 245080 + }, + { + "epoch": 1.58, + "learning_rate": 6.271968606594938e-05, + "loss": 0.0293, + "step": 245090 + }, + { + "epoch": 1.58, + "learning_rate": 6.271000471159245e-05, + "loss": 0.0266, + "step": 245100 + }, + { + "epoch": 1.58, + "learning_rate": 6.270032335723551e-05, + "loss": 0.025, + "step": 245110 + }, + { + "epoch": 1.58, + "learning_rate": 6.269064200287859e-05, + "loss": 0.0307, + "step": 245120 + }, + { + "epoch": 1.58, + "learning_rate": 6.268096064852164e-05, + "loss": 0.0271, + "step": 245130 + }, + { + "epoch": 1.58, + "learning_rate": 6.267127929416472e-05, + "loss": 0.0267, + "step": 245140 + }, + { + "epoch": 1.58, + "learning_rate": 6.266159793980779e-05, + "loss": 0.0281, + "step": 245150 + }, + { + "epoch": 1.58, + "learning_rate": 6.265191658545086e-05, + "loss": 0.0277, + "step": 245160 + }, + { + "epoch": 1.58, + "learning_rate": 6.264223523109392e-05, + "loss": 0.0236, + "step": 245170 + }, + { + "epoch": 1.58, + "learning_rate": 6.263255387673699e-05, + "loss": 0.0302, + "step": 245180 + }, + { + "epoch": 1.58, + "learning_rate": 6.262287252238006e-05, + "loss": 0.0255, + "step": 245190 + }, + { + "epoch": 1.58, + "learning_rate": 6.261319116802312e-05, + "loss": 0.035, + "step": 245200 + }, + { + "epoch": 1.58, + "learning_rate": 6.26035098136662e-05, + "loss": 0.0223, + "step": 245210 + }, + { + "epoch": 1.58, + "learning_rate": 6.259382845930927e-05, + "loss": 0.0279, + "step": 245220 + }, + { + "epoch": 1.58, + "learning_rate": 6.258414710495233e-05, + "loss": 0.0283, + "step": 245230 + }, + { + "epoch": 1.58, + "learning_rate": 6.25744657505954e-05, + "loss": 0.0236, + "step": 245240 + }, + { + "epoch": 1.58, + "learning_rate": 6.256478439623847e-05, + "loss": 0.0271, + "step": 245250 + }, + { + "epoch": 1.58, + "learning_rate": 6.255510304188153e-05, + "loss": 0.0239, + "step": 245260 + }, + { + "epoch": 1.58, + "learning_rate": 6.25454216875246e-05, + "loss": 0.0248, + "step": 245270 + }, + { + "epoch": 1.58, + "learning_rate": 6.253574033316768e-05, + "loss": 0.0255, + "step": 245280 + }, + { + "epoch": 1.58, + "learning_rate": 6.252605897881073e-05, + "loss": 0.027, + "step": 245290 + }, + { + "epoch": 1.58, + "learning_rate": 6.251637762445381e-05, + "loss": 0.0258, + "step": 245300 + }, + { + "epoch": 1.58, + "learning_rate": 6.250669627009688e-05, + "loss": 0.0267, + "step": 245310 + }, + { + "epoch": 1.58, + "learning_rate": 6.249701491573994e-05, + "loss": 0.0318, + "step": 245320 + }, + { + "epoch": 1.58, + "learning_rate": 6.248733356138301e-05, + "loss": 0.0264, + "step": 245330 + }, + { + "epoch": 1.58, + "learning_rate": 6.247765220702608e-05, + "loss": 0.027, + "step": 245340 + }, + { + "epoch": 1.58, + "learning_rate": 6.246797085266914e-05, + "loss": 0.0248, + "step": 245350 + }, + { + "epoch": 1.58, + "learning_rate": 6.245828949831221e-05, + "loss": 0.0276, + "step": 245360 + }, + { + "epoch": 1.58, + "learning_rate": 6.244860814395527e-05, + "loss": 0.0263, + "step": 245370 + }, + { + "epoch": 1.58, + "learning_rate": 6.243892678959835e-05, + "loss": 0.0266, + "step": 245380 + }, + { + "epoch": 1.58, + "learning_rate": 6.242924543524141e-05, + "loss": 0.0254, + "step": 245390 + }, + { + "epoch": 1.58, + "learning_rate": 6.241956408088449e-05, + "loss": 0.029, + "step": 245400 + }, + { + "epoch": 1.58, + "learning_rate": 6.240988272652755e-05, + "loss": 0.0244, + "step": 245410 + }, + { + "epoch": 1.58, + "learning_rate": 6.240020137217062e-05, + "loss": 0.0368, + "step": 245420 + }, + { + "epoch": 1.58, + "learning_rate": 6.239052001781369e-05, + "loss": 0.0287, + "step": 245430 + }, + { + "epoch": 1.58, + "learning_rate": 6.238083866345675e-05, + "loss": 0.0283, + "step": 245440 + }, + { + "epoch": 1.58, + "learning_rate": 6.237115730909982e-05, + "loss": 0.0286, + "step": 245450 + }, + { + "epoch": 1.58, + "learning_rate": 6.236147595474288e-05, + "loss": 0.0279, + "step": 245460 + }, + { + "epoch": 1.58, + "learning_rate": 6.235179460038596e-05, + "loss": 0.0314, + "step": 245470 + }, + { + "epoch": 1.58, + "learning_rate": 6.234211324602903e-05, + "loss": 0.037, + "step": 245480 + }, + { + "epoch": 1.58, + "learning_rate": 6.23324318916721e-05, + "loss": 0.0223, + "step": 245490 + }, + { + "epoch": 1.58, + "learning_rate": 6.232275053731516e-05, + "loss": 0.0257, + "step": 245500 + }, + { + "epoch": 1.58, + "learning_rate": 6.231306918295823e-05, + "loss": 0.0288, + "step": 245510 + }, + { + "epoch": 1.58, + "learning_rate": 6.23033878286013e-05, + "loss": 0.0254, + "step": 245520 + }, + { + "epoch": 1.58, + "learning_rate": 6.229370647424436e-05, + "loss": 0.0336, + "step": 245530 + }, + { + "epoch": 1.58, + "learning_rate": 6.228402511988744e-05, + "loss": 0.0265, + "step": 245540 + }, + { + "epoch": 1.58, + "learning_rate": 6.22743437655305e-05, + "loss": 0.0264, + "step": 245550 + }, + { + "epoch": 1.58, + "learning_rate": 6.226466241117357e-05, + "loss": 0.0288, + "step": 245560 + }, + { + "epoch": 1.58, + "learning_rate": 6.225498105681664e-05, + "loss": 0.0239, + "step": 245570 + }, + { + "epoch": 1.59, + "learning_rate": 6.22452997024597e-05, + "loss": 0.031, + "step": 245580 + }, + { + "epoch": 1.59, + "learning_rate": 6.223561834810277e-05, + "loss": 0.0231, + "step": 245590 + }, + { + "epoch": 1.59, + "learning_rate": 6.222593699374584e-05, + "loss": 0.0242, + "step": 245600 + }, + { + "epoch": 1.59, + "learning_rate": 6.22162556393889e-05, + "loss": 0.0241, + "step": 245610 + }, + { + "epoch": 1.59, + "learning_rate": 6.220657428503197e-05, + "loss": 0.0261, + "step": 245620 + }, + { + "epoch": 1.59, + "learning_rate": 6.219689293067505e-05, + "loss": 0.0272, + "step": 245630 + }, + { + "epoch": 1.59, + "learning_rate": 6.218721157631812e-05, + "loss": 0.0272, + "step": 245640 + }, + { + "epoch": 1.59, + "learning_rate": 6.217753022196117e-05, + "loss": 0.0309, + "step": 245650 + }, + { + "epoch": 1.59, + "learning_rate": 6.216784886760425e-05, + "loss": 0.0272, + "step": 245660 + }, + { + "epoch": 1.59, + "learning_rate": 6.215816751324732e-05, + "loss": 0.0225, + "step": 245670 + }, + { + "epoch": 1.59, + "learning_rate": 6.214848615889038e-05, + "loss": 0.0272, + "step": 245680 + }, + { + "epoch": 1.59, + "learning_rate": 6.213880480453345e-05, + "loss": 0.0256, + "step": 245690 + }, + { + "epoch": 1.59, + "learning_rate": 6.212912345017651e-05, + "loss": 0.0267, + "step": 245700 + }, + { + "epoch": 1.59, + "learning_rate": 6.211944209581958e-05, + "loss": 0.0309, + "step": 245710 + }, + { + "epoch": 1.59, + "learning_rate": 6.210976074146265e-05, + "loss": 0.0295, + "step": 245720 + }, + { + "epoch": 1.59, + "learning_rate": 6.210007938710573e-05, + "loss": 0.0251, + "step": 245730 + }, + { + "epoch": 1.59, + "learning_rate": 6.209039803274879e-05, + "loss": 0.0231, + "step": 245740 + }, + { + "epoch": 1.59, + "learning_rate": 6.208071667839186e-05, + "loss": 0.0286, + "step": 245750 + }, + { + "epoch": 1.59, + "learning_rate": 6.207103532403493e-05, + "loss": 0.0246, + "step": 245760 + }, + { + "epoch": 1.59, + "learning_rate": 6.206135396967799e-05, + "loss": 0.0273, + "step": 245770 + }, + { + "epoch": 1.59, + "learning_rate": 6.205167261532106e-05, + "loss": 0.026, + "step": 245780 + }, + { + "epoch": 1.59, + "learning_rate": 6.204199126096412e-05, + "loss": 0.032, + "step": 245790 + }, + { + "epoch": 1.59, + "learning_rate": 6.203230990660719e-05, + "loss": 0.0247, + "step": 245800 + }, + { + "epoch": 1.59, + "learning_rate": 6.202262855225026e-05, + "loss": 0.0228, + "step": 245810 + }, + { + "epoch": 1.59, + "learning_rate": 6.201294719789334e-05, + "loss": 0.0236, + "step": 245820 + }, + { + "epoch": 1.59, + "learning_rate": 6.20032658435364e-05, + "loss": 0.0227, + "step": 245830 + }, + { + "epoch": 1.59, + "learning_rate": 6.199358448917947e-05, + "loss": 0.024, + "step": 245840 + }, + { + "epoch": 1.59, + "learning_rate": 6.198390313482254e-05, + "loss": 0.0299, + "step": 245850 + }, + { + "epoch": 1.59, + "learning_rate": 6.19742217804656e-05, + "loss": 0.0266, + "step": 245860 + }, + { + "epoch": 1.59, + "learning_rate": 6.196454042610867e-05, + "loss": 0.0315, + "step": 245870 + }, + { + "epoch": 1.59, + "learning_rate": 6.195485907175173e-05, + "loss": 0.0223, + "step": 245880 + }, + { + "epoch": 1.59, + "learning_rate": 6.194517771739481e-05, + "loss": 0.0257, + "step": 245890 + }, + { + "epoch": 1.59, + "learning_rate": 6.193549636303787e-05, + "loss": 0.0261, + "step": 245900 + }, + { + "epoch": 1.59, + "learning_rate": 6.192581500868095e-05, + "loss": 0.0238, + "step": 245910 + }, + { + "epoch": 1.59, + "learning_rate": 6.191613365432401e-05, + "loss": 0.0309, + "step": 245920 + }, + { + "epoch": 1.59, + "learning_rate": 6.190645229996708e-05, + "loss": 0.0247, + "step": 245930 + }, + { + "epoch": 1.59, + "learning_rate": 6.189677094561014e-05, + "loss": 0.0265, + "step": 245940 + }, + { + "epoch": 1.59, + "learning_rate": 6.188708959125321e-05, + "loss": 0.027, + "step": 245950 + }, + { + "epoch": 1.59, + "learning_rate": 6.187740823689628e-05, + "loss": 0.0258, + "step": 245960 + }, + { + "epoch": 1.59, + "learning_rate": 6.186772688253934e-05, + "loss": 0.0269, + "step": 245970 + }, + { + "epoch": 1.59, + "learning_rate": 6.185804552818242e-05, + "loss": 0.0278, + "step": 245980 + }, + { + "epoch": 1.59, + "learning_rate": 6.184836417382549e-05, + "loss": 0.03, + "step": 245990 + }, + { + "epoch": 1.59, + "learning_rate": 6.183868281946854e-05, + "loss": 0.0257, + "step": 246000 + }, + { + "epoch": 1.59, + "eval_cer": 0.9198806914472941, + "eval_loss": 0.01917816512286663, + "eval_runtime": 120.0373, + "eval_samples_per_second": 16.661, + "eval_steps_per_second": 4.165, + "step": 246000 + }, + { + "epoch": 1.59, + "learning_rate": 6.182900146511162e-05, + "loss": 0.028, + "step": 246010 + }, + { + "epoch": 1.59, + "learning_rate": 6.181932011075469e-05, + "loss": 0.026, + "step": 246020 + }, + { + "epoch": 1.59, + "learning_rate": 6.180963875639775e-05, + "loss": 0.0262, + "step": 246030 + }, + { + "epoch": 1.59, + "learning_rate": 6.179995740204082e-05, + "loss": 0.031, + "step": 246040 + }, + { + "epoch": 1.59, + "learning_rate": 6.17902760476839e-05, + "loss": 0.0259, + "step": 246050 + }, + { + "epoch": 1.59, + "learning_rate": 6.178059469332695e-05, + "loss": 0.0288, + "step": 246060 + }, + { + "epoch": 1.59, + "learning_rate": 6.177091333897002e-05, + "loss": 0.0232, + "step": 246070 + }, + { + "epoch": 1.59, + "learning_rate": 6.17612319846131e-05, + "loss": 0.0236, + "step": 246080 + }, + { + "epoch": 1.59, + "learning_rate": 6.175155063025617e-05, + "loss": 0.0278, + "step": 246090 + }, + { + "epoch": 1.59, + "learning_rate": 6.174186927589923e-05, + "loss": 0.0291, + "step": 246100 + }, + { + "epoch": 1.59, + "learning_rate": 6.17321879215423e-05, + "loss": 0.025, + "step": 246110 + }, + { + "epoch": 1.59, + "learning_rate": 6.172250656718536e-05, + "loss": 0.033, + "step": 246120 + }, + { + "epoch": 1.59, + "learning_rate": 6.171282521282843e-05, + "loss": 0.0368, + "step": 246130 + }, + { + "epoch": 1.59, + "learning_rate": 6.17031438584715e-05, + "loss": 0.0261, + "step": 246140 + }, + { + "epoch": 1.59, + "learning_rate": 6.169346250411458e-05, + "loss": 0.0236, + "step": 246150 + }, + { + "epoch": 1.59, + "learning_rate": 6.168378114975763e-05, + "loss": 0.0221, + "step": 246160 + }, + { + "epoch": 1.59, + "learning_rate": 6.167409979540071e-05, + "loss": 0.0229, + "step": 246170 + }, + { + "epoch": 1.59, + "learning_rate": 6.166441844104378e-05, + "loss": 0.03, + "step": 246180 + }, + { + "epoch": 1.59, + "learning_rate": 6.165473708668684e-05, + "loss": 0.0226, + "step": 246190 + }, + { + "epoch": 1.59, + "learning_rate": 6.164505573232991e-05, + "loss": 0.0262, + "step": 246200 + }, + { + "epoch": 1.59, + "learning_rate": 6.163537437797297e-05, + "loss": 0.0236, + "step": 246210 + }, + { + "epoch": 1.59, + "learning_rate": 6.162569302361604e-05, + "loss": 0.026, + "step": 246220 + }, + { + "epoch": 1.59, + "learning_rate": 6.16160116692591e-05, + "loss": 0.025, + "step": 246230 + }, + { + "epoch": 1.59, + "learning_rate": 6.160633031490219e-05, + "loss": 0.0254, + "step": 246240 + }, + { + "epoch": 1.59, + "learning_rate": 6.159664896054525e-05, + "loss": 0.0251, + "step": 246250 + }, + { + "epoch": 1.59, + "learning_rate": 6.158696760618832e-05, + "loss": 0.0325, + "step": 246260 + }, + { + "epoch": 1.59, + "learning_rate": 6.157728625183139e-05, + "loss": 0.03, + "step": 246270 + }, + { + "epoch": 1.59, + "learning_rate": 6.156760489747445e-05, + "loss": 0.0251, + "step": 246280 + }, + { + "epoch": 1.59, + "learning_rate": 6.155792354311752e-05, + "loss": 0.0333, + "step": 246290 + }, + { + "epoch": 1.59, + "learning_rate": 6.154824218876058e-05, + "loss": 0.0289, + "step": 246300 + }, + { + "epoch": 1.59, + "learning_rate": 6.153856083440366e-05, + "loss": 0.027, + "step": 246310 + }, + { + "epoch": 1.59, + "learning_rate": 6.152887948004672e-05, + "loss": 0.0279, + "step": 246320 + }, + { + "epoch": 1.59, + "learning_rate": 6.15191981256898e-05, + "loss": 0.022, + "step": 246330 + }, + { + "epoch": 1.59, + "learning_rate": 6.150951677133286e-05, + "loss": 0.0271, + "step": 246340 + }, + { + "epoch": 1.59, + "learning_rate": 6.149983541697593e-05, + "loss": 0.0288, + "step": 246350 + }, + { + "epoch": 1.59, + "learning_rate": 6.1490154062619e-05, + "loss": 0.0247, + "step": 246360 + }, + { + "epoch": 1.59, + "learning_rate": 6.148047270826206e-05, + "loss": 0.0292, + "step": 246370 + }, + { + "epoch": 1.59, + "learning_rate": 6.147079135390513e-05, + "loss": 0.0227, + "step": 246380 + }, + { + "epoch": 1.59, + "learning_rate": 6.14611099995482e-05, + "loss": 0.0254, + "step": 246390 + }, + { + "epoch": 1.59, + "learning_rate": 6.145142864519127e-05, + "loss": 0.0233, + "step": 246400 + }, + { + "epoch": 1.59, + "learning_rate": 6.144174729083434e-05, + "loss": 0.0263, + "step": 246410 + }, + { + "epoch": 1.59, + "learning_rate": 6.143206593647739e-05, + "loss": 0.0247, + "step": 246420 + }, + { + "epoch": 1.59, + "learning_rate": 6.142238458212047e-05, + "loss": 0.0233, + "step": 246430 + }, + { + "epoch": 1.59, + "learning_rate": 6.141270322776354e-05, + "loss": 0.0254, + "step": 246440 + }, + { + "epoch": 1.59, + "learning_rate": 6.14030218734066e-05, + "loss": 0.0251, + "step": 246450 + }, + { + "epoch": 1.59, + "learning_rate": 6.139334051904967e-05, + "loss": 0.0277, + "step": 246460 + }, + { + "epoch": 1.59, + "learning_rate": 6.138365916469275e-05, + "loss": 0.0256, + "step": 246470 + }, + { + "epoch": 1.59, + "learning_rate": 6.13739778103358e-05, + "loss": 0.0243, + "step": 246480 + }, + { + "epoch": 1.59, + "learning_rate": 6.136429645597887e-05, + "loss": 0.0335, + "step": 246490 + }, + { + "epoch": 1.59, + "learning_rate": 6.135461510162195e-05, + "loss": 0.0247, + "step": 246500 + }, + { + "epoch": 1.59, + "learning_rate": 6.134493374726502e-05, + "loss": 0.0237, + "step": 246510 + }, + { + "epoch": 1.59, + "learning_rate": 6.133525239290808e-05, + "loss": 0.0255, + "step": 246520 + }, + { + "epoch": 1.59, + "learning_rate": 6.132557103855115e-05, + "loss": 0.0252, + "step": 246530 + }, + { + "epoch": 1.59, + "learning_rate": 6.131588968419421e-05, + "loss": 0.0292, + "step": 246540 + }, + { + "epoch": 1.59, + "learning_rate": 6.130620832983728e-05, + "loss": 0.0236, + "step": 246550 + }, + { + "epoch": 1.59, + "learning_rate": 6.129652697548035e-05, + "loss": 0.0243, + "step": 246560 + }, + { + "epoch": 1.59, + "learning_rate": 6.128684562112343e-05, + "loss": 0.0274, + "step": 246570 + }, + { + "epoch": 1.59, + "learning_rate": 6.127716426676648e-05, + "loss": 0.0275, + "step": 246580 + }, + { + "epoch": 1.59, + "learning_rate": 6.126748291240956e-05, + "loss": 0.0246, + "step": 246590 + }, + { + "epoch": 1.59, + "learning_rate": 6.125780155805263e-05, + "loss": 0.0222, + "step": 246600 + }, + { + "epoch": 1.59, + "learning_rate": 6.124812020369569e-05, + "loss": 0.027, + "step": 246610 + }, + { + "epoch": 1.59, + "learning_rate": 6.123843884933876e-05, + "loss": 0.0235, + "step": 246620 + }, + { + "epoch": 1.59, + "learning_rate": 6.122875749498182e-05, + "loss": 0.0283, + "step": 246630 + }, + { + "epoch": 1.59, + "learning_rate": 6.121907614062489e-05, + "loss": 0.0227, + "step": 246640 + }, + { + "epoch": 1.59, + "learning_rate": 6.120939478626796e-05, + "loss": 0.0252, + "step": 246650 + }, + { + "epoch": 1.59, + "learning_rate": 6.119971343191104e-05, + "loss": 0.0241, + "step": 246660 + }, + { + "epoch": 1.59, + "learning_rate": 6.11900320775541e-05, + "loss": 0.0235, + "step": 246670 + }, + { + "epoch": 1.59, + "learning_rate": 6.118035072319717e-05, + "loss": 0.0311, + "step": 246680 + }, + { + "epoch": 1.59, + "learning_rate": 6.117066936884023e-05, + "loss": 0.0279, + "step": 246690 + }, + { + "epoch": 1.59, + "learning_rate": 6.11609880144833e-05, + "loss": 0.0282, + "step": 246700 + }, + { + "epoch": 1.59, + "learning_rate": 6.115130666012637e-05, + "loss": 0.0252, + "step": 246710 + }, + { + "epoch": 1.59, + "learning_rate": 6.114162530576943e-05, + "loss": 0.0223, + "step": 246720 + }, + { + "epoch": 1.59, + "learning_rate": 6.113194395141251e-05, + "loss": 0.0277, + "step": 246730 + }, + { + "epoch": 1.59, + "learning_rate": 6.112226259705557e-05, + "loss": 0.0285, + "step": 246740 + }, + { + "epoch": 1.59, + "learning_rate": 6.111258124269865e-05, + "loss": 0.0362, + "step": 246750 + }, + { + "epoch": 1.59, + "learning_rate": 6.110289988834171e-05, + "loss": 0.0231, + "step": 246760 + }, + { + "epoch": 1.59, + "learning_rate": 6.109321853398478e-05, + "loss": 0.0265, + "step": 246770 + }, + { + "epoch": 1.59, + "learning_rate": 6.108353717962784e-05, + "loss": 0.0333, + "step": 246780 + }, + { + "epoch": 1.59, + "learning_rate": 6.107385582527091e-05, + "loss": 0.0233, + "step": 246790 + }, + { + "epoch": 1.59, + "learning_rate": 6.106417447091398e-05, + "loss": 0.0267, + "step": 246800 + }, + { + "epoch": 1.59, + "learning_rate": 6.105449311655704e-05, + "loss": 0.0253, + "step": 246810 + }, + { + "epoch": 1.59, + "learning_rate": 6.104481176220012e-05, + "loss": 0.023, + "step": 246820 + }, + { + "epoch": 1.59, + "learning_rate": 6.103513040784318e-05, + "loss": 0.0266, + "step": 246830 + }, + { + "epoch": 1.59, + "learning_rate": 6.102544905348625e-05, + "loss": 0.0259, + "step": 246840 + }, + { + "epoch": 1.59, + "learning_rate": 6.101576769912932e-05, + "loss": 0.0254, + "step": 246850 + }, + { + "epoch": 1.59, + "learning_rate": 6.100608634477238e-05, + "loss": 0.0259, + "step": 246860 + }, + { + "epoch": 1.59, + "learning_rate": 6.0996404990415454e-05, + "loss": 0.0286, + "step": 246870 + }, + { + "epoch": 1.59, + "learning_rate": 6.098672363605852e-05, + "loss": 0.0258, + "step": 246880 + }, + { + "epoch": 1.59, + "learning_rate": 6.0977042281701593e-05, + "loss": 0.025, + "step": 246890 + }, + { + "epoch": 1.59, + "learning_rate": 6.096736092734466e-05, + "loss": 0.0263, + "step": 246900 + }, + { + "epoch": 1.59, + "learning_rate": 6.095767957298772e-05, + "loss": 0.0335, + "step": 246910 + }, + { + "epoch": 1.59, + "learning_rate": 6.094799821863079e-05, + "loss": 0.0223, + "step": 246920 + }, + { + "epoch": 1.59, + "learning_rate": 6.093831686427386e-05, + "loss": 0.0256, + "step": 246930 + }, + { + "epoch": 1.59, + "learning_rate": 6.092863550991693e-05, + "loss": 0.0249, + "step": 246940 + }, + { + "epoch": 1.59, + "learning_rate": 6.091895415556e-05, + "loss": 0.0256, + "step": 246950 + }, + { + "epoch": 1.59, + "learning_rate": 6.090927280120307e-05, + "loss": 0.0295, + "step": 246960 + }, + { + "epoch": 1.59, + "learning_rate": 6.089959144684613e-05, + "loss": 0.0235, + "step": 246970 + }, + { + "epoch": 1.59, + "learning_rate": 6.0889910092489196e-05, + "loss": 0.0232, + "step": 246980 + }, + { + "epoch": 1.59, + "learning_rate": 6.088022873813227e-05, + "loss": 0.0253, + "step": 246990 + }, + { + "epoch": 1.59, + "learning_rate": 6.0870547383775336e-05, + "loss": 0.0276, + "step": 247000 + }, + { + "epoch": 1.59, + "eval_cer": 0.9198824991526381, + "eval_loss": 0.019043434411287308, + "eval_runtime": 120.2331, + "eval_samples_per_second": 16.634, + "eval_steps_per_second": 4.159, + "step": 247000 + }, + { + "epoch": 1.59, + "learning_rate": 6.086086602941841e-05, + "loss": 0.0211, + "step": 247010 + }, + { + "epoch": 1.59, + "learning_rate": 6.085118467506147e-05, + "loss": 0.0253, + "step": 247020 + }, + { + "epoch": 1.59, + "learning_rate": 6.084150332070454e-05, + "loss": 0.0319, + "step": 247030 + }, + { + "epoch": 1.59, + "learning_rate": 6.083182196634761e-05, + "loss": 0.024, + "step": 247040 + }, + { + "epoch": 1.59, + "learning_rate": 6.0822140611990674e-05, + "loss": 0.0267, + "step": 247050 + }, + { + "epoch": 1.59, + "learning_rate": 6.081245925763375e-05, + "loss": 0.0268, + "step": 247060 + }, + { + "epoch": 1.59, + "learning_rate": 6.0802777903276806e-05, + "loss": 0.0318, + "step": 247070 + }, + { + "epoch": 1.59, + "learning_rate": 6.079309654891988e-05, + "loss": 0.027, + "step": 247080 + }, + { + "epoch": 1.59, + "learning_rate": 6.0783415194562945e-05, + "loss": 0.0288, + "step": 247090 + }, + { + "epoch": 1.59, + "learning_rate": 6.077373384020601e-05, + "loss": 0.0268, + "step": 247100 + }, + { + "epoch": 1.59, + "learning_rate": 6.0764052485849085e-05, + "loss": 0.0284, + "step": 247110 + }, + { + "epoch": 1.59, + "learning_rate": 6.0754371131492144e-05, + "loss": 0.0286, + "step": 247120 + }, + { + "epoch": 1.6, + "learning_rate": 6.074468977713522e-05, + "loss": 0.0266, + "step": 247130 + }, + { + "epoch": 1.6, + "learning_rate": 6.073500842277828e-05, + "loss": 0.0257, + "step": 247140 + }, + { + "epoch": 1.6, + "learning_rate": 6.0725327068421356e-05, + "loss": 0.021, + "step": 247150 + }, + { + "epoch": 1.6, + "learning_rate": 6.071564571406442e-05, + "loss": 0.026, + "step": 247160 + }, + { + "epoch": 1.6, + "learning_rate": 6.070596435970748e-05, + "loss": 0.0279, + "step": 247170 + }, + { + "epoch": 1.6, + "learning_rate": 6.0696283005350555e-05, + "loss": 0.0213, + "step": 247180 + }, + { + "epoch": 1.6, + "learning_rate": 6.068660165099362e-05, + "loss": 0.0241, + "step": 247190 + }, + { + "epoch": 1.6, + "learning_rate": 6.0676920296636694e-05, + "loss": 0.0249, + "step": 247200 + }, + { + "epoch": 1.6, + "learning_rate": 6.066723894227976e-05, + "loss": 0.0287, + "step": 247210 + }, + { + "epoch": 1.6, + "learning_rate": 6.0657557587922834e-05, + "loss": 0.0276, + "step": 247220 + }, + { + "epoch": 1.6, + "learning_rate": 6.064787623356589e-05, + "loss": 0.0266, + "step": 247230 + }, + { + "epoch": 1.6, + "learning_rate": 6.063819487920896e-05, + "loss": 0.0226, + "step": 247240 + }, + { + "epoch": 1.6, + "learning_rate": 6.062851352485203e-05, + "loss": 0.0257, + "step": 247250 + }, + { + "epoch": 1.6, + "learning_rate": 6.06188321704951e-05, + "loss": 0.0284, + "step": 247260 + }, + { + "epoch": 1.6, + "learning_rate": 6.060915081613817e-05, + "loss": 0.0255, + "step": 247270 + }, + { + "epoch": 1.6, + "learning_rate": 6.059946946178123e-05, + "loss": 0.0211, + "step": 247280 + }, + { + "epoch": 1.6, + "learning_rate": 6.0589788107424304e-05, + "loss": 0.0206, + "step": 247290 + }, + { + "epoch": 1.6, + "learning_rate": 6.058010675306737e-05, + "loss": 0.0205, + "step": 247300 + }, + { + "epoch": 1.6, + "learning_rate": 6.0570425398710437e-05, + "loss": 0.0261, + "step": 247310 + }, + { + "epoch": 1.6, + "learning_rate": 6.056074404435351e-05, + "loss": 0.0262, + "step": 247320 + }, + { + "epoch": 1.6, + "learning_rate": 6.055106268999657e-05, + "loss": 0.0206, + "step": 247330 + }, + { + "epoch": 1.6, + "learning_rate": 6.054138133563964e-05, + "loss": 0.0284, + "step": 247340 + }, + { + "epoch": 1.6, + "learning_rate": 6.053169998128271e-05, + "loss": 0.0247, + "step": 247350 + }, + { + "epoch": 1.6, + "learning_rate": 6.052201862692578e-05, + "loss": 0.0228, + "step": 247360 + }, + { + "epoch": 1.6, + "learning_rate": 6.051233727256885e-05, + "loss": 0.0241, + "step": 247370 + }, + { + "epoch": 1.6, + "learning_rate": 6.050265591821191e-05, + "loss": 0.0237, + "step": 247380 + }, + { + "epoch": 1.6, + "learning_rate": 6.049297456385498e-05, + "loss": 0.0255, + "step": 247390 + }, + { + "epoch": 1.6, + "learning_rate": 6.0483293209498046e-05, + "loss": 0.0312, + "step": 247400 + }, + { + "epoch": 1.6, + "learning_rate": 6.047361185514112e-05, + "loss": 0.0218, + "step": 247410 + }, + { + "epoch": 1.6, + "learning_rate": 6.0463930500784185e-05, + "loss": 0.0271, + "step": 247420 + }, + { + "epoch": 1.6, + "learning_rate": 6.045424914642726e-05, + "loss": 0.0246, + "step": 247430 + }, + { + "epoch": 1.6, + "learning_rate": 6.044456779207032e-05, + "loss": 0.0268, + "step": 247440 + }, + { + "epoch": 1.6, + "learning_rate": 6.0434886437713384e-05, + "loss": 0.0236, + "step": 247450 + }, + { + "epoch": 1.6, + "learning_rate": 6.042520508335646e-05, + "loss": 0.0225, + "step": 247460 + }, + { + "epoch": 1.6, + "learning_rate": 6.0415523728999523e-05, + "loss": 0.0277, + "step": 247470 + }, + { + "epoch": 1.6, + "learning_rate": 6.0405842374642596e-05, + "loss": 0.029, + "step": 247480 + }, + { + "epoch": 1.6, + "learning_rate": 6.0396161020285656e-05, + "loss": 0.0263, + "step": 247490 + }, + { + "epoch": 1.6, + "learning_rate": 6.038647966592873e-05, + "loss": 0.0267, + "step": 247500 + }, + { + "epoch": 1.6, + "learning_rate": 6.0376798311571795e-05, + "loss": 0.0297, + "step": 247510 + }, + { + "epoch": 1.6, + "learning_rate": 6.036711695721486e-05, + "loss": 0.0229, + "step": 247520 + }, + { + "epoch": 1.6, + "learning_rate": 6.0357435602857934e-05, + "loss": 0.024, + "step": 247530 + }, + { + "epoch": 1.6, + "learning_rate": 6.0347754248500994e-05, + "loss": 0.0355, + "step": 247540 + }, + { + "epoch": 1.6, + "learning_rate": 6.033807289414407e-05, + "loss": 0.0239, + "step": 247550 + }, + { + "epoch": 1.6, + "learning_rate": 6.032839153978713e-05, + "loss": 0.0246, + "step": 247560 + }, + { + "epoch": 1.6, + "learning_rate": 6.0318710185430206e-05, + "loss": 0.0211, + "step": 247570 + }, + { + "epoch": 1.6, + "learning_rate": 6.030902883107327e-05, + "loss": 0.0333, + "step": 247580 + }, + { + "epoch": 1.6, + "learning_rate": 6.029934747671633e-05, + "loss": 0.0223, + "step": 247590 + }, + { + "epoch": 1.6, + "learning_rate": 6.0289666122359405e-05, + "loss": 0.0241, + "step": 247600 + }, + { + "epoch": 1.6, + "learning_rate": 6.027998476800247e-05, + "loss": 0.0269, + "step": 247610 + }, + { + "epoch": 1.6, + "learning_rate": 6.0270303413645544e-05, + "loss": 0.0242, + "step": 247620 + }, + { + "epoch": 1.6, + "learning_rate": 6.026062205928861e-05, + "loss": 0.0236, + "step": 247630 + }, + { + "epoch": 1.6, + "learning_rate": 6.0250940704931683e-05, + "loss": 0.0293, + "step": 247640 + }, + { + "epoch": 1.6, + "learning_rate": 6.024125935057474e-05, + "loss": 0.0311, + "step": 247650 + }, + { + "epoch": 1.6, + "learning_rate": 6.023157799621781e-05, + "loss": 0.0287, + "step": 247660 + }, + { + "epoch": 1.6, + "learning_rate": 6.022189664186088e-05, + "loss": 0.0267, + "step": 247670 + }, + { + "epoch": 1.6, + "learning_rate": 6.021221528750395e-05, + "loss": 0.0288, + "step": 247680 + }, + { + "epoch": 1.6, + "learning_rate": 6.020253393314702e-05, + "loss": 0.0295, + "step": 247690 + }, + { + "epoch": 1.6, + "learning_rate": 6.019285257879008e-05, + "loss": 0.0223, + "step": 247700 + }, + { + "epoch": 1.6, + "learning_rate": 6.0183171224433154e-05, + "loss": 0.0254, + "step": 247710 + }, + { + "epoch": 1.6, + "learning_rate": 6.017348987007622e-05, + "loss": 0.0195, + "step": 247720 + }, + { + "epoch": 1.6, + "learning_rate": 6.0163808515719286e-05, + "loss": 0.0274, + "step": 247730 + }, + { + "epoch": 1.6, + "learning_rate": 6.015412716136236e-05, + "loss": 0.0237, + "step": 247740 + }, + { + "epoch": 1.6, + "learning_rate": 6.014444580700542e-05, + "loss": 0.0234, + "step": 247750 + }, + { + "epoch": 1.6, + "learning_rate": 6.013476445264849e-05, + "loss": 0.0304, + "step": 247760 + }, + { + "epoch": 1.6, + "learning_rate": 6.012508309829156e-05, + "loss": 0.0275, + "step": 247770 + }, + { + "epoch": 1.6, + "learning_rate": 6.011540174393463e-05, + "loss": 0.03, + "step": 247780 + }, + { + "epoch": 1.6, + "learning_rate": 6.01057203895777e-05, + "loss": 0.0253, + "step": 247790 + }, + { + "epoch": 1.6, + "learning_rate": 6.009603903522076e-05, + "loss": 0.0201, + "step": 247800 + }, + { + "epoch": 1.6, + "learning_rate": 6.008635768086383e-05, + "loss": 0.0211, + "step": 247810 + }, + { + "epoch": 1.6, + "learning_rate": 6.0076676326506896e-05, + "loss": 0.027, + "step": 247820 + }, + { + "epoch": 1.6, + "learning_rate": 6.006699497214997e-05, + "loss": 0.0298, + "step": 247830 + }, + { + "epoch": 1.6, + "learning_rate": 6.0057313617793035e-05, + "loss": 0.021, + "step": 247840 + }, + { + "epoch": 1.6, + "learning_rate": 6.00476322634361e-05, + "loss": 0.0241, + "step": 247850 + }, + { + "epoch": 1.6, + "learning_rate": 6.003795090907917e-05, + "loss": 0.0259, + "step": 247860 + }, + { + "epoch": 1.6, + "learning_rate": 6.0028269554722234e-05, + "loss": 0.0289, + "step": 247870 + }, + { + "epoch": 1.6, + "learning_rate": 6.001858820036531e-05, + "loss": 0.027, + "step": 247880 + }, + { + "epoch": 1.6, + "learning_rate": 6.000890684600837e-05, + "loss": 0.0231, + "step": 247890 + }, + { + "epoch": 1.6, + "learning_rate": 5.999922549165144e-05, + "loss": 0.0254, + "step": 247900 + }, + { + "epoch": 1.6, + "learning_rate": 5.9989544137294506e-05, + "loss": 0.02, + "step": 247910 + }, + { + "epoch": 1.6, + "learning_rate": 5.997986278293758e-05, + "loss": 0.0229, + "step": 247920 + }, + { + "epoch": 1.6, + "learning_rate": 5.9970181428580645e-05, + "loss": 0.0235, + "step": 247930 + }, + { + "epoch": 1.6, + "learning_rate": 5.996050007422371e-05, + "loss": 0.0264, + "step": 247940 + }, + { + "epoch": 1.6, + "learning_rate": 5.995081871986678e-05, + "loss": 0.0303, + "step": 247950 + }, + { + "epoch": 1.6, + "learning_rate": 5.9941137365509844e-05, + "loss": 0.0278, + "step": 247960 + }, + { + "epoch": 1.6, + "learning_rate": 5.993145601115292e-05, + "loss": 0.0273, + "step": 247970 + }, + { + "epoch": 1.6, + "learning_rate": 5.992177465679598e-05, + "loss": 0.0245, + "step": 247980 + }, + { + "epoch": 1.6, + "learning_rate": 5.9912093302439056e-05, + "loss": 0.0282, + "step": 247990 + }, + { + "epoch": 1.6, + "learning_rate": 5.9902411948082115e-05, + "loss": 0.0238, + "step": 248000 + }, + { + "epoch": 1.6, + "eval_cer": 0.9198852107106542, + "eval_loss": 0.01876279152929783, + "eval_runtime": 120.3747, + "eval_samples_per_second": 16.615, + "eval_steps_per_second": 4.154, + "step": 248000 + }, + { + "epoch": 1.6, + "learning_rate": 5.989273059372518e-05, + "loss": 0.025, + "step": 248010 + }, + { + "epoch": 1.6, + "learning_rate": 5.9883049239368255e-05, + "loss": 0.0193, + "step": 248020 + }, + { + "epoch": 1.6, + "learning_rate": 5.987336788501132e-05, + "loss": 0.0249, + "step": 248030 + }, + { + "epoch": 1.6, + "learning_rate": 5.9863686530654394e-05, + "loss": 0.0252, + "step": 248040 + }, + { + "epoch": 1.6, + "learning_rate": 5.9854005176297453e-05, + "loss": 0.0226, + "step": 248050 + }, + { + "epoch": 1.6, + "learning_rate": 5.9844323821940526e-05, + "loss": 0.0258, + "step": 248060 + }, + { + "epoch": 1.6, + "learning_rate": 5.983464246758359e-05, + "loss": 0.0232, + "step": 248070 + }, + { + "epoch": 1.6, + "learning_rate": 5.982496111322666e-05, + "loss": 0.0221, + "step": 248080 + }, + { + "epoch": 1.6, + "learning_rate": 5.981527975886973e-05, + "loss": 0.0266, + "step": 248090 + }, + { + "epoch": 1.6, + "learning_rate": 5.980559840451279e-05, + "loss": 0.0225, + "step": 248100 + }, + { + "epoch": 1.6, + "learning_rate": 5.9795917050155864e-05, + "loss": 0.0248, + "step": 248110 + }, + { + "epoch": 1.6, + "learning_rate": 5.978623569579893e-05, + "loss": 0.0314, + "step": 248120 + }, + { + "epoch": 1.6, + "learning_rate": 5.9776554341442004e-05, + "loss": 0.0252, + "step": 248130 + }, + { + "epoch": 1.6, + "learning_rate": 5.976687298708507e-05, + "loss": 0.0247, + "step": 248140 + }, + { + "epoch": 1.6, + "learning_rate": 5.975719163272813e-05, + "loss": 0.0242, + "step": 248150 + }, + { + "epoch": 1.6, + "learning_rate": 5.97475102783712e-05, + "loss": 0.0312, + "step": 248160 + }, + { + "epoch": 1.6, + "learning_rate": 5.973782892401427e-05, + "loss": 0.0231, + "step": 248170 + }, + { + "epoch": 1.6, + "learning_rate": 5.972814756965734e-05, + "loss": 0.0281, + "step": 248180 + }, + { + "epoch": 1.6, + "learning_rate": 5.971846621530041e-05, + "loss": 0.0241, + "step": 248190 + }, + { + "epoch": 1.6, + "learning_rate": 5.970878486094348e-05, + "loss": 0.0248, + "step": 248200 + }, + { + "epoch": 1.6, + "learning_rate": 5.969910350658654e-05, + "loss": 0.0245, + "step": 248210 + }, + { + "epoch": 1.6, + "learning_rate": 5.9689422152229607e-05, + "loss": 0.0294, + "step": 248220 + }, + { + "epoch": 1.6, + "learning_rate": 5.967974079787268e-05, + "loss": 0.0213, + "step": 248230 + }, + { + "epoch": 1.6, + "learning_rate": 5.9670059443515746e-05, + "loss": 0.0219, + "step": 248240 + }, + { + "epoch": 1.6, + "learning_rate": 5.966037808915882e-05, + "loss": 0.025, + "step": 248250 + }, + { + "epoch": 1.6, + "learning_rate": 5.965069673480188e-05, + "loss": 0.0228, + "step": 248260 + }, + { + "epoch": 1.6, + "learning_rate": 5.964101538044495e-05, + "loss": 0.0263, + "step": 248270 + }, + { + "epoch": 1.6, + "learning_rate": 5.963133402608802e-05, + "loss": 0.0219, + "step": 248280 + }, + { + "epoch": 1.6, + "learning_rate": 5.9621652671731084e-05, + "loss": 0.0305, + "step": 248290 + }, + { + "epoch": 1.6, + "learning_rate": 5.961197131737416e-05, + "loss": 0.0216, + "step": 248300 + }, + { + "epoch": 1.6, + "learning_rate": 5.9602289963017216e-05, + "loss": 0.0239, + "step": 248310 + }, + { + "epoch": 1.6, + "learning_rate": 5.959260860866029e-05, + "loss": 0.0278, + "step": 248320 + }, + { + "epoch": 1.6, + "learning_rate": 5.9582927254303356e-05, + "loss": 0.0279, + "step": 248330 + }, + { + "epoch": 1.6, + "learning_rate": 5.957324589994643e-05, + "loss": 0.0242, + "step": 248340 + }, + { + "epoch": 1.6, + "learning_rate": 5.9563564545589495e-05, + "loss": 0.0281, + "step": 248350 + }, + { + "epoch": 1.6, + "learning_rate": 5.9553883191232554e-05, + "loss": 0.0272, + "step": 248360 + }, + { + "epoch": 1.6, + "learning_rate": 5.954420183687563e-05, + "loss": 0.0258, + "step": 248370 + }, + { + "epoch": 1.6, + "learning_rate": 5.9534520482518694e-05, + "loss": 0.0246, + "step": 248380 + }, + { + "epoch": 1.6, + "learning_rate": 5.9524839128161767e-05, + "loss": 0.0264, + "step": 248390 + }, + { + "epoch": 1.6, + "learning_rate": 5.951515777380483e-05, + "loss": 0.0274, + "step": 248400 + }, + { + "epoch": 1.6, + "learning_rate": 5.9505476419447906e-05, + "loss": 0.0243, + "step": 248410 + }, + { + "epoch": 1.6, + "learning_rate": 5.9495795065090965e-05, + "loss": 0.026, + "step": 248420 + }, + { + "epoch": 1.6, + "learning_rate": 5.948611371073403e-05, + "loss": 0.0249, + "step": 248430 + }, + { + "epoch": 1.6, + "learning_rate": 5.9476432356377105e-05, + "loss": 0.0233, + "step": 248440 + }, + { + "epoch": 1.6, + "learning_rate": 5.946675100202017e-05, + "loss": 0.028, + "step": 248450 + }, + { + "epoch": 1.6, + "learning_rate": 5.9457069647663244e-05, + "loss": 0.0267, + "step": 248460 + }, + { + "epoch": 1.6, + "learning_rate": 5.94473882933063e-05, + "loss": 0.0287, + "step": 248470 + }, + { + "epoch": 1.6, + "learning_rate": 5.9437706938949376e-05, + "loss": 0.0252, + "step": 248480 + }, + { + "epoch": 1.6, + "learning_rate": 5.942802558459244e-05, + "loss": 0.0251, + "step": 248490 + }, + { + "epoch": 1.6, + "learning_rate": 5.941834423023551e-05, + "loss": 0.0239, + "step": 248500 + }, + { + "epoch": 1.6, + "learning_rate": 5.940866287587858e-05, + "loss": 0.0255, + "step": 248510 + }, + { + "epoch": 1.6, + "learning_rate": 5.939898152152164e-05, + "loss": 0.0244, + "step": 248520 + }, + { + "epoch": 1.6, + "learning_rate": 5.9389300167164714e-05, + "loss": 0.0271, + "step": 248530 + }, + { + "epoch": 1.6, + "learning_rate": 5.937961881280778e-05, + "loss": 0.0273, + "step": 248540 + }, + { + "epoch": 1.6, + "learning_rate": 5.9369937458450853e-05, + "loss": 0.0251, + "step": 248550 + }, + { + "epoch": 1.6, + "learning_rate": 5.936025610409392e-05, + "loss": 0.0241, + "step": 248560 + }, + { + "epoch": 1.6, + "learning_rate": 5.935057474973698e-05, + "loss": 0.031, + "step": 248570 + }, + { + "epoch": 1.6, + "learning_rate": 5.934089339538005e-05, + "loss": 0.0264, + "step": 248580 + }, + { + "epoch": 1.6, + "learning_rate": 5.933121204102312e-05, + "loss": 0.0258, + "step": 248590 + }, + { + "epoch": 1.6, + "learning_rate": 5.932153068666619e-05, + "loss": 0.0256, + "step": 248600 + }, + { + "epoch": 1.6, + "learning_rate": 5.931184933230926e-05, + "loss": 0.0262, + "step": 248610 + }, + { + "epoch": 1.6, + "learning_rate": 5.930216797795233e-05, + "loss": 0.0271, + "step": 248620 + }, + { + "epoch": 1.6, + "learning_rate": 5.929248662359539e-05, + "loss": 0.0202, + "step": 248630 + }, + { + "epoch": 1.6, + "learning_rate": 5.9282805269238456e-05, + "loss": 0.0306, + "step": 248640 + }, + { + "epoch": 1.6, + "learning_rate": 5.927312391488153e-05, + "loss": 0.0243, + "step": 248650 + }, + { + "epoch": 1.6, + "learning_rate": 5.9263442560524596e-05, + "loss": 0.0253, + "step": 248660 + }, + { + "epoch": 1.6, + "learning_rate": 5.925376120616767e-05, + "loss": 0.0218, + "step": 248670 + }, + { + "epoch": 1.61, + "learning_rate": 5.924407985181073e-05, + "loss": 0.0228, + "step": 248680 + }, + { + "epoch": 1.61, + "learning_rate": 5.92343984974538e-05, + "loss": 0.0296, + "step": 248690 + }, + { + "epoch": 1.61, + "learning_rate": 5.922471714309687e-05, + "loss": 0.0279, + "step": 248700 + }, + { + "epoch": 1.61, + "learning_rate": 5.9215035788739934e-05, + "loss": 0.0293, + "step": 248710 + }, + { + "epoch": 1.61, + "learning_rate": 5.920535443438301e-05, + "loss": 0.0292, + "step": 248720 + }, + { + "epoch": 1.61, + "learning_rate": 5.9195673080026066e-05, + "loss": 0.0289, + "step": 248730 + }, + { + "epoch": 1.61, + "learning_rate": 5.918599172566914e-05, + "loss": 0.0253, + "step": 248740 + }, + { + "epoch": 1.61, + "learning_rate": 5.9176310371312205e-05, + "loss": 0.0285, + "step": 248750 + }, + { + "epoch": 1.61, + "learning_rate": 5.916662901695527e-05, + "loss": 0.0244, + "step": 248760 + }, + { + "epoch": 1.61, + "learning_rate": 5.9156947662598345e-05, + "loss": 0.025, + "step": 248770 + }, + { + "epoch": 1.61, + "learning_rate": 5.9147266308241404e-05, + "loss": 0.0247, + "step": 248780 + }, + { + "epoch": 1.61, + "learning_rate": 5.913758495388448e-05, + "loss": 0.0284, + "step": 248790 + }, + { + "epoch": 1.61, + "learning_rate": 5.912790359952754e-05, + "loss": 0.0244, + "step": 248800 + }, + { + "epoch": 1.61, + "learning_rate": 5.9118222245170616e-05, + "loss": 0.0254, + "step": 248810 + }, + { + "epoch": 1.61, + "learning_rate": 5.910854089081368e-05, + "loss": 0.0315, + "step": 248820 + }, + { + "epoch": 1.61, + "learning_rate": 5.909885953645674e-05, + "loss": 0.0247, + "step": 248830 + }, + { + "epoch": 1.61, + "learning_rate": 5.9089178182099815e-05, + "loss": 0.0264, + "step": 248840 + }, + { + "epoch": 1.61, + "learning_rate": 5.907949682774288e-05, + "loss": 0.0252, + "step": 248850 + }, + { + "epoch": 1.61, + "learning_rate": 5.9069815473385954e-05, + "loss": 0.027, + "step": 248860 + }, + { + "epoch": 1.61, + "learning_rate": 5.906013411902902e-05, + "loss": 0.0276, + "step": 248870 + }, + { + "epoch": 1.61, + "learning_rate": 5.9050452764672094e-05, + "loss": 0.0283, + "step": 248880 + }, + { + "epoch": 1.61, + "learning_rate": 5.904077141031515e-05, + "loss": 0.0235, + "step": 248890 + }, + { + "epoch": 1.61, + "learning_rate": 5.903109005595822e-05, + "loss": 0.0307, + "step": 248900 + }, + { + "epoch": 1.61, + "learning_rate": 5.902140870160129e-05, + "loss": 0.0244, + "step": 248910 + }, + { + "epoch": 1.61, + "learning_rate": 5.901172734724436e-05, + "loss": 0.0272, + "step": 248920 + }, + { + "epoch": 1.61, + "learning_rate": 5.900204599288743e-05, + "loss": 0.0285, + "step": 248930 + }, + { + "epoch": 1.61, + "learning_rate": 5.899236463853049e-05, + "loss": 0.0246, + "step": 248940 + }, + { + "epoch": 1.61, + "learning_rate": 5.8982683284173564e-05, + "loss": 0.0266, + "step": 248950 + }, + { + "epoch": 1.61, + "learning_rate": 5.897300192981663e-05, + "loss": 0.0287, + "step": 248960 + }, + { + "epoch": 1.61, + "learning_rate": 5.8963320575459696e-05, + "loss": 0.032, + "step": 248970 + }, + { + "epoch": 1.61, + "learning_rate": 5.895363922110277e-05, + "loss": 0.0229, + "step": 248980 + }, + { + "epoch": 1.61, + "learning_rate": 5.894395786674583e-05, + "loss": 0.0233, + "step": 248990 + }, + { + "epoch": 1.61, + "learning_rate": 5.89342765123889e-05, + "loss": 0.0301, + "step": 249000 + }, + { + "epoch": 1.61, + "eval_cer": 0.9198562874251497, + "eval_loss": 0.018836012110114098, + "eval_runtime": 120.0, + "eval_samples_per_second": 16.667, + "eval_steps_per_second": 4.167, + "step": 249000 + }, + { + "epoch": 1.61, + "learning_rate": 5.892459515803197e-05, + "loss": 0.0268, + "step": 249010 + }, + { + "epoch": 1.61, + "learning_rate": 5.891491380367504e-05, + "loss": 0.0318, + "step": 249020 + }, + { + "epoch": 1.61, + "learning_rate": 5.890523244931811e-05, + "loss": 0.024, + "step": 249030 + }, + { + "epoch": 1.61, + "learning_rate": 5.889555109496117e-05, + "loss": 0.0307, + "step": 249040 + }, + { + "epoch": 1.61, + "learning_rate": 5.888586974060424e-05, + "loss": 0.0245, + "step": 249050 + }, + { + "epoch": 1.61, + "learning_rate": 5.8876188386247306e-05, + "loss": 0.0296, + "step": 249060 + }, + { + "epoch": 1.61, + "learning_rate": 5.886650703189038e-05, + "loss": 0.0253, + "step": 249070 + }, + { + "epoch": 1.61, + "learning_rate": 5.8856825677533445e-05, + "loss": 0.03, + "step": 249080 + }, + { + "epoch": 1.61, + "learning_rate": 5.884714432317651e-05, + "loss": 0.0341, + "step": 249090 + }, + { + "epoch": 1.61, + "learning_rate": 5.883746296881958e-05, + "loss": 0.0277, + "step": 249100 + }, + { + "epoch": 1.61, + "learning_rate": 5.8827781614462644e-05, + "loss": 0.0286, + "step": 249110 + }, + { + "epoch": 1.61, + "learning_rate": 5.881810026010572e-05, + "loss": 0.0244, + "step": 249120 + }, + { + "epoch": 1.61, + "learning_rate": 5.8808418905748783e-05, + "loss": 0.0233, + "step": 249130 + }, + { + "epoch": 1.61, + "learning_rate": 5.879873755139185e-05, + "loss": 0.0271, + "step": 249140 + }, + { + "epoch": 1.61, + "learning_rate": 5.8789056197034916e-05, + "loss": 0.0218, + "step": 249150 + }, + { + "epoch": 1.61, + "learning_rate": 5.877937484267799e-05, + "loss": 0.0267, + "step": 249160 + }, + { + "epoch": 1.61, + "learning_rate": 5.8769693488321055e-05, + "loss": 0.0234, + "step": 249170 + }, + { + "epoch": 1.61, + "learning_rate": 5.876001213396412e-05, + "loss": 0.0207, + "step": 249180 + }, + { + "epoch": 1.61, + "learning_rate": 5.875033077960719e-05, + "loss": 0.0216, + "step": 249190 + }, + { + "epoch": 1.61, + "learning_rate": 5.8740649425250254e-05, + "loss": 0.0263, + "step": 249200 + }, + { + "epoch": 1.61, + "learning_rate": 5.873096807089333e-05, + "loss": 0.0251, + "step": 249210 + }, + { + "epoch": 1.61, + "learning_rate": 5.872128671653639e-05, + "loss": 0.0301, + "step": 249220 + }, + { + "epoch": 1.61, + "learning_rate": 5.8711605362179466e-05, + "loss": 0.0243, + "step": 249230 + }, + { + "epoch": 1.61, + "learning_rate": 5.8701924007822526e-05, + "loss": 0.0262, + "step": 249240 + }, + { + "epoch": 1.61, + "learning_rate": 5.869224265346559e-05, + "loss": 0.0205, + "step": 249250 + }, + { + "epoch": 1.61, + "learning_rate": 5.8682561299108665e-05, + "loss": 0.0252, + "step": 249260 + }, + { + "epoch": 1.61, + "learning_rate": 5.867287994475173e-05, + "loss": 0.0258, + "step": 249270 + }, + { + "epoch": 1.61, + "learning_rate": 5.8663198590394804e-05, + "loss": 0.0241, + "step": 249280 + }, + { + "epoch": 1.61, + "learning_rate": 5.8653517236037864e-05, + "loss": 0.0271, + "step": 249290 + }, + { + "epoch": 1.61, + "learning_rate": 5.8643835881680937e-05, + "loss": 0.0286, + "step": 249300 + }, + { + "epoch": 1.61, + "learning_rate": 5.8634154527324e-05, + "loss": 0.0257, + "step": 249310 + }, + { + "epoch": 1.61, + "learning_rate": 5.862447317296707e-05, + "loss": 0.0264, + "step": 249320 + }, + { + "epoch": 1.61, + "learning_rate": 5.861479181861014e-05, + "loss": 0.0234, + "step": 249330 + }, + { + "epoch": 1.61, + "learning_rate": 5.86051104642532e-05, + "loss": 0.0227, + "step": 249340 + }, + { + "epoch": 1.61, + "learning_rate": 5.8595429109896275e-05, + "loss": 0.0315, + "step": 249350 + }, + { + "epoch": 1.61, + "learning_rate": 5.858574775553934e-05, + "loss": 0.0252, + "step": 249360 + }, + { + "epoch": 1.61, + "learning_rate": 5.8576066401182414e-05, + "loss": 0.0272, + "step": 249370 + }, + { + "epoch": 1.61, + "learning_rate": 5.856638504682548e-05, + "loss": 0.0275, + "step": 249380 + }, + { + "epoch": 1.61, + "learning_rate": 5.855670369246854e-05, + "loss": 0.0191, + "step": 249390 + }, + { + "epoch": 1.61, + "learning_rate": 5.854702233811161e-05, + "loss": 0.0282, + "step": 249400 + }, + { + "epoch": 1.61, + "learning_rate": 5.853734098375468e-05, + "loss": 0.0241, + "step": 249410 + }, + { + "epoch": 1.61, + "learning_rate": 5.852765962939775e-05, + "loss": 0.0265, + "step": 249420 + }, + { + "epoch": 1.61, + "learning_rate": 5.851797827504082e-05, + "loss": 0.0268, + "step": 249430 + }, + { + "epoch": 1.61, + "learning_rate": 5.850829692068389e-05, + "loss": 0.022, + "step": 249440 + }, + { + "epoch": 1.61, + "learning_rate": 5.849861556632695e-05, + "loss": 0.0276, + "step": 249450 + }, + { + "epoch": 1.61, + "learning_rate": 5.848893421197002e-05, + "loss": 0.026, + "step": 249460 + }, + { + "epoch": 1.61, + "learning_rate": 5.847925285761309e-05, + "loss": 0.0225, + "step": 249470 + }, + { + "epoch": 1.61, + "learning_rate": 5.8469571503256156e-05, + "loss": 0.0243, + "step": 249480 + }, + { + "epoch": 1.61, + "learning_rate": 5.845989014889923e-05, + "loss": 0.0251, + "step": 249490 + }, + { + "epoch": 1.61, + "learning_rate": 5.845020879454229e-05, + "loss": 0.0257, + "step": 249500 + }, + { + "epoch": 1.61, + "learning_rate": 5.844052744018536e-05, + "loss": 0.0231, + "step": 249510 + }, + { + "epoch": 1.61, + "learning_rate": 5.843084608582843e-05, + "loss": 0.0292, + "step": 249520 + }, + { + "epoch": 1.61, + "learning_rate": 5.8421164731471494e-05, + "loss": 0.0322, + "step": 249530 + }, + { + "epoch": 1.61, + "learning_rate": 5.841148337711457e-05, + "loss": 0.0278, + "step": 249540 + }, + { + "epoch": 1.61, + "learning_rate": 5.8401802022757626e-05, + "loss": 0.0203, + "step": 249550 + }, + { + "epoch": 1.61, + "learning_rate": 5.83921206684007e-05, + "loss": 0.0251, + "step": 249560 + }, + { + "epoch": 1.61, + "learning_rate": 5.8382439314043766e-05, + "loss": 0.0267, + "step": 249570 + }, + { + "epoch": 1.61, + "learning_rate": 5.837275795968684e-05, + "loss": 0.0233, + "step": 249580 + }, + { + "epoch": 1.61, + "learning_rate": 5.8363076605329905e-05, + "loss": 0.0267, + "step": 249590 + }, + { + "epoch": 1.61, + "learning_rate": 5.8353395250972964e-05, + "loss": 0.0229, + "step": 249600 + }, + { + "epoch": 1.61, + "learning_rate": 5.834371389661604e-05, + "loss": 0.0226, + "step": 249610 + }, + { + "epoch": 1.61, + "learning_rate": 5.8334032542259104e-05, + "loss": 0.0343, + "step": 249620 + }, + { + "epoch": 1.61, + "learning_rate": 5.832435118790218e-05, + "loss": 0.0235, + "step": 249630 + }, + { + "epoch": 1.61, + "learning_rate": 5.831466983354524e-05, + "loss": 0.02, + "step": 249640 + }, + { + "epoch": 1.61, + "learning_rate": 5.8304988479188316e-05, + "loss": 0.029, + "step": 249650 + }, + { + "epoch": 1.61, + "learning_rate": 5.8295307124831375e-05, + "loss": 0.0327, + "step": 249660 + }, + { + "epoch": 1.61, + "learning_rate": 5.828562577047444e-05, + "loss": 0.0244, + "step": 249670 + }, + { + "epoch": 1.61, + "learning_rate": 5.8275944416117515e-05, + "loss": 0.0265, + "step": 249680 + }, + { + "epoch": 1.61, + "learning_rate": 5.826626306176058e-05, + "loss": 0.0251, + "step": 249690 + }, + { + "epoch": 1.61, + "learning_rate": 5.8256581707403654e-05, + "loss": 0.028, + "step": 249700 + }, + { + "epoch": 1.61, + "learning_rate": 5.8246900353046713e-05, + "loss": 0.0271, + "step": 249710 + }, + { + "epoch": 1.61, + "learning_rate": 5.8237218998689786e-05, + "loss": 0.0272, + "step": 249720 + }, + { + "epoch": 1.61, + "learning_rate": 5.822753764433285e-05, + "loss": 0.0314, + "step": 249730 + }, + { + "epoch": 1.61, + "learning_rate": 5.821785628997592e-05, + "loss": 0.022, + "step": 249740 + }, + { + "epoch": 1.61, + "learning_rate": 5.820817493561899e-05, + "loss": 0.0237, + "step": 249750 + }, + { + "epoch": 1.61, + "learning_rate": 5.819849358126205e-05, + "loss": 0.0252, + "step": 249760 + }, + { + "epoch": 1.61, + "learning_rate": 5.8188812226905124e-05, + "loss": 0.0224, + "step": 249770 + }, + { + "epoch": 1.61, + "learning_rate": 5.817913087254819e-05, + "loss": 0.0232, + "step": 249780 + }, + { + "epoch": 1.61, + "learning_rate": 5.8169449518191264e-05, + "loss": 0.0285, + "step": 249790 + }, + { + "epoch": 1.61, + "learning_rate": 5.815976816383433e-05, + "loss": 0.0212, + "step": 249800 + }, + { + "epoch": 1.61, + "learning_rate": 5.815008680947739e-05, + "loss": 0.0261, + "step": 249810 + }, + { + "epoch": 1.61, + "learning_rate": 5.814040545512046e-05, + "loss": 0.0232, + "step": 249820 + }, + { + "epoch": 1.61, + "learning_rate": 5.813072410076353e-05, + "loss": 0.0278, + "step": 249830 + }, + { + "epoch": 1.61, + "learning_rate": 5.81210427464066e-05, + "loss": 0.0262, + "step": 249840 + }, + { + "epoch": 1.61, + "learning_rate": 5.811136139204967e-05, + "loss": 0.0271, + "step": 249850 + }, + { + "epoch": 1.61, + "learning_rate": 5.810168003769274e-05, + "loss": 0.0284, + "step": 249860 + }, + { + "epoch": 1.61, + "learning_rate": 5.80919986833358e-05, + "loss": 0.0236, + "step": 249870 + }, + { + "epoch": 1.61, + "learning_rate": 5.8082317328978867e-05, + "loss": 0.0263, + "step": 249880 + }, + { + "epoch": 1.61, + "learning_rate": 5.807263597462194e-05, + "loss": 0.0246, + "step": 249890 + }, + { + "epoch": 1.61, + "learning_rate": 5.8062954620265006e-05, + "loss": 0.0256, + "step": 249900 + }, + { + "epoch": 1.61, + "learning_rate": 5.805327326590808e-05, + "loss": 0.0233, + "step": 249910 + }, + { + "epoch": 1.61, + "learning_rate": 5.804359191155114e-05, + "loss": 0.0235, + "step": 249920 + }, + { + "epoch": 1.61, + "learning_rate": 5.803391055719421e-05, + "loss": 0.0242, + "step": 249930 + }, + { + "epoch": 1.61, + "learning_rate": 5.802422920283728e-05, + "loss": 0.0237, + "step": 249940 + }, + { + "epoch": 1.61, + "learning_rate": 5.8014547848480344e-05, + "loss": 0.03, + "step": 249950 + }, + { + "epoch": 1.61, + "learning_rate": 5.800486649412342e-05, + "loss": 0.0265, + "step": 249960 + }, + { + "epoch": 1.61, + "learning_rate": 5.7995185139766476e-05, + "loss": 0.0331, + "step": 249970 + }, + { + "epoch": 1.61, + "learning_rate": 5.798550378540955e-05, + "loss": 0.0273, + "step": 249980 + }, + { + "epoch": 1.61, + "learning_rate": 5.7975822431052616e-05, + "loss": 0.0246, + "step": 249990 + }, + { + "epoch": 1.61, + "learning_rate": 5.796614107669569e-05, + "loss": 0.0273, + "step": 250000 + }, + { + "epoch": 1.61, + "eval_cer": 0.919873460625918, + "eval_loss": 0.018918007612228394, + "eval_runtime": 119.9798, + "eval_samples_per_second": 16.669, + "eval_steps_per_second": 4.167, + "step": 250000 + }, + { + "epoch": 1.61, + "learning_rate": 5.7956459722338755e-05, + "loss": 0.0251, + "step": 250010 + }, + { + "epoch": 1.61, + "learning_rate": 5.7946778367981814e-05, + "loss": 0.0285, + "step": 250020 + }, + { + "epoch": 1.61, + "learning_rate": 5.793709701362489e-05, + "loss": 0.0237, + "step": 250030 + }, + { + "epoch": 1.61, + "learning_rate": 5.7927415659267953e-05, + "loss": 0.0238, + "step": 250040 + }, + { + "epoch": 1.61, + "learning_rate": 5.7917734304911027e-05, + "loss": 0.0246, + "step": 250050 + }, + { + "epoch": 1.61, + "learning_rate": 5.790805295055409e-05, + "loss": 0.0298, + "step": 250060 + }, + { + "epoch": 1.61, + "learning_rate": 5.7898371596197166e-05, + "loss": 0.0242, + "step": 250070 + }, + { + "epoch": 1.61, + "learning_rate": 5.7888690241840225e-05, + "loss": 0.0295, + "step": 250080 + }, + { + "epoch": 1.61, + "learning_rate": 5.787900888748329e-05, + "loss": 0.0223, + "step": 250090 + }, + { + "epoch": 1.61, + "learning_rate": 5.7869327533126364e-05, + "loss": 0.0229, + "step": 250100 + }, + { + "epoch": 1.61, + "learning_rate": 5.785964617876943e-05, + "loss": 0.0247, + "step": 250110 + }, + { + "epoch": 1.61, + "learning_rate": 5.7849964824412504e-05, + "loss": 0.0257, + "step": 250120 + }, + { + "epoch": 1.61, + "learning_rate": 5.784028347005556e-05, + "loss": 0.0283, + "step": 250130 + }, + { + "epoch": 1.61, + "learning_rate": 5.7830602115698636e-05, + "loss": 0.0261, + "step": 250140 + }, + { + "epoch": 1.61, + "learning_rate": 5.78209207613417e-05, + "loss": 0.0212, + "step": 250150 + }, + { + "epoch": 1.61, + "learning_rate": 5.781123940698477e-05, + "loss": 0.0292, + "step": 250160 + }, + { + "epoch": 1.61, + "learning_rate": 5.780155805262784e-05, + "loss": 0.0293, + "step": 250170 + }, + { + "epoch": 1.61, + "learning_rate": 5.77918766982709e-05, + "loss": 0.0257, + "step": 250180 + }, + { + "epoch": 1.61, + "learning_rate": 5.7782195343913974e-05, + "loss": 0.0288, + "step": 250190 + }, + { + "epoch": 1.61, + "learning_rate": 5.777251398955704e-05, + "loss": 0.0269, + "step": 250200 + }, + { + "epoch": 1.61, + "learning_rate": 5.7762832635200113e-05, + "loss": 0.0229, + "step": 250210 + }, + { + "epoch": 1.61, + "learning_rate": 5.775315128084318e-05, + "loss": 0.0237, + "step": 250220 + }, + { + "epoch": 1.62, + "learning_rate": 5.774346992648624e-05, + "loss": 0.0231, + "step": 250230 + }, + { + "epoch": 1.62, + "learning_rate": 5.773378857212931e-05, + "loss": 0.027, + "step": 250240 + }, + { + "epoch": 1.62, + "learning_rate": 5.772410721777238e-05, + "loss": 0.026, + "step": 250250 + }, + { + "epoch": 1.62, + "learning_rate": 5.771442586341545e-05, + "loss": 0.027, + "step": 250260 + }, + { + "epoch": 1.62, + "learning_rate": 5.770474450905852e-05, + "loss": 0.0259, + "step": 250270 + }, + { + "epoch": 1.62, + "learning_rate": 5.769506315470159e-05, + "loss": 0.0252, + "step": 250280 + }, + { + "epoch": 1.62, + "learning_rate": 5.768538180034465e-05, + "loss": 0.029, + "step": 250290 + }, + { + "epoch": 1.62, + "learning_rate": 5.7675700445987716e-05, + "loss": 0.0275, + "step": 250300 + }, + { + "epoch": 1.62, + "learning_rate": 5.766601909163079e-05, + "loss": 0.0232, + "step": 250310 + }, + { + "epoch": 1.62, + "learning_rate": 5.7656337737273856e-05, + "loss": 0.0222, + "step": 250320 + }, + { + "epoch": 1.62, + "learning_rate": 5.764665638291693e-05, + "loss": 0.0266, + "step": 250330 + }, + { + "epoch": 1.62, + "learning_rate": 5.763697502855999e-05, + "loss": 0.0276, + "step": 250340 + }, + { + "epoch": 1.62, + "learning_rate": 5.762729367420306e-05, + "loss": 0.0255, + "step": 250350 + }, + { + "epoch": 1.62, + "learning_rate": 5.761761231984613e-05, + "loss": 0.0286, + "step": 250360 + }, + { + "epoch": 1.62, + "learning_rate": 5.7607930965489194e-05, + "loss": 0.0262, + "step": 250370 + }, + { + "epoch": 1.62, + "learning_rate": 5.7598249611132267e-05, + "loss": 0.0276, + "step": 250380 + }, + { + "epoch": 1.62, + "learning_rate": 5.7588568256775326e-05, + "loss": 0.0243, + "step": 250390 + }, + { + "epoch": 1.62, + "learning_rate": 5.75788869024184e-05, + "loss": 0.0279, + "step": 250400 + }, + { + "epoch": 1.62, + "learning_rate": 5.7569205548061465e-05, + "loss": 0.0299, + "step": 250410 + }, + { + "epoch": 1.62, + "learning_rate": 5.755952419370454e-05, + "loss": 0.025, + "step": 250420 + }, + { + "epoch": 1.62, + "learning_rate": 5.7549842839347605e-05, + "loss": 0.0247, + "step": 250430 + }, + { + "epoch": 1.62, + "learning_rate": 5.7540161484990664e-05, + "loss": 0.035, + "step": 250440 + }, + { + "epoch": 1.62, + "learning_rate": 5.753048013063374e-05, + "loss": 0.025, + "step": 250450 + }, + { + "epoch": 1.62, + "learning_rate": 5.75207987762768e-05, + "loss": 0.02, + "step": 250460 + }, + { + "epoch": 1.62, + "learning_rate": 5.7511117421919876e-05, + "loss": 0.0279, + "step": 250470 + }, + { + "epoch": 1.62, + "learning_rate": 5.750143606756294e-05, + "loss": 0.0229, + "step": 250480 + }, + { + "epoch": 1.62, + "learning_rate": 5.7491754713206e-05, + "loss": 0.0298, + "step": 250490 + }, + { + "epoch": 1.62, + "learning_rate": 5.7482073358849075e-05, + "loss": 0.0247, + "step": 250500 + }, + { + "epoch": 1.62, + "learning_rate": 5.747239200449214e-05, + "loss": 0.0264, + "step": 250510 + }, + { + "epoch": 1.62, + "learning_rate": 5.7462710650135214e-05, + "loss": 0.0272, + "step": 250520 + }, + { + "epoch": 1.62, + "learning_rate": 5.745302929577828e-05, + "loss": 0.0227, + "step": 250530 + }, + { + "epoch": 1.62, + "learning_rate": 5.744334794142135e-05, + "loss": 0.0225, + "step": 250540 + }, + { + "epoch": 1.62, + "learning_rate": 5.743366658706441e-05, + "loss": 0.022, + "step": 250550 + }, + { + "epoch": 1.62, + "learning_rate": 5.742398523270748e-05, + "loss": 0.0233, + "step": 250560 + }, + { + "epoch": 1.62, + "learning_rate": 5.741430387835055e-05, + "loss": 0.0198, + "step": 250570 + }, + { + "epoch": 1.62, + "learning_rate": 5.740462252399362e-05, + "loss": 0.0212, + "step": 250580 + }, + { + "epoch": 1.62, + "learning_rate": 5.7394941169636685e-05, + "loss": 0.0278, + "step": 250590 + }, + { + "epoch": 1.62, + "learning_rate": 5.738525981527975e-05, + "loss": 0.0266, + "step": 250600 + }, + { + "epoch": 1.62, + "learning_rate": 5.7375578460922824e-05, + "loss": 0.0216, + "step": 250610 + }, + { + "epoch": 1.62, + "learning_rate": 5.736589710656589e-05, + "loss": 0.0235, + "step": 250620 + }, + { + "epoch": 1.62, + "learning_rate": 5.7356215752208956e-05, + "loss": 0.0311, + "step": 250630 + }, + { + "epoch": 1.62, + "learning_rate": 5.734653439785202e-05, + "loss": 0.0232, + "step": 250640 + }, + { + "epoch": 1.62, + "learning_rate": 5.733685304349509e-05, + "loss": 0.0252, + "step": 250650 + }, + { + "epoch": 1.62, + "learning_rate": 5.732717168913816e-05, + "loss": 0.0274, + "step": 250660 + }, + { + "epoch": 1.62, + "learning_rate": 5.731749033478123e-05, + "loss": 0.0232, + "step": 250670 + }, + { + "epoch": 1.62, + "learning_rate": 5.73078089804243e-05, + "loss": 0.0237, + "step": 250680 + }, + { + "epoch": 1.62, + "learning_rate": 5.729812762606736e-05, + "loss": 0.0282, + "step": 250690 + }, + { + "epoch": 1.62, + "learning_rate": 5.728844627171043e-05, + "loss": 0.0239, + "step": 250700 + }, + { + "epoch": 1.62, + "learning_rate": 5.72787649173535e-05, + "loss": 0.0214, + "step": 250710 + }, + { + "epoch": 1.62, + "learning_rate": 5.7269083562996566e-05, + "loss": 0.023, + "step": 250720 + }, + { + "epoch": 1.62, + "learning_rate": 5.725940220863964e-05, + "loss": 0.0275, + "step": 250730 + }, + { + "epoch": 1.62, + "learning_rate": 5.72497208542827e-05, + "loss": 0.0237, + "step": 250740 + }, + { + "epoch": 1.62, + "learning_rate": 5.724003949992577e-05, + "loss": 0.027, + "step": 250750 + }, + { + "epoch": 1.62, + "learning_rate": 5.723035814556884e-05, + "loss": 0.0266, + "step": 250760 + }, + { + "epoch": 1.62, + "learning_rate": 5.7220676791211904e-05, + "loss": 0.0275, + "step": 250770 + }, + { + "epoch": 1.62, + "learning_rate": 5.721099543685498e-05, + "loss": 0.0217, + "step": 250780 + }, + { + "epoch": 1.62, + "learning_rate": 5.720131408249804e-05, + "loss": 0.0263, + "step": 250790 + }, + { + "epoch": 1.62, + "learning_rate": 5.719163272814111e-05, + "loss": 0.0231, + "step": 250800 + }, + { + "epoch": 1.62, + "learning_rate": 5.7181951373784176e-05, + "loss": 0.022, + "step": 250810 + }, + { + "epoch": 1.62, + "learning_rate": 5.717227001942725e-05, + "loss": 0.0286, + "step": 250820 + }, + { + "epoch": 1.62, + "learning_rate": 5.7162588665070315e-05, + "loss": 0.0273, + "step": 250830 + }, + { + "epoch": 1.62, + "learning_rate": 5.7152907310713375e-05, + "loss": 0.0241, + "step": 250840 + }, + { + "epoch": 1.62, + "learning_rate": 5.714322595635645e-05, + "loss": 0.0235, + "step": 250850 + }, + { + "epoch": 1.62, + "learning_rate": 5.7133544601999514e-05, + "loss": 0.0292, + "step": 250860 + }, + { + "epoch": 1.62, + "learning_rate": 5.712386324764259e-05, + "loss": 0.0353, + "step": 250870 + }, + { + "epoch": 1.62, + "learning_rate": 5.711418189328565e-05, + "loss": 0.0231, + "step": 250880 + }, + { + "epoch": 1.62, + "learning_rate": 5.7104500538928726e-05, + "loss": 0.0283, + "step": 250890 + }, + { + "epoch": 1.62, + "learning_rate": 5.7094819184571786e-05, + "loss": 0.0208, + "step": 250900 + }, + { + "epoch": 1.62, + "learning_rate": 5.708513783021485e-05, + "loss": 0.0284, + "step": 250910 + }, + { + "epoch": 1.62, + "learning_rate": 5.7075456475857925e-05, + "loss": 0.0308, + "step": 250920 + }, + { + "epoch": 1.62, + "learning_rate": 5.706577512150099e-05, + "loss": 0.0252, + "step": 250930 + }, + { + "epoch": 1.62, + "learning_rate": 5.7056093767144064e-05, + "loss": 0.027, + "step": 250940 + }, + { + "epoch": 1.62, + "learning_rate": 5.7046412412787124e-05, + "loss": 0.0276, + "step": 250950 + }, + { + "epoch": 1.62, + "learning_rate": 5.7036731058430197e-05, + "loss": 0.0265, + "step": 250960 + }, + { + "epoch": 1.62, + "learning_rate": 5.702704970407326e-05, + "loss": 0.0305, + "step": 250970 + }, + { + "epoch": 1.62, + "learning_rate": 5.701736834971633e-05, + "loss": 0.04, + "step": 250980 + }, + { + "epoch": 1.62, + "learning_rate": 5.70076869953594e-05, + "loss": 0.0228, + "step": 250990 + }, + { + "epoch": 1.62, + "learning_rate": 5.699800564100246e-05, + "loss": 0.0246, + "step": 251000 + }, + { + "epoch": 1.62, + "eval_cer": 0.9198400180770534, + "eval_loss": 0.018709488213062286, + "eval_runtime": 120.2758, + "eval_samples_per_second": 16.628, + "eval_steps_per_second": 4.157, + "step": 251000 + }, + { + "epoch": 1.62, + "learning_rate": 5.6988324286645535e-05, + "loss": 0.0307, + "step": 251010 + }, + { + "epoch": 1.62, + "learning_rate": 5.69786429322886e-05, + "loss": 0.0268, + "step": 251020 + }, + { + "epoch": 1.62, + "learning_rate": 5.6968961577931674e-05, + "loss": 0.022, + "step": 251030 + }, + { + "epoch": 1.62, + "learning_rate": 5.695928022357474e-05, + "loss": 0.0245, + "step": 251040 + }, + { + "epoch": 1.62, + "learning_rate": 5.69495988692178e-05, + "loss": 0.0296, + "step": 251050 + }, + { + "epoch": 1.62, + "learning_rate": 5.693991751486087e-05, + "loss": 0.0287, + "step": 251060 + }, + { + "epoch": 1.62, + "learning_rate": 5.693023616050394e-05, + "loss": 0.0268, + "step": 251070 + }, + { + "epoch": 1.62, + "learning_rate": 5.692055480614701e-05, + "loss": 0.0219, + "step": 251080 + }, + { + "epoch": 1.62, + "learning_rate": 5.691087345179008e-05, + "loss": 0.0243, + "step": 251090 + }, + { + "epoch": 1.62, + "learning_rate": 5.690119209743315e-05, + "loss": 0.0253, + "step": 251100 + }, + { + "epoch": 1.62, + "learning_rate": 5.689151074307621e-05, + "loss": 0.0217, + "step": 251110 + }, + { + "epoch": 1.62, + "learning_rate": 5.688182938871928e-05, + "loss": 0.0251, + "step": 251120 + }, + { + "epoch": 1.62, + "learning_rate": 5.687214803436235e-05, + "loss": 0.0283, + "step": 251130 + }, + { + "epoch": 1.62, + "learning_rate": 5.6862466680005416e-05, + "loss": 0.0257, + "step": 251140 + }, + { + "epoch": 1.62, + "learning_rate": 5.685278532564849e-05, + "loss": 0.0286, + "step": 251150 + }, + { + "epoch": 1.62, + "learning_rate": 5.684310397129155e-05, + "loss": 0.0305, + "step": 251160 + }, + { + "epoch": 1.62, + "learning_rate": 5.683342261693462e-05, + "loss": 0.0265, + "step": 251170 + }, + { + "epoch": 1.62, + "learning_rate": 5.682374126257769e-05, + "loss": 0.0255, + "step": 251180 + }, + { + "epoch": 1.62, + "learning_rate": 5.6814059908220754e-05, + "loss": 0.0232, + "step": 251190 + }, + { + "epoch": 1.62, + "learning_rate": 5.680437855386383e-05, + "loss": 0.0254, + "step": 251200 + }, + { + "epoch": 1.62, + "learning_rate": 5.6794697199506886e-05, + "loss": 0.0214, + "step": 251210 + }, + { + "epoch": 1.62, + "learning_rate": 5.678501584514996e-05, + "loss": 0.0292, + "step": 251220 + }, + { + "epoch": 1.62, + "learning_rate": 5.6775334490793026e-05, + "loss": 0.0237, + "step": 251230 + }, + { + "epoch": 1.62, + "learning_rate": 5.67656531364361e-05, + "loss": 0.0238, + "step": 251240 + }, + { + "epoch": 1.62, + "learning_rate": 5.6755971782079165e-05, + "loss": 0.0291, + "step": 251250 + }, + { + "epoch": 1.62, + "learning_rate": 5.6746290427722224e-05, + "loss": 0.024, + "step": 251260 + }, + { + "epoch": 1.62, + "learning_rate": 5.67366090733653e-05, + "loss": 0.0204, + "step": 251270 + }, + { + "epoch": 1.62, + "learning_rate": 5.6726927719008364e-05, + "loss": 0.024, + "step": 251280 + }, + { + "epoch": 1.62, + "learning_rate": 5.671724636465144e-05, + "loss": 0.0297, + "step": 251290 + }, + { + "epoch": 1.62, + "learning_rate": 5.67075650102945e-05, + "loss": 0.0196, + "step": 251300 + }, + { + "epoch": 1.62, + "learning_rate": 5.6697883655937576e-05, + "loss": 0.0242, + "step": 251310 + }, + { + "epoch": 1.62, + "learning_rate": 5.6688202301580635e-05, + "loss": 0.0251, + "step": 251320 + }, + { + "epoch": 1.62, + "learning_rate": 5.66785209472237e-05, + "loss": 0.027, + "step": 251330 + }, + { + "epoch": 1.62, + "learning_rate": 5.6668839592866775e-05, + "loss": 0.0301, + "step": 251340 + }, + { + "epoch": 1.62, + "learning_rate": 5.665915823850984e-05, + "loss": 0.0227, + "step": 251350 + }, + { + "epoch": 1.62, + "learning_rate": 5.6649476884152914e-05, + "loss": 0.0262, + "step": 251360 + }, + { + "epoch": 1.62, + "learning_rate": 5.663979552979597e-05, + "loss": 0.0278, + "step": 251370 + }, + { + "epoch": 1.62, + "learning_rate": 5.6630114175439046e-05, + "loss": 0.0255, + "step": 251380 + }, + { + "epoch": 1.62, + "learning_rate": 5.662043282108211e-05, + "loss": 0.0242, + "step": 251390 + }, + { + "epoch": 1.62, + "learning_rate": 5.661075146672518e-05, + "loss": 0.0307, + "step": 251400 + }, + { + "epoch": 1.62, + "learning_rate": 5.660107011236825e-05, + "loss": 0.0226, + "step": 251410 + }, + { + "epoch": 1.62, + "learning_rate": 5.659138875801131e-05, + "loss": 0.0293, + "step": 251420 + }, + { + "epoch": 1.62, + "learning_rate": 5.6581707403654384e-05, + "loss": 0.029, + "step": 251430 + }, + { + "epoch": 1.62, + "learning_rate": 5.657202604929745e-05, + "loss": 0.0274, + "step": 251440 + }, + { + "epoch": 1.62, + "learning_rate": 5.6562344694940524e-05, + "loss": 0.024, + "step": 251450 + }, + { + "epoch": 1.62, + "learning_rate": 5.655266334058359e-05, + "loss": 0.0268, + "step": 251460 + }, + { + "epoch": 1.62, + "learning_rate": 5.654298198622665e-05, + "loss": 0.0249, + "step": 251470 + }, + { + "epoch": 1.62, + "learning_rate": 5.653330063186972e-05, + "loss": 0.0313, + "step": 251480 + }, + { + "epoch": 1.62, + "learning_rate": 5.652361927751279e-05, + "loss": 0.0294, + "step": 251490 + }, + { + "epoch": 1.62, + "learning_rate": 5.651393792315586e-05, + "loss": 0.0268, + "step": 251500 + }, + { + "epoch": 1.62, + "learning_rate": 5.650425656879893e-05, + "loss": 0.0214, + "step": 251510 + }, + { + "epoch": 1.62, + "learning_rate": 5.6494575214442e-05, + "loss": 0.0244, + "step": 251520 + }, + { + "epoch": 1.62, + "learning_rate": 5.648489386008506e-05, + "loss": 0.0252, + "step": 251530 + }, + { + "epoch": 1.62, + "learning_rate": 5.6475212505728127e-05, + "loss": 0.0287, + "step": 251540 + }, + { + "epoch": 1.62, + "learning_rate": 5.64655311513712e-05, + "loss": 0.028, + "step": 251550 + }, + { + "epoch": 1.62, + "learning_rate": 5.6455849797014266e-05, + "loss": 0.0264, + "step": 251560 + }, + { + "epoch": 1.62, + "learning_rate": 5.644616844265734e-05, + "loss": 0.0286, + "step": 251570 + }, + { + "epoch": 1.62, + "learning_rate": 5.64364870883004e-05, + "loss": 0.0251, + "step": 251580 + }, + { + "epoch": 1.62, + "learning_rate": 5.642680573394347e-05, + "loss": 0.0267, + "step": 251590 + }, + { + "epoch": 1.62, + "learning_rate": 5.641712437958654e-05, + "loss": 0.0249, + "step": 251600 + }, + { + "epoch": 1.62, + "learning_rate": 5.6407443025229604e-05, + "loss": 0.0267, + "step": 251610 + }, + { + "epoch": 1.62, + "learning_rate": 5.639776167087268e-05, + "loss": 0.0284, + "step": 251620 + }, + { + "epoch": 1.62, + "learning_rate": 5.6388080316515736e-05, + "loss": 0.0279, + "step": 251630 + }, + { + "epoch": 1.62, + "learning_rate": 5.637839896215881e-05, + "loss": 0.0274, + "step": 251640 + }, + { + "epoch": 1.62, + "learning_rate": 5.6368717607801875e-05, + "loss": 0.0261, + "step": 251650 + }, + { + "epoch": 1.62, + "learning_rate": 5.635903625344495e-05, + "loss": 0.0295, + "step": 251660 + }, + { + "epoch": 1.62, + "learning_rate": 5.6349354899088015e-05, + "loss": 0.0272, + "step": 251670 + }, + { + "epoch": 1.62, + "learning_rate": 5.6339673544731074e-05, + "loss": 0.0265, + "step": 251680 + }, + { + "epoch": 1.62, + "learning_rate": 5.632999219037415e-05, + "loss": 0.0235, + "step": 251690 + }, + { + "epoch": 1.62, + "learning_rate": 5.6320310836017213e-05, + "loss": 0.0252, + "step": 251700 + }, + { + "epoch": 1.62, + "learning_rate": 5.6310629481660286e-05, + "loss": 0.0259, + "step": 251710 + }, + { + "epoch": 1.62, + "learning_rate": 5.630094812730335e-05, + "loss": 0.0292, + "step": 251720 + }, + { + "epoch": 1.62, + "learning_rate": 5.629126677294642e-05, + "loss": 0.0332, + "step": 251730 + }, + { + "epoch": 1.62, + "learning_rate": 5.6281585418589485e-05, + "loss": 0.0263, + "step": 251740 + }, + { + "epoch": 1.62, + "learning_rate": 5.627190406423255e-05, + "loss": 0.0327, + "step": 251750 + }, + { + "epoch": 1.62, + "learning_rate": 5.6262222709875624e-05, + "loss": 0.0219, + "step": 251760 + }, + { + "epoch": 1.62, + "learning_rate": 5.625254135551869e-05, + "loss": 0.0295, + "step": 251770 + }, + { + "epoch": 1.63, + "learning_rate": 5.624286000116176e-05, + "loss": 0.0264, + "step": 251780 + }, + { + "epoch": 1.63, + "learning_rate": 5.623317864680482e-05, + "loss": 0.0233, + "step": 251790 + }, + { + "epoch": 1.63, + "learning_rate": 5.6223497292447896e-05, + "loss": 0.0297, + "step": 251800 + }, + { + "epoch": 1.63, + "learning_rate": 5.621381593809096e-05, + "loss": 0.0279, + "step": 251810 + }, + { + "epoch": 1.63, + "learning_rate": 5.620413458373403e-05, + "loss": 0.0285, + "step": 251820 + }, + { + "epoch": 1.63, + "learning_rate": 5.6194453229377095e-05, + "loss": 0.0254, + "step": 251830 + }, + { + "epoch": 1.63, + "learning_rate": 5.618477187502016e-05, + "loss": 0.0267, + "step": 251840 + }, + { + "epoch": 1.63, + "learning_rate": 5.6175090520663234e-05, + "loss": 0.0224, + "step": 251850 + }, + { + "epoch": 1.63, + "learning_rate": 5.61654091663063e-05, + "loss": 0.0204, + "step": 251860 + }, + { + "epoch": 1.63, + "learning_rate": 5.6155727811949373e-05, + "loss": 0.0217, + "step": 251870 + }, + { + "epoch": 1.63, + "learning_rate": 5.614604645759243e-05, + "loss": 0.0258, + "step": 251880 + }, + { + "epoch": 1.63, + "learning_rate": 5.61363651032355e-05, + "loss": 0.0277, + "step": 251890 + }, + { + "epoch": 1.63, + "learning_rate": 5.612668374887857e-05, + "loss": 0.0276, + "step": 251900 + }, + { + "epoch": 1.63, + "learning_rate": 5.611700239452164e-05, + "loss": 0.0194, + "step": 251910 + }, + { + "epoch": 1.63, + "learning_rate": 5.610732104016471e-05, + "loss": 0.0227, + "step": 251920 + }, + { + "epoch": 1.63, + "learning_rate": 5.609763968580778e-05, + "loss": 0.0265, + "step": 251930 + }, + { + "epoch": 1.63, + "learning_rate": 5.6087958331450844e-05, + "loss": 0.0308, + "step": 251940 + }, + { + "epoch": 1.63, + "learning_rate": 5.607827697709391e-05, + "loss": 0.0227, + "step": 251950 + }, + { + "epoch": 1.63, + "learning_rate": 5.6068595622736976e-05, + "loss": 0.0262, + "step": 251960 + }, + { + "epoch": 1.63, + "learning_rate": 5.605891426838005e-05, + "loss": 0.0285, + "step": 251970 + }, + { + "epoch": 1.63, + "learning_rate": 5.6049232914023116e-05, + "loss": 0.0289, + "step": 251980 + }, + { + "epoch": 1.63, + "learning_rate": 5.603955155966618e-05, + "loss": 0.0272, + "step": 251990 + }, + { + "epoch": 1.63, + "learning_rate": 5.602987020530925e-05, + "loss": 0.0309, + "step": 252000 + }, + { + "epoch": 1.63, + "eval_cer": 0.9198192294655971, + "eval_loss": 0.018738944083452225, + "eval_runtime": 120.2162, + "eval_samples_per_second": 16.637, + "eval_steps_per_second": 4.159, + "step": 252000 + }, + { + "epoch": 1.63, + "learning_rate": 5.602018885095232e-05, + "loss": 0.0267, + "step": 252010 + }, + { + "epoch": 1.63, + "learning_rate": 5.601050749659539e-05, + "loss": 0.0254, + "step": 252020 + }, + { + "epoch": 1.63, + "learning_rate": 5.6000826142238454e-05, + "loss": 0.0268, + "step": 252030 + }, + { + "epoch": 1.63, + "learning_rate": 5.599114478788152e-05, + "loss": 0.0209, + "step": 252040 + }, + { + "epoch": 1.63, + "learning_rate": 5.5981463433524586e-05, + "loss": 0.0259, + "step": 252050 + }, + { + "epoch": 1.63, + "learning_rate": 5.597178207916766e-05, + "loss": 0.0269, + "step": 252060 + }, + { + "epoch": 1.63, + "learning_rate": 5.5962100724810725e-05, + "loss": 0.0256, + "step": 252070 + }, + { + "epoch": 1.63, + "learning_rate": 5.59524193704538e-05, + "loss": 0.0279, + "step": 252080 + }, + { + "epoch": 1.63, + "learning_rate": 5.594273801609686e-05, + "loss": 0.0268, + "step": 252090 + }, + { + "epoch": 1.63, + "learning_rate": 5.5933056661739924e-05, + "loss": 0.0254, + "step": 252100 + }, + { + "epoch": 1.63, + "learning_rate": 5.5923375307383e-05, + "loss": 0.03, + "step": 252110 + }, + { + "epoch": 1.63, + "learning_rate": 5.591369395302606e-05, + "loss": 0.0277, + "step": 252120 + }, + { + "epoch": 1.63, + "learning_rate": 5.5904012598669136e-05, + "loss": 0.022, + "step": 252130 + }, + { + "epoch": 1.63, + "learning_rate": 5.5894331244312196e-05, + "loss": 0.0235, + "step": 252140 + }, + { + "epoch": 1.63, + "learning_rate": 5.588464988995527e-05, + "loss": 0.0256, + "step": 252150 + }, + { + "epoch": 1.63, + "learning_rate": 5.5874968535598335e-05, + "loss": 0.0233, + "step": 252160 + }, + { + "epoch": 1.63, + "learning_rate": 5.58652871812414e-05, + "loss": 0.0247, + "step": 252170 + }, + { + "epoch": 1.63, + "learning_rate": 5.5855605826884474e-05, + "loss": 0.0283, + "step": 252180 + }, + { + "epoch": 1.63, + "learning_rate": 5.5845924472527534e-05, + "loss": 0.0329, + "step": 252190 + }, + { + "epoch": 1.63, + "learning_rate": 5.583624311817061e-05, + "loss": 0.0258, + "step": 252200 + }, + { + "epoch": 1.63, + "learning_rate": 5.582656176381367e-05, + "loss": 0.0247, + "step": 252210 + }, + { + "epoch": 1.63, + "learning_rate": 5.581688040945674e-05, + "loss": 0.0244, + "step": 252220 + }, + { + "epoch": 1.63, + "learning_rate": 5.580719905509981e-05, + "loss": 0.0271, + "step": 252230 + }, + { + "epoch": 1.63, + "learning_rate": 5.579751770074287e-05, + "loss": 0.027, + "step": 252240 + }, + { + "epoch": 1.63, + "learning_rate": 5.5787836346385945e-05, + "loss": 0.0259, + "step": 252250 + }, + { + "epoch": 1.63, + "learning_rate": 5.577815499202901e-05, + "loss": 0.0253, + "step": 252260 + }, + { + "epoch": 1.63, + "learning_rate": 5.5768473637672084e-05, + "loss": 0.0321, + "step": 252270 + }, + { + "epoch": 1.63, + "learning_rate": 5.575879228331515e-05, + "loss": 0.0231, + "step": 252280 + }, + { + "epoch": 1.63, + "learning_rate": 5.574911092895821e-05, + "loss": 0.0227, + "step": 252290 + }, + { + "epoch": 1.63, + "learning_rate": 5.573942957460128e-05, + "loss": 0.0248, + "step": 252300 + }, + { + "epoch": 1.63, + "learning_rate": 5.572974822024435e-05, + "loss": 0.0231, + "step": 252310 + }, + { + "epoch": 1.63, + "learning_rate": 5.572006686588742e-05, + "loss": 0.0274, + "step": 252320 + }, + { + "epoch": 1.63, + "learning_rate": 5.571038551153049e-05, + "loss": 0.0276, + "step": 252330 + }, + { + "epoch": 1.63, + "learning_rate": 5.570070415717356e-05, + "loss": 0.0255, + "step": 252340 + }, + { + "epoch": 1.63, + "learning_rate": 5.569102280281662e-05, + "loss": 0.0257, + "step": 252350 + }, + { + "epoch": 1.63, + "learning_rate": 5.568134144845969e-05, + "loss": 0.024, + "step": 252360 + }, + { + "epoch": 1.63, + "learning_rate": 5.567166009410276e-05, + "loss": 0.0258, + "step": 252370 + }, + { + "epoch": 1.63, + "learning_rate": 5.5661978739745826e-05, + "loss": 0.0264, + "step": 252380 + }, + { + "epoch": 1.63, + "learning_rate": 5.56522973853889e-05, + "loss": 0.0244, + "step": 252390 + }, + { + "epoch": 1.63, + "learning_rate": 5.564261603103196e-05, + "loss": 0.0238, + "step": 252400 + }, + { + "epoch": 1.63, + "learning_rate": 5.563293467667503e-05, + "loss": 0.0224, + "step": 252410 + }, + { + "epoch": 1.63, + "learning_rate": 5.56232533223181e-05, + "loss": 0.0337, + "step": 252420 + }, + { + "epoch": 1.63, + "learning_rate": 5.5613571967961164e-05, + "loss": 0.0267, + "step": 252430 + }, + { + "epoch": 1.63, + "learning_rate": 5.560389061360424e-05, + "loss": 0.0269, + "step": 252440 + }, + { + "epoch": 1.63, + "learning_rate": 5.5594209259247297e-05, + "loss": 0.0289, + "step": 252450 + }, + { + "epoch": 1.63, + "learning_rate": 5.558452790489037e-05, + "loss": 0.0216, + "step": 252460 + }, + { + "epoch": 1.63, + "learning_rate": 5.5574846550533436e-05, + "loss": 0.0241, + "step": 252470 + }, + { + "epoch": 1.63, + "learning_rate": 5.556516519617651e-05, + "loss": 0.0261, + "step": 252480 + }, + { + "epoch": 1.63, + "learning_rate": 5.5555483841819575e-05, + "loss": 0.0251, + "step": 252490 + }, + { + "epoch": 1.63, + "learning_rate": 5.5545802487462635e-05, + "loss": 0.0258, + "step": 252500 + }, + { + "epoch": 1.63, + "learning_rate": 5.553612113310571e-05, + "loss": 0.0277, + "step": 252510 + }, + { + "epoch": 1.63, + "learning_rate": 5.5526439778748774e-05, + "loss": 0.0255, + "step": 252520 + }, + { + "epoch": 1.63, + "learning_rate": 5.551675842439185e-05, + "loss": 0.0273, + "step": 252530 + }, + { + "epoch": 1.63, + "learning_rate": 5.550707707003491e-05, + "loss": 0.0253, + "step": 252540 + }, + { + "epoch": 1.63, + "learning_rate": 5.5497395715677986e-05, + "loss": 0.0253, + "step": 252550 + }, + { + "epoch": 1.63, + "learning_rate": 5.5487714361321046e-05, + "loss": 0.024, + "step": 252560 + }, + { + "epoch": 1.63, + "learning_rate": 5.547803300696411e-05, + "loss": 0.0357, + "step": 252570 + }, + { + "epoch": 1.63, + "learning_rate": 5.5468351652607185e-05, + "loss": 0.0196, + "step": 252580 + }, + { + "epoch": 1.63, + "learning_rate": 5.545867029825025e-05, + "loss": 0.0288, + "step": 252590 + }, + { + "epoch": 1.63, + "learning_rate": 5.5448988943893324e-05, + "loss": 0.0281, + "step": 252600 + }, + { + "epoch": 1.63, + "learning_rate": 5.5439307589536384e-05, + "loss": 0.0294, + "step": 252610 + }, + { + "epoch": 1.63, + "learning_rate": 5.5429626235179457e-05, + "loss": 0.0239, + "step": 252620 + }, + { + "epoch": 1.63, + "learning_rate": 5.541994488082252e-05, + "loss": 0.0226, + "step": 252630 + }, + { + "epoch": 1.63, + "learning_rate": 5.541026352646559e-05, + "loss": 0.0251, + "step": 252640 + }, + { + "epoch": 1.63, + "learning_rate": 5.540058217210866e-05, + "loss": 0.0247, + "step": 252650 + }, + { + "epoch": 1.63, + "learning_rate": 5.539090081775172e-05, + "loss": 0.027, + "step": 252660 + }, + { + "epoch": 1.63, + "learning_rate": 5.5381219463394795e-05, + "loss": 0.0227, + "step": 252670 + }, + { + "epoch": 1.63, + "learning_rate": 5.537153810903786e-05, + "loss": 0.0232, + "step": 252680 + }, + { + "epoch": 1.63, + "learning_rate": 5.5361856754680934e-05, + "loss": 0.0238, + "step": 252690 + }, + { + "epoch": 1.63, + "learning_rate": 5.5352175400324e-05, + "loss": 0.0234, + "step": 252700 + }, + { + "epoch": 1.63, + "learning_rate": 5.534249404596706e-05, + "loss": 0.0272, + "step": 252710 + }, + { + "epoch": 1.63, + "learning_rate": 5.533281269161013e-05, + "loss": 0.0227, + "step": 252720 + }, + { + "epoch": 1.63, + "learning_rate": 5.53231313372532e-05, + "loss": 0.0257, + "step": 252730 + }, + { + "epoch": 1.63, + "learning_rate": 5.531344998289627e-05, + "loss": 0.0222, + "step": 252740 + }, + { + "epoch": 1.63, + "learning_rate": 5.530376862853934e-05, + "loss": 0.0218, + "step": 252750 + }, + { + "epoch": 1.63, + "learning_rate": 5.529408727418241e-05, + "loss": 0.0259, + "step": 252760 + }, + { + "epoch": 1.63, + "learning_rate": 5.528440591982547e-05, + "loss": 0.0227, + "step": 252770 + }, + { + "epoch": 1.63, + "learning_rate": 5.527472456546854e-05, + "loss": 0.0309, + "step": 252780 + }, + { + "epoch": 1.63, + "learning_rate": 5.526504321111161e-05, + "loss": 0.0217, + "step": 252790 + }, + { + "epoch": 1.63, + "learning_rate": 5.5255361856754676e-05, + "loss": 0.022, + "step": 252800 + }, + { + "epoch": 1.63, + "learning_rate": 5.524568050239775e-05, + "loss": 0.0231, + "step": 252810 + }, + { + "epoch": 1.63, + "learning_rate": 5.523599914804081e-05, + "loss": 0.0237, + "step": 252820 + }, + { + "epoch": 1.63, + "learning_rate": 5.522631779368388e-05, + "loss": 0.0259, + "step": 252830 + }, + { + "epoch": 1.63, + "learning_rate": 5.521663643932695e-05, + "loss": 0.0266, + "step": 252840 + }, + { + "epoch": 1.63, + "learning_rate": 5.5206955084970014e-05, + "loss": 0.0313, + "step": 252850 + }, + { + "epoch": 1.63, + "learning_rate": 5.519727373061309e-05, + "loss": 0.0228, + "step": 252860 + }, + { + "epoch": 1.63, + "learning_rate": 5.5187592376256146e-05, + "loss": 0.0307, + "step": 252870 + }, + { + "epoch": 1.63, + "learning_rate": 5.517791102189922e-05, + "loss": 0.0219, + "step": 252880 + }, + { + "epoch": 1.63, + "learning_rate": 5.5168229667542286e-05, + "loss": 0.0254, + "step": 252890 + }, + { + "epoch": 1.63, + "learning_rate": 5.515854831318536e-05, + "loss": 0.0263, + "step": 252900 + }, + { + "epoch": 1.63, + "learning_rate": 5.5148866958828425e-05, + "loss": 0.0256, + "step": 252910 + }, + { + "epoch": 1.63, + "learning_rate": 5.5139185604471484e-05, + "loss": 0.024, + "step": 252920 + }, + { + "epoch": 1.63, + "learning_rate": 5.512950425011456e-05, + "loss": 0.0212, + "step": 252930 + }, + { + "epoch": 1.63, + "learning_rate": 5.5119822895757624e-05, + "loss": 0.023, + "step": 252940 + }, + { + "epoch": 1.63, + "learning_rate": 5.51101415414007e-05, + "loss": 0.0353, + "step": 252950 + }, + { + "epoch": 1.63, + "learning_rate": 5.510046018704376e-05, + "loss": 0.027, + "step": 252960 + }, + { + "epoch": 1.63, + "learning_rate": 5.5090778832686836e-05, + "loss": 0.0242, + "step": 252970 + }, + { + "epoch": 1.63, + "learning_rate": 5.5081097478329895e-05, + "loss": 0.0246, + "step": 252980 + }, + { + "epoch": 1.63, + "learning_rate": 5.507141612397296e-05, + "loss": 0.0271, + "step": 252990 + }, + { + "epoch": 1.63, + "learning_rate": 5.5061734769616035e-05, + "loss": 0.0237, + "step": 253000 + }, + { + "epoch": 1.63, + "eval_cer": 0.9198508643091177, + "eval_loss": 0.018802916631102562, + "eval_runtime": 119.9935, + "eval_samples_per_second": 16.668, + "eval_steps_per_second": 4.167, + "step": 253000 + }, + { + "epoch": 1.63, + "learning_rate": 5.50520534152591e-05, + "loss": 0.0292, + "step": 253010 + }, + { + "epoch": 1.63, + "learning_rate": 5.5042372060902174e-05, + "loss": 0.0239, + "step": 253020 + }, + { + "epoch": 1.63, + "learning_rate": 5.503269070654523e-05, + "loss": 0.0221, + "step": 253030 + }, + { + "epoch": 1.63, + "learning_rate": 5.5023009352188306e-05, + "loss": 0.0239, + "step": 253040 + }, + { + "epoch": 1.63, + "learning_rate": 5.501332799783137e-05, + "loss": 0.023, + "step": 253050 + }, + { + "epoch": 1.63, + "learning_rate": 5.500364664347444e-05, + "loss": 0.0234, + "step": 253060 + }, + { + "epoch": 1.63, + "learning_rate": 5.499396528911751e-05, + "loss": 0.0289, + "step": 253070 + }, + { + "epoch": 1.63, + "learning_rate": 5.498428393476057e-05, + "loss": 0.0263, + "step": 253080 + }, + { + "epoch": 1.63, + "learning_rate": 5.4974602580403644e-05, + "loss": 0.0207, + "step": 253090 + }, + { + "epoch": 1.63, + "learning_rate": 5.496492122604671e-05, + "loss": 0.0227, + "step": 253100 + }, + { + "epoch": 1.63, + "learning_rate": 5.4955239871689784e-05, + "loss": 0.0216, + "step": 253110 + }, + { + "epoch": 1.63, + "learning_rate": 5.494555851733285e-05, + "loss": 0.0287, + "step": 253120 + }, + { + "epoch": 1.63, + "learning_rate": 5.493587716297591e-05, + "loss": 0.0237, + "step": 253130 + }, + { + "epoch": 1.63, + "learning_rate": 5.492619580861898e-05, + "loss": 0.0278, + "step": 253140 + }, + { + "epoch": 1.63, + "learning_rate": 5.491651445426205e-05, + "loss": 0.0215, + "step": 253150 + }, + { + "epoch": 1.63, + "learning_rate": 5.490683309990512e-05, + "loss": 0.0302, + "step": 253160 + }, + { + "epoch": 1.63, + "learning_rate": 5.489715174554819e-05, + "loss": 0.0266, + "step": 253170 + }, + { + "epoch": 1.63, + "learning_rate": 5.4887470391191254e-05, + "loss": 0.029, + "step": 253180 + }, + { + "epoch": 1.63, + "learning_rate": 5.487778903683432e-05, + "loss": 0.0227, + "step": 253190 + }, + { + "epoch": 1.63, + "learning_rate": 5.4868107682477387e-05, + "loss": 0.0254, + "step": 253200 + }, + { + "epoch": 1.63, + "learning_rate": 5.485842632812046e-05, + "loss": 0.0245, + "step": 253210 + }, + { + "epoch": 1.63, + "learning_rate": 5.4848744973763526e-05, + "loss": 0.0251, + "step": 253220 + }, + { + "epoch": 1.63, + "learning_rate": 5.483906361940659e-05, + "loss": 0.0233, + "step": 253230 + }, + { + "epoch": 1.63, + "learning_rate": 5.482938226504966e-05, + "loss": 0.0211, + "step": 253240 + }, + { + "epoch": 1.63, + "learning_rate": 5.481970091069273e-05, + "loss": 0.0263, + "step": 253250 + }, + { + "epoch": 1.63, + "learning_rate": 5.48100195563358e-05, + "loss": 0.0246, + "step": 253260 + }, + { + "epoch": 1.63, + "learning_rate": 5.4800338201978864e-05, + "loss": 0.0257, + "step": 253270 + }, + { + "epoch": 1.63, + "learning_rate": 5.479065684762193e-05, + "loss": 0.0238, + "step": 253280 + }, + { + "epoch": 1.63, + "learning_rate": 5.4780975493264996e-05, + "loss": 0.0259, + "step": 253290 + }, + { + "epoch": 1.63, + "learning_rate": 5.477129413890807e-05, + "loss": 0.0283, + "step": 253300 + }, + { + "epoch": 1.63, + "learning_rate": 5.4761612784551135e-05, + "loss": 0.0229, + "step": 253310 + }, + { + "epoch": 1.63, + "learning_rate": 5.475193143019421e-05, + "loss": 0.0334, + "step": 253320 + }, + { + "epoch": 1.64, + "learning_rate": 5.474225007583727e-05, + "loss": 0.0274, + "step": 253330 + }, + { + "epoch": 1.64, + "learning_rate": 5.4732568721480334e-05, + "loss": 0.0244, + "step": 253340 + }, + { + "epoch": 1.64, + "learning_rate": 5.472288736712341e-05, + "loss": 0.0265, + "step": 253350 + }, + { + "epoch": 1.64, + "learning_rate": 5.4713206012766473e-05, + "loss": 0.0249, + "step": 253360 + }, + { + "epoch": 1.64, + "learning_rate": 5.4703524658409546e-05, + "loss": 0.0264, + "step": 253370 + }, + { + "epoch": 1.64, + "learning_rate": 5.4693843304052606e-05, + "loss": 0.0217, + "step": 253380 + }, + { + "epoch": 1.64, + "learning_rate": 5.468416194969568e-05, + "loss": 0.026, + "step": 253390 + }, + { + "epoch": 1.64, + "learning_rate": 5.4674480595338745e-05, + "loss": 0.0224, + "step": 253400 + }, + { + "epoch": 1.64, + "learning_rate": 5.466479924098181e-05, + "loss": 0.0242, + "step": 253410 + }, + { + "epoch": 1.64, + "learning_rate": 5.4655117886624884e-05, + "loss": 0.0252, + "step": 253420 + }, + { + "epoch": 1.64, + "learning_rate": 5.4645436532267944e-05, + "loss": 0.0237, + "step": 253430 + }, + { + "epoch": 1.64, + "learning_rate": 5.463575517791102e-05, + "loss": 0.0317, + "step": 253440 + }, + { + "epoch": 1.64, + "learning_rate": 5.462607382355408e-05, + "loss": 0.0287, + "step": 253450 + }, + { + "epoch": 1.64, + "learning_rate": 5.4616392469197156e-05, + "loss": 0.0237, + "step": 253460 + }, + { + "epoch": 1.64, + "learning_rate": 5.460671111484022e-05, + "loss": 0.0242, + "step": 253470 + }, + { + "epoch": 1.64, + "learning_rate": 5.459702976048328e-05, + "loss": 0.0202, + "step": 253480 + }, + { + "epoch": 1.64, + "learning_rate": 5.4587348406126355e-05, + "loss": 0.027, + "step": 253490 + }, + { + "epoch": 1.64, + "learning_rate": 5.457766705176942e-05, + "loss": 0.0237, + "step": 253500 + }, + { + "epoch": 1.64, + "learning_rate": 5.4567985697412494e-05, + "loss": 0.0231, + "step": 253510 + }, + { + "epoch": 1.64, + "learning_rate": 5.455830434305556e-05, + "loss": 0.0269, + "step": 253520 + }, + { + "epoch": 1.64, + "learning_rate": 5.454862298869863e-05, + "loss": 0.0269, + "step": 253530 + }, + { + "epoch": 1.64, + "learning_rate": 5.453894163434169e-05, + "loss": 0.0237, + "step": 253540 + }, + { + "epoch": 1.64, + "learning_rate": 5.452926027998476e-05, + "loss": 0.0261, + "step": 253550 + }, + { + "epoch": 1.64, + "learning_rate": 5.451957892562783e-05, + "loss": 0.0301, + "step": 253560 + }, + { + "epoch": 1.64, + "learning_rate": 5.45098975712709e-05, + "loss": 0.0238, + "step": 253570 + }, + { + "epoch": 1.64, + "learning_rate": 5.450021621691397e-05, + "loss": 0.0251, + "step": 253580 + }, + { + "epoch": 1.64, + "learning_rate": 5.449053486255703e-05, + "loss": 0.0247, + "step": 253590 + }, + { + "epoch": 1.64, + "learning_rate": 5.4480853508200104e-05, + "loss": 0.0231, + "step": 253600 + }, + { + "epoch": 1.64, + "learning_rate": 5.447117215384317e-05, + "loss": 0.029, + "step": 253610 + }, + { + "epoch": 1.64, + "learning_rate": 5.4461490799486236e-05, + "loss": 0.0263, + "step": 253620 + }, + { + "epoch": 1.64, + "learning_rate": 5.445180944512931e-05, + "loss": 0.025, + "step": 253630 + }, + { + "epoch": 1.64, + "learning_rate": 5.444212809077237e-05, + "loss": 0.0263, + "step": 253640 + }, + { + "epoch": 1.64, + "learning_rate": 5.443244673641544e-05, + "loss": 0.0232, + "step": 253650 + }, + { + "epoch": 1.64, + "learning_rate": 5.442276538205851e-05, + "loss": 0.0269, + "step": 253660 + }, + { + "epoch": 1.64, + "learning_rate": 5.441308402770158e-05, + "loss": 0.0225, + "step": 253670 + }, + { + "epoch": 1.64, + "learning_rate": 5.440340267334465e-05, + "loss": 0.0244, + "step": 253680 + }, + { + "epoch": 1.64, + "learning_rate": 5.439372131898771e-05, + "loss": 0.0224, + "step": 253690 + }, + { + "epoch": 1.64, + "learning_rate": 5.438403996463078e-05, + "loss": 0.0244, + "step": 253700 + }, + { + "epoch": 1.64, + "learning_rate": 5.4374358610273846e-05, + "loss": 0.0271, + "step": 253710 + }, + { + "epoch": 1.64, + "learning_rate": 5.436467725591692e-05, + "loss": 0.0331, + "step": 253720 + }, + { + "epoch": 1.64, + "learning_rate": 5.4354995901559985e-05, + "loss": 0.0212, + "step": 253730 + }, + { + "epoch": 1.64, + "learning_rate": 5.434531454720306e-05, + "loss": 0.0284, + "step": 253740 + }, + { + "epoch": 1.64, + "learning_rate": 5.433563319284612e-05, + "loss": 0.0246, + "step": 253750 + }, + { + "epoch": 1.64, + "learning_rate": 5.4325951838489184e-05, + "loss": 0.026, + "step": 253760 + }, + { + "epoch": 1.64, + "learning_rate": 5.431627048413226e-05, + "loss": 0.0235, + "step": 253770 + }, + { + "epoch": 1.64, + "learning_rate": 5.430658912977532e-05, + "loss": 0.023, + "step": 253780 + }, + { + "epoch": 1.64, + "learning_rate": 5.4296907775418396e-05, + "loss": 0.0242, + "step": 253790 + }, + { + "epoch": 1.64, + "learning_rate": 5.4287226421061456e-05, + "loss": 0.0225, + "step": 253800 + }, + { + "epoch": 1.64, + "learning_rate": 5.427754506670453e-05, + "loss": 0.0262, + "step": 253810 + }, + { + "epoch": 1.64, + "learning_rate": 5.4267863712347595e-05, + "loss": 0.0235, + "step": 253820 + }, + { + "epoch": 1.64, + "learning_rate": 5.425818235799066e-05, + "loss": 0.0251, + "step": 253830 + }, + { + "epoch": 1.64, + "learning_rate": 5.4248501003633734e-05, + "loss": 0.0278, + "step": 253840 + }, + { + "epoch": 1.64, + "learning_rate": 5.4238819649276794e-05, + "loss": 0.0229, + "step": 253850 + }, + { + "epoch": 1.64, + "learning_rate": 5.422913829491987e-05, + "loss": 0.0241, + "step": 253860 + }, + { + "epoch": 1.64, + "learning_rate": 5.421945694056293e-05, + "loss": 0.0286, + "step": 253870 + }, + { + "epoch": 1.64, + "learning_rate": 5.4209775586206006e-05, + "loss": 0.0257, + "step": 253880 + }, + { + "epoch": 1.64, + "learning_rate": 5.420009423184907e-05, + "loss": 0.0224, + "step": 253890 + }, + { + "epoch": 1.64, + "learning_rate": 5.419041287749213e-05, + "loss": 0.0241, + "step": 253900 + }, + { + "epoch": 1.64, + "learning_rate": 5.4180731523135205e-05, + "loss": 0.0294, + "step": 253910 + }, + { + "epoch": 1.64, + "learning_rate": 5.417105016877827e-05, + "loss": 0.0259, + "step": 253920 + }, + { + "epoch": 1.64, + "learning_rate": 5.4161368814421344e-05, + "loss": 0.0233, + "step": 253930 + }, + { + "epoch": 1.64, + "learning_rate": 5.415168746006441e-05, + "loss": 0.0252, + "step": 253940 + }, + { + "epoch": 1.64, + "learning_rate": 5.414200610570747e-05, + "loss": 0.0248, + "step": 253950 + }, + { + "epoch": 1.64, + "learning_rate": 5.413232475135054e-05, + "loss": 0.026, + "step": 253960 + }, + { + "epoch": 1.64, + "learning_rate": 5.412264339699361e-05, + "loss": 0.0242, + "step": 253970 + }, + { + "epoch": 1.64, + "learning_rate": 5.411296204263668e-05, + "loss": 0.027, + "step": 253980 + }, + { + "epoch": 1.64, + "learning_rate": 5.410328068827975e-05, + "loss": 0.0233, + "step": 253990 + }, + { + "epoch": 1.64, + "learning_rate": 5.409359933392282e-05, + "loss": 0.0234, + "step": 254000 + }, + { + "epoch": 1.64, + "eval_cer": 0.9198201333182692, + "eval_loss": 0.01838851161301136, + "eval_runtime": 120.0869, + "eval_samples_per_second": 16.655, + "eval_steps_per_second": 4.164, + "step": 254000 + }, + { + "epoch": 1.64, + "learning_rate": 5.408391797956588e-05, + "loss": 0.0227, + "step": 254010 + }, + { + "epoch": 1.64, + "learning_rate": 5.407423662520895e-05, + "loss": 0.0244, + "step": 254020 + }, + { + "epoch": 1.64, + "learning_rate": 5.406455527085202e-05, + "loss": 0.0237, + "step": 254030 + }, + { + "epoch": 1.64, + "learning_rate": 5.4054873916495086e-05, + "loss": 0.0224, + "step": 254040 + }, + { + "epoch": 1.64, + "learning_rate": 5.404519256213816e-05, + "loss": 0.0221, + "step": 254050 + }, + { + "epoch": 1.64, + "learning_rate": 5.403551120778122e-05, + "loss": 0.0259, + "step": 254060 + }, + { + "epoch": 1.64, + "learning_rate": 5.402582985342429e-05, + "loss": 0.0229, + "step": 254070 + }, + { + "epoch": 1.64, + "learning_rate": 5.401614849906736e-05, + "loss": 0.0246, + "step": 254080 + }, + { + "epoch": 1.64, + "learning_rate": 5.4006467144710424e-05, + "loss": 0.024, + "step": 254090 + }, + { + "epoch": 1.64, + "learning_rate": 5.39967857903535e-05, + "loss": 0.0302, + "step": 254100 + }, + { + "epoch": 1.64, + "learning_rate": 5.3987104435996557e-05, + "loss": 0.0237, + "step": 254110 + }, + { + "epoch": 1.64, + "learning_rate": 5.397742308163963e-05, + "loss": 0.0236, + "step": 254120 + }, + { + "epoch": 1.64, + "learning_rate": 5.3967741727282696e-05, + "loss": 0.0219, + "step": 254130 + }, + { + "epoch": 1.64, + "learning_rate": 5.395806037292577e-05, + "loss": 0.0232, + "step": 254140 + }, + { + "epoch": 1.64, + "learning_rate": 5.3948379018568835e-05, + "loss": 0.0292, + "step": 254150 + }, + { + "epoch": 1.64, + "learning_rate": 5.3938697664211895e-05, + "loss": 0.0238, + "step": 254160 + }, + { + "epoch": 1.64, + "learning_rate": 5.392901630985497e-05, + "loss": 0.0253, + "step": 254170 + }, + { + "epoch": 1.64, + "learning_rate": 5.3919334955498034e-05, + "loss": 0.0259, + "step": 254180 + }, + { + "epoch": 1.64, + "learning_rate": 5.390965360114111e-05, + "loss": 0.0247, + "step": 254190 + }, + { + "epoch": 1.64, + "learning_rate": 5.389997224678417e-05, + "loss": 0.0235, + "step": 254200 + }, + { + "epoch": 1.64, + "learning_rate": 5.3890290892427246e-05, + "loss": 0.0269, + "step": 254210 + }, + { + "epoch": 1.64, + "learning_rate": 5.3880609538070306e-05, + "loss": 0.0279, + "step": 254220 + }, + { + "epoch": 1.64, + "learning_rate": 5.387092818371337e-05, + "loss": 0.03, + "step": 254230 + }, + { + "epoch": 1.64, + "learning_rate": 5.3861246829356445e-05, + "loss": 0.0279, + "step": 254240 + }, + { + "epoch": 1.64, + "learning_rate": 5.385156547499951e-05, + "loss": 0.0247, + "step": 254250 + }, + { + "epoch": 1.64, + "learning_rate": 5.3841884120642584e-05, + "loss": 0.0236, + "step": 254260 + }, + { + "epoch": 1.64, + "learning_rate": 5.3832202766285644e-05, + "loss": 0.0248, + "step": 254270 + }, + { + "epoch": 1.64, + "learning_rate": 5.3822521411928717e-05, + "loss": 0.0212, + "step": 254280 + }, + { + "epoch": 1.64, + "learning_rate": 5.381284005757178e-05, + "loss": 0.0295, + "step": 254290 + }, + { + "epoch": 1.64, + "learning_rate": 5.380315870321485e-05, + "loss": 0.026, + "step": 254300 + }, + { + "epoch": 1.64, + "learning_rate": 5.379347734885792e-05, + "loss": 0.0244, + "step": 254310 + }, + { + "epoch": 1.64, + "learning_rate": 5.378379599450098e-05, + "loss": 0.0253, + "step": 254320 + }, + { + "epoch": 1.64, + "learning_rate": 5.3774114640144054e-05, + "loss": 0.026, + "step": 254330 + }, + { + "epoch": 1.64, + "learning_rate": 5.376443328578712e-05, + "loss": 0.0227, + "step": 254340 + }, + { + "epoch": 1.64, + "learning_rate": 5.3754751931430194e-05, + "loss": 0.0215, + "step": 254350 + }, + { + "epoch": 1.64, + "learning_rate": 5.374507057707326e-05, + "loss": 0.0266, + "step": 254360 + }, + { + "epoch": 1.64, + "learning_rate": 5.373538922271632e-05, + "loss": 0.0266, + "step": 254370 + }, + { + "epoch": 1.64, + "learning_rate": 5.372570786835939e-05, + "loss": 0.0225, + "step": 254380 + }, + { + "epoch": 1.64, + "learning_rate": 5.371602651400246e-05, + "loss": 0.0206, + "step": 254390 + }, + { + "epoch": 1.64, + "learning_rate": 5.370634515964553e-05, + "loss": 0.025, + "step": 254400 + }, + { + "epoch": 1.64, + "learning_rate": 5.36966638052886e-05, + "loss": 0.0263, + "step": 254410 + }, + { + "epoch": 1.64, + "learning_rate": 5.368698245093167e-05, + "loss": 0.0275, + "step": 254420 + }, + { + "epoch": 1.64, + "learning_rate": 5.367730109657473e-05, + "loss": 0.0293, + "step": 254430 + }, + { + "epoch": 1.64, + "learning_rate": 5.36676197422178e-05, + "loss": 0.0231, + "step": 254440 + }, + { + "epoch": 1.64, + "learning_rate": 5.365793838786087e-05, + "loss": 0.0314, + "step": 254450 + }, + { + "epoch": 1.64, + "learning_rate": 5.3648257033503936e-05, + "loss": 0.0325, + "step": 254460 + }, + { + "epoch": 1.64, + "learning_rate": 5.363857567914701e-05, + "loss": 0.0306, + "step": 254470 + }, + { + "epoch": 1.64, + "learning_rate": 5.362889432479007e-05, + "loss": 0.0256, + "step": 254480 + }, + { + "epoch": 1.64, + "learning_rate": 5.361921297043314e-05, + "loss": 0.0277, + "step": 254490 + }, + { + "epoch": 1.64, + "learning_rate": 5.360953161607621e-05, + "loss": 0.025, + "step": 254500 + }, + { + "epoch": 1.64, + "learning_rate": 5.3599850261719274e-05, + "loss": 0.0248, + "step": 254510 + }, + { + "epoch": 1.64, + "learning_rate": 5.359016890736235e-05, + "loss": 0.0259, + "step": 254520 + }, + { + "epoch": 1.64, + "learning_rate": 5.3580487553005406e-05, + "loss": 0.0265, + "step": 254530 + }, + { + "epoch": 1.64, + "learning_rate": 5.357080619864848e-05, + "loss": 0.0194, + "step": 254540 + }, + { + "epoch": 1.64, + "learning_rate": 5.3561124844291546e-05, + "loss": 0.0249, + "step": 254550 + }, + { + "epoch": 1.64, + "learning_rate": 5.355144348993462e-05, + "loss": 0.0244, + "step": 254560 + }, + { + "epoch": 1.64, + "learning_rate": 5.3541762135577685e-05, + "loss": 0.0259, + "step": 254570 + }, + { + "epoch": 1.64, + "learning_rate": 5.3532080781220744e-05, + "loss": 0.0266, + "step": 254580 + }, + { + "epoch": 1.64, + "learning_rate": 5.352239942686382e-05, + "loss": 0.032, + "step": 254590 + }, + { + "epoch": 1.64, + "learning_rate": 5.3512718072506884e-05, + "loss": 0.0216, + "step": 254600 + }, + { + "epoch": 1.64, + "learning_rate": 5.350303671814996e-05, + "loss": 0.0248, + "step": 254610 + }, + { + "epoch": 1.64, + "learning_rate": 5.349335536379302e-05, + "loss": 0.0246, + "step": 254620 + }, + { + "epoch": 1.64, + "learning_rate": 5.348367400943609e-05, + "loss": 0.0252, + "step": 254630 + }, + { + "epoch": 1.64, + "learning_rate": 5.3473992655079155e-05, + "loss": 0.0247, + "step": 254640 + }, + { + "epoch": 1.64, + "learning_rate": 5.346431130072222e-05, + "loss": 0.0242, + "step": 254650 + }, + { + "epoch": 1.64, + "learning_rate": 5.3454629946365295e-05, + "loss": 0.0317, + "step": 254660 + }, + { + "epoch": 1.64, + "learning_rate": 5.344494859200836e-05, + "loss": 0.0231, + "step": 254670 + }, + { + "epoch": 1.64, + "learning_rate": 5.343526723765143e-05, + "loss": 0.0221, + "step": 254680 + }, + { + "epoch": 1.64, + "learning_rate": 5.342558588329449e-05, + "loss": 0.0258, + "step": 254690 + }, + { + "epoch": 1.64, + "learning_rate": 5.3415904528937566e-05, + "loss": 0.0268, + "step": 254700 + }, + { + "epoch": 1.64, + "learning_rate": 5.340622317458063e-05, + "loss": 0.0252, + "step": 254710 + }, + { + "epoch": 1.64, + "learning_rate": 5.33965418202237e-05, + "loss": 0.0228, + "step": 254720 + }, + { + "epoch": 1.64, + "learning_rate": 5.3386860465866765e-05, + "loss": 0.0235, + "step": 254730 + }, + { + "epoch": 1.64, + "learning_rate": 5.337717911150983e-05, + "loss": 0.0282, + "step": 254740 + }, + { + "epoch": 1.64, + "learning_rate": 5.3367497757152904e-05, + "loss": 0.0274, + "step": 254750 + }, + { + "epoch": 1.64, + "learning_rate": 5.335781640279597e-05, + "loss": 0.0251, + "step": 254760 + }, + { + "epoch": 1.64, + "learning_rate": 5.3348135048439044e-05, + "loss": 0.0264, + "step": 254770 + }, + { + "epoch": 1.64, + "learning_rate": 5.33384536940821e-05, + "loss": 0.0232, + "step": 254780 + }, + { + "epoch": 1.64, + "learning_rate": 5.332877233972517e-05, + "loss": 0.025, + "step": 254790 + }, + { + "epoch": 1.64, + "learning_rate": 5.331909098536824e-05, + "loss": 0.0317, + "step": 254800 + }, + { + "epoch": 1.64, + "learning_rate": 5.330940963101131e-05, + "loss": 0.0257, + "step": 254810 + }, + { + "epoch": 1.64, + "learning_rate": 5.329972827665438e-05, + "loss": 0.0372, + "step": 254820 + }, + { + "epoch": 1.64, + "learning_rate": 5.329004692229744e-05, + "loss": 0.0227, + "step": 254830 + }, + { + "epoch": 1.64, + "learning_rate": 5.3280365567940514e-05, + "loss": 0.0203, + "step": 254840 + }, + { + "epoch": 1.64, + "learning_rate": 5.327068421358358e-05, + "loss": 0.0259, + "step": 254850 + }, + { + "epoch": 1.64, + "learning_rate": 5.3261002859226646e-05, + "loss": 0.028, + "step": 254860 + }, + { + "epoch": 1.64, + "learning_rate": 5.325132150486972e-05, + "loss": 0.0316, + "step": 254870 + }, + { + "epoch": 1.65, + "learning_rate": 5.324164015051278e-05, + "loss": 0.0266, + "step": 254880 + }, + { + "epoch": 1.65, + "learning_rate": 5.323195879615585e-05, + "loss": 0.0227, + "step": 254890 + }, + { + "epoch": 1.65, + "learning_rate": 5.322227744179892e-05, + "loss": 0.0244, + "step": 254900 + }, + { + "epoch": 1.65, + "learning_rate": 5.321259608744199e-05, + "loss": 0.0243, + "step": 254910 + }, + { + "epoch": 1.65, + "learning_rate": 5.320291473308506e-05, + "loss": 0.0303, + "step": 254920 + }, + { + "epoch": 1.65, + "learning_rate": 5.319323337872812e-05, + "loss": 0.0243, + "step": 254930 + }, + { + "epoch": 1.65, + "learning_rate": 5.318355202437119e-05, + "loss": 0.0246, + "step": 254940 + }, + { + "epoch": 1.65, + "learning_rate": 5.3173870670014256e-05, + "loss": 0.0264, + "step": 254950 + }, + { + "epoch": 1.65, + "learning_rate": 5.316418931565733e-05, + "loss": 0.0242, + "step": 254960 + }, + { + "epoch": 1.65, + "learning_rate": 5.3154507961300395e-05, + "loss": 0.025, + "step": 254970 + }, + { + "epoch": 1.65, + "learning_rate": 5.314482660694347e-05, + "loss": 0.0258, + "step": 254980 + }, + { + "epoch": 1.65, + "learning_rate": 5.313514525258653e-05, + "loss": 0.0302, + "step": 254990 + }, + { + "epoch": 1.65, + "learning_rate": 5.3125463898229594e-05, + "loss": 0.0246, + "step": 255000 + }, + { + "epoch": 1.65, + "eval_cer": 0.9198255564343012, + "eval_loss": 0.018629562109708786, + "eval_runtime": 120.0069, + "eval_samples_per_second": 16.666, + "eval_steps_per_second": 4.166, + "step": 255000 + }, + { + "epoch": 1.65, + "learning_rate": 5.311578254387267e-05, + "loss": 0.0264, + "step": 255010 + }, + { + "epoch": 1.65, + "learning_rate": 5.3106101189515733e-05, + "loss": 0.0253, + "step": 255020 + }, + { + "epoch": 1.65, + "learning_rate": 5.3096419835158806e-05, + "loss": 0.0293, + "step": 255030 + }, + { + "epoch": 1.65, + "learning_rate": 5.3086738480801866e-05, + "loss": 0.0254, + "step": 255040 + }, + { + "epoch": 1.65, + "learning_rate": 5.307705712644494e-05, + "loss": 0.0287, + "step": 255050 + }, + { + "epoch": 1.65, + "learning_rate": 5.3067375772088005e-05, + "loss": 0.0244, + "step": 255060 + }, + { + "epoch": 1.65, + "learning_rate": 5.305769441773107e-05, + "loss": 0.0248, + "step": 255070 + }, + { + "epoch": 1.65, + "learning_rate": 5.3048013063374144e-05, + "loss": 0.0252, + "step": 255080 + }, + { + "epoch": 1.65, + "learning_rate": 5.3038331709017204e-05, + "loss": 0.0268, + "step": 255090 + }, + { + "epoch": 1.65, + "learning_rate": 5.302865035466028e-05, + "loss": 0.0259, + "step": 255100 + }, + { + "epoch": 1.65, + "learning_rate": 5.301896900030334e-05, + "loss": 0.0274, + "step": 255110 + }, + { + "epoch": 1.65, + "learning_rate": 5.3009287645946416e-05, + "loss": 0.0252, + "step": 255120 + }, + { + "epoch": 1.65, + "learning_rate": 5.299960629158948e-05, + "loss": 0.0216, + "step": 255130 + }, + { + "epoch": 1.65, + "learning_rate": 5.298992493723254e-05, + "loss": 0.0259, + "step": 255140 + }, + { + "epoch": 1.65, + "learning_rate": 5.2980243582875615e-05, + "loss": 0.0232, + "step": 255150 + }, + { + "epoch": 1.65, + "learning_rate": 5.297056222851868e-05, + "loss": 0.0235, + "step": 255160 + }, + { + "epoch": 1.65, + "learning_rate": 5.2960880874161754e-05, + "loss": 0.0254, + "step": 255170 + }, + { + "epoch": 1.65, + "learning_rate": 5.295119951980482e-05, + "loss": 0.0244, + "step": 255180 + }, + { + "epoch": 1.65, + "learning_rate": 5.294151816544789e-05, + "loss": 0.0257, + "step": 255190 + }, + { + "epoch": 1.65, + "learning_rate": 5.293183681109095e-05, + "loss": 0.0261, + "step": 255200 + }, + { + "epoch": 1.65, + "learning_rate": 5.292215545673402e-05, + "loss": 0.0312, + "step": 255210 + }, + { + "epoch": 1.65, + "learning_rate": 5.291247410237709e-05, + "loss": 0.0251, + "step": 255220 + }, + { + "epoch": 1.65, + "learning_rate": 5.290279274802016e-05, + "loss": 0.0275, + "step": 255230 + }, + { + "epoch": 1.65, + "learning_rate": 5.289311139366323e-05, + "loss": 0.0238, + "step": 255240 + }, + { + "epoch": 1.65, + "learning_rate": 5.288343003930629e-05, + "loss": 0.024, + "step": 255250 + }, + { + "epoch": 1.65, + "learning_rate": 5.2873748684949364e-05, + "loss": 0.0272, + "step": 255260 + }, + { + "epoch": 1.65, + "learning_rate": 5.286406733059243e-05, + "loss": 0.0282, + "step": 255270 + }, + { + "epoch": 1.65, + "learning_rate": 5.2854385976235496e-05, + "loss": 0.0259, + "step": 255280 + }, + { + "epoch": 1.65, + "learning_rate": 5.284470462187857e-05, + "loss": 0.0293, + "step": 255290 + }, + { + "epoch": 1.65, + "learning_rate": 5.283502326752163e-05, + "loss": 0.0252, + "step": 255300 + }, + { + "epoch": 1.65, + "learning_rate": 5.28253419131647e-05, + "loss": 0.0227, + "step": 255310 + }, + { + "epoch": 1.65, + "learning_rate": 5.281566055880777e-05, + "loss": 0.0306, + "step": 255320 + }, + { + "epoch": 1.65, + "learning_rate": 5.280597920445084e-05, + "loss": 0.0253, + "step": 255330 + }, + { + "epoch": 1.65, + "learning_rate": 5.279629785009391e-05, + "loss": 0.0273, + "step": 255340 + }, + { + "epoch": 1.65, + "learning_rate": 5.278661649573697e-05, + "loss": 0.0287, + "step": 255350 + }, + { + "epoch": 1.65, + "learning_rate": 5.277693514138004e-05, + "loss": 0.0235, + "step": 255360 + }, + { + "epoch": 1.65, + "learning_rate": 5.2767253787023106e-05, + "loss": 0.022, + "step": 255370 + }, + { + "epoch": 1.65, + "learning_rate": 5.275757243266618e-05, + "loss": 0.0245, + "step": 255380 + }, + { + "epoch": 1.65, + "learning_rate": 5.2747891078309245e-05, + "loss": 0.0211, + "step": 255390 + }, + { + "epoch": 1.65, + "learning_rate": 5.273820972395232e-05, + "loss": 0.0237, + "step": 255400 + }, + { + "epoch": 1.65, + "learning_rate": 5.272852836959538e-05, + "loss": 0.0276, + "step": 255410 + }, + { + "epoch": 1.65, + "learning_rate": 5.2718847015238444e-05, + "loss": 0.0211, + "step": 255420 + }, + { + "epoch": 1.65, + "learning_rate": 5.270916566088152e-05, + "loss": 0.022, + "step": 255430 + }, + { + "epoch": 1.65, + "learning_rate": 5.269948430652458e-05, + "loss": 0.028, + "step": 255440 + }, + { + "epoch": 1.65, + "learning_rate": 5.2689802952167656e-05, + "loss": 0.0282, + "step": 255450 + }, + { + "epoch": 1.65, + "learning_rate": 5.2680121597810716e-05, + "loss": 0.028, + "step": 255460 + }, + { + "epoch": 1.65, + "learning_rate": 5.267044024345379e-05, + "loss": 0.0224, + "step": 255470 + }, + { + "epoch": 1.65, + "learning_rate": 5.2660758889096855e-05, + "loss": 0.0225, + "step": 255480 + }, + { + "epoch": 1.65, + "learning_rate": 5.265107753473992e-05, + "loss": 0.0235, + "step": 255490 + }, + { + "epoch": 1.65, + "learning_rate": 5.2641396180382994e-05, + "loss": 0.0247, + "step": 255500 + }, + { + "epoch": 1.65, + "learning_rate": 5.2631714826026054e-05, + "loss": 0.0225, + "step": 255510 + }, + { + "epoch": 1.65, + "learning_rate": 5.262203347166913e-05, + "loss": 0.0326, + "step": 255520 + }, + { + "epoch": 1.65, + "learning_rate": 5.261235211731219e-05, + "loss": 0.0274, + "step": 255530 + }, + { + "epoch": 1.65, + "learning_rate": 5.2602670762955266e-05, + "loss": 0.0286, + "step": 255540 + }, + { + "epoch": 1.65, + "learning_rate": 5.259298940859833e-05, + "loss": 0.0216, + "step": 255550 + }, + { + "epoch": 1.65, + "learning_rate": 5.258330805424139e-05, + "loss": 0.0238, + "step": 255560 + }, + { + "epoch": 1.65, + "learning_rate": 5.2573626699884465e-05, + "loss": 0.0204, + "step": 255570 + }, + { + "epoch": 1.65, + "learning_rate": 5.256394534552753e-05, + "loss": 0.0242, + "step": 255580 + }, + { + "epoch": 1.65, + "learning_rate": 5.2554263991170604e-05, + "loss": 0.0272, + "step": 255590 + }, + { + "epoch": 1.65, + "learning_rate": 5.254458263681367e-05, + "loss": 0.024, + "step": 255600 + }, + { + "epoch": 1.65, + "learning_rate": 5.253490128245674e-05, + "loss": 0.0243, + "step": 255610 + }, + { + "epoch": 1.65, + "learning_rate": 5.25252199280998e-05, + "loss": 0.023, + "step": 255620 + }, + { + "epoch": 1.65, + "learning_rate": 5.251553857374287e-05, + "loss": 0.022, + "step": 255630 + }, + { + "epoch": 1.65, + "learning_rate": 5.250585721938594e-05, + "loss": 0.0249, + "step": 255640 + }, + { + "epoch": 1.65, + "learning_rate": 5.249617586502901e-05, + "loss": 0.0247, + "step": 255650 + }, + { + "epoch": 1.65, + "learning_rate": 5.248649451067208e-05, + "loss": 0.0223, + "step": 255660 + }, + { + "epoch": 1.65, + "learning_rate": 5.247681315631514e-05, + "loss": 0.0293, + "step": 255670 + }, + { + "epoch": 1.65, + "learning_rate": 5.246713180195821e-05, + "loss": 0.0271, + "step": 255680 + }, + { + "epoch": 1.65, + "learning_rate": 5.245745044760128e-05, + "loss": 0.0226, + "step": 255690 + }, + { + "epoch": 1.65, + "learning_rate": 5.2447769093244346e-05, + "loss": 0.0237, + "step": 255700 + }, + { + "epoch": 1.65, + "learning_rate": 5.243808773888742e-05, + "loss": 0.0227, + "step": 255710 + }, + { + "epoch": 1.65, + "learning_rate": 5.242840638453048e-05, + "loss": 0.0245, + "step": 255720 + }, + { + "epoch": 1.65, + "learning_rate": 5.241872503017355e-05, + "loss": 0.0268, + "step": 255730 + }, + { + "epoch": 1.65, + "learning_rate": 5.240904367581662e-05, + "loss": 0.0264, + "step": 255740 + }, + { + "epoch": 1.65, + "learning_rate": 5.2399362321459684e-05, + "loss": 0.0217, + "step": 255750 + }, + { + "epoch": 1.65, + "learning_rate": 5.238968096710276e-05, + "loss": 0.0281, + "step": 255760 + }, + { + "epoch": 1.65, + "learning_rate": 5.2379999612745817e-05, + "loss": 0.0232, + "step": 255770 + }, + { + "epoch": 1.65, + "learning_rate": 5.237031825838889e-05, + "loss": 0.0208, + "step": 255780 + }, + { + "epoch": 1.65, + "learning_rate": 5.2360636904031956e-05, + "loss": 0.0299, + "step": 255790 + }, + { + "epoch": 1.65, + "learning_rate": 5.235095554967503e-05, + "loss": 0.0237, + "step": 255800 + }, + { + "epoch": 1.65, + "learning_rate": 5.2341274195318095e-05, + "loss": 0.0243, + "step": 255810 + }, + { + "epoch": 1.65, + "learning_rate": 5.2331592840961155e-05, + "loss": 0.0248, + "step": 255820 + }, + { + "epoch": 1.65, + "learning_rate": 5.232191148660423e-05, + "loss": 0.0226, + "step": 255830 + }, + { + "epoch": 1.65, + "learning_rate": 5.2312230132247294e-05, + "loss": 0.0232, + "step": 255840 + }, + { + "epoch": 1.65, + "learning_rate": 5.230254877789037e-05, + "loss": 0.026, + "step": 255850 + }, + { + "epoch": 1.65, + "learning_rate": 5.229286742353343e-05, + "loss": 0.0209, + "step": 255860 + }, + { + "epoch": 1.65, + "learning_rate": 5.22831860691765e-05, + "loss": 0.0185, + "step": 255870 + }, + { + "epoch": 1.65, + "learning_rate": 5.2273504714819566e-05, + "loss": 0.0249, + "step": 255880 + }, + { + "epoch": 1.65, + "learning_rate": 5.226382336046263e-05, + "loss": 0.0215, + "step": 255890 + }, + { + "epoch": 1.65, + "learning_rate": 5.2254142006105705e-05, + "loss": 0.0246, + "step": 255900 + }, + { + "epoch": 1.65, + "learning_rate": 5.224446065174877e-05, + "loss": 0.0265, + "step": 255910 + }, + { + "epoch": 1.65, + "learning_rate": 5.223477929739184e-05, + "loss": 0.0228, + "step": 255920 + }, + { + "epoch": 1.65, + "learning_rate": 5.2225097943034903e-05, + "loss": 0.0235, + "step": 255930 + }, + { + "epoch": 1.65, + "learning_rate": 5.2215416588677976e-05, + "loss": 0.0233, + "step": 255940 + }, + { + "epoch": 1.65, + "learning_rate": 5.220573523432104e-05, + "loss": 0.025, + "step": 255950 + }, + { + "epoch": 1.65, + "learning_rate": 5.219605387996411e-05, + "loss": 0.0236, + "step": 255960 + }, + { + "epoch": 1.65, + "learning_rate": 5.2186372525607175e-05, + "loss": 0.0238, + "step": 255970 + }, + { + "epoch": 1.65, + "learning_rate": 5.217669117125024e-05, + "loss": 0.0246, + "step": 255980 + }, + { + "epoch": 1.65, + "learning_rate": 5.2167009816893314e-05, + "loss": 0.023, + "step": 255990 + }, + { + "epoch": 1.65, + "learning_rate": 5.215732846253638e-05, + "loss": 0.0213, + "step": 256000 + }, + { + "epoch": 1.65, + "eval_cer": 0.9198852107106542, + "eval_loss": 0.018240749835968018, + "eval_runtime": 120.0265, + "eval_samples_per_second": 16.663, + "eval_steps_per_second": 4.166, + "step": 256000 + }, + { + "epoch": 1.65, + "learning_rate": 5.2147647108179454e-05, + "loss": 0.0221, + "step": 256010 + }, + { + "epoch": 1.65, + "learning_rate": 5.213796575382251e-05, + "loss": 0.0277, + "step": 256020 + }, + { + "epoch": 1.65, + "learning_rate": 5.212828439946558e-05, + "loss": 0.0244, + "step": 256030 + }, + { + "epoch": 1.65, + "learning_rate": 5.211860304510865e-05, + "loss": 0.0221, + "step": 256040 + }, + { + "epoch": 1.65, + "learning_rate": 5.210892169075172e-05, + "loss": 0.0308, + "step": 256050 + }, + { + "epoch": 1.65, + "learning_rate": 5.209924033639479e-05, + "loss": 0.0227, + "step": 256060 + }, + { + "epoch": 1.65, + "learning_rate": 5.208955898203785e-05, + "loss": 0.0282, + "step": 256070 + }, + { + "epoch": 1.65, + "learning_rate": 5.2079877627680924e-05, + "loss": 0.0243, + "step": 256080 + }, + { + "epoch": 1.65, + "learning_rate": 5.207019627332399e-05, + "loss": 0.0243, + "step": 256090 + }, + { + "epoch": 1.65, + "learning_rate": 5.206051491896706e-05, + "loss": 0.0246, + "step": 256100 + }, + { + "epoch": 1.65, + "learning_rate": 5.205083356461013e-05, + "loss": 0.0224, + "step": 256110 + }, + { + "epoch": 1.65, + "learning_rate": 5.204115221025319e-05, + "loss": 0.0233, + "step": 256120 + }, + { + "epoch": 1.65, + "learning_rate": 5.203147085589626e-05, + "loss": 0.0204, + "step": 256130 + }, + { + "epoch": 1.65, + "learning_rate": 5.202178950153933e-05, + "loss": 0.0253, + "step": 256140 + }, + { + "epoch": 1.65, + "learning_rate": 5.20121081471824e-05, + "loss": 0.0201, + "step": 256150 + }, + { + "epoch": 1.65, + "learning_rate": 5.200242679282547e-05, + "loss": 0.0241, + "step": 256160 + }, + { + "epoch": 1.65, + "learning_rate": 5.199274543846853e-05, + "loss": 0.028, + "step": 256170 + }, + { + "epoch": 1.65, + "learning_rate": 5.19830640841116e-05, + "loss": 0.0233, + "step": 256180 + }, + { + "epoch": 1.65, + "learning_rate": 5.1973382729754666e-05, + "loss": 0.029, + "step": 256190 + }, + { + "epoch": 1.65, + "learning_rate": 5.196370137539774e-05, + "loss": 0.031, + "step": 256200 + }, + { + "epoch": 1.65, + "learning_rate": 5.1954020021040806e-05, + "loss": 0.0274, + "step": 256210 + }, + { + "epoch": 1.65, + "learning_rate": 5.194433866668388e-05, + "loss": 0.0261, + "step": 256220 + }, + { + "epoch": 1.65, + "learning_rate": 5.193465731232694e-05, + "loss": 0.0257, + "step": 256230 + }, + { + "epoch": 1.65, + "learning_rate": 5.1924975957970004e-05, + "loss": 0.0277, + "step": 256240 + }, + { + "epoch": 1.65, + "learning_rate": 5.191529460361308e-05, + "loss": 0.0307, + "step": 256250 + }, + { + "epoch": 1.65, + "learning_rate": 5.1905613249256144e-05, + "loss": 0.0229, + "step": 256260 + }, + { + "epoch": 1.65, + "learning_rate": 5.1895931894899217e-05, + "loss": 0.0226, + "step": 256270 + }, + { + "epoch": 1.65, + "learning_rate": 5.1886250540542276e-05, + "loss": 0.0218, + "step": 256280 + }, + { + "epoch": 1.65, + "learning_rate": 5.187656918618535e-05, + "loss": 0.0256, + "step": 256290 + }, + { + "epoch": 1.65, + "learning_rate": 5.1866887831828415e-05, + "loss": 0.024, + "step": 256300 + }, + { + "epoch": 1.65, + "learning_rate": 5.185720647747148e-05, + "loss": 0.0236, + "step": 256310 + }, + { + "epoch": 1.65, + "learning_rate": 5.1847525123114555e-05, + "loss": 0.0238, + "step": 256320 + }, + { + "epoch": 1.65, + "learning_rate": 5.1837843768757614e-05, + "loss": 0.0225, + "step": 256330 + }, + { + "epoch": 1.65, + "learning_rate": 5.182816241440069e-05, + "loss": 0.0232, + "step": 256340 + }, + { + "epoch": 1.65, + "learning_rate": 5.181848106004375e-05, + "loss": 0.0231, + "step": 256350 + }, + { + "epoch": 1.65, + "learning_rate": 5.1808799705686826e-05, + "loss": 0.0253, + "step": 256360 + }, + { + "epoch": 1.65, + "learning_rate": 5.179911835132989e-05, + "loss": 0.0269, + "step": 256370 + }, + { + "epoch": 1.65, + "learning_rate": 5.178943699697295e-05, + "loss": 0.0256, + "step": 256380 + }, + { + "epoch": 1.65, + "learning_rate": 5.1779755642616025e-05, + "loss": 0.0227, + "step": 256390 + }, + { + "epoch": 1.65, + "learning_rate": 5.177007428825909e-05, + "loss": 0.0213, + "step": 256400 + }, + { + "epoch": 1.65, + "learning_rate": 5.1760392933902164e-05, + "loss": 0.0261, + "step": 256410 + }, + { + "epoch": 1.65, + "learning_rate": 5.175071157954523e-05, + "loss": 0.0254, + "step": 256420 + }, + { + "epoch": 1.66, + "learning_rate": 5.1741030225188304e-05, + "loss": 0.0246, + "step": 256430 + }, + { + "epoch": 1.66, + "learning_rate": 5.173134887083136e-05, + "loss": 0.0212, + "step": 256440 + }, + { + "epoch": 1.66, + "learning_rate": 5.172166751647443e-05, + "loss": 0.0241, + "step": 256450 + }, + { + "epoch": 1.66, + "learning_rate": 5.17119861621175e-05, + "loss": 0.0231, + "step": 256460 + }, + { + "epoch": 1.66, + "learning_rate": 5.170230480776057e-05, + "loss": 0.0272, + "step": 256470 + }, + { + "epoch": 1.66, + "learning_rate": 5.169262345340364e-05, + "loss": 0.0256, + "step": 256480 + }, + { + "epoch": 1.66, + "learning_rate": 5.16829420990467e-05, + "loss": 0.0263, + "step": 256490 + }, + { + "epoch": 1.66, + "learning_rate": 5.1673260744689774e-05, + "loss": 0.0216, + "step": 256500 + }, + { + "epoch": 1.66, + "learning_rate": 5.166357939033284e-05, + "loss": 0.0302, + "step": 256510 + }, + { + "epoch": 1.66, + "learning_rate": 5.1653898035975906e-05, + "loss": 0.0285, + "step": 256520 + }, + { + "epoch": 1.66, + "learning_rate": 5.164421668161898e-05, + "loss": 0.0324, + "step": 256530 + }, + { + "epoch": 1.66, + "learning_rate": 5.163453532726204e-05, + "loss": 0.0252, + "step": 256540 + }, + { + "epoch": 1.66, + "learning_rate": 5.162485397290511e-05, + "loss": 0.0209, + "step": 256550 + }, + { + "epoch": 1.66, + "learning_rate": 5.161517261854818e-05, + "loss": 0.0251, + "step": 256560 + }, + { + "epoch": 1.66, + "learning_rate": 5.160549126419125e-05, + "loss": 0.0247, + "step": 256570 + }, + { + "epoch": 1.66, + "learning_rate": 5.159580990983432e-05, + "loss": 0.0272, + "step": 256580 + }, + { + "epoch": 1.66, + "learning_rate": 5.158612855547738e-05, + "loss": 0.0256, + "step": 256590 + }, + { + "epoch": 1.66, + "learning_rate": 5.157644720112045e-05, + "loss": 0.0202, + "step": 256600 + }, + { + "epoch": 1.66, + "learning_rate": 5.1566765846763516e-05, + "loss": 0.031, + "step": 256610 + }, + { + "epoch": 1.66, + "learning_rate": 5.155708449240659e-05, + "loss": 0.0253, + "step": 256620 + }, + { + "epoch": 1.66, + "learning_rate": 5.1547403138049655e-05, + "loss": 0.026, + "step": 256630 + }, + { + "epoch": 1.66, + "learning_rate": 5.153772178369273e-05, + "loss": 0.026, + "step": 256640 + }, + { + "epoch": 1.66, + "learning_rate": 5.152804042933579e-05, + "loss": 0.023, + "step": 256650 + }, + { + "epoch": 1.66, + "learning_rate": 5.1518359074978854e-05, + "loss": 0.0238, + "step": 256660 + }, + { + "epoch": 1.66, + "learning_rate": 5.150867772062193e-05, + "loss": 0.0229, + "step": 256670 + }, + { + "epoch": 1.66, + "learning_rate": 5.149899636626499e-05, + "loss": 0.025, + "step": 256680 + }, + { + "epoch": 1.66, + "learning_rate": 5.1489315011908066e-05, + "loss": 0.0276, + "step": 256690 + }, + { + "epoch": 1.66, + "learning_rate": 5.1479633657551126e-05, + "loss": 0.0275, + "step": 256700 + }, + { + "epoch": 1.66, + "learning_rate": 5.14699523031942e-05, + "loss": 0.0288, + "step": 256710 + }, + { + "epoch": 1.66, + "learning_rate": 5.1460270948837265e-05, + "loss": 0.0208, + "step": 256720 + }, + { + "epoch": 1.66, + "learning_rate": 5.145058959448033e-05, + "loss": 0.0225, + "step": 256730 + }, + { + "epoch": 1.66, + "learning_rate": 5.1440908240123404e-05, + "loss": 0.0244, + "step": 256740 + }, + { + "epoch": 1.66, + "learning_rate": 5.1431226885766464e-05, + "loss": 0.0228, + "step": 256750 + }, + { + "epoch": 1.66, + "learning_rate": 5.142154553140954e-05, + "loss": 0.0252, + "step": 256760 + }, + { + "epoch": 1.66, + "learning_rate": 5.14118641770526e-05, + "loss": 0.0229, + "step": 256770 + }, + { + "epoch": 1.66, + "learning_rate": 5.1402182822695676e-05, + "loss": 0.0254, + "step": 256780 + }, + { + "epoch": 1.66, + "learning_rate": 5.139250146833874e-05, + "loss": 0.0196, + "step": 256790 + }, + { + "epoch": 1.66, + "learning_rate": 5.13828201139818e-05, + "loss": 0.0284, + "step": 256800 + }, + { + "epoch": 1.66, + "learning_rate": 5.1373138759624875e-05, + "loss": 0.0244, + "step": 256810 + }, + { + "epoch": 1.66, + "learning_rate": 5.136345740526794e-05, + "loss": 0.0243, + "step": 256820 + }, + { + "epoch": 1.66, + "learning_rate": 5.1353776050911014e-05, + "loss": 0.0291, + "step": 256830 + }, + { + "epoch": 1.66, + "learning_rate": 5.134409469655408e-05, + "loss": 0.0254, + "step": 256840 + }, + { + "epoch": 1.66, + "learning_rate": 5.133441334219715e-05, + "loss": 0.0201, + "step": 256850 + }, + { + "epoch": 1.66, + "learning_rate": 5.132473198784021e-05, + "loss": 0.0275, + "step": 256860 + }, + { + "epoch": 1.66, + "learning_rate": 5.131505063348328e-05, + "loss": 0.0202, + "step": 256870 + }, + { + "epoch": 1.66, + "learning_rate": 5.130536927912635e-05, + "loss": 0.02, + "step": 256880 + }, + { + "epoch": 1.66, + "learning_rate": 5.129568792476942e-05, + "loss": 0.0234, + "step": 256890 + }, + { + "epoch": 1.66, + "learning_rate": 5.128600657041249e-05, + "loss": 0.0211, + "step": 256900 + }, + { + "epoch": 1.66, + "learning_rate": 5.127632521605555e-05, + "loss": 0.0208, + "step": 256910 + }, + { + "epoch": 1.66, + "learning_rate": 5.1266643861698624e-05, + "loss": 0.0257, + "step": 256920 + }, + { + "epoch": 1.66, + "learning_rate": 5.125696250734169e-05, + "loss": 0.0256, + "step": 256930 + }, + { + "epoch": 1.66, + "learning_rate": 5.1247281152984756e-05, + "loss": 0.0203, + "step": 256940 + }, + { + "epoch": 1.66, + "learning_rate": 5.123759979862783e-05, + "loss": 0.03, + "step": 256950 + }, + { + "epoch": 1.66, + "learning_rate": 5.122791844427089e-05, + "loss": 0.0251, + "step": 256960 + }, + { + "epoch": 1.66, + "learning_rate": 5.121823708991396e-05, + "loss": 0.0238, + "step": 256970 + }, + { + "epoch": 1.66, + "learning_rate": 5.120855573555703e-05, + "loss": 0.024, + "step": 256980 + }, + { + "epoch": 1.66, + "learning_rate": 5.11988743812001e-05, + "loss": 0.0221, + "step": 256990 + }, + { + "epoch": 1.66, + "learning_rate": 5.118919302684317e-05, + "loss": 0.0251, + "step": 257000 + }, + { + "epoch": 1.66, + "eval_cer": 0.9198481527511015, + "eval_loss": 0.018239615485072136, + "eval_runtime": 120.1756, + "eval_samples_per_second": 16.642, + "eval_steps_per_second": 4.161, + "step": 257000 + }, + { + "epoch": 1.66, + "learning_rate": 5.117951167248623e-05, + "loss": 0.0253, + "step": 257010 + }, + { + "epoch": 1.66, + "learning_rate": 5.11698303181293e-05, + "loss": 0.0239, + "step": 257020 + }, + { + "epoch": 1.66, + "learning_rate": 5.1160148963772366e-05, + "loss": 0.0207, + "step": 257030 + }, + { + "epoch": 1.66, + "learning_rate": 5.115046760941544e-05, + "loss": 0.0246, + "step": 257040 + }, + { + "epoch": 1.66, + "learning_rate": 5.1140786255058505e-05, + "loss": 0.031, + "step": 257050 + }, + { + "epoch": 1.66, + "learning_rate": 5.113110490070158e-05, + "loss": 0.0264, + "step": 257060 + }, + { + "epoch": 1.66, + "learning_rate": 5.112142354634464e-05, + "loss": 0.0231, + "step": 257070 + }, + { + "epoch": 1.66, + "learning_rate": 5.1111742191987704e-05, + "loss": 0.0209, + "step": 257080 + }, + { + "epoch": 1.66, + "learning_rate": 5.110206083763078e-05, + "loss": 0.0233, + "step": 257090 + }, + { + "epoch": 1.66, + "learning_rate": 5.109237948327384e-05, + "loss": 0.0229, + "step": 257100 + }, + { + "epoch": 1.66, + "learning_rate": 5.1082698128916916e-05, + "loss": 0.0223, + "step": 257110 + }, + { + "epoch": 1.66, + "learning_rate": 5.1073016774559976e-05, + "loss": 0.0279, + "step": 257120 + }, + { + "epoch": 1.66, + "learning_rate": 5.106333542020305e-05, + "loss": 0.0223, + "step": 257130 + }, + { + "epoch": 1.66, + "learning_rate": 5.1053654065846115e-05, + "loss": 0.0272, + "step": 257140 + }, + { + "epoch": 1.66, + "learning_rate": 5.104397271148918e-05, + "loss": 0.0284, + "step": 257150 + }, + { + "epoch": 1.66, + "learning_rate": 5.1034291357132254e-05, + "loss": 0.0212, + "step": 257160 + }, + { + "epoch": 1.66, + "learning_rate": 5.1024610002775314e-05, + "loss": 0.0253, + "step": 257170 + }, + { + "epoch": 1.66, + "learning_rate": 5.101492864841839e-05, + "loss": 0.0214, + "step": 257180 + }, + { + "epoch": 1.66, + "learning_rate": 5.100524729406145e-05, + "loss": 0.0284, + "step": 257190 + }, + { + "epoch": 1.66, + "learning_rate": 5.0995565939704526e-05, + "loss": 0.0224, + "step": 257200 + }, + { + "epoch": 1.66, + "learning_rate": 5.098588458534759e-05, + "loss": 0.0243, + "step": 257210 + }, + { + "epoch": 1.66, + "learning_rate": 5.097620323099065e-05, + "loss": 0.0263, + "step": 257220 + }, + { + "epoch": 1.66, + "learning_rate": 5.0966521876633725e-05, + "loss": 0.0223, + "step": 257230 + }, + { + "epoch": 1.66, + "learning_rate": 5.095684052227679e-05, + "loss": 0.0283, + "step": 257240 + }, + { + "epoch": 1.66, + "learning_rate": 5.0947159167919864e-05, + "loss": 0.0261, + "step": 257250 + }, + { + "epoch": 1.66, + "learning_rate": 5.093747781356293e-05, + "loss": 0.0231, + "step": 257260 + }, + { + "epoch": 1.66, + "learning_rate": 5.0927796459205996e-05, + "loss": 0.0238, + "step": 257270 + }, + { + "epoch": 1.66, + "learning_rate": 5.091811510484906e-05, + "loss": 0.0238, + "step": 257280 + }, + { + "epoch": 1.66, + "learning_rate": 5.090843375049213e-05, + "loss": 0.0261, + "step": 257290 + }, + { + "epoch": 1.66, + "learning_rate": 5.08987523961352e-05, + "loss": 0.0235, + "step": 257300 + }, + { + "epoch": 1.66, + "learning_rate": 5.088907104177827e-05, + "loss": 0.0233, + "step": 257310 + }, + { + "epoch": 1.66, + "learning_rate": 5.0879389687421334e-05, + "loss": 0.03, + "step": 257320 + }, + { + "epoch": 1.66, + "learning_rate": 5.08697083330644e-05, + "loss": 0.0264, + "step": 257330 + }, + { + "epoch": 1.66, + "learning_rate": 5.0860026978707474e-05, + "loss": 0.0261, + "step": 257340 + }, + { + "epoch": 1.66, + "learning_rate": 5.085034562435054e-05, + "loss": 0.0286, + "step": 257350 + }, + { + "epoch": 1.66, + "learning_rate": 5.0840664269993606e-05, + "loss": 0.0285, + "step": 257360 + }, + { + "epoch": 1.66, + "learning_rate": 5.083098291563667e-05, + "loss": 0.0258, + "step": 257370 + }, + { + "epoch": 1.66, + "learning_rate": 5.082130156127974e-05, + "loss": 0.0223, + "step": 257380 + }, + { + "epoch": 1.66, + "learning_rate": 5.081162020692281e-05, + "loss": 0.0285, + "step": 257390 + }, + { + "epoch": 1.66, + "learning_rate": 5.080193885256588e-05, + "loss": 0.0267, + "step": 257400 + }, + { + "epoch": 1.66, + "learning_rate": 5.0792257498208944e-05, + "loss": 0.0285, + "step": 257410 + }, + { + "epoch": 1.66, + "learning_rate": 5.078257614385201e-05, + "loss": 0.0194, + "step": 257420 + }, + { + "epoch": 1.66, + "learning_rate": 5.0772894789495077e-05, + "loss": 0.0314, + "step": 257430 + }, + { + "epoch": 1.66, + "learning_rate": 5.076321343513815e-05, + "loss": 0.0273, + "step": 257440 + }, + { + "epoch": 1.66, + "learning_rate": 5.0753532080781216e-05, + "loss": 0.0293, + "step": 257450 + }, + { + "epoch": 1.66, + "learning_rate": 5.074385072642429e-05, + "loss": 0.0219, + "step": 257460 + }, + { + "epoch": 1.66, + "learning_rate": 5.073416937206735e-05, + "loss": 0.0265, + "step": 257470 + }, + { + "epoch": 1.66, + "learning_rate": 5.0724488017710414e-05, + "loss": 0.0227, + "step": 257480 + }, + { + "epoch": 1.66, + "learning_rate": 5.071480666335349e-05, + "loss": 0.0225, + "step": 257490 + }, + { + "epoch": 1.66, + "learning_rate": 5.0705125308996554e-05, + "loss": 0.0217, + "step": 257500 + }, + { + "epoch": 1.66, + "learning_rate": 5.069544395463963e-05, + "loss": 0.0259, + "step": 257510 + }, + { + "epoch": 1.66, + "learning_rate": 5.0685762600282686e-05, + "loss": 0.0256, + "step": 257520 + }, + { + "epoch": 1.66, + "learning_rate": 5.067608124592576e-05, + "loss": 0.0295, + "step": 257530 + }, + { + "epoch": 1.66, + "learning_rate": 5.0666399891568825e-05, + "loss": 0.0217, + "step": 257540 + }, + { + "epoch": 1.66, + "learning_rate": 5.065671853721189e-05, + "loss": 0.0292, + "step": 257550 + }, + { + "epoch": 1.66, + "learning_rate": 5.0647037182854965e-05, + "loss": 0.0207, + "step": 257560 + }, + { + "epoch": 1.66, + "learning_rate": 5.0637355828498024e-05, + "loss": 0.0243, + "step": 257570 + }, + { + "epoch": 1.66, + "learning_rate": 5.06276744741411e-05, + "loss": 0.026, + "step": 257580 + }, + { + "epoch": 1.66, + "learning_rate": 5.0617993119784163e-05, + "loss": 0.0215, + "step": 257590 + }, + { + "epoch": 1.66, + "learning_rate": 5.0608311765427236e-05, + "loss": 0.0289, + "step": 257600 + }, + { + "epoch": 1.66, + "learning_rate": 5.05986304110703e-05, + "loss": 0.0292, + "step": 257610 + }, + { + "epoch": 1.66, + "learning_rate": 5.058894905671336e-05, + "loss": 0.0268, + "step": 257620 + }, + { + "epoch": 1.66, + "learning_rate": 5.0579267702356435e-05, + "loss": 0.0269, + "step": 257630 + }, + { + "epoch": 1.66, + "learning_rate": 5.05695863479995e-05, + "loss": 0.0237, + "step": 257640 + }, + { + "epoch": 1.66, + "learning_rate": 5.0559904993642574e-05, + "loss": 0.0307, + "step": 257650 + }, + { + "epoch": 1.66, + "learning_rate": 5.055022363928564e-05, + "loss": 0.0245, + "step": 257660 + }, + { + "epoch": 1.66, + "learning_rate": 5.0540542284928714e-05, + "loss": 0.023, + "step": 257670 + }, + { + "epoch": 1.66, + "learning_rate": 5.053086093057177e-05, + "loss": 0.0202, + "step": 257680 + }, + { + "epoch": 1.66, + "learning_rate": 5.052117957621484e-05, + "loss": 0.0255, + "step": 257690 + }, + { + "epoch": 1.66, + "learning_rate": 5.051149822185791e-05, + "loss": 0.0224, + "step": 257700 + }, + { + "epoch": 1.66, + "learning_rate": 5.050181686750098e-05, + "loss": 0.0279, + "step": 257710 + }, + { + "epoch": 1.66, + "learning_rate": 5.049213551314405e-05, + "loss": 0.0235, + "step": 257720 + }, + { + "epoch": 1.66, + "learning_rate": 5.048245415878711e-05, + "loss": 0.0264, + "step": 257730 + }, + { + "epoch": 1.66, + "learning_rate": 5.0472772804430184e-05, + "loss": 0.0275, + "step": 257740 + }, + { + "epoch": 1.66, + "learning_rate": 5.046309145007325e-05, + "loss": 0.0275, + "step": 257750 + }, + { + "epoch": 1.66, + "learning_rate": 5.045341009571632e-05, + "loss": 0.0242, + "step": 257760 + }, + { + "epoch": 1.66, + "learning_rate": 5.044372874135939e-05, + "loss": 0.0223, + "step": 257770 + }, + { + "epoch": 1.66, + "learning_rate": 5.043404738700245e-05, + "loss": 0.0265, + "step": 257780 + }, + { + "epoch": 1.66, + "learning_rate": 5.042436603264552e-05, + "loss": 0.0277, + "step": 257790 + }, + { + "epoch": 1.66, + "learning_rate": 5.041468467828859e-05, + "loss": 0.0235, + "step": 257800 + }, + { + "epoch": 1.66, + "learning_rate": 5.040500332393166e-05, + "loss": 0.0216, + "step": 257810 + }, + { + "epoch": 1.66, + "learning_rate": 5.039532196957473e-05, + "loss": 0.0241, + "step": 257820 + }, + { + "epoch": 1.66, + "learning_rate": 5.038564061521779e-05, + "loss": 0.0264, + "step": 257830 + }, + { + "epoch": 1.66, + "learning_rate": 5.037595926086086e-05, + "loss": 0.0254, + "step": 257840 + }, + { + "epoch": 1.66, + "learning_rate": 5.0366277906503926e-05, + "loss": 0.0212, + "step": 257850 + }, + { + "epoch": 1.66, + "learning_rate": 5.0356596552147e-05, + "loss": 0.0246, + "step": 257860 + }, + { + "epoch": 1.66, + "learning_rate": 5.0346915197790066e-05, + "loss": 0.0274, + "step": 257870 + }, + { + "epoch": 1.66, + "learning_rate": 5.033723384343314e-05, + "loss": 0.0232, + "step": 257880 + }, + { + "epoch": 1.66, + "learning_rate": 5.03275524890762e-05, + "loss": 0.0216, + "step": 257890 + }, + { + "epoch": 1.66, + "learning_rate": 5.0317871134719264e-05, + "loss": 0.0229, + "step": 257900 + }, + { + "epoch": 1.66, + "learning_rate": 5.030818978036234e-05, + "loss": 0.0341, + "step": 257910 + }, + { + "epoch": 1.66, + "learning_rate": 5.0298508426005404e-05, + "loss": 0.0236, + "step": 257920 + }, + { + "epoch": 1.66, + "learning_rate": 5.0288827071648477e-05, + "loss": 0.0238, + "step": 257930 + }, + { + "epoch": 1.66, + "learning_rate": 5.0279145717291536e-05, + "loss": 0.0234, + "step": 257940 + }, + { + "epoch": 1.66, + "learning_rate": 5.026946436293461e-05, + "loss": 0.0226, + "step": 257950 + }, + { + "epoch": 1.66, + "learning_rate": 5.0259783008577675e-05, + "loss": 0.0212, + "step": 257960 + }, + { + "epoch": 1.66, + "learning_rate": 5.025010165422074e-05, + "loss": 0.025, + "step": 257970 + }, + { + "epoch": 1.67, + "learning_rate": 5.0240420299863815e-05, + "loss": 0.0282, + "step": 257980 + }, + { + "epoch": 1.67, + "learning_rate": 5.0230738945506874e-05, + "loss": 0.0277, + "step": 257990 + }, + { + "epoch": 1.67, + "learning_rate": 5.022105759114995e-05, + "loss": 0.0236, + "step": 258000 + }, + { + "epoch": 1.67, + "eval_cer": 0.9198228448762852, + "eval_loss": 0.018363136798143387, + "eval_runtime": 120.066, + "eval_samples_per_second": 16.658, + "eval_steps_per_second": 4.164, + "step": 258000 + }, + { + "epoch": 1.67, + "learning_rate": 5.021137623679301e-05, + "loss": 0.0231, + "step": 258010 + }, + { + "epoch": 1.67, + "learning_rate": 5.0201694882436086e-05, + "loss": 0.0217, + "step": 258020 + }, + { + "epoch": 1.67, + "learning_rate": 5.019201352807915e-05, + "loss": 0.0247, + "step": 258030 + }, + { + "epoch": 1.67, + "learning_rate": 5.018233217372221e-05, + "loss": 0.0248, + "step": 258040 + }, + { + "epoch": 1.67, + "learning_rate": 5.0172650819365285e-05, + "loss": 0.0276, + "step": 258050 + }, + { + "epoch": 1.67, + "learning_rate": 5.016296946500835e-05, + "loss": 0.0213, + "step": 258060 + }, + { + "epoch": 1.67, + "learning_rate": 5.0153288110651424e-05, + "loss": 0.0285, + "step": 258070 + }, + { + "epoch": 1.67, + "learning_rate": 5.014360675629449e-05, + "loss": 0.0236, + "step": 258080 + }, + { + "epoch": 1.67, + "learning_rate": 5.0133925401937564e-05, + "loss": 0.029, + "step": 258090 + }, + { + "epoch": 1.67, + "learning_rate": 5.012424404758062e-05, + "loss": 0.0282, + "step": 258100 + }, + { + "epoch": 1.67, + "learning_rate": 5.011456269322369e-05, + "loss": 0.0244, + "step": 258110 + }, + { + "epoch": 1.67, + "learning_rate": 5.010488133886676e-05, + "loss": 0.0251, + "step": 258120 + }, + { + "epoch": 1.67, + "learning_rate": 5.009519998450983e-05, + "loss": 0.0268, + "step": 258130 + }, + { + "epoch": 1.67, + "learning_rate": 5.00855186301529e-05, + "loss": 0.0268, + "step": 258140 + }, + { + "epoch": 1.67, + "learning_rate": 5.007583727579596e-05, + "loss": 0.021, + "step": 258150 + }, + { + "epoch": 1.67, + "learning_rate": 5.0066155921439034e-05, + "loss": 0.0272, + "step": 258160 + }, + { + "epoch": 1.67, + "learning_rate": 5.00564745670821e-05, + "loss": 0.0218, + "step": 258170 + }, + { + "epoch": 1.67, + "learning_rate": 5.0046793212725166e-05, + "loss": 0.0211, + "step": 258180 + }, + { + "epoch": 1.67, + "learning_rate": 5.003711185836824e-05, + "loss": 0.0262, + "step": 258190 + }, + { + "epoch": 1.67, + "learning_rate": 5.00274305040113e-05, + "loss": 0.0314, + "step": 258200 + }, + { + "epoch": 1.67, + "learning_rate": 5.001774914965437e-05, + "loss": 0.022, + "step": 258210 + }, + { + "epoch": 1.67, + "learning_rate": 5.000806779529744e-05, + "loss": 0.0269, + "step": 258220 + }, + { + "epoch": 1.67, + "learning_rate": 4.999838644094051e-05, + "loss": 0.0252, + "step": 258230 + }, + { + "epoch": 1.67, + "learning_rate": 4.998870508658358e-05, + "loss": 0.0305, + "step": 258240 + }, + { + "epoch": 1.67, + "learning_rate": 4.997902373222664e-05, + "loss": 0.0223, + "step": 258250 + }, + { + "epoch": 1.67, + "learning_rate": 4.996934237786971e-05, + "loss": 0.027, + "step": 258260 + }, + { + "epoch": 1.67, + "learning_rate": 4.9959661023512776e-05, + "loss": 0.0249, + "step": 258270 + }, + { + "epoch": 1.67, + "learning_rate": 4.994997966915585e-05, + "loss": 0.0279, + "step": 258280 + }, + { + "epoch": 1.67, + "learning_rate": 4.9940298314798915e-05, + "loss": 0.0271, + "step": 258290 + }, + { + "epoch": 1.67, + "learning_rate": 4.993061696044199e-05, + "loss": 0.0249, + "step": 258300 + }, + { + "epoch": 1.67, + "learning_rate": 4.992093560608505e-05, + "loss": 0.0224, + "step": 258310 + }, + { + "epoch": 1.67, + "learning_rate": 4.9911254251728114e-05, + "loss": 0.0253, + "step": 258320 + }, + { + "epoch": 1.67, + "learning_rate": 4.990157289737119e-05, + "loss": 0.0244, + "step": 258330 + }, + { + "epoch": 1.67, + "learning_rate": 4.989189154301425e-05, + "loss": 0.0198, + "step": 258340 + }, + { + "epoch": 1.67, + "learning_rate": 4.9882210188657326e-05, + "loss": 0.0225, + "step": 258350 + }, + { + "epoch": 1.67, + "learning_rate": 4.9872528834300386e-05, + "loss": 0.0259, + "step": 258360 + }, + { + "epoch": 1.67, + "learning_rate": 4.986284747994346e-05, + "loss": 0.0225, + "step": 258370 + }, + { + "epoch": 1.67, + "learning_rate": 4.9853166125586525e-05, + "loss": 0.025, + "step": 258380 + }, + { + "epoch": 1.67, + "learning_rate": 4.984348477122959e-05, + "loss": 0.0277, + "step": 258390 + }, + { + "epoch": 1.67, + "learning_rate": 4.9833803416872664e-05, + "loss": 0.0241, + "step": 258400 + }, + { + "epoch": 1.67, + "learning_rate": 4.9824122062515724e-05, + "loss": 0.0199, + "step": 258410 + }, + { + "epoch": 1.67, + "learning_rate": 4.98144407081588e-05, + "loss": 0.0266, + "step": 258420 + }, + { + "epoch": 1.67, + "learning_rate": 4.980475935380186e-05, + "loss": 0.0311, + "step": 258430 + }, + { + "epoch": 1.67, + "learning_rate": 4.9795077999444936e-05, + "loss": 0.023, + "step": 258440 + }, + { + "epoch": 1.67, + "learning_rate": 4.9785396645088e-05, + "loss": 0.0227, + "step": 258450 + }, + { + "epoch": 1.67, + "learning_rate": 4.977571529073106e-05, + "loss": 0.0229, + "step": 258460 + }, + { + "epoch": 1.67, + "learning_rate": 4.9766033936374135e-05, + "loss": 0.023, + "step": 258470 + }, + { + "epoch": 1.67, + "learning_rate": 4.97563525820172e-05, + "loss": 0.0265, + "step": 258480 + }, + { + "epoch": 1.67, + "learning_rate": 4.9746671227660274e-05, + "loss": 0.0224, + "step": 258490 + }, + { + "epoch": 1.67, + "learning_rate": 4.973698987330334e-05, + "loss": 0.0288, + "step": 258500 + }, + { + "epoch": 1.67, + "learning_rate": 4.9727308518946407e-05, + "loss": 0.0257, + "step": 258510 + }, + { + "epoch": 1.67, + "learning_rate": 4.971762716458947e-05, + "loss": 0.0226, + "step": 258520 + }, + { + "epoch": 1.67, + "learning_rate": 4.970794581023254e-05, + "loss": 0.0279, + "step": 258530 + }, + { + "epoch": 1.67, + "learning_rate": 4.969826445587561e-05, + "loss": 0.0219, + "step": 258540 + }, + { + "epoch": 1.67, + "learning_rate": 4.968858310151868e-05, + "loss": 0.0259, + "step": 258550 + }, + { + "epoch": 1.67, + "learning_rate": 4.9678901747161745e-05, + "loss": 0.0225, + "step": 258560 + }, + { + "epoch": 1.67, + "learning_rate": 4.966922039280481e-05, + "loss": 0.0251, + "step": 258570 + }, + { + "epoch": 1.67, + "learning_rate": 4.9659539038447884e-05, + "loss": 0.0198, + "step": 258580 + }, + { + "epoch": 1.67, + "learning_rate": 4.964985768409095e-05, + "loss": 0.0239, + "step": 258590 + }, + { + "epoch": 1.67, + "learning_rate": 4.9640176329734016e-05, + "loss": 0.0308, + "step": 258600 + }, + { + "epoch": 1.67, + "learning_rate": 4.963049497537708e-05, + "loss": 0.0219, + "step": 258610 + }, + { + "epoch": 1.67, + "learning_rate": 4.962081362102015e-05, + "loss": 0.027, + "step": 258620 + }, + { + "epoch": 1.67, + "learning_rate": 4.961113226666322e-05, + "loss": 0.027, + "step": 258630 + }, + { + "epoch": 1.67, + "learning_rate": 4.960145091230629e-05, + "loss": 0.0333, + "step": 258640 + }, + { + "epoch": 1.67, + "learning_rate": 4.959176955794936e-05, + "loss": 0.0237, + "step": 258650 + }, + { + "epoch": 1.67, + "learning_rate": 4.958208820359243e-05, + "loss": 0.024, + "step": 258660 + }, + { + "epoch": 1.67, + "learning_rate": 4.957240684923549e-05, + "loss": 0.0245, + "step": 258670 + }, + { + "epoch": 1.67, + "learning_rate": 4.956272549487856e-05, + "loss": 0.029, + "step": 258680 + }, + { + "epoch": 1.67, + "learning_rate": 4.9553044140521626e-05, + "loss": 0.02, + "step": 258690 + }, + { + "epoch": 1.67, + "learning_rate": 4.95433627861647e-05, + "loss": 0.0243, + "step": 258700 + }, + { + "epoch": 1.67, + "learning_rate": 4.9533681431807765e-05, + "loss": 0.0325, + "step": 258710 + }, + { + "epoch": 1.67, + "learning_rate": 4.952400007745083e-05, + "loss": 0.0234, + "step": 258720 + }, + { + "epoch": 1.67, + "learning_rate": 4.95143187230939e-05, + "loss": 0.0287, + "step": 258730 + }, + { + "epoch": 1.67, + "learning_rate": 4.9504637368736964e-05, + "loss": 0.0238, + "step": 258740 + }, + { + "epoch": 1.67, + "learning_rate": 4.949495601438004e-05, + "loss": 0.0244, + "step": 258750 + }, + { + "epoch": 1.67, + "learning_rate": 4.94852746600231e-05, + "loss": 0.0255, + "step": 258760 + }, + { + "epoch": 1.67, + "learning_rate": 4.947559330566617e-05, + "loss": 0.0196, + "step": 258770 + }, + { + "epoch": 1.67, + "learning_rate": 4.9465911951309236e-05, + "loss": 0.0203, + "step": 258780 + }, + { + "epoch": 1.67, + "learning_rate": 4.945623059695231e-05, + "loss": 0.0263, + "step": 258790 + }, + { + "epoch": 1.67, + "learning_rate": 4.9446549242595375e-05, + "loss": 0.0233, + "step": 258800 + }, + { + "epoch": 1.67, + "learning_rate": 4.943686788823844e-05, + "loss": 0.0249, + "step": 258810 + }, + { + "epoch": 1.67, + "learning_rate": 4.942718653388151e-05, + "loss": 0.0279, + "step": 258820 + }, + { + "epoch": 1.67, + "learning_rate": 4.9417505179524574e-05, + "loss": 0.0273, + "step": 258830 + }, + { + "epoch": 1.67, + "learning_rate": 4.940782382516765e-05, + "loss": 0.0263, + "step": 258840 + }, + { + "epoch": 1.67, + "learning_rate": 4.939814247081071e-05, + "loss": 0.0254, + "step": 258850 + }, + { + "epoch": 1.67, + "learning_rate": 4.9388461116453786e-05, + "loss": 0.0247, + "step": 258860 + }, + { + "epoch": 1.67, + "learning_rate": 4.9378779762096845e-05, + "loss": 0.0267, + "step": 258870 + }, + { + "epoch": 1.67, + "learning_rate": 4.936909840773991e-05, + "loss": 0.0255, + "step": 258880 + }, + { + "epoch": 1.67, + "learning_rate": 4.9359417053382985e-05, + "loss": 0.0194, + "step": 258890 + }, + { + "epoch": 1.67, + "learning_rate": 4.934973569902605e-05, + "loss": 0.0205, + "step": 258900 + }, + { + "epoch": 1.67, + "learning_rate": 4.9340054344669124e-05, + "loss": 0.0238, + "step": 258910 + }, + { + "epoch": 1.67, + "learning_rate": 4.933037299031218e-05, + "loss": 0.0268, + "step": 258920 + }, + { + "epoch": 1.67, + "learning_rate": 4.9320691635955256e-05, + "loss": 0.0248, + "step": 258930 + }, + { + "epoch": 1.67, + "learning_rate": 4.931101028159832e-05, + "loss": 0.0222, + "step": 258940 + }, + { + "epoch": 1.67, + "learning_rate": 4.930132892724139e-05, + "loss": 0.0219, + "step": 258950 + }, + { + "epoch": 1.67, + "learning_rate": 4.929164757288446e-05, + "loss": 0.0255, + "step": 258960 + }, + { + "epoch": 1.67, + "learning_rate": 4.928196621852752e-05, + "loss": 0.026, + "step": 258970 + }, + { + "epoch": 1.67, + "learning_rate": 4.9272284864170594e-05, + "loss": 0.0208, + "step": 258980 + }, + { + "epoch": 1.67, + "learning_rate": 4.926260350981366e-05, + "loss": 0.0239, + "step": 258990 + }, + { + "epoch": 1.67, + "learning_rate": 4.9252922155456734e-05, + "loss": 0.0276, + "step": 259000 + }, + { + "epoch": 1.67, + "eval_cer": 0.9198409219297254, + "eval_loss": 0.018455343320965767, + "eval_runtime": 120.0636, + "eval_samples_per_second": 16.658, + "eval_steps_per_second": 4.164, + "step": 259000 + }, + { + "epoch": 1.67, + "learning_rate": 4.92432408010998e-05, + "loss": 0.0202, + "step": 259010 + }, + { + "epoch": 1.67, + "learning_rate": 4.923355944674286e-05, + "loss": 0.0241, + "step": 259020 + }, + { + "epoch": 1.67, + "learning_rate": 4.922387809238593e-05, + "loss": 0.0316, + "step": 259030 + }, + { + "epoch": 1.67, + "learning_rate": 4.9214196738029e-05, + "loss": 0.0258, + "step": 259040 + }, + { + "epoch": 1.67, + "learning_rate": 4.920451538367207e-05, + "loss": 0.0275, + "step": 259050 + }, + { + "epoch": 1.67, + "learning_rate": 4.919483402931514e-05, + "loss": 0.0228, + "step": 259060 + }, + { + "epoch": 1.67, + "learning_rate": 4.918515267495821e-05, + "loss": 0.024, + "step": 259070 + }, + { + "epoch": 1.67, + "learning_rate": 4.917547132060127e-05, + "loss": 0.0237, + "step": 259080 + }, + { + "epoch": 1.67, + "learning_rate": 4.9165789966244336e-05, + "loss": 0.0252, + "step": 259090 + }, + { + "epoch": 1.67, + "learning_rate": 4.915610861188741e-05, + "loss": 0.0263, + "step": 259100 + }, + { + "epoch": 1.67, + "learning_rate": 4.9146427257530476e-05, + "loss": 0.0264, + "step": 259110 + }, + { + "epoch": 1.67, + "learning_rate": 4.913674590317355e-05, + "loss": 0.0225, + "step": 259120 + }, + { + "epoch": 1.67, + "learning_rate": 4.912706454881661e-05, + "loss": 0.0285, + "step": 259130 + }, + { + "epoch": 1.67, + "learning_rate": 4.9117383194459674e-05, + "loss": 0.0228, + "step": 259140 + }, + { + "epoch": 1.67, + "learning_rate": 4.910770184010275e-05, + "loss": 0.0208, + "step": 259150 + }, + { + "epoch": 1.67, + "learning_rate": 4.9098020485745814e-05, + "loss": 0.0213, + "step": 259160 + }, + { + "epoch": 1.67, + "learning_rate": 4.908833913138889e-05, + "loss": 0.0222, + "step": 259170 + }, + { + "epoch": 1.67, + "learning_rate": 4.9078657777031946e-05, + "loss": 0.0243, + "step": 259180 + }, + { + "epoch": 1.67, + "learning_rate": 4.906897642267502e-05, + "loss": 0.0233, + "step": 259190 + }, + { + "epoch": 1.67, + "learning_rate": 4.9059295068318085e-05, + "loss": 0.0256, + "step": 259200 + }, + { + "epoch": 1.67, + "learning_rate": 4.904961371396115e-05, + "loss": 0.0223, + "step": 259210 + }, + { + "epoch": 1.67, + "learning_rate": 4.9039932359604225e-05, + "loss": 0.0238, + "step": 259220 + }, + { + "epoch": 1.67, + "learning_rate": 4.9030251005247284e-05, + "loss": 0.024, + "step": 259230 + }, + { + "epoch": 1.67, + "learning_rate": 4.902056965089036e-05, + "loss": 0.0273, + "step": 259240 + }, + { + "epoch": 1.67, + "learning_rate": 4.9010888296533423e-05, + "loss": 0.0265, + "step": 259250 + }, + { + "epoch": 1.67, + "learning_rate": 4.9001206942176496e-05, + "loss": 0.0264, + "step": 259260 + }, + { + "epoch": 1.67, + "learning_rate": 4.899152558781956e-05, + "loss": 0.023, + "step": 259270 + }, + { + "epoch": 1.67, + "learning_rate": 4.898184423346262e-05, + "loss": 0.0259, + "step": 259280 + }, + { + "epoch": 1.67, + "learning_rate": 4.8972162879105695e-05, + "loss": 0.0282, + "step": 259290 + }, + { + "epoch": 1.67, + "learning_rate": 4.896248152474876e-05, + "loss": 0.0212, + "step": 259300 + }, + { + "epoch": 1.67, + "learning_rate": 4.8952800170391834e-05, + "loss": 0.026, + "step": 259310 + }, + { + "epoch": 1.67, + "learning_rate": 4.89431188160349e-05, + "loss": 0.027, + "step": 259320 + }, + { + "epoch": 1.67, + "learning_rate": 4.8933437461677974e-05, + "loss": 0.0243, + "step": 259330 + }, + { + "epoch": 1.67, + "learning_rate": 4.892375610732103e-05, + "loss": 0.0214, + "step": 259340 + }, + { + "epoch": 1.67, + "learning_rate": 4.89140747529641e-05, + "loss": 0.0286, + "step": 259350 + }, + { + "epoch": 1.67, + "learning_rate": 4.890439339860717e-05, + "loss": 0.0276, + "step": 259360 + }, + { + "epoch": 1.67, + "learning_rate": 4.889471204425024e-05, + "loss": 0.0244, + "step": 259370 + }, + { + "epoch": 1.67, + "learning_rate": 4.888503068989331e-05, + "loss": 0.0191, + "step": 259380 + }, + { + "epoch": 1.67, + "learning_rate": 4.887534933553637e-05, + "loss": 0.0289, + "step": 259390 + }, + { + "epoch": 1.67, + "learning_rate": 4.8865667981179444e-05, + "loss": 0.0225, + "step": 259400 + }, + { + "epoch": 1.67, + "learning_rate": 4.885598662682251e-05, + "loss": 0.0231, + "step": 259410 + }, + { + "epoch": 1.67, + "learning_rate": 4.8846305272465577e-05, + "loss": 0.0264, + "step": 259420 + }, + { + "epoch": 1.67, + "learning_rate": 4.883662391810865e-05, + "loss": 0.0237, + "step": 259430 + }, + { + "epoch": 1.67, + "learning_rate": 4.882694256375171e-05, + "loss": 0.0242, + "step": 259440 + }, + { + "epoch": 1.67, + "learning_rate": 4.881726120939478e-05, + "loss": 0.0199, + "step": 259450 + }, + { + "epoch": 1.67, + "learning_rate": 4.880757985503785e-05, + "loss": 0.0208, + "step": 259460 + }, + { + "epoch": 1.67, + "learning_rate": 4.879789850068092e-05, + "loss": 0.0239, + "step": 259470 + }, + { + "epoch": 1.67, + "learning_rate": 4.878821714632399e-05, + "loss": 0.0227, + "step": 259480 + }, + { + "epoch": 1.67, + "learning_rate": 4.877853579196705e-05, + "loss": 0.0253, + "step": 259490 + }, + { + "epoch": 1.67, + "learning_rate": 4.876885443761012e-05, + "loss": 0.0242, + "step": 259500 + }, + { + "epoch": 1.67, + "learning_rate": 4.8759173083253186e-05, + "loss": 0.0275, + "step": 259510 + }, + { + "epoch": 1.67, + "learning_rate": 4.874949172889626e-05, + "loss": 0.0233, + "step": 259520 + }, + { + "epoch": 1.68, + "learning_rate": 4.8739810374539326e-05, + "loss": 0.0242, + "step": 259530 + }, + { + "epoch": 1.68, + "learning_rate": 4.87301290201824e-05, + "loss": 0.0265, + "step": 259540 + }, + { + "epoch": 1.68, + "learning_rate": 4.872044766582546e-05, + "loss": 0.0222, + "step": 259550 + }, + { + "epoch": 1.68, + "learning_rate": 4.8710766311468524e-05, + "loss": 0.0262, + "step": 259560 + }, + { + "epoch": 1.68, + "learning_rate": 4.87010849571116e-05, + "loss": 0.0209, + "step": 259570 + }, + { + "epoch": 1.68, + "learning_rate": 4.8691403602754664e-05, + "loss": 0.0215, + "step": 259580 + }, + { + "epoch": 1.68, + "learning_rate": 4.8681722248397737e-05, + "loss": 0.0303, + "step": 259590 + }, + { + "epoch": 1.68, + "learning_rate": 4.8672040894040796e-05, + "loss": 0.0254, + "step": 259600 + }, + { + "epoch": 1.68, + "learning_rate": 4.866235953968387e-05, + "loss": 0.0268, + "step": 259610 + }, + { + "epoch": 1.68, + "learning_rate": 4.8652678185326935e-05, + "loss": 0.0224, + "step": 259620 + }, + { + "epoch": 1.68, + "learning_rate": 4.864299683097e-05, + "loss": 0.0215, + "step": 259630 + }, + { + "epoch": 1.68, + "learning_rate": 4.8633315476613075e-05, + "loss": 0.024, + "step": 259640 + }, + { + "epoch": 1.68, + "learning_rate": 4.8623634122256134e-05, + "loss": 0.0235, + "step": 259650 + }, + { + "epoch": 1.68, + "learning_rate": 4.861395276789921e-05, + "loss": 0.0247, + "step": 259660 + }, + { + "epoch": 1.68, + "learning_rate": 4.860427141354227e-05, + "loss": 0.028, + "step": 259670 + }, + { + "epoch": 1.68, + "learning_rate": 4.8594590059185346e-05, + "loss": 0.0244, + "step": 259680 + }, + { + "epoch": 1.68, + "learning_rate": 4.858490870482841e-05, + "loss": 0.0223, + "step": 259690 + }, + { + "epoch": 1.68, + "learning_rate": 4.857522735047147e-05, + "loss": 0.0264, + "step": 259700 + }, + { + "epoch": 1.68, + "learning_rate": 4.8565545996114545e-05, + "loss": 0.0249, + "step": 259710 + }, + { + "epoch": 1.68, + "learning_rate": 4.855586464175761e-05, + "loss": 0.0239, + "step": 259720 + }, + { + "epoch": 1.68, + "learning_rate": 4.8546183287400684e-05, + "loss": 0.0242, + "step": 259730 + }, + { + "epoch": 1.68, + "learning_rate": 4.853650193304375e-05, + "loss": 0.0244, + "step": 259740 + }, + { + "epoch": 1.68, + "learning_rate": 4.8526820578686823e-05, + "loss": 0.0273, + "step": 259750 + }, + { + "epoch": 1.68, + "learning_rate": 4.851713922432988e-05, + "loss": 0.0288, + "step": 259760 + }, + { + "epoch": 1.68, + "learning_rate": 4.850745786997295e-05, + "loss": 0.0242, + "step": 259770 + }, + { + "epoch": 1.68, + "learning_rate": 4.849777651561602e-05, + "loss": 0.0219, + "step": 259780 + }, + { + "epoch": 1.68, + "learning_rate": 4.848809516125909e-05, + "loss": 0.0287, + "step": 259790 + }, + { + "epoch": 1.68, + "learning_rate": 4.847841380690216e-05, + "loss": 0.0286, + "step": 259800 + }, + { + "epoch": 1.68, + "learning_rate": 4.846873245254522e-05, + "loss": 0.0283, + "step": 259810 + }, + { + "epoch": 1.68, + "learning_rate": 4.8459051098188294e-05, + "loss": 0.0226, + "step": 259820 + }, + { + "epoch": 1.68, + "learning_rate": 4.844936974383136e-05, + "loss": 0.0278, + "step": 259830 + }, + { + "epoch": 1.68, + "learning_rate": 4.8439688389474426e-05, + "loss": 0.0253, + "step": 259840 + }, + { + "epoch": 1.68, + "learning_rate": 4.84300070351175e-05, + "loss": 0.0227, + "step": 259850 + }, + { + "epoch": 1.68, + "learning_rate": 4.842032568076056e-05, + "loss": 0.0229, + "step": 259860 + }, + { + "epoch": 1.68, + "learning_rate": 4.841064432640363e-05, + "loss": 0.0218, + "step": 259870 + }, + { + "epoch": 1.68, + "learning_rate": 4.84009629720467e-05, + "loss": 0.0292, + "step": 259880 + }, + { + "epoch": 1.68, + "learning_rate": 4.839128161768977e-05, + "loss": 0.0256, + "step": 259890 + }, + { + "epoch": 1.68, + "learning_rate": 4.838160026333284e-05, + "loss": 0.0299, + "step": 259900 + }, + { + "epoch": 1.68, + "learning_rate": 4.83719189089759e-05, + "loss": 0.0241, + "step": 259910 + }, + { + "epoch": 1.68, + "learning_rate": 4.836223755461897e-05, + "loss": 0.0316, + "step": 259920 + }, + { + "epoch": 1.68, + "learning_rate": 4.8352556200262036e-05, + "loss": 0.0271, + "step": 259930 + }, + { + "epoch": 1.68, + "learning_rate": 4.834287484590511e-05, + "loss": 0.0249, + "step": 259940 + }, + { + "epoch": 1.68, + "learning_rate": 4.8333193491548175e-05, + "loss": 0.0227, + "step": 259950 + }, + { + "epoch": 1.68, + "learning_rate": 4.832351213719124e-05, + "loss": 0.0259, + "step": 259960 + }, + { + "epoch": 1.68, + "learning_rate": 4.831383078283431e-05, + "loss": 0.0235, + "step": 259970 + }, + { + "epoch": 1.68, + "learning_rate": 4.8304149428477374e-05, + "loss": 0.0284, + "step": 259980 + }, + { + "epoch": 1.68, + "learning_rate": 4.829446807412045e-05, + "loss": 0.0224, + "step": 259990 + }, + { + "epoch": 1.68, + "learning_rate": 4.828478671976351e-05, + "loss": 0.0233, + "step": 260000 + }, + { + "epoch": 1.68, + "eval_cer": 0.9198653259518699, + "eval_loss": 0.018204906955361366, + "eval_runtime": 119.9898, + "eval_samples_per_second": 16.668, + "eval_steps_per_second": 4.167, + "step": 260000 + }, + { + "epoch": 1.68, + "learning_rate": 4.827510536540658e-05, + "loss": 0.0275, + "step": 260010 + }, + { + "epoch": 1.68, + "learning_rate": 4.8265424011049646e-05, + "loss": 0.0224, + "step": 260020 + }, + { + "epoch": 1.68, + "learning_rate": 4.825574265669272e-05, + "loss": 0.0241, + "step": 260030 + }, + { + "epoch": 1.68, + "learning_rate": 4.8246061302335785e-05, + "loss": 0.0214, + "step": 260040 + }, + { + "epoch": 1.68, + "learning_rate": 4.823637994797885e-05, + "loss": 0.0222, + "step": 260050 + }, + { + "epoch": 1.68, + "learning_rate": 4.822669859362192e-05, + "loss": 0.022, + "step": 260060 + }, + { + "epoch": 1.68, + "learning_rate": 4.8217017239264984e-05, + "loss": 0.0247, + "step": 260070 + }, + { + "epoch": 1.68, + "learning_rate": 4.820733588490806e-05, + "loss": 0.0288, + "step": 260080 + }, + { + "epoch": 1.68, + "learning_rate": 4.819765453055112e-05, + "loss": 0.0286, + "step": 260090 + }, + { + "epoch": 1.68, + "learning_rate": 4.8187973176194196e-05, + "loss": 0.025, + "step": 260100 + }, + { + "epoch": 1.68, + "learning_rate": 4.8178291821837256e-05, + "loss": 0.0235, + "step": 260110 + }, + { + "epoch": 1.68, + "learning_rate": 4.816861046748032e-05, + "loss": 0.0249, + "step": 260120 + }, + { + "epoch": 1.68, + "learning_rate": 4.8158929113123395e-05, + "loss": 0.0222, + "step": 260130 + }, + { + "epoch": 1.68, + "learning_rate": 4.814924775876646e-05, + "loss": 0.0282, + "step": 260140 + }, + { + "epoch": 1.68, + "learning_rate": 4.8139566404409534e-05, + "loss": 0.0264, + "step": 260150 + }, + { + "epoch": 1.68, + "learning_rate": 4.8129885050052593e-05, + "loss": 0.0257, + "step": 260160 + }, + { + "epoch": 1.68, + "learning_rate": 4.8120203695695667e-05, + "loss": 0.0275, + "step": 260170 + }, + { + "epoch": 1.68, + "learning_rate": 4.811052234133873e-05, + "loss": 0.0241, + "step": 260180 + }, + { + "epoch": 1.68, + "learning_rate": 4.81008409869818e-05, + "loss": 0.0224, + "step": 260190 + }, + { + "epoch": 1.68, + "learning_rate": 4.809115963262487e-05, + "loss": 0.0258, + "step": 260200 + }, + { + "epoch": 1.68, + "learning_rate": 4.808147827826793e-05, + "loss": 0.0234, + "step": 260210 + }, + { + "epoch": 1.68, + "learning_rate": 4.8071796923911004e-05, + "loss": 0.0241, + "step": 260220 + }, + { + "epoch": 1.68, + "learning_rate": 4.806211556955407e-05, + "loss": 0.0231, + "step": 260230 + }, + { + "epoch": 1.68, + "learning_rate": 4.8052434215197144e-05, + "loss": 0.0283, + "step": 260240 + }, + { + "epoch": 1.68, + "learning_rate": 4.804275286084021e-05, + "loss": 0.0231, + "step": 260250 + }, + { + "epoch": 1.68, + "learning_rate": 4.803307150648327e-05, + "loss": 0.023, + "step": 260260 + }, + { + "epoch": 1.68, + "learning_rate": 4.802339015212634e-05, + "loss": 0.0274, + "step": 260270 + }, + { + "epoch": 1.68, + "learning_rate": 4.801370879776941e-05, + "loss": 0.0231, + "step": 260280 + }, + { + "epoch": 1.68, + "learning_rate": 4.800402744341248e-05, + "loss": 0.0222, + "step": 260290 + }, + { + "epoch": 1.68, + "learning_rate": 4.799434608905555e-05, + "loss": 0.024, + "step": 260300 + }, + { + "epoch": 1.68, + "learning_rate": 4.798466473469862e-05, + "loss": 0.0248, + "step": 260310 + }, + { + "epoch": 1.68, + "learning_rate": 4.797498338034168e-05, + "loss": 0.0262, + "step": 260320 + }, + { + "epoch": 1.68, + "learning_rate": 4.796530202598475e-05, + "loss": 0.0217, + "step": 260330 + }, + { + "epoch": 1.68, + "learning_rate": 4.795562067162782e-05, + "loss": 0.0253, + "step": 260340 + }, + { + "epoch": 1.68, + "learning_rate": 4.7945939317270886e-05, + "loss": 0.0248, + "step": 260350 + }, + { + "epoch": 1.68, + "learning_rate": 4.793625796291396e-05, + "loss": 0.0306, + "step": 260360 + }, + { + "epoch": 1.68, + "learning_rate": 4.792657660855702e-05, + "loss": 0.0234, + "step": 260370 + }, + { + "epoch": 1.68, + "learning_rate": 4.791689525420009e-05, + "loss": 0.0229, + "step": 260380 + }, + { + "epoch": 1.68, + "learning_rate": 4.790721389984316e-05, + "loss": 0.0204, + "step": 260390 + }, + { + "epoch": 1.68, + "learning_rate": 4.7897532545486224e-05, + "loss": 0.0246, + "step": 260400 + }, + { + "epoch": 1.68, + "learning_rate": 4.78878511911293e-05, + "loss": 0.0205, + "step": 260410 + }, + { + "epoch": 1.68, + "learning_rate": 4.7878169836772356e-05, + "loss": 0.029, + "step": 260420 + }, + { + "epoch": 1.68, + "learning_rate": 4.786848848241543e-05, + "loss": 0.0236, + "step": 260430 + }, + { + "epoch": 1.68, + "learning_rate": 4.7858807128058496e-05, + "loss": 0.0227, + "step": 260440 + }, + { + "epoch": 1.68, + "learning_rate": 4.784912577370157e-05, + "loss": 0.0229, + "step": 260450 + }, + { + "epoch": 1.68, + "learning_rate": 4.7839444419344635e-05, + "loss": 0.0278, + "step": 260460 + }, + { + "epoch": 1.68, + "learning_rate": 4.7829763064987694e-05, + "loss": 0.0264, + "step": 260470 + }, + { + "epoch": 1.68, + "learning_rate": 4.782008171063077e-05, + "loss": 0.0228, + "step": 260480 + }, + { + "epoch": 1.68, + "learning_rate": 4.7810400356273834e-05, + "loss": 0.026, + "step": 260490 + }, + { + "epoch": 1.68, + "learning_rate": 4.7800719001916907e-05, + "loss": 0.028, + "step": 260500 + }, + { + "epoch": 1.68, + "learning_rate": 4.779103764755997e-05, + "loss": 0.0246, + "step": 260510 + }, + { + "epoch": 1.68, + "learning_rate": 4.7781356293203046e-05, + "loss": 0.0248, + "step": 260520 + }, + { + "epoch": 1.68, + "learning_rate": 4.7771674938846105e-05, + "loss": 0.0241, + "step": 260530 + }, + { + "epoch": 1.68, + "learning_rate": 4.776199358448917e-05, + "loss": 0.0224, + "step": 260540 + }, + { + "epoch": 1.68, + "learning_rate": 4.7752312230132245e-05, + "loss": 0.0253, + "step": 260550 + }, + { + "epoch": 1.68, + "learning_rate": 4.774263087577531e-05, + "loss": 0.0272, + "step": 260560 + }, + { + "epoch": 1.68, + "learning_rate": 4.7732949521418384e-05, + "loss": 0.0272, + "step": 260570 + }, + { + "epoch": 1.68, + "learning_rate": 4.772326816706144e-05, + "loss": 0.0284, + "step": 260580 + }, + { + "epoch": 1.68, + "learning_rate": 4.7713586812704516e-05, + "loss": 0.0215, + "step": 260590 + }, + { + "epoch": 1.68, + "learning_rate": 4.770390545834758e-05, + "loss": 0.0219, + "step": 260600 + }, + { + "epoch": 1.68, + "learning_rate": 4.769422410399065e-05, + "loss": 0.0244, + "step": 260610 + }, + { + "epoch": 1.68, + "learning_rate": 4.768454274963372e-05, + "loss": 0.0213, + "step": 260620 + }, + { + "epoch": 1.68, + "learning_rate": 4.767486139527678e-05, + "loss": 0.0295, + "step": 260630 + }, + { + "epoch": 1.68, + "learning_rate": 4.7665180040919854e-05, + "loss": 0.0205, + "step": 260640 + }, + { + "epoch": 1.68, + "learning_rate": 4.765549868656292e-05, + "loss": 0.0241, + "step": 260650 + }, + { + "epoch": 1.68, + "learning_rate": 4.7645817332205994e-05, + "loss": 0.0254, + "step": 260660 + }, + { + "epoch": 1.68, + "learning_rate": 4.763613597784906e-05, + "loss": 0.0249, + "step": 260670 + }, + { + "epoch": 1.68, + "learning_rate": 4.762645462349212e-05, + "loss": 0.0217, + "step": 260680 + }, + { + "epoch": 1.68, + "learning_rate": 4.761677326913519e-05, + "loss": 0.0233, + "step": 260690 + }, + { + "epoch": 1.68, + "learning_rate": 4.760709191477826e-05, + "loss": 0.0219, + "step": 260700 + }, + { + "epoch": 1.68, + "learning_rate": 4.759741056042133e-05, + "loss": 0.0287, + "step": 260710 + }, + { + "epoch": 1.68, + "learning_rate": 4.75877292060644e-05, + "loss": 0.0231, + "step": 260720 + }, + { + "epoch": 1.68, + "learning_rate": 4.757804785170747e-05, + "loss": 0.0236, + "step": 260730 + }, + { + "epoch": 1.68, + "learning_rate": 4.756836649735053e-05, + "loss": 0.0219, + "step": 260740 + }, + { + "epoch": 1.68, + "learning_rate": 4.7558685142993596e-05, + "loss": 0.0277, + "step": 260750 + }, + { + "epoch": 1.68, + "learning_rate": 4.754900378863667e-05, + "loss": 0.0254, + "step": 260760 + }, + { + "epoch": 1.68, + "learning_rate": 4.7539322434279736e-05, + "loss": 0.0252, + "step": 260770 + }, + { + "epoch": 1.68, + "learning_rate": 4.752964107992281e-05, + "loss": 0.0226, + "step": 260780 + }, + { + "epoch": 1.68, + "learning_rate": 4.751995972556587e-05, + "loss": 0.0253, + "step": 260790 + }, + { + "epoch": 1.68, + "learning_rate": 4.751027837120894e-05, + "loss": 0.0246, + "step": 260800 + }, + { + "epoch": 1.68, + "learning_rate": 4.750059701685201e-05, + "loss": 0.0216, + "step": 260810 + }, + { + "epoch": 1.68, + "learning_rate": 4.7490915662495074e-05, + "loss": 0.0217, + "step": 260820 + }, + { + "epoch": 1.68, + "learning_rate": 4.748123430813815e-05, + "loss": 0.0196, + "step": 260830 + }, + { + "epoch": 1.68, + "learning_rate": 4.7471552953781206e-05, + "loss": 0.026, + "step": 260840 + }, + { + "epoch": 1.68, + "learning_rate": 4.746187159942428e-05, + "loss": 0.0252, + "step": 260850 + }, + { + "epoch": 1.68, + "learning_rate": 4.7452190245067345e-05, + "loss": 0.0214, + "step": 260860 + }, + { + "epoch": 1.68, + "learning_rate": 4.744250889071041e-05, + "loss": 0.0235, + "step": 260870 + }, + { + "epoch": 1.68, + "learning_rate": 4.7432827536353485e-05, + "loss": 0.0242, + "step": 260880 + }, + { + "epoch": 1.68, + "learning_rate": 4.7423146181996544e-05, + "loss": 0.0235, + "step": 260890 + }, + { + "epoch": 1.68, + "learning_rate": 4.741346482763962e-05, + "loss": 0.0246, + "step": 260900 + }, + { + "epoch": 1.68, + "learning_rate": 4.7403783473282683e-05, + "loss": 0.0241, + "step": 260910 + }, + { + "epoch": 1.68, + "learning_rate": 4.7394102118925756e-05, + "loss": 0.0234, + "step": 260920 + }, + { + "epoch": 1.68, + "learning_rate": 4.738442076456882e-05, + "loss": 0.0261, + "step": 260930 + }, + { + "epoch": 1.68, + "learning_rate": 4.737473941021188e-05, + "loss": 0.0269, + "step": 260940 + }, + { + "epoch": 1.68, + "learning_rate": 4.7365058055854955e-05, + "loss": 0.0301, + "step": 260950 + }, + { + "epoch": 1.68, + "learning_rate": 4.735537670149802e-05, + "loss": 0.0247, + "step": 260960 + }, + { + "epoch": 1.68, + "learning_rate": 4.7345695347141094e-05, + "loss": 0.0272, + "step": 260970 + }, + { + "epoch": 1.68, + "learning_rate": 4.733601399278416e-05, + "loss": 0.0261, + "step": 260980 + }, + { + "epoch": 1.68, + "learning_rate": 4.7326332638427234e-05, + "loss": 0.0291, + "step": 260990 + }, + { + "epoch": 1.68, + "learning_rate": 4.731665128407029e-05, + "loss": 0.0205, + "step": 261000 + }, + { + "epoch": 1.68, + "eval_cer": 0.919811998644221, + "eval_loss": 0.01825707219541073, + "eval_runtime": 120.0532, + "eval_samples_per_second": 16.659, + "eval_steps_per_second": 4.165, + "step": 261000 + }, + { + "epoch": 1.68, + "learning_rate": 4.730696992971336e-05, + "loss": 0.022, + "step": 261010 + }, + { + "epoch": 1.68, + "learning_rate": 4.729728857535643e-05, + "loss": 0.0277, + "step": 261020 + }, + { + "epoch": 1.68, + "learning_rate": 4.72876072209995e-05, + "loss": 0.0285, + "step": 261030 + }, + { + "epoch": 1.68, + "learning_rate": 4.727792586664257e-05, + "loss": 0.0276, + "step": 261040 + }, + { + "epoch": 1.68, + "learning_rate": 4.726824451228563e-05, + "loss": 0.0256, + "step": 261050 + }, + { + "epoch": 1.68, + "learning_rate": 4.7258563157928704e-05, + "loss": 0.0254, + "step": 261060 + }, + { + "epoch": 1.69, + "learning_rate": 4.724888180357177e-05, + "loss": 0.0299, + "step": 261070 + }, + { + "epoch": 1.69, + "learning_rate": 4.7239200449214837e-05, + "loss": 0.0303, + "step": 261080 + }, + { + "epoch": 1.69, + "learning_rate": 4.722951909485791e-05, + "loss": 0.025, + "step": 261090 + }, + { + "epoch": 1.69, + "learning_rate": 4.721983774050097e-05, + "loss": 0.0265, + "step": 261100 + }, + { + "epoch": 1.69, + "learning_rate": 4.721015638614404e-05, + "loss": 0.025, + "step": 261110 + }, + { + "epoch": 1.69, + "learning_rate": 4.720047503178711e-05, + "loss": 0.0245, + "step": 261120 + }, + { + "epoch": 1.69, + "learning_rate": 4.719079367743018e-05, + "loss": 0.0268, + "step": 261130 + }, + { + "epoch": 1.69, + "learning_rate": 4.718111232307325e-05, + "loss": 0.0267, + "step": 261140 + }, + { + "epoch": 1.69, + "learning_rate": 4.717143096871631e-05, + "loss": 0.024, + "step": 261150 + }, + { + "epoch": 1.69, + "learning_rate": 4.716174961435938e-05, + "loss": 0.0222, + "step": 261160 + }, + { + "epoch": 1.69, + "learning_rate": 4.7152068260002446e-05, + "loss": 0.0251, + "step": 261170 + }, + { + "epoch": 1.69, + "learning_rate": 4.714238690564552e-05, + "loss": 0.0275, + "step": 261180 + }, + { + "epoch": 1.69, + "learning_rate": 4.7132705551288586e-05, + "loss": 0.0285, + "step": 261190 + }, + { + "epoch": 1.69, + "learning_rate": 4.712302419693166e-05, + "loss": 0.0219, + "step": 261200 + }, + { + "epoch": 1.69, + "learning_rate": 4.711334284257472e-05, + "loss": 0.0244, + "step": 261210 + }, + { + "epoch": 1.69, + "learning_rate": 4.7103661488217784e-05, + "loss": 0.027, + "step": 261220 + }, + { + "epoch": 1.69, + "learning_rate": 4.709398013386086e-05, + "loss": 0.0301, + "step": 261230 + }, + { + "epoch": 1.69, + "learning_rate": 4.7084298779503924e-05, + "loss": 0.0251, + "step": 261240 + }, + { + "epoch": 1.69, + "learning_rate": 4.7074617425146997e-05, + "loss": 0.0255, + "step": 261250 + }, + { + "epoch": 1.69, + "learning_rate": 4.7064936070790056e-05, + "loss": 0.0224, + "step": 261260 + }, + { + "epoch": 1.69, + "learning_rate": 4.705525471643313e-05, + "loss": 0.0299, + "step": 261270 + }, + { + "epoch": 1.69, + "learning_rate": 4.7045573362076195e-05, + "loss": 0.0256, + "step": 261280 + }, + { + "epoch": 1.69, + "learning_rate": 4.703589200771926e-05, + "loss": 0.0254, + "step": 261290 + }, + { + "epoch": 1.69, + "learning_rate": 4.7026210653362334e-05, + "loss": 0.0216, + "step": 261300 + }, + { + "epoch": 1.69, + "learning_rate": 4.7016529299005394e-05, + "loss": 0.026, + "step": 261310 + }, + { + "epoch": 1.69, + "learning_rate": 4.700684794464847e-05, + "loss": 0.0246, + "step": 261320 + }, + { + "epoch": 1.69, + "learning_rate": 4.699716659029153e-05, + "loss": 0.0241, + "step": 261330 + }, + { + "epoch": 1.69, + "learning_rate": 4.6987485235934606e-05, + "loss": 0.0299, + "step": 261340 + }, + { + "epoch": 1.69, + "learning_rate": 4.697780388157767e-05, + "loss": 0.0217, + "step": 261350 + }, + { + "epoch": 1.69, + "learning_rate": 4.696812252722073e-05, + "loss": 0.0246, + "step": 261360 + }, + { + "epoch": 1.69, + "learning_rate": 4.6958441172863805e-05, + "loss": 0.0252, + "step": 261370 + }, + { + "epoch": 1.69, + "learning_rate": 4.694875981850687e-05, + "loss": 0.0218, + "step": 261380 + }, + { + "epoch": 1.69, + "learning_rate": 4.6939078464149944e-05, + "loss": 0.0217, + "step": 261390 + }, + { + "epoch": 1.69, + "learning_rate": 4.692939710979301e-05, + "loss": 0.0274, + "step": 261400 + }, + { + "epoch": 1.69, + "learning_rate": 4.691971575543608e-05, + "loss": 0.025, + "step": 261410 + }, + { + "epoch": 1.69, + "learning_rate": 4.691003440107914e-05, + "loss": 0.0226, + "step": 261420 + }, + { + "epoch": 1.69, + "learning_rate": 4.690035304672221e-05, + "loss": 0.0241, + "step": 261430 + }, + { + "epoch": 1.69, + "learning_rate": 4.689067169236528e-05, + "loss": 0.0233, + "step": 261440 + }, + { + "epoch": 1.69, + "learning_rate": 4.688099033800835e-05, + "loss": 0.0299, + "step": 261450 + }, + { + "epoch": 1.69, + "learning_rate": 4.6871308983651415e-05, + "loss": 0.0215, + "step": 261460 + }, + { + "epoch": 1.69, + "learning_rate": 4.686162762929448e-05, + "loss": 0.0244, + "step": 261470 + }, + { + "epoch": 1.69, + "learning_rate": 4.6851946274937554e-05, + "loss": 0.0232, + "step": 261480 + }, + { + "epoch": 1.69, + "learning_rate": 4.684226492058062e-05, + "loss": 0.0224, + "step": 261490 + }, + { + "epoch": 1.69, + "learning_rate": 4.6832583566223686e-05, + "loss": 0.0236, + "step": 261500 + }, + { + "epoch": 1.69, + "learning_rate": 4.682290221186675e-05, + "loss": 0.0227, + "step": 261510 + }, + { + "epoch": 1.69, + "learning_rate": 4.681322085750982e-05, + "loss": 0.027, + "step": 261520 + }, + { + "epoch": 1.69, + "learning_rate": 4.680353950315289e-05, + "loss": 0.0248, + "step": 261530 + }, + { + "epoch": 1.69, + "learning_rate": 4.679385814879596e-05, + "loss": 0.0261, + "step": 261540 + }, + { + "epoch": 1.69, + "learning_rate": 4.678417679443903e-05, + "loss": 0.0228, + "step": 261550 + }, + { + "epoch": 1.69, + "learning_rate": 4.677449544008209e-05, + "loss": 0.0226, + "step": 261560 + }, + { + "epoch": 1.69, + "learning_rate": 4.676481408572516e-05, + "loss": 0.0227, + "step": 261570 + }, + { + "epoch": 1.69, + "learning_rate": 4.675513273136823e-05, + "loss": 0.0272, + "step": 261580 + }, + { + "epoch": 1.69, + "learning_rate": 4.6745451377011296e-05, + "loss": 0.0249, + "step": 261590 + }, + { + "epoch": 1.69, + "learning_rate": 4.673577002265437e-05, + "loss": 0.0257, + "step": 261600 + }, + { + "epoch": 1.69, + "learning_rate": 4.672608866829743e-05, + "loss": 0.0225, + "step": 261610 + }, + { + "epoch": 1.69, + "learning_rate": 4.67164073139405e-05, + "loss": 0.024, + "step": 261620 + }, + { + "epoch": 1.69, + "learning_rate": 4.670672595958357e-05, + "loss": 0.0253, + "step": 261630 + }, + { + "epoch": 1.69, + "learning_rate": 4.6697044605226634e-05, + "loss": 0.0248, + "step": 261640 + }, + { + "epoch": 1.69, + "learning_rate": 4.668736325086971e-05, + "loss": 0.0255, + "step": 261650 + }, + { + "epoch": 1.69, + "learning_rate": 4.6677681896512767e-05, + "loss": 0.0208, + "step": 261660 + }, + { + "epoch": 1.69, + "learning_rate": 4.666800054215584e-05, + "loss": 0.0263, + "step": 261670 + }, + { + "epoch": 1.69, + "learning_rate": 4.6658319187798906e-05, + "loss": 0.0259, + "step": 261680 + }, + { + "epoch": 1.69, + "learning_rate": 4.664863783344198e-05, + "loss": 0.0376, + "step": 261690 + }, + { + "epoch": 1.69, + "learning_rate": 4.6638956479085045e-05, + "loss": 0.0238, + "step": 261700 + }, + { + "epoch": 1.69, + "learning_rate": 4.6629275124728105e-05, + "loss": 0.0229, + "step": 261710 + }, + { + "epoch": 1.69, + "learning_rate": 4.661959377037118e-05, + "loss": 0.0356, + "step": 261720 + }, + { + "epoch": 1.69, + "learning_rate": 4.6609912416014244e-05, + "loss": 0.0321, + "step": 261730 + }, + { + "epoch": 1.69, + "learning_rate": 4.660023106165732e-05, + "loss": 0.0251, + "step": 261740 + }, + { + "epoch": 1.69, + "learning_rate": 4.659054970730038e-05, + "loss": 0.0241, + "step": 261750 + }, + { + "epoch": 1.69, + "learning_rate": 4.6580868352943456e-05, + "loss": 0.027, + "step": 261760 + }, + { + "epoch": 1.69, + "learning_rate": 4.6571186998586515e-05, + "loss": 0.0228, + "step": 261770 + }, + { + "epoch": 1.69, + "learning_rate": 4.656150564422958e-05, + "loss": 0.0266, + "step": 261780 + }, + { + "epoch": 1.69, + "learning_rate": 4.6551824289872655e-05, + "loss": 0.0249, + "step": 261790 + }, + { + "epoch": 1.69, + "learning_rate": 4.654214293551572e-05, + "loss": 0.0235, + "step": 261800 + }, + { + "epoch": 1.69, + "learning_rate": 4.6532461581158794e-05, + "loss": 0.0236, + "step": 261810 + }, + { + "epoch": 1.69, + "learning_rate": 4.6522780226801853e-05, + "loss": 0.0263, + "step": 261820 + }, + { + "epoch": 1.69, + "learning_rate": 4.6513098872444926e-05, + "loss": 0.021, + "step": 261830 + }, + { + "epoch": 1.69, + "learning_rate": 4.650341751808799e-05, + "loss": 0.0234, + "step": 261840 + }, + { + "epoch": 1.69, + "learning_rate": 4.649373616373106e-05, + "loss": 0.0247, + "step": 261850 + }, + { + "epoch": 1.69, + "learning_rate": 4.648405480937413e-05, + "loss": 0.0272, + "step": 261860 + }, + { + "epoch": 1.69, + "learning_rate": 4.647437345501719e-05, + "loss": 0.0306, + "step": 261870 + }, + { + "epoch": 1.69, + "learning_rate": 4.6464692100660264e-05, + "loss": 0.0244, + "step": 261880 + }, + { + "epoch": 1.69, + "learning_rate": 4.645501074630333e-05, + "loss": 0.0208, + "step": 261890 + }, + { + "epoch": 1.69, + "learning_rate": 4.6445329391946404e-05, + "loss": 0.0235, + "step": 261900 + }, + { + "epoch": 1.69, + "learning_rate": 4.643564803758947e-05, + "loss": 0.0287, + "step": 261910 + }, + { + "epoch": 1.69, + "learning_rate": 4.642596668323253e-05, + "loss": 0.0271, + "step": 261920 + }, + { + "epoch": 1.69, + "learning_rate": 4.64162853288756e-05, + "loss": 0.0216, + "step": 261930 + }, + { + "epoch": 1.69, + "learning_rate": 4.640660397451867e-05, + "loss": 0.0293, + "step": 261940 + }, + { + "epoch": 1.69, + "learning_rate": 4.639692262016174e-05, + "loss": 0.0269, + "step": 261950 + }, + { + "epoch": 1.69, + "learning_rate": 4.638724126580481e-05, + "loss": 0.0255, + "step": 261960 + }, + { + "epoch": 1.69, + "learning_rate": 4.637755991144788e-05, + "loss": 0.0223, + "step": 261970 + }, + { + "epoch": 1.69, + "learning_rate": 4.636787855709094e-05, + "loss": 0.0286, + "step": 261980 + }, + { + "epoch": 1.69, + "learning_rate": 4.635819720273401e-05, + "loss": 0.026, + "step": 261990 + }, + { + "epoch": 1.69, + "learning_rate": 4.634851584837708e-05, + "loss": 0.0253, + "step": 262000 + }, + { + "epoch": 1.69, + "eval_cer": 0.9198499604564456, + "eval_loss": 0.018117111176252365, + "eval_runtime": 120.1178, + "eval_samples_per_second": 16.65, + "eval_steps_per_second": 4.163, + "step": 262000 + }, + { + "epoch": 1.69, + "learning_rate": 4.6338834494020146e-05, + "loss": 0.0266, + "step": 262010 + }, + { + "epoch": 1.69, + "learning_rate": 4.632915313966322e-05, + "loss": 0.0256, + "step": 262020 + }, + { + "epoch": 1.69, + "learning_rate": 4.631947178530628e-05, + "loss": 0.0262, + "step": 262030 + }, + { + "epoch": 1.69, + "learning_rate": 4.630979043094935e-05, + "loss": 0.027, + "step": 262040 + }, + { + "epoch": 1.69, + "learning_rate": 4.630010907659242e-05, + "loss": 0.0222, + "step": 262050 + }, + { + "epoch": 1.69, + "learning_rate": 4.6290427722235484e-05, + "loss": 0.0248, + "step": 262060 + }, + { + "epoch": 1.69, + "learning_rate": 4.628074636787856e-05, + "loss": 0.0236, + "step": 262070 + }, + { + "epoch": 1.69, + "learning_rate": 4.6271065013521616e-05, + "loss": 0.0251, + "step": 262080 + }, + { + "epoch": 1.69, + "learning_rate": 4.626138365916469e-05, + "loss": 0.0252, + "step": 262090 + }, + { + "epoch": 1.69, + "learning_rate": 4.6251702304807756e-05, + "loss": 0.0216, + "step": 262100 + }, + { + "epoch": 1.69, + "learning_rate": 4.624202095045083e-05, + "loss": 0.0248, + "step": 262110 + }, + { + "epoch": 1.69, + "learning_rate": 4.6232339596093895e-05, + "loss": 0.0227, + "step": 262120 + }, + { + "epoch": 1.69, + "learning_rate": 4.6222658241736954e-05, + "loss": 0.0279, + "step": 262130 + }, + { + "epoch": 1.69, + "learning_rate": 4.621297688738003e-05, + "loss": 0.0247, + "step": 262140 + }, + { + "epoch": 1.69, + "learning_rate": 4.6203295533023094e-05, + "loss": 0.0248, + "step": 262150 + }, + { + "epoch": 1.69, + "learning_rate": 4.6193614178666167e-05, + "loss": 0.0263, + "step": 262160 + }, + { + "epoch": 1.69, + "learning_rate": 4.618393282430923e-05, + "loss": 0.0225, + "step": 262170 + }, + { + "epoch": 1.69, + "learning_rate": 4.6174251469952306e-05, + "loss": 0.0214, + "step": 262180 + }, + { + "epoch": 1.69, + "learning_rate": 4.6164570115595365e-05, + "loss": 0.0259, + "step": 262190 + }, + { + "epoch": 1.69, + "learning_rate": 4.615488876123843e-05, + "loss": 0.0313, + "step": 262200 + }, + { + "epoch": 1.69, + "learning_rate": 4.6145207406881505e-05, + "loss": 0.0223, + "step": 262210 + }, + { + "epoch": 1.69, + "learning_rate": 4.613552605252457e-05, + "loss": 0.0242, + "step": 262220 + }, + { + "epoch": 1.69, + "learning_rate": 4.6125844698167644e-05, + "loss": 0.0224, + "step": 262230 + }, + { + "epoch": 1.69, + "learning_rate": 4.61161633438107e-05, + "loss": 0.0232, + "step": 262240 + }, + { + "epoch": 1.69, + "learning_rate": 4.6106481989453776e-05, + "loss": 0.029, + "step": 262250 + }, + { + "epoch": 1.69, + "learning_rate": 4.609680063509684e-05, + "loss": 0.0205, + "step": 262260 + }, + { + "epoch": 1.69, + "learning_rate": 4.608711928073991e-05, + "loss": 0.0252, + "step": 262270 + }, + { + "epoch": 1.69, + "learning_rate": 4.607743792638298e-05, + "loss": 0.0243, + "step": 262280 + }, + { + "epoch": 1.69, + "learning_rate": 4.606775657202604e-05, + "loss": 0.0242, + "step": 262290 + }, + { + "epoch": 1.69, + "learning_rate": 4.6058075217669114e-05, + "loss": 0.0278, + "step": 262300 + }, + { + "epoch": 1.69, + "learning_rate": 4.604839386331218e-05, + "loss": 0.0243, + "step": 262310 + }, + { + "epoch": 1.69, + "learning_rate": 4.6038712508955254e-05, + "loss": 0.0265, + "step": 262320 + }, + { + "epoch": 1.69, + "learning_rate": 4.602903115459832e-05, + "loss": 0.0239, + "step": 262330 + }, + { + "epoch": 1.69, + "learning_rate": 4.601934980024138e-05, + "loss": 0.0205, + "step": 262340 + }, + { + "epoch": 1.69, + "learning_rate": 4.600966844588445e-05, + "loss": 0.019, + "step": 262350 + }, + { + "epoch": 1.69, + "learning_rate": 4.599998709152752e-05, + "loss": 0.0271, + "step": 262360 + }, + { + "epoch": 1.69, + "learning_rate": 4.599030573717059e-05, + "loss": 0.0227, + "step": 262370 + }, + { + "epoch": 1.69, + "learning_rate": 4.598062438281366e-05, + "loss": 0.0204, + "step": 262380 + }, + { + "epoch": 1.69, + "learning_rate": 4.597094302845673e-05, + "loss": 0.026, + "step": 262390 + }, + { + "epoch": 1.69, + "learning_rate": 4.596126167409979e-05, + "loss": 0.0242, + "step": 262400 + }, + { + "epoch": 1.69, + "learning_rate": 4.5951580319742856e-05, + "loss": 0.0271, + "step": 262410 + }, + { + "epoch": 1.69, + "learning_rate": 4.594189896538593e-05, + "loss": 0.0277, + "step": 262420 + }, + { + "epoch": 1.69, + "learning_rate": 4.5932217611028996e-05, + "loss": 0.0297, + "step": 262430 + }, + { + "epoch": 1.69, + "learning_rate": 4.592253625667207e-05, + "loss": 0.0233, + "step": 262440 + }, + { + "epoch": 1.69, + "learning_rate": 4.591285490231513e-05, + "loss": 0.0213, + "step": 262450 + }, + { + "epoch": 1.69, + "learning_rate": 4.59031735479582e-05, + "loss": 0.0269, + "step": 262460 + }, + { + "epoch": 1.69, + "learning_rate": 4.589349219360127e-05, + "loss": 0.0266, + "step": 262470 + }, + { + "epoch": 1.69, + "learning_rate": 4.5883810839244334e-05, + "loss": 0.024, + "step": 262480 + }, + { + "epoch": 1.69, + "learning_rate": 4.587412948488741e-05, + "loss": 0.036, + "step": 262490 + }, + { + "epoch": 1.69, + "learning_rate": 4.5864448130530466e-05, + "loss": 0.0239, + "step": 262500 + }, + { + "epoch": 1.69, + "learning_rate": 4.585476677617354e-05, + "loss": 0.022, + "step": 262510 + }, + { + "epoch": 1.69, + "learning_rate": 4.5845085421816605e-05, + "loss": 0.0194, + "step": 262520 + }, + { + "epoch": 1.69, + "learning_rate": 4.583540406745968e-05, + "loss": 0.0249, + "step": 262530 + }, + { + "epoch": 1.69, + "learning_rate": 4.5825722713102745e-05, + "loss": 0.022, + "step": 262540 + }, + { + "epoch": 1.69, + "learning_rate": 4.5816041358745804e-05, + "loss": 0.0263, + "step": 262550 + }, + { + "epoch": 1.69, + "learning_rate": 4.580636000438888e-05, + "loss": 0.0241, + "step": 262560 + }, + { + "epoch": 1.69, + "learning_rate": 4.579667865003194e-05, + "loss": 0.0268, + "step": 262570 + }, + { + "epoch": 1.69, + "learning_rate": 4.5786997295675016e-05, + "loss": 0.029, + "step": 262580 + }, + { + "epoch": 1.69, + "learning_rate": 4.577731594131808e-05, + "loss": 0.0226, + "step": 262590 + }, + { + "epoch": 1.69, + "learning_rate": 4.576763458696114e-05, + "loss": 0.0292, + "step": 262600 + }, + { + "epoch": 1.69, + "learning_rate": 4.5757953232604215e-05, + "loss": 0.0278, + "step": 262610 + }, + { + "epoch": 1.7, + "learning_rate": 4.574827187824728e-05, + "loss": 0.0263, + "step": 262620 + }, + { + "epoch": 1.7, + "learning_rate": 4.5738590523890354e-05, + "loss": 0.0224, + "step": 262630 + }, + { + "epoch": 1.7, + "learning_rate": 4.572890916953342e-05, + "loss": 0.022, + "step": 262640 + }, + { + "epoch": 1.7, + "learning_rate": 4.571922781517649e-05, + "loss": 0.0252, + "step": 262650 + }, + { + "epoch": 1.7, + "learning_rate": 4.570954646081955e-05, + "loss": 0.0262, + "step": 262660 + }, + { + "epoch": 1.7, + "learning_rate": 4.569986510646262e-05, + "loss": 0.0214, + "step": 262670 + }, + { + "epoch": 1.7, + "learning_rate": 4.569018375210569e-05, + "loss": 0.0205, + "step": 262680 + }, + { + "epoch": 1.7, + "learning_rate": 4.568050239774876e-05, + "loss": 0.0263, + "step": 262690 + }, + { + "epoch": 1.7, + "learning_rate": 4.5670821043391825e-05, + "loss": 0.0234, + "step": 262700 + }, + { + "epoch": 1.7, + "learning_rate": 4.566113968903489e-05, + "loss": 0.026, + "step": 262710 + }, + { + "epoch": 1.7, + "learning_rate": 4.5651458334677964e-05, + "loss": 0.0239, + "step": 262720 + }, + { + "epoch": 1.7, + "learning_rate": 4.564177698032103e-05, + "loss": 0.021, + "step": 262730 + }, + { + "epoch": 1.7, + "learning_rate": 4.5632095625964097e-05, + "loss": 0.0267, + "step": 262740 + }, + { + "epoch": 1.7, + "learning_rate": 4.562241427160716e-05, + "loss": 0.0247, + "step": 262750 + }, + { + "epoch": 1.7, + "learning_rate": 4.561273291725023e-05, + "loss": 0.0239, + "step": 262760 + }, + { + "epoch": 1.7, + "learning_rate": 4.56030515628933e-05, + "loss": 0.0233, + "step": 262770 + }, + { + "epoch": 1.7, + "learning_rate": 4.559337020853637e-05, + "loss": 0.0308, + "step": 262780 + }, + { + "epoch": 1.7, + "learning_rate": 4.558368885417944e-05, + "loss": 0.0232, + "step": 262790 + }, + { + "epoch": 1.7, + "learning_rate": 4.55740074998225e-05, + "loss": 0.029, + "step": 262800 + }, + { + "epoch": 1.7, + "learning_rate": 4.556432614546557e-05, + "loss": 0.0323, + "step": 262810 + }, + { + "epoch": 1.7, + "learning_rate": 4.555464479110864e-05, + "loss": 0.0262, + "step": 262820 + }, + { + "epoch": 1.7, + "learning_rate": 4.5544963436751706e-05, + "loss": 0.0236, + "step": 262830 + }, + { + "epoch": 1.7, + "learning_rate": 4.553528208239478e-05, + "loss": 0.0197, + "step": 262840 + }, + { + "epoch": 1.7, + "learning_rate": 4.552560072803784e-05, + "loss": 0.0265, + "step": 262850 + }, + { + "epoch": 1.7, + "learning_rate": 4.551591937368091e-05, + "loss": 0.0235, + "step": 262860 + }, + { + "epoch": 1.7, + "learning_rate": 4.550623801932398e-05, + "loss": 0.0236, + "step": 262870 + }, + { + "epoch": 1.7, + "learning_rate": 4.5496556664967044e-05, + "loss": 0.0209, + "step": 262880 + }, + { + "epoch": 1.7, + "learning_rate": 4.548687531061012e-05, + "loss": 0.0257, + "step": 262890 + }, + { + "epoch": 1.7, + "learning_rate": 4.547719395625318e-05, + "loss": 0.0253, + "step": 262900 + }, + { + "epoch": 1.7, + "learning_rate": 4.546751260189625e-05, + "loss": 0.0265, + "step": 262910 + }, + { + "epoch": 1.7, + "learning_rate": 4.5457831247539316e-05, + "loss": 0.0237, + "step": 262920 + }, + { + "epoch": 1.7, + "learning_rate": 4.544814989318239e-05, + "loss": 0.0254, + "step": 262930 + }, + { + "epoch": 1.7, + "learning_rate": 4.5438468538825455e-05, + "loss": 0.0326, + "step": 262940 + }, + { + "epoch": 1.7, + "learning_rate": 4.542878718446852e-05, + "loss": 0.0304, + "step": 262950 + }, + { + "epoch": 1.7, + "learning_rate": 4.541910583011159e-05, + "loss": 0.0236, + "step": 262960 + }, + { + "epoch": 1.7, + "learning_rate": 4.5409424475754654e-05, + "loss": 0.0271, + "step": 262970 + }, + { + "epoch": 1.7, + "learning_rate": 4.539974312139773e-05, + "loss": 0.0261, + "step": 262980 + }, + { + "epoch": 1.7, + "learning_rate": 4.539006176704079e-05, + "loss": 0.027, + "step": 262990 + }, + { + "epoch": 1.7, + "learning_rate": 4.5380380412683866e-05, + "loss": 0.0221, + "step": 263000 + }, + { + "epoch": 1.7, + "eval_cer": 0.9198345949610214, + "eval_loss": 0.018028145655989647, + "eval_runtime": 120.064, + "eval_samples_per_second": 16.658, + "eval_steps_per_second": 4.164, + "step": 263000 + }, + { + "epoch": 1.7, + "learning_rate": 4.5370699058326926e-05, + "loss": 0.0251, + "step": 263010 + }, + { + "epoch": 1.7, + "learning_rate": 4.536101770396999e-05, + "loss": 0.0274, + "step": 263020 + }, + { + "epoch": 1.7, + "learning_rate": 4.5351336349613065e-05, + "loss": 0.0202, + "step": 263030 + }, + { + "epoch": 1.7, + "learning_rate": 4.534165499525613e-05, + "loss": 0.0232, + "step": 263040 + }, + { + "epoch": 1.7, + "learning_rate": 4.5331973640899204e-05, + "loss": 0.0253, + "step": 263050 + }, + { + "epoch": 1.7, + "learning_rate": 4.5322292286542264e-05, + "loss": 0.0236, + "step": 263060 + }, + { + "epoch": 1.7, + "learning_rate": 4.531261093218534e-05, + "loss": 0.0263, + "step": 263070 + }, + { + "epoch": 1.7, + "learning_rate": 4.53029295778284e-05, + "loss": 0.0239, + "step": 263080 + }, + { + "epoch": 1.7, + "learning_rate": 4.529324822347147e-05, + "loss": 0.0228, + "step": 263090 + }, + { + "epoch": 1.7, + "learning_rate": 4.528356686911454e-05, + "loss": 0.0256, + "step": 263100 + }, + { + "epoch": 1.7, + "learning_rate": 4.52738855147576e-05, + "loss": 0.025, + "step": 263110 + }, + { + "epoch": 1.7, + "learning_rate": 4.5264204160400675e-05, + "loss": 0.027, + "step": 263120 + }, + { + "epoch": 1.7, + "learning_rate": 4.525452280604374e-05, + "loss": 0.0267, + "step": 263130 + }, + { + "epoch": 1.7, + "learning_rate": 4.5244841451686814e-05, + "loss": 0.0283, + "step": 263140 + }, + { + "epoch": 1.7, + "learning_rate": 4.523516009732988e-05, + "loss": 0.0278, + "step": 263150 + }, + { + "epoch": 1.7, + "learning_rate": 4.522547874297294e-05, + "loss": 0.0275, + "step": 263160 + }, + { + "epoch": 1.7, + "learning_rate": 4.521579738861601e-05, + "loss": 0.0202, + "step": 263170 + }, + { + "epoch": 1.7, + "learning_rate": 4.520611603425908e-05, + "loss": 0.0275, + "step": 263180 + }, + { + "epoch": 1.7, + "learning_rate": 4.519643467990215e-05, + "loss": 0.0259, + "step": 263190 + }, + { + "epoch": 1.7, + "learning_rate": 4.518675332554522e-05, + "loss": 0.0273, + "step": 263200 + }, + { + "epoch": 1.7, + "learning_rate": 4.517707197118829e-05, + "loss": 0.0271, + "step": 263210 + }, + { + "epoch": 1.7, + "learning_rate": 4.516739061683135e-05, + "loss": 0.0214, + "step": 263220 + }, + { + "epoch": 1.7, + "learning_rate": 4.515770926247442e-05, + "loss": 0.027, + "step": 263230 + }, + { + "epoch": 1.7, + "learning_rate": 4.514802790811749e-05, + "loss": 0.0262, + "step": 263240 + }, + { + "epoch": 1.7, + "learning_rate": 4.5138346553760556e-05, + "loss": 0.0253, + "step": 263250 + }, + { + "epoch": 1.7, + "learning_rate": 4.512866519940363e-05, + "loss": 0.0201, + "step": 263260 + }, + { + "epoch": 1.7, + "learning_rate": 4.511898384504669e-05, + "loss": 0.0281, + "step": 263270 + }, + { + "epoch": 1.7, + "learning_rate": 4.510930249068976e-05, + "loss": 0.0262, + "step": 263280 + }, + { + "epoch": 1.7, + "learning_rate": 4.509962113633283e-05, + "loss": 0.0228, + "step": 263290 + }, + { + "epoch": 1.7, + "learning_rate": 4.5089939781975894e-05, + "loss": 0.0293, + "step": 263300 + }, + { + "epoch": 1.7, + "learning_rate": 4.508025842761897e-05, + "loss": 0.0234, + "step": 263310 + }, + { + "epoch": 1.7, + "learning_rate": 4.5070577073262027e-05, + "loss": 0.0295, + "step": 263320 + }, + { + "epoch": 1.7, + "learning_rate": 4.50608957189051e-05, + "loss": 0.0273, + "step": 263330 + }, + { + "epoch": 1.7, + "learning_rate": 4.5051214364548166e-05, + "loss": 0.0231, + "step": 263340 + }, + { + "epoch": 1.7, + "learning_rate": 4.504153301019124e-05, + "loss": 0.0236, + "step": 263350 + }, + { + "epoch": 1.7, + "learning_rate": 4.5031851655834305e-05, + "loss": 0.0254, + "step": 263360 + }, + { + "epoch": 1.7, + "learning_rate": 4.5022170301477364e-05, + "loss": 0.0255, + "step": 263370 + }, + { + "epoch": 1.7, + "learning_rate": 4.501248894712044e-05, + "loss": 0.022, + "step": 263380 + }, + { + "epoch": 1.7, + "learning_rate": 4.5002807592763504e-05, + "loss": 0.0267, + "step": 263390 + }, + { + "epoch": 1.7, + "learning_rate": 4.499312623840658e-05, + "loss": 0.0256, + "step": 263400 + }, + { + "epoch": 1.7, + "learning_rate": 4.498344488404964e-05, + "loss": 0.028, + "step": 263410 + }, + { + "epoch": 1.7, + "learning_rate": 4.4973763529692716e-05, + "loss": 0.0282, + "step": 263420 + }, + { + "epoch": 1.7, + "learning_rate": 4.4964082175335775e-05, + "loss": 0.0244, + "step": 263430 + }, + { + "epoch": 1.7, + "learning_rate": 4.495440082097884e-05, + "loss": 0.0263, + "step": 263440 + }, + { + "epoch": 1.7, + "learning_rate": 4.4944719466621915e-05, + "loss": 0.0243, + "step": 263450 + }, + { + "epoch": 1.7, + "learning_rate": 4.493503811226498e-05, + "loss": 0.024, + "step": 263460 + }, + { + "epoch": 1.7, + "learning_rate": 4.4925356757908054e-05, + "loss": 0.0237, + "step": 263470 + }, + { + "epoch": 1.7, + "learning_rate": 4.4915675403551113e-05, + "loss": 0.0261, + "step": 263480 + }, + { + "epoch": 1.7, + "learning_rate": 4.4905994049194186e-05, + "loss": 0.0316, + "step": 263490 + }, + { + "epoch": 1.7, + "learning_rate": 4.489631269483725e-05, + "loss": 0.0239, + "step": 263500 + }, + { + "epoch": 1.7, + "learning_rate": 4.488663134048032e-05, + "loss": 0.0214, + "step": 263510 + }, + { + "epoch": 1.7, + "learning_rate": 4.487694998612339e-05, + "loss": 0.0223, + "step": 263520 + }, + { + "epoch": 1.7, + "learning_rate": 4.486726863176645e-05, + "loss": 0.0248, + "step": 263530 + }, + { + "epoch": 1.7, + "learning_rate": 4.4857587277409524e-05, + "loss": 0.0253, + "step": 263540 + }, + { + "epoch": 1.7, + "learning_rate": 4.484790592305259e-05, + "loss": 0.0244, + "step": 263550 + }, + { + "epoch": 1.7, + "learning_rate": 4.4838224568695664e-05, + "loss": 0.026, + "step": 263560 + }, + { + "epoch": 1.7, + "learning_rate": 4.482854321433873e-05, + "loss": 0.0229, + "step": 263570 + }, + { + "epoch": 1.7, + "learning_rate": 4.481886185998179e-05, + "loss": 0.0211, + "step": 263580 + }, + { + "epoch": 1.7, + "learning_rate": 4.480918050562486e-05, + "loss": 0.0245, + "step": 263590 + }, + { + "epoch": 1.7, + "learning_rate": 4.479949915126793e-05, + "loss": 0.0215, + "step": 263600 + }, + { + "epoch": 1.7, + "learning_rate": 4.4789817796911e-05, + "loss": 0.0235, + "step": 263610 + }, + { + "epoch": 1.7, + "learning_rate": 4.478013644255407e-05, + "loss": 0.0251, + "step": 263620 + }, + { + "epoch": 1.7, + "learning_rate": 4.477045508819714e-05, + "loss": 0.0297, + "step": 263630 + }, + { + "epoch": 1.7, + "learning_rate": 4.47607737338402e-05, + "loss": 0.0249, + "step": 263640 + }, + { + "epoch": 1.7, + "learning_rate": 4.4751092379483267e-05, + "loss": 0.0305, + "step": 263650 + }, + { + "epoch": 1.7, + "learning_rate": 4.474141102512634e-05, + "loss": 0.0243, + "step": 263660 + }, + { + "epoch": 1.7, + "learning_rate": 4.4731729670769406e-05, + "loss": 0.0225, + "step": 263670 + }, + { + "epoch": 1.7, + "learning_rate": 4.472204831641248e-05, + "loss": 0.0205, + "step": 263680 + }, + { + "epoch": 1.7, + "learning_rate": 4.471236696205554e-05, + "loss": 0.0315, + "step": 263690 + }, + { + "epoch": 1.7, + "learning_rate": 4.470268560769861e-05, + "loss": 0.0242, + "step": 263700 + }, + { + "epoch": 1.7, + "learning_rate": 4.469300425334168e-05, + "loss": 0.0213, + "step": 263710 + }, + { + "epoch": 1.7, + "learning_rate": 4.4683322898984744e-05, + "loss": 0.0243, + "step": 263720 + }, + { + "epoch": 1.7, + "learning_rate": 4.467364154462782e-05, + "loss": 0.0212, + "step": 263730 + }, + { + "epoch": 1.7, + "learning_rate": 4.4663960190270876e-05, + "loss": 0.0268, + "step": 263740 + }, + { + "epoch": 1.7, + "learning_rate": 4.465427883591395e-05, + "loss": 0.023, + "step": 263750 + }, + { + "epoch": 1.7, + "learning_rate": 4.4644597481557016e-05, + "loss": 0.0248, + "step": 263760 + }, + { + "epoch": 1.7, + "learning_rate": 4.463491612720009e-05, + "loss": 0.0237, + "step": 263770 + }, + { + "epoch": 1.7, + "learning_rate": 4.4625234772843155e-05, + "loss": 0.0257, + "step": 263780 + }, + { + "epoch": 1.7, + "learning_rate": 4.4615553418486214e-05, + "loss": 0.0209, + "step": 263790 + }, + { + "epoch": 1.7, + "learning_rate": 4.460587206412929e-05, + "loss": 0.0283, + "step": 263800 + }, + { + "epoch": 1.7, + "learning_rate": 4.4596190709772354e-05, + "loss": 0.0213, + "step": 263810 + }, + { + "epoch": 1.7, + "learning_rate": 4.4586509355415427e-05, + "loss": 0.0241, + "step": 263820 + }, + { + "epoch": 1.7, + "learning_rate": 4.457682800105849e-05, + "loss": 0.0241, + "step": 263830 + }, + { + "epoch": 1.7, + "learning_rate": 4.4567146646701566e-05, + "loss": 0.0247, + "step": 263840 + }, + { + "epoch": 1.7, + "learning_rate": 4.4557465292344625e-05, + "loss": 0.0199, + "step": 263850 + }, + { + "epoch": 1.7, + "learning_rate": 4.454778393798769e-05, + "loss": 0.0223, + "step": 263860 + }, + { + "epoch": 1.7, + "learning_rate": 4.4538102583630765e-05, + "loss": 0.0197, + "step": 263870 + }, + { + "epoch": 1.7, + "learning_rate": 4.452842122927383e-05, + "loss": 0.0223, + "step": 263880 + }, + { + "epoch": 1.7, + "learning_rate": 4.4518739874916904e-05, + "loss": 0.0225, + "step": 263890 + }, + { + "epoch": 1.7, + "learning_rate": 4.450905852055996e-05, + "loss": 0.0207, + "step": 263900 + }, + { + "epoch": 1.7, + "learning_rate": 4.4499377166203036e-05, + "loss": 0.0226, + "step": 263910 + }, + { + "epoch": 1.7, + "learning_rate": 4.44896958118461e-05, + "loss": 0.0219, + "step": 263920 + }, + { + "epoch": 1.7, + "learning_rate": 4.448001445748917e-05, + "loss": 0.0193, + "step": 263930 + }, + { + "epoch": 1.7, + "learning_rate": 4.447033310313224e-05, + "loss": 0.0266, + "step": 263940 + }, + { + "epoch": 1.7, + "learning_rate": 4.44606517487753e-05, + "loss": 0.0194, + "step": 263950 + }, + { + "epoch": 1.7, + "learning_rate": 4.4450970394418374e-05, + "loss": 0.0268, + "step": 263960 + }, + { + "epoch": 1.7, + "learning_rate": 4.444128904006144e-05, + "loss": 0.0301, + "step": 263970 + }, + { + "epoch": 1.7, + "learning_rate": 4.4431607685704513e-05, + "loss": 0.0208, + "step": 263980 + }, + { + "epoch": 1.7, + "learning_rate": 4.442192633134758e-05, + "loss": 0.0207, + "step": 263990 + }, + { + "epoch": 1.7, + "learning_rate": 4.441224497699064e-05, + "loss": 0.0228, + "step": 264000 + }, + { + "epoch": 1.7, + "eval_cer": 0.9198797875946221, + "eval_loss": 0.01815461367368698, + "eval_runtime": 120.0874, + "eval_samples_per_second": 16.655, + "eval_steps_per_second": 4.164, + "step": 264000 + }, + { + "epoch": 1.7, + "learning_rate": 4.440256362263371e-05, + "loss": 0.024, + "step": 264010 + }, + { + "epoch": 1.7, + "learning_rate": 4.439288226827678e-05, + "loss": 0.0251, + "step": 264020 + }, + { + "epoch": 1.7, + "learning_rate": 4.438320091391985e-05, + "loss": 0.0223, + "step": 264030 + }, + { + "epoch": 1.7, + "learning_rate": 4.437351955956292e-05, + "loss": 0.0225, + "step": 264040 + }, + { + "epoch": 1.7, + "learning_rate": 4.4363838205205984e-05, + "loss": 0.025, + "step": 264050 + }, + { + "epoch": 1.7, + "learning_rate": 4.435415685084905e-05, + "loss": 0.0219, + "step": 264060 + }, + { + "epoch": 1.7, + "learning_rate": 4.4344475496492116e-05, + "loss": 0.0256, + "step": 264070 + }, + { + "epoch": 1.7, + "learning_rate": 4.433479414213519e-05, + "loss": 0.0216, + "step": 264080 + }, + { + "epoch": 1.7, + "learning_rate": 4.4325112787778256e-05, + "loss": 0.0231, + "step": 264090 + }, + { + "epoch": 1.7, + "learning_rate": 4.431543143342132e-05, + "loss": 0.0198, + "step": 264100 + }, + { + "epoch": 1.7, + "learning_rate": 4.430575007906439e-05, + "loss": 0.0195, + "step": 264110 + }, + { + "epoch": 1.7, + "learning_rate": 4.429606872470746e-05, + "loss": 0.0259, + "step": 264120 + }, + { + "epoch": 1.7, + "learning_rate": 4.428638737035053e-05, + "loss": 0.024, + "step": 264130 + }, + { + "epoch": 1.7, + "learning_rate": 4.4276706015993594e-05, + "loss": 0.0262, + "step": 264140 + }, + { + "epoch": 1.7, + "learning_rate": 4.426702466163666e-05, + "loss": 0.022, + "step": 264150 + }, + { + "epoch": 1.7, + "learning_rate": 4.4257343307279726e-05, + "loss": 0.0241, + "step": 264160 + }, + { + "epoch": 1.71, + "learning_rate": 4.42476619529228e-05, + "loss": 0.0208, + "step": 264170 + }, + { + "epoch": 1.71, + "learning_rate": 4.4237980598565865e-05, + "loss": 0.0248, + "step": 264180 + }, + { + "epoch": 1.71, + "learning_rate": 4.422829924420894e-05, + "loss": 0.0246, + "step": 264190 + }, + { + "epoch": 1.71, + "learning_rate": 4.4218617889852e-05, + "loss": 0.0293, + "step": 264200 + }, + { + "epoch": 1.71, + "learning_rate": 4.4208936535495064e-05, + "loss": 0.0271, + "step": 264210 + }, + { + "epoch": 1.71, + "learning_rate": 4.419925518113814e-05, + "loss": 0.0206, + "step": 264220 + }, + { + "epoch": 1.71, + "learning_rate": 4.41895738267812e-05, + "loss": 0.0246, + "step": 264230 + }, + { + "epoch": 1.71, + "learning_rate": 4.4179892472424276e-05, + "loss": 0.0264, + "step": 264240 + }, + { + "epoch": 1.71, + "learning_rate": 4.4170211118067336e-05, + "loss": 0.022, + "step": 264250 + }, + { + "epoch": 1.71, + "learning_rate": 4.41605297637104e-05, + "loss": 0.0266, + "step": 264260 + }, + { + "epoch": 1.71, + "learning_rate": 4.4150848409353475e-05, + "loss": 0.025, + "step": 264270 + }, + { + "epoch": 1.71, + "learning_rate": 4.414116705499654e-05, + "loss": 0.0262, + "step": 264280 + }, + { + "epoch": 1.71, + "learning_rate": 4.4131485700639614e-05, + "loss": 0.0256, + "step": 264290 + }, + { + "epoch": 1.71, + "learning_rate": 4.4121804346282674e-05, + "loss": 0.0241, + "step": 264300 + }, + { + "epoch": 1.71, + "learning_rate": 4.411212299192575e-05, + "loss": 0.0264, + "step": 264310 + }, + { + "epoch": 1.71, + "learning_rate": 4.410244163756881e-05, + "loss": 0.0257, + "step": 264320 + }, + { + "epoch": 1.71, + "learning_rate": 4.409276028321188e-05, + "loss": 0.0235, + "step": 264330 + }, + { + "epoch": 1.71, + "learning_rate": 4.408307892885495e-05, + "loss": 0.0249, + "step": 264340 + }, + { + "epoch": 1.71, + "learning_rate": 4.407339757449801e-05, + "loss": 0.0226, + "step": 264350 + }, + { + "epoch": 1.71, + "learning_rate": 4.4063716220141085e-05, + "loss": 0.0245, + "step": 264360 + }, + { + "epoch": 1.71, + "learning_rate": 4.405403486578415e-05, + "loss": 0.0294, + "step": 264370 + }, + { + "epoch": 1.71, + "learning_rate": 4.4044353511427224e-05, + "loss": 0.0229, + "step": 264380 + }, + { + "epoch": 1.71, + "learning_rate": 4.403467215707029e-05, + "loss": 0.0252, + "step": 264390 + }, + { + "epoch": 1.71, + "learning_rate": 4.402499080271335e-05, + "loss": 0.025, + "step": 264400 + }, + { + "epoch": 1.71, + "learning_rate": 4.401530944835642e-05, + "loss": 0.0246, + "step": 264410 + }, + { + "epoch": 1.71, + "learning_rate": 4.400562809399949e-05, + "loss": 0.0235, + "step": 264420 + }, + { + "epoch": 1.71, + "learning_rate": 4.399594673964256e-05, + "loss": 0.0261, + "step": 264430 + }, + { + "epoch": 1.71, + "learning_rate": 4.398626538528563e-05, + "loss": 0.0275, + "step": 264440 + }, + { + "epoch": 1.71, + "learning_rate": 4.39765840309287e-05, + "loss": 0.0247, + "step": 264450 + }, + { + "epoch": 1.71, + "learning_rate": 4.396690267657176e-05, + "loss": 0.0229, + "step": 264460 + }, + { + "epoch": 1.71, + "learning_rate": 4.395722132221483e-05, + "loss": 0.0245, + "step": 264470 + }, + { + "epoch": 1.71, + "learning_rate": 4.39475399678579e-05, + "loss": 0.024, + "step": 264480 + }, + { + "epoch": 1.71, + "learning_rate": 4.3937858613500966e-05, + "loss": 0.0251, + "step": 264490 + }, + { + "epoch": 1.71, + "learning_rate": 4.392817725914404e-05, + "loss": 0.0235, + "step": 264500 + }, + { + "epoch": 1.71, + "learning_rate": 4.39184959047871e-05, + "loss": 0.023, + "step": 264510 + }, + { + "epoch": 1.71, + "learning_rate": 4.390881455043017e-05, + "loss": 0.0233, + "step": 264520 + }, + { + "epoch": 1.71, + "learning_rate": 4.389913319607324e-05, + "loss": 0.026, + "step": 264530 + }, + { + "epoch": 1.71, + "learning_rate": 4.3889451841716304e-05, + "loss": 0.0195, + "step": 264540 + }, + { + "epoch": 1.71, + "learning_rate": 4.387977048735938e-05, + "loss": 0.0224, + "step": 264550 + }, + { + "epoch": 1.71, + "learning_rate": 4.387008913300244e-05, + "loss": 0.0276, + "step": 264560 + }, + { + "epoch": 1.71, + "learning_rate": 4.386040777864551e-05, + "loss": 0.0199, + "step": 264570 + }, + { + "epoch": 1.71, + "learning_rate": 4.3850726424288576e-05, + "loss": 0.0247, + "step": 264580 + }, + { + "epoch": 1.71, + "learning_rate": 4.384104506993165e-05, + "loss": 0.0244, + "step": 264590 + }, + { + "epoch": 1.71, + "learning_rate": 4.3831363715574715e-05, + "loss": 0.0253, + "step": 264600 + }, + { + "epoch": 1.71, + "learning_rate": 4.3821682361217775e-05, + "loss": 0.0218, + "step": 264610 + }, + { + "epoch": 1.71, + "learning_rate": 4.381200100686085e-05, + "loss": 0.0231, + "step": 264620 + }, + { + "epoch": 1.71, + "learning_rate": 4.3802319652503914e-05, + "loss": 0.0281, + "step": 264630 + }, + { + "epoch": 1.71, + "learning_rate": 4.379263829814699e-05, + "loss": 0.0254, + "step": 264640 + }, + { + "epoch": 1.71, + "learning_rate": 4.378295694379005e-05, + "loss": 0.022, + "step": 264650 + }, + { + "epoch": 1.71, + "learning_rate": 4.3773275589433126e-05, + "loss": 0.028, + "step": 264660 + }, + { + "epoch": 1.71, + "learning_rate": 4.3763594235076186e-05, + "loss": 0.0219, + "step": 264670 + }, + { + "epoch": 1.71, + "learning_rate": 4.375391288071925e-05, + "loss": 0.025, + "step": 264680 + }, + { + "epoch": 1.71, + "learning_rate": 4.3744231526362325e-05, + "loss": 0.0285, + "step": 264690 + }, + { + "epoch": 1.71, + "learning_rate": 4.373455017200539e-05, + "loss": 0.023, + "step": 264700 + }, + { + "epoch": 1.71, + "learning_rate": 4.3724868817648464e-05, + "loss": 0.0234, + "step": 264710 + }, + { + "epoch": 1.71, + "learning_rate": 4.3715187463291524e-05, + "loss": 0.0245, + "step": 264720 + }, + { + "epoch": 1.71, + "learning_rate": 4.37055061089346e-05, + "loss": 0.0213, + "step": 264730 + }, + { + "epoch": 1.71, + "learning_rate": 4.369582475457766e-05, + "loss": 0.0228, + "step": 264740 + }, + { + "epoch": 1.71, + "learning_rate": 4.368614340022073e-05, + "loss": 0.0252, + "step": 264750 + }, + { + "epoch": 1.71, + "learning_rate": 4.36764620458638e-05, + "loss": 0.0201, + "step": 264760 + }, + { + "epoch": 1.71, + "learning_rate": 4.366678069150686e-05, + "loss": 0.0198, + "step": 264770 + }, + { + "epoch": 1.71, + "learning_rate": 4.3657099337149935e-05, + "loss": 0.028, + "step": 264780 + }, + { + "epoch": 1.71, + "learning_rate": 4.3647417982793e-05, + "loss": 0.0224, + "step": 264790 + }, + { + "epoch": 1.71, + "learning_rate": 4.3637736628436074e-05, + "loss": 0.0264, + "step": 264800 + }, + { + "epoch": 1.71, + "learning_rate": 4.362805527407914e-05, + "loss": 0.0201, + "step": 264810 + }, + { + "epoch": 1.71, + "learning_rate": 4.36183739197222e-05, + "loss": 0.0208, + "step": 264820 + }, + { + "epoch": 1.71, + "learning_rate": 4.360869256536527e-05, + "loss": 0.0259, + "step": 264830 + }, + { + "epoch": 1.71, + "learning_rate": 4.359901121100834e-05, + "loss": 0.0214, + "step": 264840 + }, + { + "epoch": 1.71, + "learning_rate": 4.358932985665141e-05, + "loss": 0.0228, + "step": 264850 + }, + { + "epoch": 1.71, + "learning_rate": 4.357964850229448e-05, + "loss": 0.0249, + "step": 264860 + }, + { + "epoch": 1.71, + "learning_rate": 4.356996714793755e-05, + "loss": 0.0225, + "step": 264870 + }, + { + "epoch": 1.71, + "learning_rate": 4.356028579358061e-05, + "loss": 0.0281, + "step": 264880 + }, + { + "epoch": 1.71, + "learning_rate": 4.355060443922368e-05, + "loss": 0.0195, + "step": 264890 + }, + { + "epoch": 1.71, + "learning_rate": 4.354092308486675e-05, + "loss": 0.0258, + "step": 264900 + }, + { + "epoch": 1.71, + "learning_rate": 4.3531241730509816e-05, + "loss": 0.0251, + "step": 264910 + }, + { + "epoch": 1.71, + "learning_rate": 4.352156037615289e-05, + "loss": 0.0218, + "step": 264920 + }, + { + "epoch": 1.71, + "learning_rate": 4.351187902179595e-05, + "loss": 0.025, + "step": 264930 + }, + { + "epoch": 1.71, + "learning_rate": 4.350219766743902e-05, + "loss": 0.0327, + "step": 264940 + }, + { + "epoch": 1.71, + "learning_rate": 4.349251631308209e-05, + "loss": 0.0228, + "step": 264950 + }, + { + "epoch": 1.71, + "learning_rate": 4.3482834958725154e-05, + "loss": 0.0219, + "step": 264960 + }, + { + "epoch": 1.71, + "learning_rate": 4.347315360436823e-05, + "loss": 0.0227, + "step": 264970 + }, + { + "epoch": 1.71, + "learning_rate": 4.3463472250011286e-05, + "loss": 0.0253, + "step": 264980 + }, + { + "epoch": 1.71, + "learning_rate": 4.345379089565436e-05, + "loss": 0.0188, + "step": 264990 + }, + { + "epoch": 1.71, + "learning_rate": 4.3444109541297426e-05, + "loss": 0.0209, + "step": 265000 + }, + { + "epoch": 1.71, + "eval_cer": 0.9198490566037736, + "eval_loss": 0.01810065098106861, + "eval_runtime": 120.1229, + "eval_samples_per_second": 16.65, + "eval_steps_per_second": 4.162, + "step": 265000 + }, + { + "epoch": 1.71, + "learning_rate": 4.34344281869405e-05, + "loss": 0.0271, + "step": 265010 + }, + { + "epoch": 1.71, + "learning_rate": 4.3424746832583565e-05, + "loss": 0.0219, + "step": 265020 + }, + { + "epoch": 1.71, + "learning_rate": 4.3415065478226624e-05, + "loss": 0.023, + "step": 265030 + }, + { + "epoch": 1.71, + "learning_rate": 4.34053841238697e-05, + "loss": 0.025, + "step": 265040 + }, + { + "epoch": 1.71, + "learning_rate": 4.3395702769512764e-05, + "loss": 0.0251, + "step": 265050 + }, + { + "epoch": 1.71, + "learning_rate": 4.338602141515584e-05, + "loss": 0.0246, + "step": 265060 + }, + { + "epoch": 1.71, + "learning_rate": 4.33763400607989e-05, + "loss": 0.0183, + "step": 265070 + }, + { + "epoch": 1.71, + "learning_rate": 4.3366658706441976e-05, + "loss": 0.0234, + "step": 265080 + }, + { + "epoch": 1.71, + "learning_rate": 4.3356977352085035e-05, + "loss": 0.0269, + "step": 265090 + }, + { + "epoch": 1.71, + "learning_rate": 4.33472959977281e-05, + "loss": 0.0266, + "step": 265100 + }, + { + "epoch": 1.71, + "learning_rate": 4.3337614643371175e-05, + "loss": 0.0239, + "step": 265110 + }, + { + "epoch": 1.71, + "learning_rate": 4.332793328901424e-05, + "loss": 0.0254, + "step": 265120 + }, + { + "epoch": 1.71, + "learning_rate": 4.3318251934657314e-05, + "loss": 0.025, + "step": 265130 + }, + { + "epoch": 1.71, + "learning_rate": 4.3308570580300373e-05, + "loss": 0.0273, + "step": 265140 + }, + { + "epoch": 1.71, + "learning_rate": 4.3298889225943446e-05, + "loss": 0.0241, + "step": 265150 + }, + { + "epoch": 1.71, + "learning_rate": 4.328920787158651e-05, + "loss": 0.0256, + "step": 265160 + }, + { + "epoch": 1.71, + "learning_rate": 4.327952651722958e-05, + "loss": 0.0199, + "step": 265170 + }, + { + "epoch": 1.71, + "learning_rate": 4.326984516287265e-05, + "loss": 0.0198, + "step": 265180 + }, + { + "epoch": 1.71, + "learning_rate": 4.326016380851571e-05, + "loss": 0.026, + "step": 265190 + }, + { + "epoch": 1.71, + "learning_rate": 4.3250482454158784e-05, + "loss": 0.0249, + "step": 265200 + }, + { + "epoch": 1.71, + "learning_rate": 4.324080109980185e-05, + "loss": 0.0226, + "step": 265210 + }, + { + "epoch": 1.71, + "learning_rate": 4.3231119745444924e-05, + "loss": 0.0243, + "step": 265220 + }, + { + "epoch": 1.71, + "learning_rate": 4.322143839108799e-05, + "loss": 0.0259, + "step": 265230 + }, + { + "epoch": 1.71, + "learning_rate": 4.321175703673105e-05, + "loss": 0.0205, + "step": 265240 + }, + { + "epoch": 1.71, + "learning_rate": 4.320207568237412e-05, + "loss": 0.0208, + "step": 265250 + }, + { + "epoch": 1.71, + "learning_rate": 4.319239432801719e-05, + "loss": 0.0211, + "step": 265260 + }, + { + "epoch": 1.71, + "learning_rate": 4.318271297366026e-05, + "loss": 0.0222, + "step": 265270 + }, + { + "epoch": 1.71, + "learning_rate": 4.317303161930333e-05, + "loss": 0.0235, + "step": 265280 + }, + { + "epoch": 1.71, + "learning_rate": 4.3163350264946394e-05, + "loss": 0.0245, + "step": 265290 + }, + { + "epoch": 1.71, + "learning_rate": 4.315366891058946e-05, + "loss": 0.0261, + "step": 265300 + }, + { + "epoch": 1.71, + "learning_rate": 4.3143987556232527e-05, + "loss": 0.0222, + "step": 265310 + }, + { + "epoch": 1.71, + "learning_rate": 4.31343062018756e-05, + "loss": 0.0271, + "step": 265320 + }, + { + "epoch": 1.71, + "learning_rate": 4.3124624847518666e-05, + "loss": 0.0281, + "step": 265330 + }, + { + "epoch": 1.71, + "learning_rate": 4.311494349316174e-05, + "loss": 0.0247, + "step": 265340 + }, + { + "epoch": 1.71, + "learning_rate": 4.31052621388048e-05, + "loss": 0.0238, + "step": 265350 + }, + { + "epoch": 1.71, + "learning_rate": 4.309558078444787e-05, + "loss": 0.0272, + "step": 265360 + }, + { + "epoch": 1.71, + "learning_rate": 4.308589943009094e-05, + "loss": 0.0272, + "step": 265370 + }, + { + "epoch": 1.71, + "learning_rate": 4.3076218075734004e-05, + "loss": 0.0248, + "step": 265380 + }, + { + "epoch": 1.71, + "learning_rate": 4.306653672137708e-05, + "loss": 0.0204, + "step": 265390 + }, + { + "epoch": 1.71, + "learning_rate": 4.3056855367020136e-05, + "loss": 0.0207, + "step": 265400 + }, + { + "epoch": 1.71, + "learning_rate": 4.304717401266321e-05, + "loss": 0.0212, + "step": 265410 + }, + { + "epoch": 1.71, + "learning_rate": 4.3037492658306276e-05, + "loss": 0.0251, + "step": 265420 + }, + { + "epoch": 1.71, + "learning_rate": 4.302781130394935e-05, + "loss": 0.0241, + "step": 265430 + }, + { + "epoch": 1.71, + "learning_rate": 4.3018129949592415e-05, + "loss": 0.0238, + "step": 265440 + }, + { + "epoch": 1.71, + "learning_rate": 4.3008448595235474e-05, + "loss": 0.0271, + "step": 265450 + }, + { + "epoch": 1.71, + "learning_rate": 4.299876724087855e-05, + "loss": 0.0235, + "step": 265460 + }, + { + "epoch": 1.71, + "learning_rate": 4.2989085886521614e-05, + "loss": 0.027, + "step": 265470 + }, + { + "epoch": 1.71, + "learning_rate": 4.2979404532164687e-05, + "loss": 0.0228, + "step": 265480 + }, + { + "epoch": 1.71, + "learning_rate": 4.296972317780775e-05, + "loss": 0.0252, + "step": 265490 + }, + { + "epoch": 1.71, + "learning_rate": 4.296004182345082e-05, + "loss": 0.0174, + "step": 265500 + }, + { + "epoch": 1.71, + "learning_rate": 4.2950360469093885e-05, + "loss": 0.0243, + "step": 265510 + }, + { + "epoch": 1.71, + "learning_rate": 4.294067911473695e-05, + "loss": 0.026, + "step": 265520 + }, + { + "epoch": 1.71, + "learning_rate": 4.2930997760380024e-05, + "loss": 0.0272, + "step": 265530 + }, + { + "epoch": 1.71, + "learning_rate": 4.292131640602309e-05, + "loss": 0.0251, + "step": 265540 + }, + { + "epoch": 1.71, + "learning_rate": 4.291163505166616e-05, + "loss": 0.0284, + "step": 265550 + }, + { + "epoch": 1.71, + "learning_rate": 4.290195369730922e-05, + "loss": 0.0254, + "step": 265560 + }, + { + "epoch": 1.71, + "learning_rate": 4.2892272342952296e-05, + "loss": 0.0261, + "step": 265570 + }, + { + "epoch": 1.71, + "learning_rate": 4.288259098859536e-05, + "loss": 0.0231, + "step": 265580 + }, + { + "epoch": 1.71, + "learning_rate": 4.287290963423843e-05, + "loss": 0.0232, + "step": 265590 + }, + { + "epoch": 1.71, + "learning_rate": 4.2863228279881495e-05, + "loss": 0.0235, + "step": 265600 + }, + { + "epoch": 1.71, + "learning_rate": 4.285354692552456e-05, + "loss": 0.0237, + "step": 265610 + }, + { + "epoch": 1.71, + "learning_rate": 4.2843865571167634e-05, + "loss": 0.0233, + "step": 265620 + }, + { + "epoch": 1.71, + "learning_rate": 4.28341842168107e-05, + "loss": 0.0207, + "step": 265630 + }, + { + "epoch": 1.71, + "learning_rate": 4.2824502862453773e-05, + "loss": 0.0247, + "step": 265640 + }, + { + "epoch": 1.71, + "learning_rate": 4.281482150809683e-05, + "loss": 0.0234, + "step": 265650 + }, + { + "epoch": 1.71, + "learning_rate": 4.28051401537399e-05, + "loss": 0.0273, + "step": 265660 + }, + { + "epoch": 1.71, + "learning_rate": 4.279545879938297e-05, + "loss": 0.0263, + "step": 265670 + }, + { + "epoch": 1.71, + "learning_rate": 4.278577744502604e-05, + "loss": 0.0248, + "step": 265680 + }, + { + "epoch": 1.71, + "learning_rate": 4.277609609066911e-05, + "loss": 0.0234, + "step": 265690 + }, + { + "epoch": 1.71, + "learning_rate": 4.276641473631217e-05, + "loss": 0.0238, + "step": 265700 + }, + { + "epoch": 1.71, + "learning_rate": 4.2756733381955244e-05, + "loss": 0.0286, + "step": 265710 + }, + { + "epoch": 1.72, + "learning_rate": 4.274705202759831e-05, + "loss": 0.0235, + "step": 265720 + }, + { + "epoch": 1.72, + "learning_rate": 4.2737370673241376e-05, + "loss": 0.0238, + "step": 265730 + }, + { + "epoch": 1.72, + "learning_rate": 4.272768931888445e-05, + "loss": 0.0257, + "step": 265740 + }, + { + "epoch": 1.72, + "learning_rate": 4.271800796452751e-05, + "loss": 0.0241, + "step": 265750 + }, + { + "epoch": 1.72, + "learning_rate": 4.270832661017058e-05, + "loss": 0.0276, + "step": 265760 + }, + { + "epoch": 1.72, + "learning_rate": 4.269864525581365e-05, + "loss": 0.0194, + "step": 265770 + }, + { + "epoch": 1.72, + "learning_rate": 4.268896390145672e-05, + "loss": 0.0268, + "step": 265780 + }, + { + "epoch": 1.72, + "learning_rate": 4.267928254709979e-05, + "loss": 0.0219, + "step": 265790 + }, + { + "epoch": 1.72, + "learning_rate": 4.266960119274285e-05, + "loss": 0.0293, + "step": 265800 + }, + { + "epoch": 1.72, + "learning_rate": 4.265991983838592e-05, + "loss": 0.0242, + "step": 265810 + }, + { + "epoch": 1.72, + "learning_rate": 4.2650238484028986e-05, + "loss": 0.0246, + "step": 265820 + }, + { + "epoch": 1.72, + "learning_rate": 4.264055712967206e-05, + "loss": 0.0275, + "step": 265830 + }, + { + "epoch": 1.72, + "learning_rate": 4.2630875775315125e-05, + "loss": 0.0199, + "step": 265840 + }, + { + "epoch": 1.72, + "learning_rate": 4.26211944209582e-05, + "loss": 0.0236, + "step": 265850 + }, + { + "epoch": 1.72, + "learning_rate": 4.261151306660126e-05, + "loss": 0.0238, + "step": 265860 + }, + { + "epoch": 1.72, + "learning_rate": 4.2601831712244324e-05, + "loss": 0.0273, + "step": 265870 + }, + { + "epoch": 1.72, + "learning_rate": 4.25921503578874e-05, + "loss": 0.0211, + "step": 265880 + }, + { + "epoch": 1.72, + "learning_rate": 4.258246900353046e-05, + "loss": 0.0241, + "step": 265890 + }, + { + "epoch": 1.72, + "learning_rate": 4.2572787649173536e-05, + "loss": 0.0206, + "step": 265900 + }, + { + "epoch": 1.72, + "learning_rate": 4.2563106294816596e-05, + "loss": 0.0206, + "step": 265910 + }, + { + "epoch": 1.72, + "learning_rate": 4.255342494045967e-05, + "loss": 0.0258, + "step": 265920 + }, + { + "epoch": 1.72, + "learning_rate": 4.2543743586102735e-05, + "loss": 0.025, + "step": 265930 + }, + { + "epoch": 1.72, + "learning_rate": 4.25340622317458e-05, + "loss": 0.0268, + "step": 265940 + }, + { + "epoch": 1.72, + "learning_rate": 4.2524380877388874e-05, + "loss": 0.0293, + "step": 265950 + }, + { + "epoch": 1.72, + "learning_rate": 4.2514699523031934e-05, + "loss": 0.0286, + "step": 265960 + }, + { + "epoch": 1.72, + "learning_rate": 4.250501816867501e-05, + "loss": 0.0275, + "step": 265970 + }, + { + "epoch": 1.72, + "learning_rate": 4.249533681431807e-05, + "loss": 0.0213, + "step": 265980 + }, + { + "epoch": 1.72, + "learning_rate": 4.248565545996114e-05, + "loss": 0.0307, + "step": 265990 + }, + { + "epoch": 1.72, + "learning_rate": 4.247597410560421e-05, + "loss": 0.0319, + "step": 266000 + }, + { + "epoch": 1.72, + "eval_cer": 0.9198671336572138, + "eval_loss": 0.01788017526268959, + "eval_runtime": 120.022, + "eval_samples_per_second": 16.664, + "eval_steps_per_second": 4.166, + "step": 266000 + }, + { + "epoch": 1.72, + "learning_rate": 4.246629275124727e-05, + "loss": 0.025, + "step": 266010 + }, + { + "epoch": 1.72, + "learning_rate": 4.2456611396890345e-05, + "loss": 0.0276, + "step": 266020 + }, + { + "epoch": 1.72, + "learning_rate": 4.244693004253341e-05, + "loss": 0.0299, + "step": 266030 + }, + { + "epoch": 1.72, + "learning_rate": 4.2437248688176484e-05, + "loss": 0.0197, + "step": 266040 + }, + { + "epoch": 1.72, + "learning_rate": 4.242756733381955e-05, + "loss": 0.0212, + "step": 266050 + }, + { + "epoch": 1.72, + "learning_rate": 4.241788597946261e-05, + "loss": 0.0202, + "step": 266060 + }, + { + "epoch": 1.72, + "learning_rate": 4.240820462510568e-05, + "loss": 0.0237, + "step": 266070 + }, + { + "epoch": 1.72, + "learning_rate": 4.239852327074875e-05, + "loss": 0.0237, + "step": 266080 + }, + { + "epoch": 1.72, + "learning_rate": 4.238884191639182e-05, + "loss": 0.0236, + "step": 266090 + }, + { + "epoch": 1.72, + "learning_rate": 4.237916056203489e-05, + "loss": 0.0239, + "step": 266100 + }, + { + "epoch": 1.72, + "learning_rate": 4.236947920767796e-05, + "loss": 0.0193, + "step": 266110 + }, + { + "epoch": 1.72, + "learning_rate": 4.235979785332102e-05, + "loss": 0.0256, + "step": 266120 + }, + { + "epoch": 1.72, + "learning_rate": 4.235011649896409e-05, + "loss": 0.0228, + "step": 266130 + }, + { + "epoch": 1.72, + "learning_rate": 4.234043514460716e-05, + "loss": 0.0202, + "step": 266140 + }, + { + "epoch": 1.72, + "learning_rate": 4.2330753790250226e-05, + "loss": 0.0293, + "step": 266150 + }, + { + "epoch": 1.72, + "learning_rate": 4.23210724358933e-05, + "loss": 0.0173, + "step": 266160 + }, + { + "epoch": 1.72, + "learning_rate": 4.231139108153636e-05, + "loss": 0.0216, + "step": 266170 + }, + { + "epoch": 1.72, + "learning_rate": 4.230170972717943e-05, + "loss": 0.0269, + "step": 266180 + }, + { + "epoch": 1.72, + "learning_rate": 4.22920283728225e-05, + "loss": 0.02, + "step": 266190 + }, + { + "epoch": 1.72, + "learning_rate": 4.2282347018465564e-05, + "loss": 0.0228, + "step": 266200 + }, + { + "epoch": 1.72, + "learning_rate": 4.227266566410864e-05, + "loss": 0.0227, + "step": 266210 + }, + { + "epoch": 1.72, + "learning_rate": 4.22629843097517e-05, + "loss": 0.0233, + "step": 266220 + }, + { + "epoch": 1.72, + "learning_rate": 4.225330295539477e-05, + "loss": 0.0232, + "step": 266230 + }, + { + "epoch": 1.72, + "learning_rate": 4.2243621601037836e-05, + "loss": 0.0295, + "step": 266240 + }, + { + "epoch": 1.72, + "learning_rate": 4.223394024668091e-05, + "loss": 0.0213, + "step": 266250 + }, + { + "epoch": 1.72, + "learning_rate": 4.2224258892323975e-05, + "loss": 0.0251, + "step": 266260 + }, + { + "epoch": 1.72, + "learning_rate": 4.2214577537967035e-05, + "loss": 0.0215, + "step": 266270 + }, + { + "epoch": 1.72, + "learning_rate": 4.220489618361011e-05, + "loss": 0.0239, + "step": 266280 + }, + { + "epoch": 1.72, + "learning_rate": 4.2195214829253174e-05, + "loss": 0.0237, + "step": 266290 + }, + { + "epoch": 1.72, + "learning_rate": 4.218553347489625e-05, + "loss": 0.0194, + "step": 266300 + }, + { + "epoch": 1.72, + "learning_rate": 4.217585212053931e-05, + "loss": 0.0237, + "step": 266310 + }, + { + "epoch": 1.72, + "learning_rate": 4.2166170766182386e-05, + "loss": 0.0213, + "step": 266320 + }, + { + "epoch": 1.72, + "learning_rate": 4.2156489411825446e-05, + "loss": 0.0227, + "step": 266330 + }, + { + "epoch": 1.72, + "learning_rate": 4.214680805746851e-05, + "loss": 0.0251, + "step": 266340 + }, + { + "epoch": 1.72, + "learning_rate": 4.2137126703111585e-05, + "loss": 0.0302, + "step": 266350 + }, + { + "epoch": 1.72, + "learning_rate": 4.212744534875465e-05, + "loss": 0.0219, + "step": 266360 + }, + { + "epoch": 1.72, + "learning_rate": 4.2117763994397724e-05, + "loss": 0.0209, + "step": 266370 + }, + { + "epoch": 1.72, + "learning_rate": 4.2108082640040784e-05, + "loss": 0.0273, + "step": 266380 + }, + { + "epoch": 1.72, + "learning_rate": 4.2098401285683857e-05, + "loss": 0.0282, + "step": 266390 + }, + { + "epoch": 1.72, + "learning_rate": 4.208871993132692e-05, + "loss": 0.027, + "step": 266400 + }, + { + "epoch": 1.72, + "learning_rate": 4.207903857696999e-05, + "loss": 0.0287, + "step": 266410 + }, + { + "epoch": 1.72, + "learning_rate": 4.206935722261306e-05, + "loss": 0.0242, + "step": 266420 + }, + { + "epoch": 1.72, + "learning_rate": 4.205967586825612e-05, + "loss": 0.0252, + "step": 266430 + }, + { + "epoch": 1.72, + "learning_rate": 4.2049994513899195e-05, + "loss": 0.0223, + "step": 266440 + }, + { + "epoch": 1.72, + "learning_rate": 4.204031315954226e-05, + "loss": 0.0261, + "step": 266450 + }, + { + "epoch": 1.72, + "learning_rate": 4.2030631805185334e-05, + "loss": 0.0336, + "step": 266460 + }, + { + "epoch": 1.72, + "learning_rate": 4.20209504508284e-05, + "loss": 0.0217, + "step": 266470 + }, + { + "epoch": 1.72, + "learning_rate": 4.201126909647146e-05, + "loss": 0.0231, + "step": 266480 + }, + { + "epoch": 1.72, + "learning_rate": 4.200158774211453e-05, + "loss": 0.0284, + "step": 266490 + }, + { + "epoch": 1.72, + "learning_rate": 4.19919063877576e-05, + "loss": 0.0275, + "step": 266500 + }, + { + "epoch": 1.72, + "learning_rate": 4.198222503340067e-05, + "loss": 0.0247, + "step": 266510 + }, + { + "epoch": 1.72, + "learning_rate": 4.197254367904374e-05, + "loss": 0.0232, + "step": 266520 + }, + { + "epoch": 1.72, + "learning_rate": 4.196286232468681e-05, + "loss": 0.024, + "step": 266530 + }, + { + "epoch": 1.72, + "learning_rate": 4.195318097032987e-05, + "loss": 0.0172, + "step": 266540 + }, + { + "epoch": 1.72, + "learning_rate": 4.194349961597294e-05, + "loss": 0.0231, + "step": 266550 + }, + { + "epoch": 1.72, + "learning_rate": 4.193381826161601e-05, + "loss": 0.0248, + "step": 266560 + }, + { + "epoch": 1.72, + "learning_rate": 4.1924136907259076e-05, + "loss": 0.0211, + "step": 266570 + }, + { + "epoch": 1.72, + "learning_rate": 4.191445555290215e-05, + "loss": 0.0278, + "step": 266580 + }, + { + "epoch": 1.72, + "learning_rate": 4.190477419854521e-05, + "loss": 0.0233, + "step": 266590 + }, + { + "epoch": 1.72, + "learning_rate": 4.189509284418828e-05, + "loss": 0.0205, + "step": 266600 + }, + { + "epoch": 1.72, + "learning_rate": 4.188541148983135e-05, + "loss": 0.0301, + "step": 266610 + }, + { + "epoch": 1.72, + "learning_rate": 4.1875730135474414e-05, + "loss": 0.0206, + "step": 266620 + }, + { + "epoch": 1.72, + "learning_rate": 4.186604878111749e-05, + "loss": 0.0202, + "step": 266630 + }, + { + "epoch": 1.72, + "learning_rate": 4.1856367426760546e-05, + "loss": 0.0224, + "step": 266640 + }, + { + "epoch": 1.72, + "learning_rate": 4.184668607240362e-05, + "loss": 0.0223, + "step": 266650 + }, + { + "epoch": 1.72, + "learning_rate": 4.1837004718046686e-05, + "loss": 0.0287, + "step": 266660 + }, + { + "epoch": 1.72, + "learning_rate": 4.182732336368976e-05, + "loss": 0.0269, + "step": 266670 + }, + { + "epoch": 1.72, + "learning_rate": 4.1817642009332825e-05, + "loss": 0.0261, + "step": 266680 + }, + { + "epoch": 1.72, + "learning_rate": 4.1807960654975884e-05, + "loss": 0.0226, + "step": 266690 + }, + { + "epoch": 1.72, + "learning_rate": 4.179827930061896e-05, + "loss": 0.021, + "step": 266700 + }, + { + "epoch": 1.72, + "learning_rate": 4.1788597946262024e-05, + "loss": 0.0254, + "step": 266710 + }, + { + "epoch": 1.72, + "learning_rate": 4.17789165919051e-05, + "loss": 0.023, + "step": 266720 + }, + { + "epoch": 1.72, + "learning_rate": 4.176923523754816e-05, + "loss": 0.021, + "step": 266730 + }, + { + "epoch": 1.72, + "learning_rate": 4.175955388319123e-05, + "loss": 0.0256, + "step": 266740 + }, + { + "epoch": 1.72, + "learning_rate": 4.1749872528834295e-05, + "loss": 0.0251, + "step": 266750 + }, + { + "epoch": 1.72, + "learning_rate": 4.174019117447736e-05, + "loss": 0.0216, + "step": 266760 + }, + { + "epoch": 1.72, + "learning_rate": 4.1730509820120435e-05, + "loss": 0.0228, + "step": 266770 + }, + { + "epoch": 1.72, + "learning_rate": 4.17208284657635e-05, + "loss": 0.0213, + "step": 266780 + }, + { + "epoch": 1.72, + "learning_rate": 4.171114711140657e-05, + "loss": 0.0241, + "step": 266790 + }, + { + "epoch": 1.72, + "learning_rate": 4.170146575704963e-05, + "loss": 0.022, + "step": 266800 + }, + { + "epoch": 1.72, + "learning_rate": 4.1691784402692706e-05, + "loss": 0.0253, + "step": 266810 + }, + { + "epoch": 1.72, + "learning_rate": 4.168210304833577e-05, + "loss": 0.0248, + "step": 266820 + }, + { + "epoch": 1.72, + "learning_rate": 4.167242169397884e-05, + "loss": 0.0224, + "step": 266830 + }, + { + "epoch": 1.72, + "learning_rate": 4.1662740339621905e-05, + "loss": 0.0266, + "step": 266840 + }, + { + "epoch": 1.72, + "learning_rate": 4.165305898526497e-05, + "loss": 0.0234, + "step": 266850 + }, + { + "epoch": 1.72, + "learning_rate": 4.1643377630908044e-05, + "loss": 0.0239, + "step": 266860 + }, + { + "epoch": 1.72, + "learning_rate": 4.163369627655111e-05, + "loss": 0.0282, + "step": 266870 + }, + { + "epoch": 1.72, + "learning_rate": 4.1624014922194184e-05, + "loss": 0.0231, + "step": 266880 + }, + { + "epoch": 1.72, + "learning_rate": 4.161433356783724e-05, + "loss": 0.0242, + "step": 266890 + }, + { + "epoch": 1.72, + "learning_rate": 4.160465221348031e-05, + "loss": 0.0276, + "step": 266900 + }, + { + "epoch": 1.72, + "learning_rate": 4.159497085912338e-05, + "loss": 0.0243, + "step": 266910 + }, + { + "epoch": 1.72, + "learning_rate": 4.158528950476645e-05, + "loss": 0.0203, + "step": 266920 + }, + { + "epoch": 1.72, + "learning_rate": 4.157560815040952e-05, + "loss": 0.0268, + "step": 266930 + }, + { + "epoch": 1.72, + "learning_rate": 4.156592679605258e-05, + "loss": 0.0276, + "step": 266940 + }, + { + "epoch": 1.72, + "learning_rate": 4.1556245441695654e-05, + "loss": 0.0227, + "step": 266950 + }, + { + "epoch": 1.72, + "learning_rate": 4.154656408733872e-05, + "loss": 0.0244, + "step": 266960 + }, + { + "epoch": 1.72, + "learning_rate": 4.1536882732981787e-05, + "loss": 0.0202, + "step": 266970 + }, + { + "epoch": 1.72, + "learning_rate": 4.152720137862486e-05, + "loss": 0.0267, + "step": 266980 + }, + { + "epoch": 1.72, + "learning_rate": 4.151752002426792e-05, + "loss": 0.0231, + "step": 266990 + }, + { + "epoch": 1.72, + "learning_rate": 4.150783866991099e-05, + "loss": 0.0236, + "step": 267000 + }, + { + "epoch": 1.72, + "eval_cer": 0.9198870184159982, + "eval_loss": 0.017837153747677803, + "eval_runtime": 119.9955, + "eval_samples_per_second": 16.667, + "eval_steps_per_second": 4.167, + "step": 267000 + }, + { + "epoch": 1.72, + "learning_rate": 4.149815731555406e-05, + "loss": 0.0231, + "step": 267010 + }, + { + "epoch": 1.72, + "learning_rate": 4.148847596119713e-05, + "loss": 0.0239, + "step": 267020 + }, + { + "epoch": 1.72, + "learning_rate": 4.14787946068402e-05, + "loss": 0.0227, + "step": 267030 + }, + { + "epoch": 1.72, + "learning_rate": 4.146911325248326e-05, + "loss": 0.0236, + "step": 267040 + }, + { + "epoch": 1.72, + "learning_rate": 4.145943189812633e-05, + "loss": 0.0262, + "step": 267050 + }, + { + "epoch": 1.72, + "learning_rate": 4.1449750543769396e-05, + "loss": 0.0224, + "step": 267060 + }, + { + "epoch": 1.72, + "learning_rate": 4.144006918941247e-05, + "loss": 0.0239, + "step": 267070 + }, + { + "epoch": 1.72, + "learning_rate": 4.1430387835055536e-05, + "loss": 0.0241, + "step": 267080 + }, + { + "epoch": 1.72, + "learning_rate": 4.142070648069861e-05, + "loss": 0.0261, + "step": 267090 + }, + { + "epoch": 1.72, + "learning_rate": 4.141102512634167e-05, + "loss": 0.0242, + "step": 267100 + }, + { + "epoch": 1.72, + "learning_rate": 4.1401343771984734e-05, + "loss": 0.0266, + "step": 267110 + }, + { + "epoch": 1.72, + "learning_rate": 4.139166241762781e-05, + "loss": 0.0275, + "step": 267120 + }, + { + "epoch": 1.72, + "learning_rate": 4.1381981063270873e-05, + "loss": 0.026, + "step": 267130 + }, + { + "epoch": 1.72, + "learning_rate": 4.1372299708913947e-05, + "loss": 0.0284, + "step": 267140 + }, + { + "epoch": 1.72, + "learning_rate": 4.1362618354557006e-05, + "loss": 0.0263, + "step": 267150 + }, + { + "epoch": 1.72, + "learning_rate": 4.135293700020008e-05, + "loss": 0.0234, + "step": 267160 + }, + { + "epoch": 1.72, + "learning_rate": 4.1343255645843145e-05, + "loss": 0.019, + "step": 267170 + }, + { + "epoch": 1.72, + "learning_rate": 4.133357429148621e-05, + "loss": 0.0302, + "step": 267180 + }, + { + "epoch": 1.72, + "learning_rate": 4.1323892937129284e-05, + "loss": 0.0226, + "step": 267190 + }, + { + "epoch": 1.72, + "learning_rate": 4.1314211582772344e-05, + "loss": 0.027, + "step": 267200 + }, + { + "epoch": 1.72, + "learning_rate": 4.130453022841542e-05, + "loss": 0.0305, + "step": 267210 + }, + { + "epoch": 1.72, + "learning_rate": 4.129484887405848e-05, + "loss": 0.0283, + "step": 267220 + }, + { + "epoch": 1.72, + "learning_rate": 4.1285167519701556e-05, + "loss": 0.024, + "step": 267230 + }, + { + "epoch": 1.72, + "learning_rate": 4.127548616534462e-05, + "loss": 0.0265, + "step": 267240 + }, + { + "epoch": 1.72, + "learning_rate": 4.126580481098768e-05, + "loss": 0.023, + "step": 267250 + }, + { + "epoch": 1.72, + "learning_rate": 4.1256123456630755e-05, + "loss": 0.0236, + "step": 267260 + }, + { + "epoch": 1.73, + "learning_rate": 4.124644210227382e-05, + "loss": 0.0217, + "step": 267270 + }, + { + "epoch": 1.73, + "learning_rate": 4.1236760747916894e-05, + "loss": 0.0217, + "step": 267280 + }, + { + "epoch": 1.73, + "learning_rate": 4.122707939355996e-05, + "loss": 0.0264, + "step": 267290 + }, + { + "epoch": 1.73, + "learning_rate": 4.1217398039203033e-05, + "loss": 0.027, + "step": 267300 + }, + { + "epoch": 1.73, + "learning_rate": 4.120771668484609e-05, + "loss": 0.0212, + "step": 267310 + }, + { + "epoch": 1.73, + "learning_rate": 4.119803533048916e-05, + "loss": 0.0228, + "step": 267320 + }, + { + "epoch": 1.73, + "learning_rate": 4.118835397613223e-05, + "loss": 0.0216, + "step": 267330 + }, + { + "epoch": 1.73, + "learning_rate": 4.11786726217753e-05, + "loss": 0.0277, + "step": 267340 + }, + { + "epoch": 1.73, + "learning_rate": 4.116899126741837e-05, + "loss": 0.0259, + "step": 267350 + }, + { + "epoch": 1.73, + "learning_rate": 4.115930991306143e-05, + "loss": 0.0193, + "step": 267360 + }, + { + "epoch": 1.73, + "learning_rate": 4.1149628558704504e-05, + "loss": 0.0271, + "step": 267370 + }, + { + "epoch": 1.73, + "learning_rate": 4.113994720434757e-05, + "loss": 0.0256, + "step": 267380 + }, + { + "epoch": 1.73, + "learning_rate": 4.1130265849990636e-05, + "loss": 0.0258, + "step": 267390 + }, + { + "epoch": 1.73, + "learning_rate": 4.112058449563371e-05, + "loss": 0.026, + "step": 267400 + }, + { + "epoch": 1.73, + "learning_rate": 4.111090314127677e-05, + "loss": 0.0187, + "step": 267410 + }, + { + "epoch": 1.73, + "learning_rate": 4.110122178691984e-05, + "loss": 0.0199, + "step": 267420 + }, + { + "epoch": 1.73, + "learning_rate": 4.109154043256291e-05, + "loss": 0.0257, + "step": 267430 + }, + { + "epoch": 1.73, + "learning_rate": 4.108185907820598e-05, + "loss": 0.0267, + "step": 267440 + }, + { + "epoch": 1.73, + "learning_rate": 4.107217772384905e-05, + "loss": 0.0237, + "step": 267450 + }, + { + "epoch": 1.73, + "learning_rate": 4.106249636949211e-05, + "loss": 0.0235, + "step": 267460 + }, + { + "epoch": 1.73, + "learning_rate": 4.105281501513518e-05, + "loss": 0.026, + "step": 267470 + }, + { + "epoch": 1.73, + "learning_rate": 4.1043133660778246e-05, + "loss": 0.0247, + "step": 267480 + }, + { + "epoch": 1.73, + "learning_rate": 4.103345230642132e-05, + "loss": 0.0266, + "step": 267490 + }, + { + "epoch": 1.73, + "learning_rate": 4.1023770952064385e-05, + "loss": 0.0225, + "step": 267500 + }, + { + "epoch": 1.73, + "learning_rate": 4.101408959770746e-05, + "loss": 0.0245, + "step": 267510 + }, + { + "epoch": 1.73, + "learning_rate": 4.100440824335052e-05, + "loss": 0.0309, + "step": 267520 + }, + { + "epoch": 1.73, + "learning_rate": 4.0994726888993584e-05, + "loss": 0.0262, + "step": 267530 + }, + { + "epoch": 1.73, + "learning_rate": 4.098504553463666e-05, + "loss": 0.0251, + "step": 267540 + }, + { + "epoch": 1.73, + "learning_rate": 4.097536418027972e-05, + "loss": 0.0266, + "step": 267550 + }, + { + "epoch": 1.73, + "learning_rate": 4.0965682825922796e-05, + "loss": 0.0196, + "step": 267560 + }, + { + "epoch": 1.73, + "learning_rate": 4.0956001471565856e-05, + "loss": 0.0224, + "step": 267570 + }, + { + "epoch": 1.73, + "learning_rate": 4.094632011720893e-05, + "loss": 0.0208, + "step": 267580 + }, + { + "epoch": 1.73, + "learning_rate": 4.0936638762851995e-05, + "loss": 0.0217, + "step": 267590 + }, + { + "epoch": 1.73, + "learning_rate": 4.092695740849506e-05, + "loss": 0.0254, + "step": 267600 + }, + { + "epoch": 1.73, + "learning_rate": 4.0917276054138134e-05, + "loss": 0.0263, + "step": 267610 + }, + { + "epoch": 1.73, + "learning_rate": 4.0907594699781194e-05, + "loss": 0.0221, + "step": 267620 + }, + { + "epoch": 1.73, + "learning_rate": 4.089791334542427e-05, + "loss": 0.0213, + "step": 267630 + }, + { + "epoch": 1.73, + "learning_rate": 4.088823199106733e-05, + "loss": 0.0251, + "step": 267640 + }, + { + "epoch": 1.73, + "learning_rate": 4.0878550636710406e-05, + "loss": 0.0261, + "step": 267650 + }, + { + "epoch": 1.73, + "learning_rate": 4.086886928235347e-05, + "loss": 0.0199, + "step": 267660 + }, + { + "epoch": 1.73, + "learning_rate": 4.085918792799653e-05, + "loss": 0.024, + "step": 267670 + }, + { + "epoch": 1.73, + "learning_rate": 4.0849506573639605e-05, + "loss": 0.025, + "step": 267680 + }, + { + "epoch": 1.73, + "learning_rate": 4.083982521928267e-05, + "loss": 0.0248, + "step": 267690 + }, + { + "epoch": 1.73, + "learning_rate": 4.0830143864925744e-05, + "loss": 0.0283, + "step": 267700 + }, + { + "epoch": 1.73, + "learning_rate": 4.082046251056881e-05, + "loss": 0.0302, + "step": 267710 + }, + { + "epoch": 1.73, + "learning_rate": 4.081078115621187e-05, + "loss": 0.0232, + "step": 267720 + }, + { + "epoch": 1.73, + "learning_rate": 4.080109980185494e-05, + "loss": 0.0251, + "step": 267730 + }, + { + "epoch": 1.73, + "learning_rate": 4.079141844749801e-05, + "loss": 0.0263, + "step": 267740 + }, + { + "epoch": 1.73, + "learning_rate": 4.078173709314108e-05, + "loss": 0.0265, + "step": 267750 + }, + { + "epoch": 1.73, + "learning_rate": 4.077205573878415e-05, + "loss": 0.0196, + "step": 267760 + }, + { + "epoch": 1.73, + "learning_rate": 4.076237438442722e-05, + "loss": 0.0241, + "step": 267770 + }, + { + "epoch": 1.73, + "learning_rate": 4.075269303007028e-05, + "loss": 0.0282, + "step": 267780 + }, + { + "epoch": 1.73, + "learning_rate": 4.074301167571335e-05, + "loss": 0.0262, + "step": 267790 + }, + { + "epoch": 1.73, + "learning_rate": 4.073333032135642e-05, + "loss": 0.0225, + "step": 267800 + }, + { + "epoch": 1.73, + "learning_rate": 4.0723648966999486e-05, + "loss": 0.0287, + "step": 267810 + }, + { + "epoch": 1.73, + "learning_rate": 4.071396761264256e-05, + "loss": 0.0251, + "step": 267820 + }, + { + "epoch": 1.73, + "learning_rate": 4.070428625828562e-05, + "loss": 0.022, + "step": 267830 + }, + { + "epoch": 1.73, + "learning_rate": 4.069460490392869e-05, + "loss": 0.0236, + "step": 267840 + }, + { + "epoch": 1.73, + "learning_rate": 4.068492354957176e-05, + "loss": 0.0251, + "step": 267850 + }, + { + "epoch": 1.73, + "learning_rate": 4.0675242195214824e-05, + "loss": 0.0192, + "step": 267860 + }, + { + "epoch": 1.73, + "learning_rate": 4.06655608408579e-05, + "loss": 0.0204, + "step": 267870 + }, + { + "epoch": 1.73, + "learning_rate": 4.065587948650096e-05, + "loss": 0.0279, + "step": 267880 + }, + { + "epoch": 1.73, + "learning_rate": 4.064619813214403e-05, + "loss": 0.0224, + "step": 267890 + }, + { + "epoch": 1.73, + "learning_rate": 4.0636516777787096e-05, + "loss": 0.0268, + "step": 267900 + }, + { + "epoch": 1.73, + "learning_rate": 4.062683542343017e-05, + "loss": 0.0284, + "step": 267910 + }, + { + "epoch": 1.73, + "learning_rate": 4.0617154069073235e-05, + "loss": 0.0219, + "step": 267920 + }, + { + "epoch": 1.73, + "learning_rate": 4.0607472714716295e-05, + "loss": 0.0287, + "step": 267930 + }, + { + "epoch": 1.73, + "learning_rate": 4.059779136035937e-05, + "loss": 0.0318, + "step": 267940 + }, + { + "epoch": 1.73, + "learning_rate": 4.0588110006002434e-05, + "loss": 0.0248, + "step": 267950 + }, + { + "epoch": 1.73, + "learning_rate": 4.057842865164551e-05, + "loss": 0.0201, + "step": 267960 + }, + { + "epoch": 1.73, + "learning_rate": 4.056874729728857e-05, + "loss": 0.0236, + "step": 267970 + }, + { + "epoch": 1.73, + "learning_rate": 4.0559065942931646e-05, + "loss": 0.0307, + "step": 267980 + }, + { + "epoch": 1.73, + "learning_rate": 4.0549384588574706e-05, + "loss": 0.026, + "step": 267990 + }, + { + "epoch": 1.73, + "learning_rate": 4.053970323421777e-05, + "loss": 0.029, + "step": 268000 + }, + { + "epoch": 1.73, + "eval_cer": 0.919813806349565, + "eval_loss": 0.017884543165564537, + "eval_runtime": 120.1776, + "eval_samples_per_second": 16.642, + "eval_steps_per_second": 4.161, + "step": 268000 + }, + { + "epoch": 1.73, + "learning_rate": 4.0530021879860845e-05, + "loss": 0.0274, + "step": 268010 + }, + { + "epoch": 1.73, + "learning_rate": 4.052034052550391e-05, + "loss": 0.0215, + "step": 268020 + }, + { + "epoch": 1.73, + "learning_rate": 4.0510659171146984e-05, + "loss": 0.0225, + "step": 268030 + }, + { + "epoch": 1.73, + "learning_rate": 4.0500977816790044e-05, + "loss": 0.0263, + "step": 268040 + }, + { + "epoch": 1.73, + "learning_rate": 4.0491296462433117e-05, + "loss": 0.0252, + "step": 268050 + }, + { + "epoch": 1.73, + "learning_rate": 4.048161510807618e-05, + "loss": 0.0221, + "step": 268060 + }, + { + "epoch": 1.73, + "learning_rate": 4.047193375371925e-05, + "loss": 0.0223, + "step": 268070 + }, + { + "epoch": 1.73, + "learning_rate": 4.046225239936232e-05, + "loss": 0.0227, + "step": 268080 + }, + { + "epoch": 1.73, + "learning_rate": 4.045257104500538e-05, + "loss": 0.0238, + "step": 268090 + }, + { + "epoch": 1.73, + "learning_rate": 4.0442889690648455e-05, + "loss": 0.0252, + "step": 268100 + }, + { + "epoch": 1.73, + "learning_rate": 4.043320833629152e-05, + "loss": 0.0345, + "step": 268110 + }, + { + "epoch": 1.73, + "learning_rate": 4.0423526981934594e-05, + "loss": 0.0238, + "step": 268120 + }, + { + "epoch": 1.73, + "learning_rate": 4.041384562757766e-05, + "loss": 0.0238, + "step": 268130 + }, + { + "epoch": 1.73, + "learning_rate": 4.040416427322072e-05, + "loss": 0.0256, + "step": 268140 + }, + { + "epoch": 1.73, + "learning_rate": 4.039448291886379e-05, + "loss": 0.023, + "step": 268150 + }, + { + "epoch": 1.73, + "learning_rate": 4.038480156450686e-05, + "loss": 0.022, + "step": 268160 + }, + { + "epoch": 1.73, + "learning_rate": 4.037512021014993e-05, + "loss": 0.0236, + "step": 268170 + }, + { + "epoch": 1.73, + "learning_rate": 4.0365438855793e-05, + "loss": 0.0247, + "step": 268180 + }, + { + "epoch": 1.73, + "learning_rate": 4.0355757501436064e-05, + "loss": 0.0318, + "step": 268190 + }, + { + "epoch": 1.73, + "learning_rate": 4.034607614707913e-05, + "loss": 0.0311, + "step": 268200 + }, + { + "epoch": 1.73, + "learning_rate": 4.03363947927222e-05, + "loss": 0.0202, + "step": 268210 + }, + { + "epoch": 1.73, + "learning_rate": 4.032671343836527e-05, + "loss": 0.0216, + "step": 268220 + }, + { + "epoch": 1.73, + "learning_rate": 4.0317032084008336e-05, + "loss": 0.0217, + "step": 268230 + }, + { + "epoch": 1.73, + "learning_rate": 4.03073507296514e-05, + "loss": 0.0239, + "step": 268240 + }, + { + "epoch": 1.73, + "learning_rate": 4.029766937529447e-05, + "loss": 0.0242, + "step": 268250 + }, + { + "epoch": 1.73, + "learning_rate": 4.028798802093754e-05, + "loss": 0.0208, + "step": 268260 + }, + { + "epoch": 1.73, + "learning_rate": 4.027830666658061e-05, + "loss": 0.0297, + "step": 268270 + }, + { + "epoch": 1.73, + "learning_rate": 4.0268625312223674e-05, + "loss": 0.0218, + "step": 268280 + }, + { + "epoch": 1.73, + "learning_rate": 4.025894395786674e-05, + "loss": 0.021, + "step": 268290 + }, + { + "epoch": 1.73, + "learning_rate": 4.0249262603509806e-05, + "loss": 0.0227, + "step": 268300 + }, + { + "epoch": 1.73, + "learning_rate": 4.023958124915288e-05, + "loss": 0.0231, + "step": 268310 + }, + { + "epoch": 1.73, + "learning_rate": 4.0229899894795946e-05, + "loss": 0.0236, + "step": 268320 + }, + { + "epoch": 1.73, + "learning_rate": 4.022021854043902e-05, + "loss": 0.0242, + "step": 268330 + }, + { + "epoch": 1.73, + "learning_rate": 4.021053718608208e-05, + "loss": 0.0234, + "step": 268340 + }, + { + "epoch": 1.73, + "learning_rate": 4.0200855831725144e-05, + "loss": 0.0271, + "step": 268350 + }, + { + "epoch": 1.73, + "learning_rate": 4.019117447736822e-05, + "loss": 0.0284, + "step": 268360 + }, + { + "epoch": 1.73, + "learning_rate": 4.0181493123011284e-05, + "loss": 0.0252, + "step": 268370 + }, + { + "epoch": 1.73, + "learning_rate": 4.017181176865436e-05, + "loss": 0.0246, + "step": 268380 + }, + { + "epoch": 1.73, + "learning_rate": 4.0162130414297416e-05, + "loss": 0.0234, + "step": 268390 + }, + { + "epoch": 1.73, + "learning_rate": 4.015244905994049e-05, + "loss": 0.0202, + "step": 268400 + }, + { + "epoch": 1.73, + "learning_rate": 4.0142767705583555e-05, + "loss": 0.03, + "step": 268410 + }, + { + "epoch": 1.73, + "learning_rate": 4.013308635122662e-05, + "loss": 0.0247, + "step": 268420 + }, + { + "epoch": 1.73, + "learning_rate": 4.0123404996869695e-05, + "loss": 0.0234, + "step": 268430 + }, + { + "epoch": 1.73, + "learning_rate": 4.0113723642512754e-05, + "loss": 0.0232, + "step": 268440 + }, + { + "epoch": 1.73, + "learning_rate": 4.010404228815583e-05, + "loss": 0.0302, + "step": 268450 + }, + { + "epoch": 1.73, + "learning_rate": 4.009436093379889e-05, + "loss": 0.0263, + "step": 268460 + }, + { + "epoch": 1.73, + "learning_rate": 4.0084679579441966e-05, + "loss": 0.0241, + "step": 268470 + }, + { + "epoch": 1.73, + "learning_rate": 4.007499822508503e-05, + "loss": 0.0236, + "step": 268480 + }, + { + "epoch": 1.73, + "learning_rate": 4.006531687072809e-05, + "loss": 0.0315, + "step": 268490 + }, + { + "epoch": 1.73, + "learning_rate": 4.0055635516371165e-05, + "loss": 0.0242, + "step": 268500 + }, + { + "epoch": 1.73, + "learning_rate": 4.004595416201423e-05, + "loss": 0.0266, + "step": 268510 + }, + { + "epoch": 1.73, + "learning_rate": 4.0036272807657304e-05, + "loss": 0.0331, + "step": 268520 + }, + { + "epoch": 1.73, + "learning_rate": 4.002659145330037e-05, + "loss": 0.023, + "step": 268530 + }, + { + "epoch": 1.73, + "learning_rate": 4.0016910098943444e-05, + "loss": 0.0228, + "step": 268540 + }, + { + "epoch": 1.73, + "learning_rate": 4.00072287445865e-05, + "loss": 0.0253, + "step": 268550 + }, + { + "epoch": 1.73, + "learning_rate": 3.999754739022957e-05, + "loss": 0.0243, + "step": 268560 + }, + { + "epoch": 1.73, + "learning_rate": 3.998786603587264e-05, + "loss": 0.0236, + "step": 268570 + }, + { + "epoch": 1.73, + "learning_rate": 3.997818468151571e-05, + "loss": 0.0223, + "step": 268580 + }, + { + "epoch": 1.73, + "learning_rate": 3.996850332715878e-05, + "loss": 0.0266, + "step": 268590 + }, + { + "epoch": 1.73, + "learning_rate": 3.995882197280184e-05, + "loss": 0.018, + "step": 268600 + }, + { + "epoch": 1.73, + "learning_rate": 3.9949140618444914e-05, + "loss": 0.0243, + "step": 268610 + }, + { + "epoch": 1.73, + "learning_rate": 3.993945926408798e-05, + "loss": 0.0214, + "step": 268620 + }, + { + "epoch": 1.73, + "learning_rate": 3.9929777909731047e-05, + "loss": 0.024, + "step": 268630 + }, + { + "epoch": 1.73, + "learning_rate": 3.992009655537412e-05, + "loss": 0.0241, + "step": 268640 + }, + { + "epoch": 1.73, + "learning_rate": 3.991041520101718e-05, + "loss": 0.0233, + "step": 268650 + }, + { + "epoch": 1.73, + "learning_rate": 3.990073384666025e-05, + "loss": 0.0249, + "step": 268660 + }, + { + "epoch": 1.73, + "learning_rate": 3.989105249230332e-05, + "loss": 0.0327, + "step": 268670 + }, + { + "epoch": 1.73, + "learning_rate": 3.988137113794639e-05, + "loss": 0.0226, + "step": 268680 + }, + { + "epoch": 1.73, + "learning_rate": 3.987168978358946e-05, + "loss": 0.0252, + "step": 268690 + }, + { + "epoch": 1.73, + "learning_rate": 3.986200842923252e-05, + "loss": 0.0259, + "step": 268700 + }, + { + "epoch": 1.73, + "learning_rate": 3.985232707487559e-05, + "loss": 0.0251, + "step": 268710 + }, + { + "epoch": 1.73, + "learning_rate": 3.9842645720518656e-05, + "loss": 0.0314, + "step": 268720 + }, + { + "epoch": 1.73, + "learning_rate": 3.983296436616173e-05, + "loss": 0.0251, + "step": 268730 + }, + { + "epoch": 1.73, + "learning_rate": 3.9823283011804795e-05, + "loss": 0.0253, + "step": 268740 + }, + { + "epoch": 1.73, + "learning_rate": 3.981360165744787e-05, + "loss": 0.0234, + "step": 268750 + }, + { + "epoch": 1.73, + "learning_rate": 3.980392030309093e-05, + "loss": 0.0217, + "step": 268760 + }, + { + "epoch": 1.73, + "learning_rate": 3.9794238948733994e-05, + "loss": 0.0201, + "step": 268770 + }, + { + "epoch": 1.73, + "learning_rate": 3.978455759437707e-05, + "loss": 0.0266, + "step": 268780 + }, + { + "epoch": 1.73, + "learning_rate": 3.9774876240020133e-05, + "loss": 0.023, + "step": 268790 + }, + { + "epoch": 1.73, + "learning_rate": 3.9765194885663206e-05, + "loss": 0.0225, + "step": 268800 + }, + { + "epoch": 1.73, + "learning_rate": 3.9755513531306266e-05, + "loss": 0.0226, + "step": 268810 + }, + { + "epoch": 1.74, + "learning_rate": 3.974583217694934e-05, + "loss": 0.0252, + "step": 268820 + }, + { + "epoch": 1.74, + "learning_rate": 3.9736150822592405e-05, + "loss": 0.0216, + "step": 268830 + }, + { + "epoch": 1.74, + "learning_rate": 3.972646946823547e-05, + "loss": 0.0202, + "step": 268840 + }, + { + "epoch": 1.74, + "learning_rate": 3.9716788113878544e-05, + "loss": 0.0196, + "step": 268850 + }, + { + "epoch": 1.74, + "learning_rate": 3.9707106759521604e-05, + "loss": 0.0222, + "step": 268860 + }, + { + "epoch": 1.74, + "learning_rate": 3.969742540516468e-05, + "loss": 0.0224, + "step": 268870 + }, + { + "epoch": 1.74, + "learning_rate": 3.968774405080774e-05, + "loss": 0.026, + "step": 268880 + }, + { + "epoch": 1.74, + "learning_rate": 3.9678062696450816e-05, + "loss": 0.0258, + "step": 268890 + }, + { + "epoch": 1.74, + "learning_rate": 3.966838134209388e-05, + "loss": 0.0238, + "step": 268900 + }, + { + "epoch": 1.74, + "learning_rate": 3.965869998773694e-05, + "loss": 0.0217, + "step": 268910 + }, + { + "epoch": 1.74, + "learning_rate": 3.9649018633380015e-05, + "loss": 0.0195, + "step": 268920 + }, + { + "epoch": 1.74, + "learning_rate": 3.963933727902308e-05, + "loss": 0.0263, + "step": 268930 + }, + { + "epoch": 1.74, + "learning_rate": 3.9629655924666154e-05, + "loss": 0.0272, + "step": 268940 + }, + { + "epoch": 1.74, + "learning_rate": 3.961997457030922e-05, + "loss": 0.0232, + "step": 268950 + }, + { + "epoch": 1.74, + "learning_rate": 3.9610293215952293e-05, + "loss": 0.0239, + "step": 268960 + }, + { + "epoch": 1.74, + "learning_rate": 3.960061186159535e-05, + "loss": 0.0218, + "step": 268970 + }, + { + "epoch": 1.74, + "learning_rate": 3.959093050723842e-05, + "loss": 0.025, + "step": 268980 + }, + { + "epoch": 1.74, + "learning_rate": 3.958124915288149e-05, + "loss": 0.0251, + "step": 268990 + }, + { + "epoch": 1.74, + "learning_rate": 3.957156779852456e-05, + "loss": 0.0233, + "step": 269000 + }, + { + "epoch": 1.74, + "eval_cer": 0.9198192294655971, + "eval_loss": 0.0177915096282959, + "eval_runtime": 119.9978, + "eval_samples_per_second": 16.667, + "eval_steps_per_second": 4.167, + "step": 269000 + }, + { + "epoch": 1.74, + "learning_rate": 3.956188644416763e-05, + "loss": 0.0222, + "step": 269010 + }, + { + "epoch": 1.74, + "learning_rate": 3.955220508981069e-05, + "loss": 0.0226, + "step": 269020 + }, + { + "epoch": 1.74, + "learning_rate": 3.9542523735453764e-05, + "loss": 0.0222, + "step": 269030 + }, + { + "epoch": 1.74, + "learning_rate": 3.953284238109683e-05, + "loss": 0.0211, + "step": 269040 + }, + { + "epoch": 1.74, + "learning_rate": 3.9523161026739896e-05, + "loss": 0.0246, + "step": 269050 + }, + { + "epoch": 1.74, + "learning_rate": 3.951347967238297e-05, + "loss": 0.0195, + "step": 269060 + }, + { + "epoch": 1.74, + "learning_rate": 3.950379831802603e-05, + "loss": 0.0295, + "step": 269070 + }, + { + "epoch": 1.74, + "learning_rate": 3.94941169636691e-05, + "loss": 0.024, + "step": 269080 + }, + { + "epoch": 1.74, + "learning_rate": 3.948443560931217e-05, + "loss": 0.0244, + "step": 269090 + }, + { + "epoch": 1.74, + "learning_rate": 3.947475425495524e-05, + "loss": 0.0203, + "step": 269100 + }, + { + "epoch": 1.74, + "learning_rate": 3.946507290059831e-05, + "loss": 0.024, + "step": 269110 + }, + { + "epoch": 1.74, + "learning_rate": 3.945539154624137e-05, + "loss": 0.0238, + "step": 269120 + }, + { + "epoch": 1.74, + "learning_rate": 3.944571019188444e-05, + "loss": 0.0237, + "step": 269130 + }, + { + "epoch": 1.74, + "learning_rate": 3.9436028837527506e-05, + "loss": 0.0264, + "step": 269140 + }, + { + "epoch": 1.74, + "learning_rate": 3.942634748317058e-05, + "loss": 0.0219, + "step": 269150 + }, + { + "epoch": 1.74, + "learning_rate": 3.9416666128813645e-05, + "loss": 0.0224, + "step": 269160 + }, + { + "epoch": 1.74, + "learning_rate": 3.940698477445672e-05, + "loss": 0.0231, + "step": 269170 + }, + { + "epoch": 1.74, + "learning_rate": 3.939730342009978e-05, + "loss": 0.0242, + "step": 269180 + }, + { + "epoch": 1.74, + "learning_rate": 3.9387622065742844e-05, + "loss": 0.0216, + "step": 269190 + }, + { + "epoch": 1.74, + "learning_rate": 3.937794071138592e-05, + "loss": 0.0242, + "step": 269200 + }, + { + "epoch": 1.74, + "learning_rate": 3.936825935702898e-05, + "loss": 0.0245, + "step": 269210 + }, + { + "epoch": 1.74, + "learning_rate": 3.9358578002672056e-05, + "loss": 0.0212, + "step": 269220 + }, + { + "epoch": 1.74, + "learning_rate": 3.9348896648315116e-05, + "loss": 0.0231, + "step": 269230 + }, + { + "epoch": 1.74, + "learning_rate": 3.933921529395819e-05, + "loss": 0.0217, + "step": 269240 + }, + { + "epoch": 1.74, + "learning_rate": 3.9329533939601255e-05, + "loss": 0.0251, + "step": 269250 + }, + { + "epoch": 1.74, + "learning_rate": 3.931985258524432e-05, + "loss": 0.022, + "step": 269260 + }, + { + "epoch": 1.74, + "learning_rate": 3.9310171230887394e-05, + "loss": 0.0283, + "step": 269270 + }, + { + "epoch": 1.74, + "learning_rate": 3.9300489876530454e-05, + "loss": 0.0228, + "step": 269280 + }, + { + "epoch": 1.74, + "learning_rate": 3.929080852217353e-05, + "loss": 0.0207, + "step": 269290 + }, + { + "epoch": 1.74, + "learning_rate": 3.928112716781659e-05, + "loss": 0.0276, + "step": 269300 + }, + { + "epoch": 1.74, + "learning_rate": 3.9271445813459666e-05, + "loss": 0.0279, + "step": 269310 + }, + { + "epoch": 1.74, + "learning_rate": 3.926176445910273e-05, + "loss": 0.0215, + "step": 269320 + }, + { + "epoch": 1.74, + "learning_rate": 3.925208310474579e-05, + "loss": 0.0267, + "step": 269330 + }, + { + "epoch": 1.74, + "learning_rate": 3.9242401750388865e-05, + "loss": 0.023, + "step": 269340 + }, + { + "epoch": 1.74, + "learning_rate": 3.923272039603193e-05, + "loss": 0.0226, + "step": 269350 + }, + { + "epoch": 1.74, + "learning_rate": 3.9223039041675004e-05, + "loss": 0.0255, + "step": 269360 + }, + { + "epoch": 1.74, + "learning_rate": 3.921335768731807e-05, + "loss": 0.0233, + "step": 269370 + }, + { + "epoch": 1.74, + "learning_rate": 3.9203676332961136e-05, + "loss": 0.0268, + "step": 269380 + }, + { + "epoch": 1.74, + "learning_rate": 3.91939949786042e-05, + "loss": 0.0216, + "step": 269390 + }, + { + "epoch": 1.74, + "learning_rate": 3.918431362424727e-05, + "loss": 0.0267, + "step": 269400 + }, + { + "epoch": 1.74, + "learning_rate": 3.917463226989034e-05, + "loss": 0.0251, + "step": 269410 + }, + { + "epoch": 1.74, + "learning_rate": 3.916495091553341e-05, + "loss": 0.0245, + "step": 269420 + }, + { + "epoch": 1.74, + "learning_rate": 3.9155269561176474e-05, + "loss": 0.021, + "step": 269430 + }, + { + "epoch": 1.74, + "learning_rate": 3.914558820681954e-05, + "loss": 0.0212, + "step": 269440 + }, + { + "epoch": 1.74, + "learning_rate": 3.913590685246261e-05, + "loss": 0.0249, + "step": 269450 + }, + { + "epoch": 1.74, + "learning_rate": 3.912622549810568e-05, + "loss": 0.0236, + "step": 269460 + }, + { + "epoch": 1.74, + "learning_rate": 3.9116544143748746e-05, + "loss": 0.024, + "step": 269470 + }, + { + "epoch": 1.74, + "learning_rate": 3.910686278939181e-05, + "loss": 0.0251, + "step": 269480 + }, + { + "epoch": 1.74, + "learning_rate": 3.909718143503488e-05, + "loss": 0.0261, + "step": 269490 + }, + { + "epoch": 1.74, + "learning_rate": 3.908750008067795e-05, + "loss": 0.0229, + "step": 269500 + }, + { + "epoch": 1.74, + "learning_rate": 3.907781872632102e-05, + "loss": 0.0225, + "step": 269510 + }, + { + "epoch": 1.74, + "learning_rate": 3.9068137371964084e-05, + "loss": 0.0242, + "step": 269520 + }, + { + "epoch": 1.74, + "learning_rate": 3.905845601760715e-05, + "loss": 0.0291, + "step": 269530 + }, + { + "epoch": 1.74, + "learning_rate": 3.9048774663250217e-05, + "loss": 0.0229, + "step": 269540 + }, + { + "epoch": 1.74, + "learning_rate": 3.903909330889329e-05, + "loss": 0.0248, + "step": 269550 + }, + { + "epoch": 1.74, + "learning_rate": 3.9029411954536356e-05, + "loss": 0.0248, + "step": 269560 + }, + { + "epoch": 1.74, + "learning_rate": 3.901973060017943e-05, + "loss": 0.028, + "step": 269570 + }, + { + "epoch": 1.74, + "learning_rate": 3.901004924582249e-05, + "loss": 0.0272, + "step": 269580 + }, + { + "epoch": 1.74, + "learning_rate": 3.9000367891465555e-05, + "loss": 0.0225, + "step": 269590 + }, + { + "epoch": 1.74, + "learning_rate": 3.899068653710863e-05, + "loss": 0.0228, + "step": 269600 + }, + { + "epoch": 1.74, + "learning_rate": 3.8981005182751694e-05, + "loss": 0.0257, + "step": 269610 + }, + { + "epoch": 1.74, + "learning_rate": 3.897132382839477e-05, + "loss": 0.0314, + "step": 269620 + }, + { + "epoch": 1.74, + "learning_rate": 3.8961642474037826e-05, + "loss": 0.0231, + "step": 269630 + }, + { + "epoch": 1.74, + "learning_rate": 3.89519611196809e-05, + "loss": 0.0281, + "step": 269640 + }, + { + "epoch": 1.74, + "learning_rate": 3.8942279765323966e-05, + "loss": 0.0235, + "step": 269650 + }, + { + "epoch": 1.74, + "learning_rate": 3.893259841096703e-05, + "loss": 0.0268, + "step": 269660 + }, + { + "epoch": 1.74, + "learning_rate": 3.8922917056610105e-05, + "loss": 0.0265, + "step": 269670 + }, + { + "epoch": 1.74, + "learning_rate": 3.891323570225317e-05, + "loss": 0.0237, + "step": 269680 + }, + { + "epoch": 1.74, + "learning_rate": 3.890355434789624e-05, + "loss": 0.0238, + "step": 269690 + }, + { + "epoch": 1.74, + "learning_rate": 3.8893872993539304e-05, + "loss": 0.0273, + "step": 269700 + }, + { + "epoch": 1.74, + "learning_rate": 3.8884191639182377e-05, + "loss": 0.0233, + "step": 269710 + }, + { + "epoch": 1.74, + "learning_rate": 3.887451028482544e-05, + "loss": 0.028, + "step": 269720 + }, + { + "epoch": 1.74, + "learning_rate": 3.886482893046851e-05, + "loss": 0.0226, + "step": 269730 + }, + { + "epoch": 1.74, + "learning_rate": 3.8855147576111575e-05, + "loss": 0.0212, + "step": 269740 + }, + { + "epoch": 1.74, + "learning_rate": 3.884546622175464e-05, + "loss": 0.0247, + "step": 269750 + }, + { + "epoch": 1.74, + "learning_rate": 3.8835784867397715e-05, + "loss": 0.0227, + "step": 269760 + }, + { + "epoch": 1.74, + "learning_rate": 3.882610351304078e-05, + "loss": 0.0266, + "step": 269770 + }, + { + "epoch": 1.74, + "learning_rate": 3.8816422158683854e-05, + "loss": 0.0256, + "step": 269780 + }, + { + "epoch": 1.74, + "learning_rate": 3.880674080432691e-05, + "loss": 0.0244, + "step": 269790 + }, + { + "epoch": 1.74, + "learning_rate": 3.879705944996998e-05, + "loss": 0.0228, + "step": 269800 + }, + { + "epoch": 1.74, + "learning_rate": 3.878737809561305e-05, + "loss": 0.0197, + "step": 269810 + }, + { + "epoch": 1.74, + "learning_rate": 3.877769674125612e-05, + "loss": 0.024, + "step": 269820 + }, + { + "epoch": 1.74, + "learning_rate": 3.876801538689919e-05, + "loss": 0.0236, + "step": 269830 + }, + { + "epoch": 1.74, + "learning_rate": 3.875833403254225e-05, + "loss": 0.0251, + "step": 269840 + }, + { + "epoch": 1.74, + "learning_rate": 3.8748652678185324e-05, + "loss": 0.0228, + "step": 269850 + }, + { + "epoch": 1.74, + "learning_rate": 3.873897132382839e-05, + "loss": 0.0245, + "step": 269860 + }, + { + "epoch": 1.74, + "learning_rate": 3.872928996947146e-05, + "loss": 0.0198, + "step": 269870 + }, + { + "epoch": 1.74, + "learning_rate": 3.871960861511453e-05, + "loss": 0.0199, + "step": 269880 + }, + { + "epoch": 1.74, + "learning_rate": 3.870992726075759e-05, + "loss": 0.0195, + "step": 269890 + }, + { + "epoch": 1.74, + "learning_rate": 3.870024590640066e-05, + "loss": 0.0255, + "step": 269900 + }, + { + "epoch": 1.74, + "learning_rate": 3.869056455204373e-05, + "loss": 0.0237, + "step": 269910 + }, + { + "epoch": 1.74, + "learning_rate": 3.86808831976868e-05, + "loss": 0.0234, + "step": 269920 + }, + { + "epoch": 1.74, + "learning_rate": 3.867120184332987e-05, + "loss": 0.0275, + "step": 269930 + }, + { + "epoch": 1.74, + "learning_rate": 3.866152048897293e-05, + "loss": 0.0268, + "step": 269940 + }, + { + "epoch": 1.74, + "learning_rate": 3.8651839134616e-05, + "loss": 0.0286, + "step": 269950 + }, + { + "epoch": 1.74, + "learning_rate": 3.8642157780259066e-05, + "loss": 0.0232, + "step": 269960 + }, + { + "epoch": 1.74, + "learning_rate": 3.863247642590214e-05, + "loss": 0.0245, + "step": 269970 + }, + { + "epoch": 1.74, + "learning_rate": 3.8622795071545206e-05, + "loss": 0.0237, + "step": 269980 + }, + { + "epoch": 1.74, + "learning_rate": 3.861311371718828e-05, + "loss": 0.0197, + "step": 269990 + }, + { + "epoch": 1.74, + "learning_rate": 3.860343236283134e-05, + "loss": 0.0248, + "step": 270000 + }, + { + "epoch": 1.74, + "eval_cer": 0.9198463450457576, + "eval_loss": 0.01764541305601597, + "eval_runtime": 119.9301, + "eval_samples_per_second": 16.676, + "eval_steps_per_second": 4.169, + "step": 270000 + }, + { + "epoch": 1.74, + "learning_rate": 3.8593751008474404e-05, + "loss": 0.0227, + "step": 270010 + }, + { + "epoch": 1.74, + "learning_rate": 3.858406965411748e-05, + "loss": 0.0236, + "step": 270020 + }, + { + "epoch": 1.74, + "learning_rate": 3.8574388299760544e-05, + "loss": 0.0244, + "step": 270030 + }, + { + "epoch": 1.74, + "learning_rate": 3.856470694540362e-05, + "loss": 0.0252, + "step": 270040 + }, + { + "epoch": 1.74, + "learning_rate": 3.8555025591046676e-05, + "loss": 0.0235, + "step": 270050 + }, + { + "epoch": 1.74, + "learning_rate": 3.854534423668975e-05, + "loss": 0.0209, + "step": 270060 + }, + { + "epoch": 1.74, + "learning_rate": 3.8535662882332815e-05, + "loss": 0.0219, + "step": 270070 + }, + { + "epoch": 1.74, + "learning_rate": 3.852598152797588e-05, + "loss": 0.027, + "step": 270080 + }, + { + "epoch": 1.74, + "learning_rate": 3.8516300173618955e-05, + "loss": 0.0211, + "step": 270090 + }, + { + "epoch": 1.74, + "learning_rate": 3.8506618819262014e-05, + "loss": 0.0242, + "step": 270100 + }, + { + "epoch": 1.74, + "learning_rate": 3.849693746490509e-05, + "loss": 0.0254, + "step": 270110 + }, + { + "epoch": 1.74, + "learning_rate": 3.848725611054815e-05, + "loss": 0.0271, + "step": 270120 + }, + { + "epoch": 1.74, + "learning_rate": 3.8477574756191226e-05, + "loss": 0.0242, + "step": 270130 + }, + { + "epoch": 1.74, + "learning_rate": 3.846789340183429e-05, + "loss": 0.0222, + "step": 270140 + }, + { + "epoch": 1.74, + "learning_rate": 3.845821204747735e-05, + "loss": 0.0251, + "step": 270150 + }, + { + "epoch": 1.74, + "learning_rate": 3.8448530693120425e-05, + "loss": 0.0207, + "step": 270160 + }, + { + "epoch": 1.74, + "learning_rate": 3.843884933876349e-05, + "loss": 0.0311, + "step": 270170 + }, + { + "epoch": 1.74, + "learning_rate": 3.8429167984406564e-05, + "loss": 0.0266, + "step": 270180 + }, + { + "epoch": 1.74, + "learning_rate": 3.841948663004963e-05, + "loss": 0.0246, + "step": 270190 + }, + { + "epoch": 1.74, + "learning_rate": 3.8409805275692704e-05, + "loss": 0.0215, + "step": 270200 + }, + { + "epoch": 1.74, + "learning_rate": 3.840012392133576e-05, + "loss": 0.0269, + "step": 270210 + }, + { + "epoch": 1.74, + "learning_rate": 3.839044256697883e-05, + "loss": 0.0209, + "step": 270220 + }, + { + "epoch": 1.74, + "learning_rate": 3.83807612126219e-05, + "loss": 0.024, + "step": 270230 + }, + { + "epoch": 1.74, + "learning_rate": 3.837107985826497e-05, + "loss": 0.0229, + "step": 270240 + }, + { + "epoch": 1.74, + "learning_rate": 3.836139850390804e-05, + "loss": 0.0226, + "step": 270250 + }, + { + "epoch": 1.74, + "learning_rate": 3.83517171495511e-05, + "loss": 0.0222, + "step": 270260 + }, + { + "epoch": 1.74, + "learning_rate": 3.8342035795194174e-05, + "loss": 0.0245, + "step": 270270 + }, + { + "epoch": 1.74, + "learning_rate": 3.833235444083724e-05, + "loss": 0.024, + "step": 270280 + }, + { + "epoch": 1.74, + "learning_rate": 3.8322673086480307e-05, + "loss": 0.0206, + "step": 270290 + }, + { + "epoch": 1.74, + "learning_rate": 3.831299173212338e-05, + "loss": 0.0209, + "step": 270300 + }, + { + "epoch": 1.74, + "learning_rate": 3.830331037776644e-05, + "loss": 0.025, + "step": 270310 + }, + { + "epoch": 1.74, + "learning_rate": 3.829362902340951e-05, + "loss": 0.0237, + "step": 270320 + }, + { + "epoch": 1.74, + "learning_rate": 3.828394766905258e-05, + "loss": 0.0242, + "step": 270330 + }, + { + "epoch": 1.74, + "learning_rate": 3.827426631469565e-05, + "loss": 0.0232, + "step": 270340 + }, + { + "epoch": 1.74, + "learning_rate": 3.826458496033872e-05, + "loss": 0.0232, + "step": 270350 + }, + { + "epoch": 1.74, + "learning_rate": 3.825490360598178e-05, + "loss": 0.0267, + "step": 270360 + }, + { + "epoch": 1.75, + "learning_rate": 3.824522225162485e-05, + "loss": 0.0221, + "step": 270370 + }, + { + "epoch": 1.75, + "learning_rate": 3.8235540897267916e-05, + "loss": 0.0205, + "step": 270380 + }, + { + "epoch": 1.75, + "learning_rate": 3.822585954291099e-05, + "loss": 0.0209, + "step": 270390 + }, + { + "epoch": 1.75, + "learning_rate": 3.8216178188554055e-05, + "loss": 0.0232, + "step": 270400 + }, + { + "epoch": 1.75, + "learning_rate": 3.820649683419713e-05, + "loss": 0.0252, + "step": 270410 + }, + { + "epoch": 1.75, + "learning_rate": 3.819681547984019e-05, + "loss": 0.022, + "step": 270420 + }, + { + "epoch": 1.75, + "learning_rate": 3.8187134125483254e-05, + "loss": 0.0227, + "step": 270430 + }, + { + "epoch": 1.75, + "learning_rate": 3.817745277112633e-05, + "loss": 0.0213, + "step": 270440 + }, + { + "epoch": 1.75, + "learning_rate": 3.8167771416769393e-05, + "loss": 0.0215, + "step": 270450 + }, + { + "epoch": 1.75, + "learning_rate": 3.8158090062412466e-05, + "loss": 0.025, + "step": 270460 + }, + { + "epoch": 1.75, + "learning_rate": 3.8148408708055526e-05, + "loss": 0.0259, + "step": 270470 + }, + { + "epoch": 1.75, + "learning_rate": 3.81387273536986e-05, + "loss": 0.0212, + "step": 270480 + }, + { + "epoch": 1.75, + "learning_rate": 3.8129045999341665e-05, + "loss": 0.0267, + "step": 270490 + }, + { + "epoch": 1.75, + "learning_rate": 3.811936464498473e-05, + "loss": 0.0328, + "step": 270500 + }, + { + "epoch": 1.75, + "learning_rate": 3.8109683290627804e-05, + "loss": 0.0188, + "step": 270510 + }, + { + "epoch": 1.75, + "learning_rate": 3.8100001936270864e-05, + "loss": 0.0263, + "step": 270520 + }, + { + "epoch": 1.75, + "learning_rate": 3.809032058191394e-05, + "loss": 0.0211, + "step": 270530 + }, + { + "epoch": 1.75, + "learning_rate": 3.8080639227557e-05, + "loss": 0.0285, + "step": 270540 + }, + { + "epoch": 1.75, + "learning_rate": 3.8070957873200076e-05, + "loss": 0.0242, + "step": 270550 + }, + { + "epoch": 1.75, + "learning_rate": 3.806127651884314e-05, + "loss": 0.019, + "step": 270560 + }, + { + "epoch": 1.75, + "learning_rate": 3.80515951644862e-05, + "loss": 0.0219, + "step": 270570 + }, + { + "epoch": 1.75, + "learning_rate": 3.8041913810129275e-05, + "loss": 0.0249, + "step": 270580 + }, + { + "epoch": 1.75, + "learning_rate": 3.803223245577234e-05, + "loss": 0.0272, + "step": 270590 + }, + { + "epoch": 1.75, + "learning_rate": 3.8022551101415414e-05, + "loss": 0.0252, + "step": 270600 + }, + { + "epoch": 1.75, + "learning_rate": 3.801286974705848e-05, + "loss": 0.0211, + "step": 270610 + }, + { + "epoch": 1.75, + "learning_rate": 3.800318839270155e-05, + "loss": 0.0213, + "step": 270620 + }, + { + "epoch": 1.75, + "learning_rate": 3.799350703834461e-05, + "loss": 0.0245, + "step": 270630 + }, + { + "epoch": 1.75, + "learning_rate": 3.798382568398768e-05, + "loss": 0.0265, + "step": 270640 + }, + { + "epoch": 1.75, + "learning_rate": 3.797414432963075e-05, + "loss": 0.0236, + "step": 270650 + }, + { + "epoch": 1.75, + "learning_rate": 3.796446297527382e-05, + "loss": 0.0227, + "step": 270660 + }, + { + "epoch": 1.75, + "learning_rate": 3.795478162091689e-05, + "loss": 0.0274, + "step": 270670 + }, + { + "epoch": 1.75, + "learning_rate": 3.794510026655995e-05, + "loss": 0.0196, + "step": 270680 + }, + { + "epoch": 1.75, + "learning_rate": 3.7935418912203024e-05, + "loss": 0.024, + "step": 270690 + }, + { + "epoch": 1.75, + "learning_rate": 3.792573755784609e-05, + "loss": 0.0263, + "step": 270700 + }, + { + "epoch": 1.75, + "learning_rate": 3.7916056203489156e-05, + "loss": 0.0239, + "step": 270710 + }, + { + "epoch": 1.75, + "learning_rate": 3.790637484913223e-05, + "loss": 0.0279, + "step": 270720 + }, + { + "epoch": 1.75, + "learning_rate": 3.789669349477529e-05, + "loss": 0.0217, + "step": 270730 + }, + { + "epoch": 1.75, + "learning_rate": 3.788701214041836e-05, + "loss": 0.0219, + "step": 270740 + }, + { + "epoch": 1.75, + "learning_rate": 3.787733078606143e-05, + "loss": 0.0222, + "step": 270750 + }, + { + "epoch": 1.75, + "learning_rate": 3.78676494317045e-05, + "loss": 0.0255, + "step": 270760 + }, + { + "epoch": 1.75, + "learning_rate": 3.785796807734757e-05, + "loss": 0.0252, + "step": 270770 + }, + { + "epoch": 1.75, + "learning_rate": 3.784828672299063e-05, + "loss": 0.025, + "step": 270780 + }, + { + "epoch": 1.75, + "learning_rate": 3.78386053686337e-05, + "loss": 0.0208, + "step": 270790 + }, + { + "epoch": 1.75, + "learning_rate": 3.7828924014276766e-05, + "loss": 0.0221, + "step": 270800 + }, + { + "epoch": 1.75, + "learning_rate": 3.781924265991984e-05, + "loss": 0.0252, + "step": 270810 + }, + { + "epoch": 1.75, + "learning_rate": 3.7809561305562905e-05, + "loss": 0.0242, + "step": 270820 + }, + { + "epoch": 1.75, + "learning_rate": 3.779987995120597e-05, + "loss": 0.0258, + "step": 270830 + }, + { + "epoch": 1.75, + "learning_rate": 3.779019859684904e-05, + "loss": 0.0263, + "step": 270840 + }, + { + "epoch": 1.75, + "learning_rate": 3.7780517242492104e-05, + "loss": 0.021, + "step": 270850 + }, + { + "epoch": 1.75, + "learning_rate": 3.777083588813518e-05, + "loss": 0.022, + "step": 270860 + }, + { + "epoch": 1.75, + "learning_rate": 3.776115453377824e-05, + "loss": 0.0241, + "step": 270870 + }, + { + "epoch": 1.75, + "learning_rate": 3.775147317942131e-05, + "loss": 0.0198, + "step": 270880 + }, + { + "epoch": 1.75, + "learning_rate": 3.7741791825064376e-05, + "loss": 0.0263, + "step": 270890 + }, + { + "epoch": 1.75, + "learning_rate": 3.773211047070745e-05, + "loss": 0.0269, + "step": 270900 + }, + { + "epoch": 1.75, + "learning_rate": 3.7722429116350515e-05, + "loss": 0.0207, + "step": 270910 + }, + { + "epoch": 1.75, + "learning_rate": 3.771274776199358e-05, + "loss": 0.0235, + "step": 270920 + }, + { + "epoch": 1.75, + "learning_rate": 3.770306640763665e-05, + "loss": 0.024, + "step": 270930 + }, + { + "epoch": 1.75, + "learning_rate": 3.7693385053279714e-05, + "loss": 0.017, + "step": 270940 + }, + { + "epoch": 1.75, + "learning_rate": 3.768370369892279e-05, + "loss": 0.019, + "step": 270950 + }, + { + "epoch": 1.75, + "learning_rate": 3.767402234456585e-05, + "loss": 0.0271, + "step": 270960 + }, + { + "epoch": 1.75, + "learning_rate": 3.7664340990208926e-05, + "loss": 0.0256, + "step": 270970 + }, + { + "epoch": 1.75, + "learning_rate": 3.7654659635851985e-05, + "loss": 0.0243, + "step": 270980 + }, + { + "epoch": 1.75, + "learning_rate": 3.764497828149505e-05, + "loss": 0.0229, + "step": 270990 + }, + { + "epoch": 1.75, + "learning_rate": 3.7635296927138125e-05, + "loss": 0.0211, + "step": 271000 + }, + { + "epoch": 1.75, + "eval_cer": 0.9198490566037736, + "eval_loss": 0.01767873205244541, + "eval_runtime": 119.9595, + "eval_samples_per_second": 16.672, + "eval_steps_per_second": 4.168, + "step": 271000 + }, + { + "epoch": 1.75, + "learning_rate": 3.762561557278119e-05, + "loss": 0.0239, + "step": 271010 + }, + { + "epoch": 1.75, + "learning_rate": 3.7615934218424264e-05, + "loss": 0.0231, + "step": 271020 + }, + { + "epoch": 1.75, + "learning_rate": 3.7606252864067323e-05, + "loss": 0.0234, + "step": 271030 + }, + { + "epoch": 1.75, + "learning_rate": 3.7596571509710396e-05, + "loss": 0.0222, + "step": 271040 + }, + { + "epoch": 1.75, + "learning_rate": 3.758689015535346e-05, + "loss": 0.0239, + "step": 271050 + }, + { + "epoch": 1.75, + "learning_rate": 3.757720880099653e-05, + "loss": 0.0275, + "step": 271060 + }, + { + "epoch": 1.75, + "learning_rate": 3.75675274466396e-05, + "loss": 0.03, + "step": 271070 + }, + { + "epoch": 1.75, + "learning_rate": 3.755784609228266e-05, + "loss": 0.0233, + "step": 271080 + }, + { + "epoch": 1.75, + "learning_rate": 3.7548164737925734e-05, + "loss": 0.0258, + "step": 271090 + }, + { + "epoch": 1.75, + "learning_rate": 3.75384833835688e-05, + "loss": 0.021, + "step": 271100 + }, + { + "epoch": 1.75, + "learning_rate": 3.7528802029211874e-05, + "loss": 0.0265, + "step": 271110 + }, + { + "epoch": 1.75, + "learning_rate": 3.751912067485494e-05, + "loss": 0.0223, + "step": 271120 + }, + { + "epoch": 1.75, + "learning_rate": 3.7509439320498e-05, + "loss": 0.0242, + "step": 271130 + }, + { + "epoch": 1.75, + "learning_rate": 3.749975796614107e-05, + "loss": 0.0274, + "step": 271140 + }, + { + "epoch": 1.75, + "learning_rate": 3.749007661178414e-05, + "loss": 0.0292, + "step": 271150 + }, + { + "epoch": 1.75, + "learning_rate": 3.7480395257427205e-05, + "loss": 0.0203, + "step": 271160 + }, + { + "epoch": 1.75, + "learning_rate": 3.747071390307028e-05, + "loss": 0.0284, + "step": 271170 + }, + { + "epoch": 1.75, + "learning_rate": 3.7461032548713344e-05, + "loss": 0.0285, + "step": 271180 + }, + { + "epoch": 1.75, + "learning_rate": 3.745135119435641e-05, + "loss": 0.0247, + "step": 271190 + }, + { + "epoch": 1.75, + "learning_rate": 3.744166983999948e-05, + "loss": 0.0247, + "step": 271200 + }, + { + "epoch": 1.75, + "learning_rate": 3.743198848564255e-05, + "loss": 0.0234, + "step": 271210 + }, + { + "epoch": 1.75, + "learning_rate": 3.7422307131285616e-05, + "loss": 0.0258, + "step": 271220 + }, + { + "epoch": 1.75, + "learning_rate": 3.741262577692868e-05, + "loss": 0.0233, + "step": 271230 + }, + { + "epoch": 1.75, + "learning_rate": 3.740294442257175e-05, + "loss": 0.0269, + "step": 271240 + }, + { + "epoch": 1.75, + "learning_rate": 3.739326306821482e-05, + "loss": 0.0254, + "step": 271250 + }, + { + "epoch": 1.75, + "learning_rate": 3.738358171385789e-05, + "loss": 0.025, + "step": 271260 + }, + { + "epoch": 1.75, + "learning_rate": 3.7373900359500954e-05, + "loss": 0.0222, + "step": 271270 + }, + { + "epoch": 1.75, + "learning_rate": 3.736421900514403e-05, + "loss": 0.0276, + "step": 271280 + }, + { + "epoch": 1.75, + "learning_rate": 3.7354537650787086e-05, + "loss": 0.0246, + "step": 271290 + }, + { + "epoch": 1.75, + "learning_rate": 3.734485629643016e-05, + "loss": 0.0209, + "step": 271300 + }, + { + "epoch": 1.75, + "learning_rate": 3.7335174942073226e-05, + "loss": 0.0242, + "step": 271310 + }, + { + "epoch": 1.75, + "learning_rate": 3.732549358771629e-05, + "loss": 0.0195, + "step": 271320 + }, + { + "epoch": 1.75, + "learning_rate": 3.7315812233359365e-05, + "loss": 0.0253, + "step": 271330 + }, + { + "epoch": 1.75, + "learning_rate": 3.730613087900243e-05, + "loss": 0.0286, + "step": 271340 + }, + { + "epoch": 1.75, + "learning_rate": 3.72964495246455e-05, + "loss": 0.0271, + "step": 271350 + }, + { + "epoch": 1.75, + "learning_rate": 3.7286768170288563e-05, + "loss": 0.0229, + "step": 271360 + }, + { + "epoch": 1.75, + "learning_rate": 3.727708681593163e-05, + "loss": 0.0291, + "step": 271370 + }, + { + "epoch": 1.75, + "learning_rate": 3.72674054615747e-05, + "loss": 0.0246, + "step": 271380 + }, + { + "epoch": 1.75, + "learning_rate": 3.725772410721777e-05, + "loss": 0.0228, + "step": 271390 + }, + { + "epoch": 1.75, + "learning_rate": 3.7248042752860835e-05, + "loss": 0.0276, + "step": 271400 + }, + { + "epoch": 1.75, + "learning_rate": 3.723836139850391e-05, + "loss": 0.0295, + "step": 271410 + }, + { + "epoch": 1.75, + "learning_rate": 3.7228680044146974e-05, + "loss": 0.0225, + "step": 271420 + }, + { + "epoch": 1.75, + "learning_rate": 3.721899868979004e-05, + "loss": 0.0275, + "step": 271430 + }, + { + "epoch": 1.75, + "learning_rate": 3.720931733543311e-05, + "loss": 0.0242, + "step": 271440 + }, + { + "epoch": 1.75, + "learning_rate": 3.719963598107617e-05, + "loss": 0.0217, + "step": 271450 + }, + { + "epoch": 1.75, + "learning_rate": 3.7189954626719246e-05, + "loss": 0.0248, + "step": 271460 + }, + { + "epoch": 1.75, + "learning_rate": 3.718027327236231e-05, + "loss": 0.0237, + "step": 271470 + }, + { + "epoch": 1.75, + "learning_rate": 3.717059191800538e-05, + "loss": 0.0268, + "step": 271480 + }, + { + "epoch": 1.75, + "learning_rate": 3.716091056364845e-05, + "loss": 0.023, + "step": 271490 + }, + { + "epoch": 1.75, + "learning_rate": 3.715122920929151e-05, + "loss": 0.0232, + "step": 271500 + }, + { + "epoch": 1.75, + "learning_rate": 3.7141547854934584e-05, + "loss": 0.0198, + "step": 271510 + }, + { + "epoch": 1.75, + "learning_rate": 3.713186650057765e-05, + "loss": 0.0287, + "step": 271520 + }, + { + "epoch": 1.75, + "learning_rate": 3.712218514622072e-05, + "loss": 0.0327, + "step": 271530 + }, + { + "epoch": 1.75, + "learning_rate": 3.711250379186379e-05, + "loss": 0.0238, + "step": 271540 + }, + { + "epoch": 1.75, + "learning_rate": 3.7102822437506856e-05, + "loss": 0.0208, + "step": 271550 + }, + { + "epoch": 1.75, + "learning_rate": 3.709314108314992e-05, + "loss": 0.0235, + "step": 271560 + }, + { + "epoch": 1.75, + "learning_rate": 3.708345972879299e-05, + "loss": 0.0288, + "step": 271570 + }, + { + "epoch": 1.75, + "learning_rate": 3.7073778374436055e-05, + "loss": 0.0273, + "step": 271580 + }, + { + "epoch": 1.75, + "learning_rate": 3.706409702007913e-05, + "loss": 0.0264, + "step": 271590 + }, + { + "epoch": 1.75, + "learning_rate": 3.7054415665722194e-05, + "loss": 0.0261, + "step": 271600 + }, + { + "epoch": 1.75, + "learning_rate": 3.704473431136526e-05, + "loss": 0.0264, + "step": 271610 + }, + { + "epoch": 1.75, + "learning_rate": 3.703505295700833e-05, + "loss": 0.0201, + "step": 271620 + }, + { + "epoch": 1.75, + "learning_rate": 3.702537160265139e-05, + "loss": 0.0253, + "step": 271630 + }, + { + "epoch": 1.75, + "learning_rate": 3.7015690248294466e-05, + "loss": 0.0249, + "step": 271640 + }, + { + "epoch": 1.75, + "learning_rate": 3.700600889393753e-05, + "loss": 0.0237, + "step": 271650 + }, + { + "epoch": 1.75, + "learning_rate": 3.69963275395806e-05, + "loss": 0.0191, + "step": 271660 + }, + { + "epoch": 1.75, + "learning_rate": 3.698664618522367e-05, + "loss": 0.0237, + "step": 271670 + }, + { + "epoch": 1.75, + "learning_rate": 3.697696483086674e-05, + "loss": 0.0248, + "step": 271680 + }, + { + "epoch": 1.75, + "learning_rate": 3.6967283476509804e-05, + "loss": 0.0247, + "step": 271690 + }, + { + "epoch": 1.75, + "learning_rate": 3.695760212215287e-05, + "loss": 0.0252, + "step": 271700 + }, + { + "epoch": 1.75, + "learning_rate": 3.6947920767795936e-05, + "loss": 0.0208, + "step": 271710 + }, + { + "epoch": 1.75, + "learning_rate": 3.693823941343901e-05, + "loss": 0.0227, + "step": 271720 + }, + { + "epoch": 1.75, + "learning_rate": 3.6928558059082075e-05, + "loss": 0.029, + "step": 271730 + }, + { + "epoch": 1.75, + "learning_rate": 3.691887670472514e-05, + "loss": 0.0261, + "step": 271740 + }, + { + "epoch": 1.75, + "learning_rate": 3.6909195350368215e-05, + "loss": 0.0204, + "step": 271750 + }, + { + "epoch": 1.75, + "learning_rate": 3.689951399601128e-05, + "loss": 0.022, + "step": 271760 + }, + { + "epoch": 1.75, + "learning_rate": 3.688983264165435e-05, + "loss": 0.0188, + "step": 271770 + }, + { + "epoch": 1.75, + "learning_rate": 3.688015128729741e-05, + "loss": 0.0266, + "step": 271780 + }, + { + "epoch": 1.75, + "learning_rate": 3.687046993294048e-05, + "loss": 0.0204, + "step": 271790 + }, + { + "epoch": 1.75, + "learning_rate": 3.686078857858355e-05, + "loss": 0.0261, + "step": 271800 + }, + { + "epoch": 1.75, + "learning_rate": 3.685110722422662e-05, + "loss": 0.0194, + "step": 271810 + }, + { + "epoch": 1.75, + "learning_rate": 3.6841425869869685e-05, + "loss": 0.02, + "step": 271820 + }, + { + "epoch": 1.75, + "learning_rate": 3.683174451551276e-05, + "loss": 0.0253, + "step": 271830 + }, + { + "epoch": 1.75, + "learning_rate": 3.682206316115582e-05, + "loss": 0.0247, + "step": 271840 + }, + { + "epoch": 1.75, + "learning_rate": 3.681238180679889e-05, + "loss": 0.0268, + "step": 271850 + }, + { + "epoch": 1.75, + "learning_rate": 3.680270045244196e-05, + "loss": 0.0213, + "step": 271860 + }, + { + "epoch": 1.75, + "learning_rate": 3.679301909808502e-05, + "loss": 0.0233, + "step": 271870 + }, + { + "epoch": 1.75, + "learning_rate": 3.6783337743728096e-05, + "loss": 0.0261, + "step": 271880 + }, + { + "epoch": 1.75, + "learning_rate": 3.677365638937116e-05, + "loss": 0.0212, + "step": 271890 + }, + { + "epoch": 1.75, + "learning_rate": 3.676397503501423e-05, + "loss": 0.0259, + "step": 271900 + }, + { + "epoch": 1.75, + "learning_rate": 3.6754293680657295e-05, + "loss": 0.0233, + "step": 271910 + }, + { + "epoch": 1.76, + "learning_rate": 3.674461232630036e-05, + "loss": 0.021, + "step": 271920 + }, + { + "epoch": 1.76, + "learning_rate": 3.6734930971943434e-05, + "loss": 0.0281, + "step": 271930 + }, + { + "epoch": 1.76, + "learning_rate": 3.67252496175865e-05, + "loss": 0.0283, + "step": 271940 + }, + { + "epoch": 1.76, + "learning_rate": 3.6715568263229566e-05, + "loss": 0.0243, + "step": 271950 + }, + { + "epoch": 1.76, + "learning_rate": 3.670588690887264e-05, + "loss": 0.0229, + "step": 271960 + }, + { + "epoch": 1.76, + "learning_rate": 3.6696205554515706e-05, + "loss": 0.0257, + "step": 271970 + }, + { + "epoch": 1.76, + "learning_rate": 3.668652420015877e-05, + "loss": 0.0262, + "step": 271980 + }, + { + "epoch": 1.76, + "learning_rate": 3.667684284580184e-05, + "loss": 0.0235, + "step": 271990 + }, + { + "epoch": 1.76, + "learning_rate": 3.6667161491444904e-05, + "loss": 0.0257, + "step": 272000 + }, + { + "epoch": 1.76, + "eval_cer": 0.9197975370014687, + "eval_loss": 0.01773538440465927, + "eval_runtime": 119.9524, + "eval_samples_per_second": 16.673, + "eval_steps_per_second": 4.168, + "step": 272000 + }, + { + "epoch": 1.76, + "learning_rate": 3.665748013708798e-05, + "loss": 0.0232, + "step": 272010 + }, + { + "epoch": 1.76, + "learning_rate": 3.6647798782731044e-05, + "loss": 0.0271, + "step": 272020 + }, + { + "epoch": 1.76, + "learning_rate": 3.663811742837411e-05, + "loss": 0.0254, + "step": 272030 + }, + { + "epoch": 1.76, + "learning_rate": 3.662843607401718e-05, + "loss": 0.0233, + "step": 272040 + }, + { + "epoch": 1.76, + "learning_rate": 3.661875471966024e-05, + "loss": 0.0213, + "step": 272050 + }, + { + "epoch": 1.76, + "learning_rate": 3.6609073365303315e-05, + "loss": 0.0234, + "step": 272060 + }, + { + "epoch": 1.76, + "learning_rate": 3.659939201094638e-05, + "loss": 0.0229, + "step": 272070 + }, + { + "epoch": 1.76, + "learning_rate": 3.658971065658945e-05, + "loss": 0.0236, + "step": 272080 + }, + { + "epoch": 1.76, + "learning_rate": 3.658002930223252e-05, + "loss": 0.0272, + "step": 272090 + }, + { + "epoch": 1.76, + "learning_rate": 3.657034794787559e-05, + "loss": 0.0222, + "step": 272100 + }, + { + "epoch": 1.76, + "learning_rate": 3.6560666593518653e-05, + "loss": 0.0203, + "step": 272110 + }, + { + "epoch": 1.76, + "learning_rate": 3.655098523916172e-05, + "loss": 0.028, + "step": 272120 + }, + { + "epoch": 1.76, + "learning_rate": 3.6541303884804786e-05, + "loss": 0.0247, + "step": 272130 + }, + { + "epoch": 1.76, + "learning_rate": 3.653162253044786e-05, + "loss": 0.0196, + "step": 272140 + }, + { + "epoch": 1.76, + "learning_rate": 3.6521941176090925e-05, + "loss": 0.0251, + "step": 272150 + }, + { + "epoch": 1.76, + "learning_rate": 3.651225982173399e-05, + "loss": 0.0228, + "step": 272160 + }, + { + "epoch": 1.76, + "learning_rate": 3.6502578467377064e-05, + "loss": 0.0235, + "step": 272170 + }, + { + "epoch": 1.76, + "learning_rate": 3.649289711302013e-05, + "loss": 0.023, + "step": 272180 + }, + { + "epoch": 1.76, + "learning_rate": 3.64832157586632e-05, + "loss": 0.0222, + "step": 272190 + }, + { + "epoch": 1.76, + "learning_rate": 3.647353440430626e-05, + "loss": 0.024, + "step": 272200 + }, + { + "epoch": 1.76, + "learning_rate": 3.646385304994933e-05, + "loss": 0.0217, + "step": 272210 + }, + { + "epoch": 1.76, + "learning_rate": 3.64541716955924e-05, + "loss": 0.0258, + "step": 272220 + }, + { + "epoch": 1.76, + "learning_rate": 3.644449034123547e-05, + "loss": 0.0213, + "step": 272230 + }, + { + "epoch": 1.76, + "learning_rate": 3.6434808986878535e-05, + "loss": 0.019, + "step": 272240 + }, + { + "epoch": 1.76, + "learning_rate": 3.64251276325216e-05, + "loss": 0.0217, + "step": 272250 + }, + { + "epoch": 1.76, + "learning_rate": 3.641544627816467e-05, + "loss": 0.0263, + "step": 272260 + }, + { + "epoch": 1.76, + "learning_rate": 3.640576492380774e-05, + "loss": 0.0248, + "step": 272270 + }, + { + "epoch": 1.76, + "learning_rate": 3.6396083569450807e-05, + "loss": 0.0208, + "step": 272280 + }, + { + "epoch": 1.76, + "learning_rate": 3.638640221509387e-05, + "loss": 0.0262, + "step": 272290 + }, + { + "epoch": 1.76, + "learning_rate": 3.637672086073694e-05, + "loss": 0.0263, + "step": 272300 + }, + { + "epoch": 1.76, + "learning_rate": 3.636703950638001e-05, + "loss": 0.0231, + "step": 272310 + }, + { + "epoch": 1.76, + "learning_rate": 3.635735815202308e-05, + "loss": 0.0251, + "step": 272320 + }, + { + "epoch": 1.76, + "learning_rate": 3.6347676797666145e-05, + "loss": 0.0237, + "step": 272330 + }, + { + "epoch": 1.76, + "learning_rate": 3.633799544330921e-05, + "loss": 0.0208, + "step": 272340 + }, + { + "epoch": 1.76, + "learning_rate": 3.632831408895228e-05, + "loss": 0.0211, + "step": 272350 + }, + { + "epoch": 1.76, + "learning_rate": 3.631863273459535e-05, + "loss": 0.0234, + "step": 272360 + }, + { + "epoch": 1.76, + "learning_rate": 3.6308951380238416e-05, + "loss": 0.0228, + "step": 272370 + }, + { + "epoch": 1.76, + "learning_rate": 3.629927002588148e-05, + "loss": 0.0224, + "step": 272380 + }, + { + "epoch": 1.76, + "learning_rate": 3.6289588671524556e-05, + "loss": 0.0237, + "step": 272390 + }, + { + "epoch": 1.76, + "learning_rate": 3.6279907317167615e-05, + "loss": 0.0244, + "step": 272400 + }, + { + "epoch": 1.76, + "learning_rate": 3.627022596281069e-05, + "loss": 0.0244, + "step": 272410 + }, + { + "epoch": 1.76, + "learning_rate": 3.6260544608453754e-05, + "loss": 0.0242, + "step": 272420 + }, + { + "epoch": 1.76, + "learning_rate": 3.625086325409682e-05, + "loss": 0.021, + "step": 272430 + }, + { + "epoch": 1.76, + "learning_rate": 3.6241181899739894e-05, + "loss": 0.0254, + "step": 272440 + }, + { + "epoch": 1.76, + "learning_rate": 3.623150054538296e-05, + "loss": 0.0237, + "step": 272450 + }, + { + "epoch": 1.76, + "learning_rate": 3.6221819191026026e-05, + "loss": 0.0203, + "step": 272460 + }, + { + "epoch": 1.76, + "learning_rate": 3.621213783666909e-05, + "loss": 0.0253, + "step": 272470 + }, + { + "epoch": 1.76, + "learning_rate": 3.620245648231216e-05, + "loss": 0.0245, + "step": 272480 + }, + { + "epoch": 1.76, + "learning_rate": 3.619277512795523e-05, + "loss": 0.019, + "step": 272490 + }, + { + "epoch": 1.76, + "learning_rate": 3.61830937735983e-05, + "loss": 0.0197, + "step": 272500 + }, + { + "epoch": 1.76, + "learning_rate": 3.6173412419241364e-05, + "loss": 0.0213, + "step": 272510 + }, + { + "epoch": 1.76, + "learning_rate": 3.616373106488444e-05, + "loss": 0.0254, + "step": 272520 + }, + { + "epoch": 1.76, + "learning_rate": 3.6154049710527496e-05, + "loss": 0.0267, + "step": 272530 + }, + { + "epoch": 1.76, + "learning_rate": 3.614436835617057e-05, + "loss": 0.0251, + "step": 272540 + }, + { + "epoch": 1.76, + "learning_rate": 3.6134687001813636e-05, + "loss": 0.0281, + "step": 272550 + }, + { + "epoch": 1.76, + "learning_rate": 3.61250056474567e-05, + "loss": 0.0224, + "step": 272560 + }, + { + "epoch": 1.76, + "learning_rate": 3.6115324293099775e-05, + "loss": 0.0301, + "step": 272570 + }, + { + "epoch": 1.76, + "learning_rate": 3.610564293874284e-05, + "loss": 0.0278, + "step": 272580 + }, + { + "epoch": 1.76, + "learning_rate": 3.609596158438591e-05, + "loss": 0.0234, + "step": 272590 + }, + { + "epoch": 1.76, + "learning_rate": 3.6086280230028974e-05, + "loss": 0.0232, + "step": 272600 + }, + { + "epoch": 1.76, + "learning_rate": 3.607659887567204e-05, + "loss": 0.0195, + "step": 272610 + }, + { + "epoch": 1.76, + "learning_rate": 3.606691752131511e-05, + "loss": 0.0243, + "step": 272620 + }, + { + "epoch": 1.76, + "learning_rate": 3.605723616695818e-05, + "loss": 0.0192, + "step": 272630 + }, + { + "epoch": 1.76, + "learning_rate": 3.6047554812601245e-05, + "loss": 0.0225, + "step": 272640 + }, + { + "epoch": 1.76, + "learning_rate": 3.603787345824432e-05, + "loss": 0.0193, + "step": 272650 + }, + { + "epoch": 1.76, + "learning_rate": 3.6028192103887385e-05, + "loss": 0.025, + "step": 272660 + }, + { + "epoch": 1.76, + "learning_rate": 3.601851074953045e-05, + "loss": 0.0233, + "step": 272670 + }, + { + "epoch": 1.76, + "learning_rate": 3.600882939517352e-05, + "loss": 0.0267, + "step": 272680 + }, + { + "epoch": 1.76, + "learning_rate": 3.599914804081658e-05, + "loss": 0.0228, + "step": 272690 + }, + { + "epoch": 1.76, + "learning_rate": 3.5989466686459656e-05, + "loss": 0.0203, + "step": 272700 + }, + { + "epoch": 1.76, + "learning_rate": 3.597978533210272e-05, + "loss": 0.0247, + "step": 272710 + }, + { + "epoch": 1.76, + "learning_rate": 3.597010397774579e-05, + "loss": 0.0227, + "step": 272720 + }, + { + "epoch": 1.76, + "learning_rate": 3.596042262338886e-05, + "loss": 0.027, + "step": 272730 + }, + { + "epoch": 1.76, + "learning_rate": 3.595074126903192e-05, + "loss": 0.0196, + "step": 272740 + }, + { + "epoch": 1.76, + "learning_rate": 3.5941059914674994e-05, + "loss": 0.0209, + "step": 272750 + }, + { + "epoch": 1.76, + "learning_rate": 3.593137856031806e-05, + "loss": 0.0285, + "step": 272760 + }, + { + "epoch": 1.76, + "learning_rate": 3.592169720596113e-05, + "loss": 0.0268, + "step": 272770 + }, + { + "epoch": 1.76, + "learning_rate": 3.59120158516042e-05, + "loss": 0.0316, + "step": 272780 + }, + { + "epoch": 1.76, + "learning_rate": 3.5902334497247266e-05, + "loss": 0.0204, + "step": 272790 + }, + { + "epoch": 1.76, + "learning_rate": 3.589265314289033e-05, + "loss": 0.0267, + "step": 272800 + }, + { + "epoch": 1.76, + "learning_rate": 3.58829717885334e-05, + "loss": 0.0265, + "step": 272810 + }, + { + "epoch": 1.76, + "learning_rate": 3.5873290434176465e-05, + "loss": 0.0263, + "step": 272820 + }, + { + "epoch": 1.76, + "learning_rate": 3.586360907981954e-05, + "loss": 0.0236, + "step": 272830 + }, + { + "epoch": 1.76, + "learning_rate": 3.5853927725462604e-05, + "loss": 0.0252, + "step": 272840 + }, + { + "epoch": 1.76, + "learning_rate": 3.584424637110567e-05, + "loss": 0.0224, + "step": 272850 + }, + { + "epoch": 1.76, + "learning_rate": 3.583456501674874e-05, + "loss": 0.0254, + "step": 272860 + }, + { + "epoch": 1.76, + "learning_rate": 3.582488366239181e-05, + "loss": 0.023, + "step": 272870 + }, + { + "epoch": 1.76, + "learning_rate": 3.5815202308034876e-05, + "loss": 0.0211, + "step": 272880 + }, + { + "epoch": 1.76, + "learning_rate": 3.580552095367794e-05, + "loss": 0.0245, + "step": 272890 + }, + { + "epoch": 1.76, + "learning_rate": 3.579583959932101e-05, + "loss": 0.0207, + "step": 272900 + }, + { + "epoch": 1.76, + "learning_rate": 3.578615824496408e-05, + "loss": 0.026, + "step": 272910 + }, + { + "epoch": 1.76, + "learning_rate": 3.577647689060715e-05, + "loss": 0.0215, + "step": 272920 + }, + { + "epoch": 1.76, + "learning_rate": 3.5766795536250214e-05, + "loss": 0.024, + "step": 272930 + }, + { + "epoch": 1.76, + "learning_rate": 3.575711418189329e-05, + "loss": 0.0196, + "step": 272940 + }, + { + "epoch": 1.76, + "learning_rate": 3.5747432827536346e-05, + "loss": 0.0223, + "step": 272950 + }, + { + "epoch": 1.76, + "learning_rate": 3.573775147317942e-05, + "loss": 0.0237, + "step": 272960 + }, + { + "epoch": 1.76, + "learning_rate": 3.5728070118822485e-05, + "loss": 0.0233, + "step": 272970 + }, + { + "epoch": 1.76, + "learning_rate": 3.571838876446555e-05, + "loss": 0.0255, + "step": 272980 + }, + { + "epoch": 1.76, + "learning_rate": 3.5708707410108625e-05, + "loss": 0.0219, + "step": 272990 + }, + { + "epoch": 1.76, + "learning_rate": 3.569902605575169e-05, + "loss": 0.0247, + "step": 273000 + }, + { + "epoch": 1.76, + "eval_cer": 0.9198716529205739, + "eval_loss": 0.017535319551825523, + "eval_runtime": 119.9947, + "eval_samples_per_second": 16.667, + "eval_steps_per_second": 4.167, + "step": 273000 + }, + { + "epoch": 1.76, + "learning_rate": 3.568934470139476e-05, + "loss": 0.0234, + "step": 273010 + }, + { + "epoch": 1.76, + "learning_rate": 3.5679663347037823e-05, + "loss": 0.026, + "step": 273020 + }, + { + "epoch": 1.76, + "learning_rate": 3.566998199268089e-05, + "loss": 0.0242, + "step": 273030 + }, + { + "epoch": 1.76, + "learning_rate": 3.566030063832396e-05, + "loss": 0.0275, + "step": 273040 + }, + { + "epoch": 1.76, + "learning_rate": 3.565061928396703e-05, + "loss": 0.0208, + "step": 273050 + }, + { + "epoch": 1.76, + "learning_rate": 3.5640937929610095e-05, + "loss": 0.021, + "step": 273060 + }, + { + "epoch": 1.76, + "learning_rate": 3.563125657525317e-05, + "loss": 0.023, + "step": 273070 + }, + { + "epoch": 1.76, + "learning_rate": 3.5621575220896234e-05, + "loss": 0.0286, + "step": 273080 + }, + { + "epoch": 1.76, + "learning_rate": 3.56118938665393e-05, + "loss": 0.0237, + "step": 273090 + }, + { + "epoch": 1.76, + "learning_rate": 3.560221251218237e-05, + "loss": 0.0286, + "step": 273100 + }, + { + "epoch": 1.76, + "learning_rate": 3.559253115782543e-05, + "loss": 0.0224, + "step": 273110 + }, + { + "epoch": 1.76, + "learning_rate": 3.5582849803468506e-05, + "loss": 0.0251, + "step": 273120 + }, + { + "epoch": 1.76, + "learning_rate": 3.557316844911157e-05, + "loss": 0.0227, + "step": 273130 + }, + { + "epoch": 1.76, + "learning_rate": 3.556348709475464e-05, + "loss": 0.0251, + "step": 273140 + }, + { + "epoch": 1.76, + "learning_rate": 3.555380574039771e-05, + "loss": 0.0242, + "step": 273150 + }, + { + "epoch": 1.76, + "learning_rate": 3.554412438604077e-05, + "loss": 0.0219, + "step": 273160 + }, + { + "epoch": 1.76, + "learning_rate": 3.5534443031683844e-05, + "loss": 0.0261, + "step": 273170 + }, + { + "epoch": 1.76, + "learning_rate": 3.552476167732691e-05, + "loss": 0.0254, + "step": 273180 + }, + { + "epoch": 1.76, + "learning_rate": 3.551508032296998e-05, + "loss": 0.02, + "step": 273190 + }, + { + "epoch": 1.76, + "learning_rate": 3.550539896861305e-05, + "loss": 0.0203, + "step": 273200 + }, + { + "epoch": 1.76, + "learning_rate": 3.5495717614256116e-05, + "loss": 0.0249, + "step": 273210 + }, + { + "epoch": 1.76, + "learning_rate": 3.548603625989918e-05, + "loss": 0.023, + "step": 273220 + }, + { + "epoch": 1.76, + "learning_rate": 3.547635490554225e-05, + "loss": 0.0241, + "step": 273230 + }, + { + "epoch": 1.76, + "learning_rate": 3.5466673551185315e-05, + "loss": 0.0225, + "step": 273240 + }, + { + "epoch": 1.76, + "learning_rate": 3.545699219682839e-05, + "loss": 0.0258, + "step": 273250 + }, + { + "epoch": 1.76, + "learning_rate": 3.5447310842471454e-05, + "loss": 0.0203, + "step": 273260 + }, + { + "epoch": 1.76, + "learning_rate": 3.543762948811452e-05, + "loss": 0.0224, + "step": 273270 + }, + { + "epoch": 1.76, + "learning_rate": 3.542794813375759e-05, + "loss": 0.0226, + "step": 273280 + }, + { + "epoch": 1.76, + "learning_rate": 3.541826677940066e-05, + "loss": 0.0301, + "step": 273290 + }, + { + "epoch": 1.76, + "learning_rate": 3.5408585425043726e-05, + "loss": 0.0198, + "step": 273300 + }, + { + "epoch": 1.76, + "learning_rate": 3.539890407068679e-05, + "loss": 0.0267, + "step": 273310 + }, + { + "epoch": 1.76, + "learning_rate": 3.538922271632986e-05, + "loss": 0.0256, + "step": 273320 + }, + { + "epoch": 1.76, + "learning_rate": 3.537954136197293e-05, + "loss": 0.0282, + "step": 273330 + }, + { + "epoch": 1.76, + "learning_rate": 3.5369860007616e-05, + "loss": 0.0225, + "step": 273340 + }, + { + "epoch": 1.76, + "learning_rate": 3.5360178653259064e-05, + "loss": 0.02, + "step": 273350 + }, + { + "epoch": 1.76, + "learning_rate": 3.535049729890213e-05, + "loss": 0.0251, + "step": 273360 + }, + { + "epoch": 1.76, + "learning_rate": 3.5340815944545196e-05, + "loss": 0.0218, + "step": 273370 + }, + { + "epoch": 1.76, + "learning_rate": 3.533113459018827e-05, + "loss": 0.0193, + "step": 273380 + }, + { + "epoch": 1.76, + "learning_rate": 3.5321453235831335e-05, + "loss": 0.018, + "step": 273390 + }, + { + "epoch": 1.76, + "learning_rate": 3.53117718814744e-05, + "loss": 0.0248, + "step": 273400 + }, + { + "epoch": 1.76, + "learning_rate": 3.5302090527117475e-05, + "loss": 0.0211, + "step": 273410 + }, + { + "epoch": 1.76, + "learning_rate": 3.529240917276054e-05, + "loss": 0.0226, + "step": 273420 + }, + { + "epoch": 1.76, + "learning_rate": 3.528272781840361e-05, + "loss": 0.0213, + "step": 273430 + }, + { + "epoch": 1.76, + "learning_rate": 3.527304646404667e-05, + "loss": 0.0238, + "step": 273440 + }, + { + "epoch": 1.76, + "learning_rate": 3.526336510968974e-05, + "loss": 0.0224, + "step": 273450 + }, + { + "epoch": 1.76, + "learning_rate": 3.525368375533281e-05, + "loss": 0.0246, + "step": 273460 + }, + { + "epoch": 1.77, + "learning_rate": 3.524400240097588e-05, + "loss": 0.0258, + "step": 273470 + }, + { + "epoch": 1.77, + "learning_rate": 3.5234321046618945e-05, + "loss": 0.0259, + "step": 273480 + }, + { + "epoch": 1.77, + "learning_rate": 3.522463969226202e-05, + "loss": 0.0241, + "step": 273490 + }, + { + "epoch": 1.77, + "learning_rate": 3.521495833790508e-05, + "loss": 0.0241, + "step": 273500 + }, + { + "epoch": 1.77, + "learning_rate": 3.520527698354815e-05, + "loss": 0.0247, + "step": 273510 + }, + { + "epoch": 1.77, + "learning_rate": 3.519559562919122e-05, + "loss": 0.0206, + "step": 273520 + }, + { + "epoch": 1.77, + "learning_rate": 3.518591427483428e-05, + "loss": 0.0237, + "step": 273530 + }, + { + "epoch": 1.77, + "learning_rate": 3.5176232920477356e-05, + "loss": 0.0222, + "step": 273540 + }, + { + "epoch": 1.77, + "learning_rate": 3.516655156612042e-05, + "loss": 0.0259, + "step": 273550 + }, + { + "epoch": 1.77, + "learning_rate": 3.515687021176349e-05, + "loss": 0.0234, + "step": 273560 + }, + { + "epoch": 1.77, + "learning_rate": 3.5147188857406555e-05, + "loss": 0.0259, + "step": 273570 + }, + { + "epoch": 1.77, + "learning_rate": 3.513750750304962e-05, + "loss": 0.0173, + "step": 273580 + }, + { + "epoch": 1.77, + "learning_rate": 3.5127826148692694e-05, + "loss": 0.0249, + "step": 273590 + }, + { + "epoch": 1.77, + "learning_rate": 3.511814479433576e-05, + "loss": 0.0222, + "step": 273600 + }, + { + "epoch": 1.77, + "learning_rate": 3.5108463439978826e-05, + "loss": 0.0275, + "step": 273610 + }, + { + "epoch": 1.77, + "learning_rate": 3.509878208562189e-05, + "loss": 0.0205, + "step": 273620 + }, + { + "epoch": 1.77, + "learning_rate": 3.5089100731264966e-05, + "loss": 0.0233, + "step": 273630 + }, + { + "epoch": 1.77, + "learning_rate": 3.507941937690803e-05, + "loss": 0.0237, + "step": 273640 + }, + { + "epoch": 1.77, + "learning_rate": 3.50697380225511e-05, + "loss": 0.023, + "step": 273650 + }, + { + "epoch": 1.77, + "learning_rate": 3.5060056668194164e-05, + "loss": 0.0249, + "step": 273660 + }, + { + "epoch": 1.77, + "learning_rate": 3.505037531383723e-05, + "loss": 0.0234, + "step": 273670 + }, + { + "epoch": 1.77, + "learning_rate": 3.5040693959480304e-05, + "loss": 0.0323, + "step": 273680 + }, + { + "epoch": 1.77, + "learning_rate": 3.503101260512337e-05, + "loss": 0.0225, + "step": 273690 + }, + { + "epoch": 1.77, + "learning_rate": 3.5021331250766436e-05, + "loss": 0.0228, + "step": 273700 + }, + { + "epoch": 1.77, + "learning_rate": 3.50116498964095e-05, + "loss": 0.0241, + "step": 273710 + }, + { + "epoch": 1.77, + "learning_rate": 3.500196854205257e-05, + "loss": 0.0228, + "step": 273720 + }, + { + "epoch": 1.77, + "learning_rate": 3.499228718769564e-05, + "loss": 0.0234, + "step": 273730 + }, + { + "epoch": 1.77, + "learning_rate": 3.498260583333871e-05, + "loss": 0.0219, + "step": 273740 + }, + { + "epoch": 1.77, + "learning_rate": 3.4972924478981774e-05, + "loss": 0.0248, + "step": 273750 + }, + { + "epoch": 1.77, + "learning_rate": 3.496324312462485e-05, + "loss": 0.0234, + "step": 273760 + }, + { + "epoch": 1.77, + "learning_rate": 3.495356177026791e-05, + "loss": 0.0276, + "step": 273770 + }, + { + "epoch": 1.77, + "learning_rate": 3.494388041591098e-05, + "loss": 0.023, + "step": 273780 + }, + { + "epoch": 1.77, + "learning_rate": 3.4934199061554046e-05, + "loss": 0.0253, + "step": 273790 + }, + { + "epoch": 1.77, + "learning_rate": 3.492451770719711e-05, + "loss": 0.0204, + "step": 273800 + }, + { + "epoch": 1.77, + "learning_rate": 3.4914836352840185e-05, + "loss": 0.0232, + "step": 273810 + }, + { + "epoch": 1.77, + "learning_rate": 3.490515499848325e-05, + "loss": 0.0187, + "step": 273820 + }, + { + "epoch": 1.77, + "learning_rate": 3.489547364412632e-05, + "loss": 0.024, + "step": 273830 + }, + { + "epoch": 1.77, + "learning_rate": 3.488579228976939e-05, + "loss": 0.0226, + "step": 273840 + }, + { + "epoch": 1.77, + "learning_rate": 3.487611093541245e-05, + "loss": 0.0226, + "step": 273850 + }, + { + "epoch": 1.77, + "learning_rate": 3.486642958105552e-05, + "loss": 0.0292, + "step": 273860 + }, + { + "epoch": 1.77, + "learning_rate": 3.485674822669859e-05, + "loss": 0.023, + "step": 273870 + }, + { + "epoch": 1.77, + "learning_rate": 3.4847066872341656e-05, + "loss": 0.019, + "step": 273880 + }, + { + "epoch": 1.77, + "learning_rate": 3.483738551798473e-05, + "loss": 0.022, + "step": 273890 + }, + { + "epoch": 1.77, + "learning_rate": 3.4827704163627795e-05, + "loss": 0.0236, + "step": 273900 + }, + { + "epoch": 1.77, + "learning_rate": 3.481802280927086e-05, + "loss": 0.0243, + "step": 273910 + }, + { + "epoch": 1.77, + "learning_rate": 3.480834145491393e-05, + "loss": 0.0224, + "step": 273920 + }, + { + "epoch": 1.77, + "learning_rate": 3.4798660100556994e-05, + "loss": 0.0286, + "step": 273930 + }, + { + "epoch": 1.77, + "learning_rate": 3.4788978746200067e-05, + "loss": 0.0249, + "step": 273940 + }, + { + "epoch": 1.77, + "learning_rate": 3.477929739184313e-05, + "loss": 0.0216, + "step": 273950 + }, + { + "epoch": 1.77, + "learning_rate": 3.47696160374862e-05, + "loss": 0.0212, + "step": 273960 + }, + { + "epoch": 1.77, + "learning_rate": 3.475993468312927e-05, + "loss": 0.0264, + "step": 273970 + }, + { + "epoch": 1.77, + "learning_rate": 3.475025332877234e-05, + "loss": 0.0223, + "step": 273980 + }, + { + "epoch": 1.77, + "learning_rate": 3.4740571974415405e-05, + "loss": 0.0199, + "step": 273990 + }, + { + "epoch": 1.77, + "learning_rate": 3.473089062005847e-05, + "loss": 0.0323, + "step": 274000 + }, + { + "epoch": 1.77, + "eval_cer": 0.9198553835724776, + "eval_loss": 0.017592335119843483, + "eval_runtime": 119.8118, + "eval_samples_per_second": 16.693, + "eval_steps_per_second": 4.173, + "step": 274000 + }, + { + "epoch": 1.77, + "learning_rate": 3.472120926570154e-05, + "loss": 0.0225, + "step": 274010 + }, + { + "epoch": 1.77, + "learning_rate": 3.471152791134461e-05, + "loss": 0.0205, + "step": 274020 + }, + { + "epoch": 1.77, + "learning_rate": 3.4701846556987676e-05, + "loss": 0.0267, + "step": 274030 + }, + { + "epoch": 1.77, + "learning_rate": 3.469216520263074e-05, + "loss": 0.0236, + "step": 274040 + }, + { + "epoch": 1.77, + "learning_rate": 3.4682483848273816e-05, + "loss": 0.0201, + "step": 274050 + }, + { + "epoch": 1.77, + "learning_rate": 3.4672802493916875e-05, + "loss": 0.0257, + "step": 274060 + }, + { + "epoch": 1.77, + "learning_rate": 3.466312113955995e-05, + "loss": 0.0254, + "step": 274070 + }, + { + "epoch": 1.77, + "learning_rate": 3.4653439785203014e-05, + "loss": 0.0265, + "step": 274080 + }, + { + "epoch": 1.77, + "learning_rate": 3.464375843084608e-05, + "loss": 0.024, + "step": 274090 + }, + { + "epoch": 1.77, + "learning_rate": 3.4634077076489153e-05, + "loss": 0.0233, + "step": 274100 + }, + { + "epoch": 1.77, + "learning_rate": 3.462439572213222e-05, + "loss": 0.0219, + "step": 274110 + }, + { + "epoch": 1.77, + "learning_rate": 3.4614714367775286e-05, + "loss": 0.0245, + "step": 274120 + }, + { + "epoch": 1.77, + "learning_rate": 3.460503301341835e-05, + "loss": 0.0253, + "step": 274130 + }, + { + "epoch": 1.77, + "learning_rate": 3.459535165906142e-05, + "loss": 0.0248, + "step": 274140 + }, + { + "epoch": 1.77, + "learning_rate": 3.458567030470449e-05, + "loss": 0.0244, + "step": 274150 + }, + { + "epoch": 1.77, + "learning_rate": 3.457598895034756e-05, + "loss": 0.0274, + "step": 274160 + }, + { + "epoch": 1.77, + "learning_rate": 3.4566307595990624e-05, + "loss": 0.0226, + "step": 274170 + }, + { + "epoch": 1.77, + "learning_rate": 3.45566262416337e-05, + "loss": 0.0218, + "step": 274180 + }, + { + "epoch": 1.77, + "learning_rate": 3.4546944887276756e-05, + "loss": 0.0297, + "step": 274190 + }, + { + "epoch": 1.77, + "learning_rate": 3.453726353291983e-05, + "loss": 0.028, + "step": 274200 + }, + { + "epoch": 1.77, + "learning_rate": 3.4527582178562896e-05, + "loss": 0.0209, + "step": 274210 + }, + { + "epoch": 1.77, + "learning_rate": 3.451790082420596e-05, + "loss": 0.0235, + "step": 274220 + }, + { + "epoch": 1.77, + "learning_rate": 3.4508219469849035e-05, + "loss": 0.0261, + "step": 274230 + }, + { + "epoch": 1.77, + "learning_rate": 3.44985381154921e-05, + "loss": 0.0238, + "step": 274240 + }, + { + "epoch": 1.77, + "learning_rate": 3.448885676113517e-05, + "loss": 0.0259, + "step": 274250 + }, + { + "epoch": 1.77, + "learning_rate": 3.4479175406778234e-05, + "loss": 0.0248, + "step": 274260 + }, + { + "epoch": 1.77, + "learning_rate": 3.44694940524213e-05, + "loss": 0.0269, + "step": 274270 + }, + { + "epoch": 1.77, + "learning_rate": 3.445981269806437e-05, + "loss": 0.028, + "step": 274280 + }, + { + "epoch": 1.77, + "learning_rate": 3.445013134370744e-05, + "loss": 0.0215, + "step": 274290 + }, + { + "epoch": 1.77, + "learning_rate": 3.4440449989350505e-05, + "loss": 0.0212, + "step": 274300 + }, + { + "epoch": 1.77, + "learning_rate": 3.443076863499358e-05, + "loss": 0.0218, + "step": 274310 + }, + { + "epoch": 1.77, + "learning_rate": 3.4421087280636645e-05, + "loss": 0.0265, + "step": 274320 + }, + { + "epoch": 1.77, + "learning_rate": 3.441140592627971e-05, + "loss": 0.0255, + "step": 274330 + }, + { + "epoch": 1.77, + "learning_rate": 3.440172457192278e-05, + "loss": 0.0258, + "step": 274340 + }, + { + "epoch": 1.77, + "learning_rate": 3.439204321756584e-05, + "loss": 0.0207, + "step": 274350 + }, + { + "epoch": 1.77, + "learning_rate": 3.4382361863208916e-05, + "loss": 0.025, + "step": 274360 + }, + { + "epoch": 1.77, + "learning_rate": 3.437268050885198e-05, + "loss": 0.0246, + "step": 274370 + }, + { + "epoch": 1.77, + "learning_rate": 3.436299915449505e-05, + "loss": 0.0293, + "step": 274380 + }, + { + "epoch": 1.77, + "learning_rate": 3.435331780013812e-05, + "loss": 0.0268, + "step": 274390 + }, + { + "epoch": 1.77, + "learning_rate": 3.434363644578118e-05, + "loss": 0.0227, + "step": 274400 + }, + { + "epoch": 1.77, + "learning_rate": 3.4333955091424254e-05, + "loss": 0.0229, + "step": 274410 + }, + { + "epoch": 1.77, + "learning_rate": 3.432427373706732e-05, + "loss": 0.0227, + "step": 274420 + }, + { + "epoch": 1.77, + "learning_rate": 3.431459238271039e-05, + "loss": 0.0245, + "step": 274430 + }, + { + "epoch": 1.77, + "learning_rate": 3.430491102835346e-05, + "loss": 0.0248, + "step": 274440 + }, + { + "epoch": 1.77, + "learning_rate": 3.4295229673996526e-05, + "loss": 0.0247, + "step": 274450 + }, + { + "epoch": 1.77, + "learning_rate": 3.428554831963959e-05, + "loss": 0.0218, + "step": 274460 + }, + { + "epoch": 1.77, + "learning_rate": 3.427586696528266e-05, + "loss": 0.0241, + "step": 274470 + }, + { + "epoch": 1.77, + "learning_rate": 3.4266185610925725e-05, + "loss": 0.0232, + "step": 274480 + }, + { + "epoch": 1.77, + "learning_rate": 3.42565042565688e-05, + "loss": 0.0229, + "step": 274490 + }, + { + "epoch": 1.77, + "learning_rate": 3.4246822902211864e-05, + "loss": 0.0274, + "step": 274500 + }, + { + "epoch": 1.77, + "learning_rate": 3.423714154785493e-05, + "loss": 0.0247, + "step": 274510 + }, + { + "epoch": 1.77, + "learning_rate": 3.4227460193498e-05, + "loss": 0.0216, + "step": 274520 + }, + { + "epoch": 1.77, + "learning_rate": 3.421777883914107e-05, + "loss": 0.0231, + "step": 274530 + }, + { + "epoch": 1.77, + "learning_rate": 3.4208097484784136e-05, + "loss": 0.0217, + "step": 274540 + }, + { + "epoch": 1.77, + "learning_rate": 3.41984161304272e-05, + "loss": 0.0215, + "step": 274550 + }, + { + "epoch": 1.77, + "learning_rate": 3.418873477607027e-05, + "loss": 0.0202, + "step": 274560 + }, + { + "epoch": 1.77, + "learning_rate": 3.417905342171334e-05, + "loss": 0.0264, + "step": 274570 + }, + { + "epoch": 1.77, + "learning_rate": 3.416937206735641e-05, + "loss": 0.0252, + "step": 274580 + }, + { + "epoch": 1.77, + "learning_rate": 3.4159690712999474e-05, + "loss": 0.0227, + "step": 274590 + }, + { + "epoch": 1.77, + "learning_rate": 3.415000935864255e-05, + "loss": 0.0256, + "step": 274600 + }, + { + "epoch": 1.77, + "learning_rate": 3.4140328004285606e-05, + "loss": 0.0238, + "step": 274610 + }, + { + "epoch": 1.77, + "learning_rate": 3.413064664992868e-05, + "loss": 0.021, + "step": 274620 + }, + { + "epoch": 1.77, + "learning_rate": 3.4120965295571745e-05, + "loss": 0.0219, + "step": 274630 + }, + { + "epoch": 1.77, + "learning_rate": 3.411128394121481e-05, + "loss": 0.0209, + "step": 274640 + }, + { + "epoch": 1.77, + "learning_rate": 3.4101602586857885e-05, + "loss": 0.0223, + "step": 274650 + }, + { + "epoch": 1.77, + "learning_rate": 3.409192123250095e-05, + "loss": 0.0273, + "step": 274660 + }, + { + "epoch": 1.77, + "learning_rate": 3.408223987814402e-05, + "loss": 0.0226, + "step": 274670 + }, + { + "epoch": 1.77, + "learning_rate": 3.4072558523787083e-05, + "loss": 0.0241, + "step": 274680 + }, + { + "epoch": 1.77, + "learning_rate": 3.406287716943015e-05, + "loss": 0.0185, + "step": 274690 + }, + { + "epoch": 1.77, + "learning_rate": 3.405319581507322e-05, + "loss": 0.0213, + "step": 274700 + }, + { + "epoch": 1.77, + "learning_rate": 3.404351446071629e-05, + "loss": 0.022, + "step": 274710 + }, + { + "epoch": 1.77, + "learning_rate": 3.4033833106359355e-05, + "loss": 0.0211, + "step": 274720 + }, + { + "epoch": 1.77, + "learning_rate": 3.402415175200243e-05, + "loss": 0.026, + "step": 274730 + }, + { + "epoch": 1.77, + "learning_rate": 3.4014470397645494e-05, + "loss": 0.0259, + "step": 274740 + }, + { + "epoch": 1.77, + "learning_rate": 3.400478904328856e-05, + "loss": 0.0208, + "step": 274750 + }, + { + "epoch": 1.77, + "learning_rate": 3.399510768893163e-05, + "loss": 0.0225, + "step": 274760 + }, + { + "epoch": 1.77, + "learning_rate": 3.398542633457469e-05, + "loss": 0.0238, + "step": 274770 + }, + { + "epoch": 1.77, + "learning_rate": 3.3975744980217766e-05, + "loss": 0.0206, + "step": 274780 + }, + { + "epoch": 1.77, + "learning_rate": 3.396606362586083e-05, + "loss": 0.0238, + "step": 274790 + }, + { + "epoch": 1.77, + "learning_rate": 3.39563822715039e-05, + "loss": 0.0207, + "step": 274800 + }, + { + "epoch": 1.77, + "learning_rate": 3.394670091714697e-05, + "loss": 0.0255, + "step": 274810 + }, + { + "epoch": 1.77, + "learning_rate": 3.393701956279003e-05, + "loss": 0.0248, + "step": 274820 + }, + { + "epoch": 1.77, + "learning_rate": 3.3927338208433104e-05, + "loss": 0.0252, + "step": 274830 + }, + { + "epoch": 1.77, + "learning_rate": 3.391765685407617e-05, + "loss": 0.0234, + "step": 274840 + }, + { + "epoch": 1.77, + "learning_rate": 3.390797549971924e-05, + "loss": 0.0237, + "step": 274850 + }, + { + "epoch": 1.77, + "learning_rate": 3.389829414536231e-05, + "loss": 0.0267, + "step": 274860 + }, + { + "epoch": 1.77, + "learning_rate": 3.3888612791005376e-05, + "loss": 0.0198, + "step": 274870 + }, + { + "epoch": 1.77, + "learning_rate": 3.387893143664844e-05, + "loss": 0.0215, + "step": 274880 + }, + { + "epoch": 1.77, + "learning_rate": 3.386925008229151e-05, + "loss": 0.0209, + "step": 274890 + }, + { + "epoch": 1.77, + "learning_rate": 3.3859568727934575e-05, + "loss": 0.0191, + "step": 274900 + }, + { + "epoch": 1.77, + "learning_rate": 3.384988737357765e-05, + "loss": 0.0236, + "step": 274910 + }, + { + "epoch": 1.77, + "learning_rate": 3.3840206019220714e-05, + "loss": 0.0267, + "step": 274920 + }, + { + "epoch": 1.77, + "learning_rate": 3.383052466486378e-05, + "loss": 0.0192, + "step": 274930 + }, + { + "epoch": 1.77, + "learning_rate": 3.3820843310506846e-05, + "loss": 0.0226, + "step": 274940 + }, + { + "epoch": 1.77, + "learning_rate": 3.381116195614992e-05, + "loss": 0.0294, + "step": 274950 + }, + { + "epoch": 1.77, + "learning_rate": 3.3801480601792986e-05, + "loss": 0.0241, + "step": 274960 + }, + { + "epoch": 1.77, + "learning_rate": 3.379179924743605e-05, + "loss": 0.024, + "step": 274970 + }, + { + "epoch": 1.77, + "learning_rate": 3.378211789307912e-05, + "loss": 0.0212, + "step": 274980 + }, + { + "epoch": 1.77, + "learning_rate": 3.3772436538722184e-05, + "loss": 0.024, + "step": 274990 + }, + { + "epoch": 1.77, + "learning_rate": 3.376275518436526e-05, + "loss": 0.0236, + "step": 275000 + }, + { + "epoch": 1.77, + "eval_cer": 0.9198418257823975, + "eval_loss": 0.017496764659881592, + "eval_runtime": 119.762, + "eval_samples_per_second": 16.7, + "eval_steps_per_second": 4.175, + "step": 275000 + }, + { + "epoch": 1.77, + "learning_rate": 3.3753073830008324e-05, + "loss": 0.0252, + "step": 275010 + }, + { + "epoch": 1.78, + "learning_rate": 3.374339247565139e-05, + "loss": 0.0238, + "step": 275020 + }, + { + "epoch": 1.78, + "learning_rate": 3.3733711121294456e-05, + "loss": 0.0222, + "step": 275030 + }, + { + "epoch": 1.78, + "learning_rate": 3.372402976693752e-05, + "loss": 0.0225, + "step": 275040 + }, + { + "epoch": 1.78, + "learning_rate": 3.3714348412580595e-05, + "loss": 0.025, + "step": 275050 + }, + { + "epoch": 1.78, + "learning_rate": 3.370466705822366e-05, + "loss": 0.0213, + "step": 275060 + }, + { + "epoch": 1.78, + "learning_rate": 3.369498570386673e-05, + "loss": 0.0199, + "step": 275070 + }, + { + "epoch": 1.78, + "learning_rate": 3.36853043495098e-05, + "loss": 0.0211, + "step": 275080 + }, + { + "epoch": 1.78, + "learning_rate": 3.367562299515286e-05, + "loss": 0.023, + "step": 275090 + }, + { + "epoch": 1.78, + "learning_rate": 3.366594164079593e-05, + "loss": 0.0233, + "step": 275100 + }, + { + "epoch": 1.78, + "learning_rate": 3.3656260286439e-05, + "loss": 0.0209, + "step": 275110 + }, + { + "epoch": 1.78, + "learning_rate": 3.3646578932082066e-05, + "loss": 0.0227, + "step": 275120 + }, + { + "epoch": 1.78, + "learning_rate": 3.363689757772514e-05, + "loss": 0.0212, + "step": 275130 + }, + { + "epoch": 1.78, + "learning_rate": 3.3627216223368205e-05, + "loss": 0.0245, + "step": 275140 + }, + { + "epoch": 1.78, + "learning_rate": 3.361753486901127e-05, + "loss": 0.0208, + "step": 275150 + }, + { + "epoch": 1.78, + "learning_rate": 3.360785351465434e-05, + "loss": 0.0233, + "step": 275160 + }, + { + "epoch": 1.78, + "learning_rate": 3.3598172160297404e-05, + "loss": 0.023, + "step": 275170 + }, + { + "epoch": 1.78, + "learning_rate": 3.358849080594048e-05, + "loss": 0.0215, + "step": 275180 + }, + { + "epoch": 1.78, + "learning_rate": 3.357880945158354e-05, + "loss": 0.0226, + "step": 275190 + }, + { + "epoch": 1.78, + "learning_rate": 3.356912809722661e-05, + "loss": 0.0221, + "step": 275200 + }, + { + "epoch": 1.78, + "learning_rate": 3.355944674286968e-05, + "loss": 0.0303, + "step": 275210 + }, + { + "epoch": 1.78, + "learning_rate": 3.354976538851275e-05, + "loss": 0.0233, + "step": 275220 + }, + { + "epoch": 1.78, + "learning_rate": 3.3540084034155815e-05, + "loss": 0.0208, + "step": 275230 + }, + { + "epoch": 1.78, + "learning_rate": 3.353040267979888e-05, + "loss": 0.0227, + "step": 275240 + }, + { + "epoch": 1.78, + "learning_rate": 3.352072132544195e-05, + "loss": 0.0234, + "step": 275250 + }, + { + "epoch": 1.78, + "learning_rate": 3.351103997108502e-05, + "loss": 0.0195, + "step": 275260 + }, + { + "epoch": 1.78, + "learning_rate": 3.3501358616728086e-05, + "loss": 0.0233, + "step": 275270 + }, + { + "epoch": 1.78, + "learning_rate": 3.349167726237115e-05, + "loss": 0.0227, + "step": 275280 + }, + { + "epoch": 1.78, + "learning_rate": 3.3481995908014226e-05, + "loss": 0.0244, + "step": 275290 + }, + { + "epoch": 1.78, + "learning_rate": 3.3472314553657285e-05, + "loss": 0.0293, + "step": 275300 + }, + { + "epoch": 1.78, + "learning_rate": 3.346263319930036e-05, + "loss": 0.0291, + "step": 275310 + }, + { + "epoch": 1.78, + "learning_rate": 3.3452951844943424e-05, + "loss": 0.0231, + "step": 275320 + }, + { + "epoch": 1.78, + "learning_rate": 3.344327049058649e-05, + "loss": 0.029, + "step": 275330 + }, + { + "epoch": 1.78, + "learning_rate": 3.3433589136229564e-05, + "loss": 0.0208, + "step": 275340 + }, + { + "epoch": 1.78, + "learning_rate": 3.342390778187263e-05, + "loss": 0.0222, + "step": 275350 + }, + { + "epoch": 1.78, + "learning_rate": 3.3414226427515696e-05, + "loss": 0.0224, + "step": 275360 + }, + { + "epoch": 1.78, + "learning_rate": 3.340454507315876e-05, + "loss": 0.0232, + "step": 275370 + }, + { + "epoch": 1.78, + "learning_rate": 3.339486371880183e-05, + "loss": 0.0207, + "step": 275380 + }, + { + "epoch": 1.78, + "learning_rate": 3.33851823644449e-05, + "loss": 0.0251, + "step": 275390 + }, + { + "epoch": 1.78, + "learning_rate": 3.337550101008797e-05, + "loss": 0.0241, + "step": 275400 + }, + { + "epoch": 1.78, + "learning_rate": 3.3365819655731034e-05, + "loss": 0.025, + "step": 275410 + }, + { + "epoch": 1.78, + "learning_rate": 3.335613830137411e-05, + "loss": 0.0248, + "step": 275420 + }, + { + "epoch": 1.78, + "learning_rate": 3.334645694701717e-05, + "loss": 0.0201, + "step": 275430 + }, + { + "epoch": 1.78, + "learning_rate": 3.333677559266024e-05, + "loss": 0.0198, + "step": 275440 + }, + { + "epoch": 1.78, + "learning_rate": 3.3327094238303306e-05, + "loss": 0.03, + "step": 275450 + }, + { + "epoch": 1.78, + "learning_rate": 3.331741288394637e-05, + "loss": 0.0229, + "step": 275460 + }, + { + "epoch": 1.78, + "learning_rate": 3.3307731529589445e-05, + "loss": 0.0236, + "step": 275470 + }, + { + "epoch": 1.78, + "learning_rate": 3.329805017523251e-05, + "loss": 0.0273, + "step": 275480 + }, + { + "epoch": 1.78, + "learning_rate": 3.328836882087558e-05, + "loss": 0.0237, + "step": 275490 + }, + { + "epoch": 1.78, + "learning_rate": 3.327868746651865e-05, + "loss": 0.0257, + "step": 275500 + }, + { + "epoch": 1.78, + "learning_rate": 3.326900611216171e-05, + "loss": 0.0225, + "step": 275510 + }, + { + "epoch": 1.78, + "learning_rate": 3.325932475780478e-05, + "loss": 0.0293, + "step": 275520 + }, + { + "epoch": 1.78, + "learning_rate": 3.324964340344785e-05, + "loss": 0.0223, + "step": 275530 + }, + { + "epoch": 1.78, + "learning_rate": 3.3239962049090916e-05, + "loss": 0.0209, + "step": 275540 + }, + { + "epoch": 1.78, + "learning_rate": 3.323028069473399e-05, + "loss": 0.0243, + "step": 275550 + }, + { + "epoch": 1.78, + "learning_rate": 3.3220599340377055e-05, + "loss": 0.0255, + "step": 275560 + }, + { + "epoch": 1.78, + "learning_rate": 3.321091798602012e-05, + "loss": 0.0251, + "step": 275570 + }, + { + "epoch": 1.78, + "learning_rate": 3.320123663166319e-05, + "loss": 0.0298, + "step": 275580 + }, + { + "epoch": 1.78, + "learning_rate": 3.3191555277306254e-05, + "loss": 0.0241, + "step": 275590 + }, + { + "epoch": 1.78, + "learning_rate": 3.3181873922949327e-05, + "loss": 0.0241, + "step": 275600 + }, + { + "epoch": 1.78, + "learning_rate": 3.317219256859239e-05, + "loss": 0.0248, + "step": 275610 + }, + { + "epoch": 1.78, + "learning_rate": 3.316251121423546e-05, + "loss": 0.0238, + "step": 275620 + }, + { + "epoch": 1.78, + "learning_rate": 3.315282985987853e-05, + "loss": 0.0207, + "step": 275630 + }, + { + "epoch": 1.78, + "learning_rate": 3.31431485055216e-05, + "loss": 0.0234, + "step": 275640 + }, + { + "epoch": 1.78, + "learning_rate": 3.3133467151164664e-05, + "loss": 0.0299, + "step": 275650 + }, + { + "epoch": 1.78, + "learning_rate": 3.312378579680773e-05, + "loss": 0.023, + "step": 275660 + }, + { + "epoch": 1.78, + "learning_rate": 3.31141044424508e-05, + "loss": 0.0224, + "step": 275670 + }, + { + "epoch": 1.78, + "learning_rate": 3.310442308809387e-05, + "loss": 0.0251, + "step": 275680 + }, + { + "epoch": 1.78, + "learning_rate": 3.3094741733736936e-05, + "loss": 0.0236, + "step": 275690 + }, + { + "epoch": 1.78, + "learning_rate": 3.308506037938e-05, + "loss": 0.0221, + "step": 275700 + }, + { + "epoch": 1.78, + "learning_rate": 3.3075379025023075e-05, + "loss": 0.0289, + "step": 275710 + }, + { + "epoch": 1.78, + "learning_rate": 3.3065697670666135e-05, + "loss": 0.0232, + "step": 275720 + }, + { + "epoch": 1.78, + "learning_rate": 3.305601631630921e-05, + "loss": 0.0264, + "step": 275730 + }, + { + "epoch": 1.78, + "learning_rate": 3.3046334961952274e-05, + "loss": 0.0243, + "step": 275740 + }, + { + "epoch": 1.78, + "learning_rate": 3.303665360759534e-05, + "loss": 0.0206, + "step": 275750 + }, + { + "epoch": 1.78, + "learning_rate": 3.3026972253238413e-05, + "loss": 0.0228, + "step": 275760 + }, + { + "epoch": 1.78, + "learning_rate": 3.301729089888148e-05, + "loss": 0.0233, + "step": 275770 + }, + { + "epoch": 1.78, + "learning_rate": 3.3007609544524546e-05, + "loss": 0.022, + "step": 275780 + }, + { + "epoch": 1.78, + "learning_rate": 3.299792819016761e-05, + "loss": 0.0233, + "step": 275790 + }, + { + "epoch": 1.78, + "learning_rate": 3.298824683581068e-05, + "loss": 0.0262, + "step": 275800 + }, + { + "epoch": 1.78, + "learning_rate": 3.297856548145375e-05, + "loss": 0.0207, + "step": 275810 + }, + { + "epoch": 1.78, + "learning_rate": 3.296888412709682e-05, + "loss": 0.0222, + "step": 275820 + }, + { + "epoch": 1.78, + "learning_rate": 3.2959202772739884e-05, + "loss": 0.0214, + "step": 275830 + }, + { + "epoch": 1.78, + "learning_rate": 3.294952141838296e-05, + "loss": 0.0204, + "step": 275840 + }, + { + "epoch": 1.78, + "learning_rate": 3.293984006402602e-05, + "loss": 0.0252, + "step": 275850 + }, + { + "epoch": 1.78, + "learning_rate": 3.293015870966909e-05, + "loss": 0.0268, + "step": 275860 + }, + { + "epoch": 1.78, + "learning_rate": 3.2920477355312156e-05, + "loss": 0.0249, + "step": 275870 + }, + { + "epoch": 1.78, + "learning_rate": 3.291079600095522e-05, + "loss": 0.0244, + "step": 275880 + }, + { + "epoch": 1.78, + "learning_rate": 3.2901114646598295e-05, + "loss": 0.023, + "step": 275890 + }, + { + "epoch": 1.78, + "learning_rate": 3.289143329224136e-05, + "loss": 0.0191, + "step": 275900 + }, + { + "epoch": 1.78, + "learning_rate": 3.288175193788443e-05, + "loss": 0.0235, + "step": 275910 + }, + { + "epoch": 1.78, + "learning_rate": 3.2872070583527494e-05, + "loss": 0.0266, + "step": 275920 + }, + { + "epoch": 1.78, + "learning_rate": 3.286238922917056e-05, + "loss": 0.0267, + "step": 275930 + }, + { + "epoch": 1.78, + "learning_rate": 3.285270787481363e-05, + "loss": 0.0238, + "step": 275940 + }, + { + "epoch": 1.78, + "learning_rate": 3.28430265204567e-05, + "loss": 0.0255, + "step": 275950 + }, + { + "epoch": 1.78, + "learning_rate": 3.2833345166099765e-05, + "loss": 0.0221, + "step": 275960 + }, + { + "epoch": 1.78, + "learning_rate": 3.282366381174284e-05, + "loss": 0.0244, + "step": 275970 + }, + { + "epoch": 1.78, + "learning_rate": 3.2813982457385905e-05, + "loss": 0.0278, + "step": 275980 + }, + { + "epoch": 1.78, + "learning_rate": 3.280430110302897e-05, + "loss": 0.0245, + "step": 275990 + }, + { + "epoch": 1.78, + "learning_rate": 3.279461974867204e-05, + "loss": 0.0202, + "step": 276000 + }, + { + "epoch": 1.78, + "eval_cer": 0.9197794599480285, + "eval_loss": 0.017633169889450073, + "eval_runtime": 120.0188, + "eval_samples_per_second": 16.664, + "eval_steps_per_second": 4.166, + "step": 276000 + }, + { + "epoch": 1.78, + "learning_rate": 3.27849383943151e-05, + "loss": 0.0197, + "step": 276010 + }, + { + "epoch": 1.78, + "learning_rate": 3.2775257039958176e-05, + "loss": 0.0227, + "step": 276020 + }, + { + "epoch": 1.78, + "learning_rate": 3.276557568560124e-05, + "loss": 0.026, + "step": 276030 + }, + { + "epoch": 1.78, + "learning_rate": 3.275589433124431e-05, + "loss": 0.0253, + "step": 276040 + }, + { + "epoch": 1.78, + "learning_rate": 3.274621297688738e-05, + "loss": 0.0258, + "step": 276050 + }, + { + "epoch": 1.78, + "learning_rate": 3.273653162253044e-05, + "loss": 0.0235, + "step": 276060 + }, + { + "epoch": 1.78, + "learning_rate": 3.2726850268173514e-05, + "loss": 0.0358, + "step": 276070 + }, + { + "epoch": 1.78, + "learning_rate": 3.271716891381658e-05, + "loss": 0.0219, + "step": 276080 + }, + { + "epoch": 1.78, + "learning_rate": 3.270748755945965e-05, + "loss": 0.0241, + "step": 276090 + }, + { + "epoch": 1.78, + "learning_rate": 3.269780620510272e-05, + "loss": 0.0193, + "step": 276100 + }, + { + "epoch": 1.78, + "learning_rate": 3.2688124850745786e-05, + "loss": 0.0227, + "step": 276110 + }, + { + "epoch": 1.78, + "learning_rate": 3.267844349638885e-05, + "loss": 0.024, + "step": 276120 + }, + { + "epoch": 1.78, + "learning_rate": 3.266876214203192e-05, + "loss": 0.0212, + "step": 276130 + }, + { + "epoch": 1.78, + "learning_rate": 3.2659080787674985e-05, + "loss": 0.0241, + "step": 276140 + }, + { + "epoch": 1.78, + "learning_rate": 3.264939943331806e-05, + "loss": 0.0215, + "step": 276150 + }, + { + "epoch": 1.78, + "learning_rate": 3.2639718078961124e-05, + "loss": 0.0226, + "step": 276160 + }, + { + "epoch": 1.78, + "learning_rate": 3.263003672460419e-05, + "loss": 0.0211, + "step": 276170 + }, + { + "epoch": 1.78, + "learning_rate": 3.262035537024726e-05, + "loss": 0.0254, + "step": 276180 + }, + { + "epoch": 1.78, + "learning_rate": 3.261067401589033e-05, + "loss": 0.0228, + "step": 276190 + }, + { + "epoch": 1.78, + "learning_rate": 3.2600992661533396e-05, + "loss": 0.0217, + "step": 276200 + }, + { + "epoch": 1.78, + "learning_rate": 3.259131130717646e-05, + "loss": 0.0242, + "step": 276210 + }, + { + "epoch": 1.78, + "learning_rate": 3.258162995281953e-05, + "loss": 0.0203, + "step": 276220 + }, + { + "epoch": 1.78, + "learning_rate": 3.25719485984626e-05, + "loss": 0.0217, + "step": 276230 + }, + { + "epoch": 1.78, + "learning_rate": 3.256226724410567e-05, + "loss": 0.0216, + "step": 276240 + }, + { + "epoch": 1.78, + "learning_rate": 3.2552585889748734e-05, + "loss": 0.0176, + "step": 276250 + }, + { + "epoch": 1.78, + "learning_rate": 3.25429045353918e-05, + "loss": 0.0233, + "step": 276260 + }, + { + "epoch": 1.78, + "learning_rate": 3.2533223181034866e-05, + "loss": 0.0241, + "step": 276270 + }, + { + "epoch": 1.78, + "learning_rate": 3.252354182667794e-05, + "loss": 0.0239, + "step": 276280 + }, + { + "epoch": 1.78, + "learning_rate": 3.2513860472321005e-05, + "loss": 0.0216, + "step": 276290 + }, + { + "epoch": 1.78, + "learning_rate": 3.250417911796407e-05, + "loss": 0.023, + "step": 276300 + }, + { + "epoch": 1.78, + "learning_rate": 3.249449776360714e-05, + "loss": 0.0213, + "step": 276310 + }, + { + "epoch": 1.78, + "learning_rate": 3.248481640925021e-05, + "loss": 0.0251, + "step": 276320 + }, + { + "epoch": 1.78, + "learning_rate": 3.247513505489328e-05, + "loss": 0.0221, + "step": 276330 + }, + { + "epoch": 1.78, + "learning_rate": 3.2465453700536343e-05, + "loss": 0.0209, + "step": 276340 + }, + { + "epoch": 1.78, + "learning_rate": 3.245577234617941e-05, + "loss": 0.023, + "step": 276350 + }, + { + "epoch": 1.78, + "learning_rate": 3.244609099182248e-05, + "loss": 0.0181, + "step": 276360 + }, + { + "epoch": 1.78, + "learning_rate": 3.243640963746555e-05, + "loss": 0.0235, + "step": 276370 + }, + { + "epoch": 1.78, + "learning_rate": 3.2426728283108615e-05, + "loss": 0.026, + "step": 276380 + }, + { + "epoch": 1.78, + "learning_rate": 3.241704692875168e-05, + "loss": 0.0244, + "step": 276390 + }, + { + "epoch": 1.78, + "learning_rate": 3.2407365574394754e-05, + "loss": 0.0208, + "step": 276400 + }, + { + "epoch": 1.78, + "learning_rate": 3.239768422003782e-05, + "loss": 0.0265, + "step": 276410 + }, + { + "epoch": 1.78, + "learning_rate": 3.238800286568089e-05, + "loss": 0.0205, + "step": 276420 + }, + { + "epoch": 1.78, + "learning_rate": 3.237832151132395e-05, + "loss": 0.0342, + "step": 276430 + }, + { + "epoch": 1.78, + "learning_rate": 3.236864015696702e-05, + "loss": 0.0247, + "step": 276440 + }, + { + "epoch": 1.78, + "learning_rate": 3.235895880261009e-05, + "loss": 0.0229, + "step": 276450 + }, + { + "epoch": 1.78, + "learning_rate": 3.234927744825316e-05, + "loss": 0.0222, + "step": 276460 + }, + { + "epoch": 1.78, + "learning_rate": 3.2339596093896225e-05, + "loss": 0.0227, + "step": 276470 + }, + { + "epoch": 1.78, + "learning_rate": 3.232991473953929e-05, + "loss": 0.0215, + "step": 276480 + }, + { + "epoch": 1.78, + "learning_rate": 3.232023338518236e-05, + "loss": 0.025, + "step": 276490 + }, + { + "epoch": 1.78, + "learning_rate": 3.231055203082543e-05, + "loss": 0.0252, + "step": 276500 + }, + { + "epoch": 1.78, + "learning_rate": 3.2300870676468497e-05, + "loss": 0.0232, + "step": 276510 + }, + { + "epoch": 1.78, + "learning_rate": 3.229118932211156e-05, + "loss": 0.0248, + "step": 276520 + }, + { + "epoch": 1.78, + "learning_rate": 3.2281507967754636e-05, + "loss": 0.0302, + "step": 276530 + }, + { + "epoch": 1.78, + "learning_rate": 3.22718266133977e-05, + "loss": 0.03, + "step": 276540 + }, + { + "epoch": 1.78, + "learning_rate": 3.226214525904077e-05, + "loss": 0.0215, + "step": 276550 + }, + { + "epoch": 1.78, + "learning_rate": 3.2252463904683835e-05, + "loss": 0.0258, + "step": 276560 + }, + { + "epoch": 1.79, + "learning_rate": 3.22427825503269e-05, + "loss": 0.0174, + "step": 276570 + }, + { + "epoch": 1.79, + "learning_rate": 3.2233101195969974e-05, + "loss": 0.024, + "step": 276580 + }, + { + "epoch": 1.79, + "learning_rate": 3.222341984161304e-05, + "loss": 0.0257, + "step": 276590 + }, + { + "epoch": 1.79, + "learning_rate": 3.2213738487256106e-05, + "loss": 0.0241, + "step": 276600 + }, + { + "epoch": 1.79, + "learning_rate": 3.220405713289918e-05, + "loss": 0.0196, + "step": 276610 + }, + { + "epoch": 1.79, + "learning_rate": 3.219437577854224e-05, + "loss": 0.0185, + "step": 276620 + }, + { + "epoch": 1.79, + "learning_rate": 3.218469442418531e-05, + "loss": 0.0233, + "step": 276630 + }, + { + "epoch": 1.79, + "learning_rate": 3.217501306982838e-05, + "loss": 0.0316, + "step": 276640 + }, + { + "epoch": 1.79, + "learning_rate": 3.2165331715471444e-05, + "loss": 0.02, + "step": 276650 + }, + { + "epoch": 1.79, + "learning_rate": 3.215565036111452e-05, + "loss": 0.0236, + "step": 276660 + }, + { + "epoch": 1.79, + "learning_rate": 3.2145969006757584e-05, + "loss": 0.0244, + "step": 276670 + }, + { + "epoch": 1.79, + "learning_rate": 3.213628765240065e-05, + "loss": 0.0216, + "step": 276680 + }, + { + "epoch": 1.79, + "learning_rate": 3.2126606298043716e-05, + "loss": 0.0204, + "step": 276690 + }, + { + "epoch": 1.79, + "learning_rate": 3.211692494368678e-05, + "loss": 0.0281, + "step": 276700 + }, + { + "epoch": 1.79, + "learning_rate": 3.2107243589329855e-05, + "loss": 0.0205, + "step": 276710 + }, + { + "epoch": 1.79, + "learning_rate": 3.209756223497292e-05, + "loss": 0.0292, + "step": 276720 + }, + { + "epoch": 1.79, + "learning_rate": 3.208788088061599e-05, + "loss": 0.0235, + "step": 276730 + }, + { + "epoch": 1.79, + "learning_rate": 3.207819952625906e-05, + "loss": 0.0272, + "step": 276740 + }, + { + "epoch": 1.79, + "learning_rate": 3.206851817190212e-05, + "loss": 0.0216, + "step": 276750 + }, + { + "epoch": 1.79, + "learning_rate": 3.205883681754519e-05, + "loss": 0.0217, + "step": 276760 + }, + { + "epoch": 1.79, + "learning_rate": 3.204915546318826e-05, + "loss": 0.0223, + "step": 276770 + }, + { + "epoch": 1.79, + "learning_rate": 3.2039474108831326e-05, + "loss": 0.0249, + "step": 276780 + }, + { + "epoch": 1.79, + "learning_rate": 3.20297927544744e-05, + "loss": 0.0253, + "step": 276790 + }, + { + "epoch": 1.79, + "learning_rate": 3.2020111400117465e-05, + "loss": 0.0217, + "step": 276800 + }, + { + "epoch": 1.79, + "learning_rate": 3.201043004576053e-05, + "loss": 0.0261, + "step": 276810 + }, + { + "epoch": 1.79, + "learning_rate": 3.20007486914036e-05, + "loss": 0.0197, + "step": 276820 + }, + { + "epoch": 1.79, + "learning_rate": 3.1991067337046664e-05, + "loss": 0.0267, + "step": 276830 + }, + { + "epoch": 1.79, + "learning_rate": 3.198138598268974e-05, + "loss": 0.0213, + "step": 276840 + }, + { + "epoch": 1.79, + "learning_rate": 3.19717046283328e-05, + "loss": 0.0236, + "step": 276850 + }, + { + "epoch": 1.79, + "learning_rate": 3.196202327397587e-05, + "loss": 0.0207, + "step": 276860 + }, + { + "epoch": 1.79, + "learning_rate": 3.195234191961894e-05, + "loss": 0.0269, + "step": 276870 + }, + { + "epoch": 1.79, + "learning_rate": 3.194266056526201e-05, + "loss": 0.027, + "step": 276880 + }, + { + "epoch": 1.79, + "learning_rate": 3.1932979210905075e-05, + "loss": 0.0219, + "step": 276890 + }, + { + "epoch": 1.79, + "learning_rate": 3.192329785654814e-05, + "loss": 0.0246, + "step": 276900 + }, + { + "epoch": 1.79, + "learning_rate": 3.191361650219121e-05, + "loss": 0.021, + "step": 276910 + }, + { + "epoch": 1.79, + "learning_rate": 3.190393514783428e-05, + "loss": 0.0222, + "step": 276920 + }, + { + "epoch": 1.79, + "learning_rate": 3.1894253793477346e-05, + "loss": 0.0219, + "step": 276930 + }, + { + "epoch": 1.79, + "learning_rate": 3.188457243912041e-05, + "loss": 0.0229, + "step": 276940 + }, + { + "epoch": 1.79, + "learning_rate": 3.1874891084763486e-05, + "loss": 0.0263, + "step": 276950 + }, + { + "epoch": 1.79, + "learning_rate": 3.1865209730406545e-05, + "loss": 0.0253, + "step": 276960 + }, + { + "epoch": 1.79, + "learning_rate": 3.185552837604962e-05, + "loss": 0.0195, + "step": 276970 + }, + { + "epoch": 1.79, + "learning_rate": 3.1845847021692684e-05, + "loss": 0.0245, + "step": 276980 + }, + { + "epoch": 1.79, + "learning_rate": 3.183616566733575e-05, + "loss": 0.0246, + "step": 276990 + }, + { + "epoch": 1.79, + "learning_rate": 3.1826484312978824e-05, + "loss": 0.0318, + "step": 277000 + }, + { + "epoch": 1.79, + "eval_cer": 0.9198689413625579, + "eval_loss": 0.01742408238351345, + "eval_runtime": 119.8944, + "eval_samples_per_second": 16.681, + "eval_steps_per_second": 4.17, + "step": 277000 + }, + { + "epoch": 1.79, + "learning_rate": 3.181680295862189e-05, + "loss": 0.0255, + "step": 277010 + }, + { + "epoch": 1.79, + "learning_rate": 3.1807121604264956e-05, + "loss": 0.0216, + "step": 277020 + }, + { + "epoch": 1.79, + "learning_rate": 3.179744024990802e-05, + "loss": 0.0213, + "step": 277030 + }, + { + "epoch": 1.79, + "learning_rate": 3.178775889555109e-05, + "loss": 0.0249, + "step": 277040 + }, + { + "epoch": 1.79, + "learning_rate": 3.177807754119416e-05, + "loss": 0.0203, + "step": 277050 + }, + { + "epoch": 1.79, + "learning_rate": 3.176839618683723e-05, + "loss": 0.0262, + "step": 277060 + }, + { + "epoch": 1.79, + "learning_rate": 3.1758714832480294e-05, + "loss": 0.0298, + "step": 277070 + }, + { + "epoch": 1.79, + "learning_rate": 3.174903347812337e-05, + "loss": 0.0226, + "step": 277080 + }, + { + "epoch": 1.79, + "learning_rate": 3.173935212376643e-05, + "loss": 0.0245, + "step": 277090 + }, + { + "epoch": 1.79, + "learning_rate": 3.17296707694095e-05, + "loss": 0.0241, + "step": 277100 + }, + { + "epoch": 1.79, + "learning_rate": 3.1719989415052566e-05, + "loss": 0.0231, + "step": 277110 + }, + { + "epoch": 1.79, + "learning_rate": 3.171030806069563e-05, + "loss": 0.0195, + "step": 277120 + }, + { + "epoch": 1.79, + "learning_rate": 3.1700626706338705e-05, + "loss": 0.0208, + "step": 277130 + }, + { + "epoch": 1.79, + "learning_rate": 3.169094535198177e-05, + "loss": 0.0218, + "step": 277140 + }, + { + "epoch": 1.79, + "learning_rate": 3.168126399762484e-05, + "loss": 0.0261, + "step": 277150 + }, + { + "epoch": 1.79, + "learning_rate": 3.167158264326791e-05, + "loss": 0.0192, + "step": 277160 + }, + { + "epoch": 1.79, + "learning_rate": 3.166190128891097e-05, + "loss": 0.023, + "step": 277170 + }, + { + "epoch": 1.79, + "learning_rate": 3.165221993455404e-05, + "loss": 0.024, + "step": 277180 + }, + { + "epoch": 1.79, + "learning_rate": 3.164253858019711e-05, + "loss": 0.0266, + "step": 277190 + }, + { + "epoch": 1.79, + "learning_rate": 3.1632857225840176e-05, + "loss": 0.0279, + "step": 277200 + }, + { + "epoch": 1.79, + "learning_rate": 3.162317587148325e-05, + "loss": 0.0226, + "step": 277210 + }, + { + "epoch": 1.79, + "learning_rate": 3.1613494517126315e-05, + "loss": 0.0225, + "step": 277220 + }, + { + "epoch": 1.79, + "learning_rate": 3.160381316276938e-05, + "loss": 0.033, + "step": 277230 + }, + { + "epoch": 1.79, + "learning_rate": 3.159413180841245e-05, + "loss": 0.021, + "step": 277240 + }, + { + "epoch": 1.79, + "learning_rate": 3.1584450454055513e-05, + "loss": 0.0305, + "step": 277250 + }, + { + "epoch": 1.79, + "learning_rate": 3.1574769099698586e-05, + "loss": 0.024, + "step": 277260 + }, + { + "epoch": 1.79, + "learning_rate": 3.156508774534165e-05, + "loss": 0.0233, + "step": 277270 + }, + { + "epoch": 1.79, + "learning_rate": 3.155540639098472e-05, + "loss": 0.0242, + "step": 277280 + }, + { + "epoch": 1.79, + "learning_rate": 3.154572503662779e-05, + "loss": 0.0258, + "step": 277290 + }, + { + "epoch": 1.79, + "learning_rate": 3.153604368227086e-05, + "loss": 0.0286, + "step": 277300 + }, + { + "epoch": 1.79, + "learning_rate": 3.1526362327913924e-05, + "loss": 0.0214, + "step": 277310 + }, + { + "epoch": 1.79, + "learning_rate": 3.151668097355699e-05, + "loss": 0.021, + "step": 277320 + }, + { + "epoch": 1.79, + "learning_rate": 3.150699961920006e-05, + "loss": 0.0226, + "step": 277330 + }, + { + "epoch": 1.79, + "learning_rate": 3.149731826484313e-05, + "loss": 0.0199, + "step": 277340 + }, + { + "epoch": 1.79, + "learning_rate": 3.1487636910486196e-05, + "loss": 0.0222, + "step": 277350 + }, + { + "epoch": 1.79, + "learning_rate": 3.147795555612926e-05, + "loss": 0.0235, + "step": 277360 + }, + { + "epoch": 1.79, + "learning_rate": 3.1468274201772335e-05, + "loss": 0.0236, + "step": 277370 + }, + { + "epoch": 1.79, + "learning_rate": 3.1458592847415395e-05, + "loss": 0.0229, + "step": 277380 + }, + { + "epoch": 1.79, + "learning_rate": 3.144891149305847e-05, + "loss": 0.022, + "step": 277390 + }, + { + "epoch": 1.79, + "learning_rate": 3.1439230138701534e-05, + "loss": 0.0213, + "step": 277400 + }, + { + "epoch": 1.79, + "learning_rate": 3.14295487843446e-05, + "loss": 0.0238, + "step": 277410 + }, + { + "epoch": 1.79, + "learning_rate": 3.1419867429987673e-05, + "loss": 0.0248, + "step": 277420 + }, + { + "epoch": 1.79, + "learning_rate": 3.141018607563074e-05, + "loss": 0.0236, + "step": 277430 + }, + { + "epoch": 1.79, + "learning_rate": 3.1400504721273806e-05, + "loss": 0.0223, + "step": 277440 + }, + { + "epoch": 1.79, + "learning_rate": 3.139082336691687e-05, + "loss": 0.0232, + "step": 277450 + }, + { + "epoch": 1.79, + "learning_rate": 3.138114201255994e-05, + "loss": 0.0217, + "step": 277460 + }, + { + "epoch": 1.79, + "learning_rate": 3.137146065820301e-05, + "loss": 0.0221, + "step": 277470 + }, + { + "epoch": 1.79, + "learning_rate": 3.136177930384608e-05, + "loss": 0.0217, + "step": 277480 + }, + { + "epoch": 1.79, + "learning_rate": 3.1352097949489144e-05, + "loss": 0.0221, + "step": 277490 + }, + { + "epoch": 1.79, + "learning_rate": 3.134241659513222e-05, + "loss": 0.0209, + "step": 277500 + }, + { + "epoch": 1.79, + "learning_rate": 3.133273524077528e-05, + "loss": 0.0267, + "step": 277510 + }, + { + "epoch": 1.79, + "learning_rate": 3.132305388641835e-05, + "loss": 0.0236, + "step": 277520 + }, + { + "epoch": 1.79, + "learning_rate": 3.1313372532061416e-05, + "loss": 0.0261, + "step": 277530 + }, + { + "epoch": 1.79, + "learning_rate": 3.130369117770448e-05, + "loss": 0.022, + "step": 277540 + }, + { + "epoch": 1.79, + "learning_rate": 3.1294009823347555e-05, + "loss": 0.0221, + "step": 277550 + }, + { + "epoch": 1.79, + "learning_rate": 3.128432846899062e-05, + "loss": 0.0194, + "step": 277560 + }, + { + "epoch": 1.79, + "learning_rate": 3.127464711463369e-05, + "loss": 0.0248, + "step": 277570 + }, + { + "epoch": 1.79, + "learning_rate": 3.126496576027676e-05, + "loss": 0.0233, + "step": 277580 + }, + { + "epoch": 1.79, + "learning_rate": 3.125528440591982e-05, + "loss": 0.0255, + "step": 277590 + }, + { + "epoch": 1.79, + "learning_rate": 3.124560305156289e-05, + "loss": 0.0226, + "step": 277600 + }, + { + "epoch": 1.79, + "learning_rate": 3.123592169720596e-05, + "loss": 0.0233, + "step": 277610 + }, + { + "epoch": 1.79, + "learning_rate": 3.1226240342849025e-05, + "loss": 0.0223, + "step": 277620 + }, + { + "epoch": 1.79, + "learning_rate": 3.12165589884921e-05, + "loss": 0.0246, + "step": 277630 + }, + { + "epoch": 1.79, + "learning_rate": 3.1206877634135165e-05, + "loss": 0.0217, + "step": 277640 + }, + { + "epoch": 1.79, + "learning_rate": 3.119719627977823e-05, + "loss": 0.0197, + "step": 277650 + }, + { + "epoch": 1.79, + "learning_rate": 3.11875149254213e-05, + "loss": 0.0267, + "step": 277660 + }, + { + "epoch": 1.79, + "learning_rate": 3.117783357106436e-05, + "loss": 0.0246, + "step": 277670 + }, + { + "epoch": 1.79, + "learning_rate": 3.1168152216707436e-05, + "loss": 0.0264, + "step": 277680 + }, + { + "epoch": 1.79, + "learning_rate": 3.11584708623505e-05, + "loss": 0.0239, + "step": 277690 + }, + { + "epoch": 1.79, + "learning_rate": 3.114878950799357e-05, + "loss": 0.0266, + "step": 277700 + }, + { + "epoch": 1.79, + "learning_rate": 3.1139108153636635e-05, + "loss": 0.0278, + "step": 277710 + }, + { + "epoch": 1.79, + "learning_rate": 3.11294267992797e-05, + "loss": 0.0248, + "step": 277720 + }, + { + "epoch": 1.79, + "learning_rate": 3.1119745444922774e-05, + "loss": 0.0295, + "step": 277730 + }, + { + "epoch": 1.79, + "learning_rate": 3.111006409056584e-05, + "loss": 0.0196, + "step": 277740 + }, + { + "epoch": 1.79, + "learning_rate": 3.110038273620891e-05, + "loss": 0.0207, + "step": 277750 + }, + { + "epoch": 1.79, + "learning_rate": 3.109070138185197e-05, + "loss": 0.0249, + "step": 277760 + }, + { + "epoch": 1.79, + "learning_rate": 3.1081020027495046e-05, + "loss": 0.0233, + "step": 277770 + }, + { + "epoch": 1.79, + "learning_rate": 3.107133867313811e-05, + "loss": 0.0263, + "step": 277780 + }, + { + "epoch": 1.79, + "learning_rate": 3.106165731878118e-05, + "loss": 0.0244, + "step": 277790 + }, + { + "epoch": 1.79, + "learning_rate": 3.1051975964424245e-05, + "loss": 0.0272, + "step": 277800 + }, + { + "epoch": 1.79, + "learning_rate": 3.104229461006731e-05, + "loss": 0.0189, + "step": 277810 + }, + { + "epoch": 1.79, + "learning_rate": 3.1032613255710384e-05, + "loss": 0.0231, + "step": 277820 + }, + { + "epoch": 1.79, + "learning_rate": 3.102293190135345e-05, + "loss": 0.0203, + "step": 277830 + }, + { + "epoch": 1.79, + "learning_rate": 3.1013250546996516e-05, + "loss": 0.0186, + "step": 277840 + }, + { + "epoch": 1.79, + "learning_rate": 3.100356919263959e-05, + "loss": 0.0204, + "step": 277850 + }, + { + "epoch": 1.79, + "learning_rate": 3.099388783828265e-05, + "loss": 0.0259, + "step": 277860 + }, + { + "epoch": 1.79, + "learning_rate": 3.098420648392572e-05, + "loss": 0.0251, + "step": 277870 + }, + { + "epoch": 1.79, + "learning_rate": 3.097452512956879e-05, + "loss": 0.0231, + "step": 277880 + }, + { + "epoch": 1.79, + "learning_rate": 3.0964843775211854e-05, + "loss": 0.0205, + "step": 277890 + }, + { + "epoch": 1.79, + "learning_rate": 3.095516242085493e-05, + "loss": 0.0255, + "step": 277900 + }, + { + "epoch": 1.79, + "learning_rate": 3.0945481066497994e-05, + "loss": 0.0199, + "step": 277910 + }, + { + "epoch": 1.79, + "learning_rate": 3.093579971214106e-05, + "loss": 0.0229, + "step": 277920 + }, + { + "epoch": 1.79, + "learning_rate": 3.0926118357784126e-05, + "loss": 0.0226, + "step": 277930 + }, + { + "epoch": 1.79, + "learning_rate": 3.091643700342719e-05, + "loss": 0.0247, + "step": 277940 + }, + { + "epoch": 1.79, + "learning_rate": 3.0906755649070265e-05, + "loss": 0.0236, + "step": 277950 + }, + { + "epoch": 1.79, + "learning_rate": 3.089707429471333e-05, + "loss": 0.0205, + "step": 277960 + }, + { + "epoch": 1.79, + "learning_rate": 3.08873929403564e-05, + "loss": 0.0273, + "step": 277970 + }, + { + "epoch": 1.79, + "learning_rate": 3.087771158599947e-05, + "loss": 0.0213, + "step": 277980 + }, + { + "epoch": 1.79, + "learning_rate": 3.086803023164254e-05, + "loss": 0.027, + "step": 277990 + }, + { + "epoch": 1.79, + "learning_rate": 3.0858348877285603e-05, + "loss": 0.0206, + "step": 278000 + }, + { + "epoch": 1.79, + "eval_cer": 0.9198373065190374, + "eval_loss": 0.017471129074692726, + "eval_runtime": 119.7858, + "eval_samples_per_second": 16.696, + "eval_steps_per_second": 4.174, + "step": 278000 + }, + { + "epoch": 1.79, + "learning_rate": 3.084866752292867e-05, + "loss": 0.0219, + "step": 278010 + }, + { + "epoch": 1.79, + "learning_rate": 3.0838986168571736e-05, + "loss": 0.0278, + "step": 278020 + }, + { + "epoch": 1.79, + "learning_rate": 3.082930481421481e-05, + "loss": 0.0201, + "step": 278030 + }, + { + "epoch": 1.79, + "learning_rate": 3.0819623459857875e-05, + "loss": 0.0216, + "step": 278040 + }, + { + "epoch": 1.79, + "learning_rate": 3.080994210550094e-05, + "loss": 0.0242, + "step": 278050 + }, + { + "epoch": 1.79, + "learning_rate": 3.0800260751144014e-05, + "loss": 0.0262, + "step": 278060 + }, + { + "epoch": 1.79, + "learning_rate": 3.0790579396787074e-05, + "loss": 0.0192, + "step": 278070 + }, + { + "epoch": 1.79, + "learning_rate": 3.078089804243015e-05, + "loss": 0.0284, + "step": 278080 + }, + { + "epoch": 1.79, + "learning_rate": 3.077121668807321e-05, + "loss": 0.0202, + "step": 278090 + }, + { + "epoch": 1.79, + "learning_rate": 3.076153533371628e-05, + "loss": 0.0216, + "step": 278100 + }, + { + "epoch": 1.79, + "learning_rate": 3.075185397935935e-05, + "loss": 0.0251, + "step": 278110 + }, + { + "epoch": 1.8, + "learning_rate": 3.074217262500242e-05, + "loss": 0.0217, + "step": 278120 + }, + { + "epoch": 1.8, + "learning_rate": 3.0732491270645485e-05, + "loss": 0.0241, + "step": 278130 + }, + { + "epoch": 1.8, + "learning_rate": 3.072280991628855e-05, + "loss": 0.0207, + "step": 278140 + }, + { + "epoch": 1.8, + "learning_rate": 3.071312856193162e-05, + "loss": 0.0252, + "step": 278150 + }, + { + "epoch": 1.8, + "learning_rate": 3.070344720757469e-05, + "loss": 0.0224, + "step": 278160 + }, + { + "epoch": 1.8, + "learning_rate": 3.0693765853217757e-05, + "loss": 0.0254, + "step": 278170 + }, + { + "epoch": 1.8, + "learning_rate": 3.068408449886082e-05, + "loss": 0.0235, + "step": 278180 + }, + { + "epoch": 1.8, + "learning_rate": 3.0674403144503896e-05, + "loss": 0.0235, + "step": 278190 + }, + { + "epoch": 1.8, + "learning_rate": 3.066472179014696e-05, + "loss": 0.0259, + "step": 278200 + }, + { + "epoch": 1.8, + "learning_rate": 3.065504043579003e-05, + "loss": 0.019, + "step": 278210 + }, + { + "epoch": 1.8, + "learning_rate": 3.0645359081433095e-05, + "loss": 0.0214, + "step": 278220 + }, + { + "epoch": 1.8, + "learning_rate": 3.063567772707616e-05, + "loss": 0.0282, + "step": 278230 + }, + { + "epoch": 1.8, + "learning_rate": 3.0625996372719234e-05, + "loss": 0.0241, + "step": 278240 + }, + { + "epoch": 1.8, + "learning_rate": 3.06163150183623e-05, + "loss": 0.0227, + "step": 278250 + }, + { + "epoch": 1.8, + "learning_rate": 3.0606633664005366e-05, + "loss": 0.0258, + "step": 278260 + }, + { + "epoch": 1.8, + "learning_rate": 3.059695230964844e-05, + "loss": 0.0255, + "step": 278270 + }, + { + "epoch": 1.8, + "learning_rate": 3.05872709552915e-05, + "loss": 0.0203, + "step": 278280 + }, + { + "epoch": 1.8, + "learning_rate": 3.057758960093457e-05, + "loss": 0.0231, + "step": 278290 + }, + { + "epoch": 1.8, + "learning_rate": 3.056790824657764e-05, + "loss": 0.0251, + "step": 278300 + }, + { + "epoch": 1.8, + "learning_rate": 3.0558226892220704e-05, + "loss": 0.025, + "step": 278310 + }, + { + "epoch": 1.8, + "learning_rate": 3.054854553786378e-05, + "loss": 0.0226, + "step": 278320 + }, + { + "epoch": 1.8, + "learning_rate": 3.0538864183506843e-05, + "loss": 0.0286, + "step": 278330 + }, + { + "epoch": 1.8, + "learning_rate": 3.052918282914991e-05, + "loss": 0.0236, + "step": 278340 + }, + { + "epoch": 1.8, + "learning_rate": 3.0519501474792976e-05, + "loss": 0.0263, + "step": 278350 + }, + { + "epoch": 1.8, + "learning_rate": 3.0509820120436046e-05, + "loss": 0.0244, + "step": 278360 + }, + { + "epoch": 1.8, + "learning_rate": 3.0500138766079112e-05, + "loss": 0.0285, + "step": 278370 + }, + { + "epoch": 1.8, + "learning_rate": 3.049045741172218e-05, + "loss": 0.0205, + "step": 278380 + }, + { + "epoch": 1.8, + "learning_rate": 3.048077605736525e-05, + "loss": 0.0276, + "step": 278390 + }, + { + "epoch": 1.8, + "learning_rate": 3.0471094703008317e-05, + "loss": 0.0256, + "step": 278400 + }, + { + "epoch": 1.8, + "learning_rate": 3.0461413348651387e-05, + "loss": 0.0264, + "step": 278410 + }, + { + "epoch": 1.8, + "learning_rate": 3.045173199429445e-05, + "loss": 0.0215, + "step": 278420 + }, + { + "epoch": 1.8, + "learning_rate": 3.044205063993752e-05, + "loss": 0.0217, + "step": 278430 + }, + { + "epoch": 1.8, + "learning_rate": 3.043236928558059e-05, + "loss": 0.0261, + "step": 278440 + }, + { + "epoch": 1.8, + "learning_rate": 3.0422687931223655e-05, + "loss": 0.0246, + "step": 278450 + }, + { + "epoch": 1.8, + "learning_rate": 3.0413006576866725e-05, + "loss": 0.0257, + "step": 278460 + }, + { + "epoch": 1.8, + "learning_rate": 3.0403325222509795e-05, + "loss": 0.0284, + "step": 278470 + }, + { + "epoch": 1.8, + "learning_rate": 3.0393643868152857e-05, + "loss": 0.0247, + "step": 278480 + }, + { + "epoch": 1.8, + "learning_rate": 3.0383962513795927e-05, + "loss": 0.0193, + "step": 278490 + }, + { + "epoch": 1.8, + "learning_rate": 3.0374281159438993e-05, + "loss": 0.0243, + "step": 278500 + }, + { + "epoch": 1.8, + "learning_rate": 3.0364599805082063e-05, + "loss": 0.0249, + "step": 278510 + }, + { + "epoch": 1.8, + "learning_rate": 3.0354918450725133e-05, + "loss": 0.0204, + "step": 278520 + }, + { + "epoch": 1.8, + "learning_rate": 3.03452370963682e-05, + "loss": 0.0246, + "step": 278530 + }, + { + "epoch": 1.8, + "learning_rate": 3.033555574201127e-05, + "loss": 0.0279, + "step": 278540 + }, + { + "epoch": 1.8, + "learning_rate": 3.032587438765433e-05, + "loss": 0.0273, + "step": 278550 + }, + { + "epoch": 1.8, + "learning_rate": 3.03161930332974e-05, + "loss": 0.0208, + "step": 278560 + }, + { + "epoch": 1.8, + "learning_rate": 3.030651167894047e-05, + "loss": 0.0268, + "step": 278570 + }, + { + "epoch": 1.8, + "learning_rate": 3.0296830324583537e-05, + "loss": 0.0249, + "step": 278580 + }, + { + "epoch": 1.8, + "learning_rate": 3.0287148970226606e-05, + "loss": 0.0199, + "step": 278590 + }, + { + "epoch": 1.8, + "learning_rate": 3.0277467615869676e-05, + "loss": 0.0306, + "step": 278600 + }, + { + "epoch": 1.8, + "learning_rate": 3.0267786261512742e-05, + "loss": 0.02, + "step": 278610 + }, + { + "epoch": 1.8, + "learning_rate": 3.025810490715581e-05, + "loss": 0.0219, + "step": 278620 + }, + { + "epoch": 1.8, + "learning_rate": 3.0248423552798875e-05, + "loss": 0.0248, + "step": 278630 + }, + { + "epoch": 1.8, + "learning_rate": 3.0238742198441944e-05, + "loss": 0.02, + "step": 278640 + }, + { + "epoch": 1.8, + "learning_rate": 3.0229060844085014e-05, + "loss": 0.021, + "step": 278650 + }, + { + "epoch": 1.8, + "learning_rate": 3.021937948972808e-05, + "loss": 0.0208, + "step": 278660 + }, + { + "epoch": 1.8, + "learning_rate": 3.020969813537115e-05, + "loss": 0.0275, + "step": 278670 + }, + { + "epoch": 1.8, + "learning_rate": 3.0200016781014216e-05, + "loss": 0.028, + "step": 278680 + }, + { + "epoch": 1.8, + "learning_rate": 3.0190335426657282e-05, + "loss": 0.0268, + "step": 278690 + }, + { + "epoch": 1.8, + "learning_rate": 3.0180654072300352e-05, + "loss": 0.0223, + "step": 278700 + }, + { + "epoch": 1.8, + "learning_rate": 3.0170972717943418e-05, + "loss": 0.0251, + "step": 278710 + }, + { + "epoch": 1.8, + "learning_rate": 3.0161291363586488e-05, + "loss": 0.0232, + "step": 278720 + }, + { + "epoch": 1.8, + "learning_rate": 3.0151610009229554e-05, + "loss": 0.0204, + "step": 278730 + }, + { + "epoch": 1.8, + "learning_rate": 3.0141928654872624e-05, + "loss": 0.0241, + "step": 278740 + }, + { + "epoch": 1.8, + "learning_rate": 3.0132247300515693e-05, + "loss": 0.0247, + "step": 278750 + }, + { + "epoch": 1.8, + "learning_rate": 3.0122565946158756e-05, + "loss": 0.0237, + "step": 278760 + }, + { + "epoch": 1.8, + "learning_rate": 3.0112884591801826e-05, + "loss": 0.018, + "step": 278770 + }, + { + "epoch": 1.8, + "learning_rate": 3.0103203237444892e-05, + "loss": 0.0264, + "step": 278780 + }, + { + "epoch": 1.8, + "learning_rate": 3.009352188308796e-05, + "loss": 0.0199, + "step": 278790 + }, + { + "epoch": 1.8, + "learning_rate": 3.008384052873103e-05, + "loss": 0.0208, + "step": 278800 + }, + { + "epoch": 1.8, + "learning_rate": 3.0074159174374098e-05, + "loss": 0.0212, + "step": 278810 + }, + { + "epoch": 1.8, + "learning_rate": 3.0064477820017167e-05, + "loss": 0.0226, + "step": 278820 + }, + { + "epoch": 1.8, + "learning_rate": 3.005479646566023e-05, + "loss": 0.0235, + "step": 278830 + }, + { + "epoch": 1.8, + "learning_rate": 3.00451151113033e-05, + "loss": 0.0215, + "step": 278840 + }, + { + "epoch": 1.8, + "learning_rate": 3.003543375694637e-05, + "loss": 0.0245, + "step": 278850 + }, + { + "epoch": 1.8, + "learning_rate": 3.0025752402589435e-05, + "loss": 0.0226, + "step": 278860 + }, + { + "epoch": 1.8, + "learning_rate": 3.0016071048232505e-05, + "loss": 0.0199, + "step": 278870 + }, + { + "epoch": 1.8, + "learning_rate": 3.0006389693875575e-05, + "loss": 0.028, + "step": 278880 + }, + { + "epoch": 1.8, + "learning_rate": 2.999670833951864e-05, + "loss": 0.0207, + "step": 278890 + }, + { + "epoch": 1.8, + "learning_rate": 2.9987026985161707e-05, + "loss": 0.0261, + "step": 278900 + }, + { + "epoch": 1.8, + "learning_rate": 2.9977345630804773e-05, + "loss": 0.0261, + "step": 278910 + }, + { + "epoch": 1.8, + "learning_rate": 2.9967664276447843e-05, + "loss": 0.0254, + "step": 278920 + }, + { + "epoch": 1.8, + "learning_rate": 2.9957982922090913e-05, + "loss": 0.0281, + "step": 278930 + }, + { + "epoch": 1.8, + "learning_rate": 2.994830156773398e-05, + "loss": 0.0242, + "step": 278940 + }, + { + "epoch": 1.8, + "learning_rate": 2.993862021337705e-05, + "loss": 0.0199, + "step": 278950 + }, + { + "epoch": 1.8, + "learning_rate": 2.9928938859020118e-05, + "loss": 0.0281, + "step": 278960 + }, + { + "epoch": 1.8, + "learning_rate": 2.991925750466318e-05, + "loss": 0.0212, + "step": 278970 + }, + { + "epoch": 1.8, + "learning_rate": 2.990957615030625e-05, + "loss": 0.0198, + "step": 278980 + }, + { + "epoch": 1.8, + "learning_rate": 2.9899894795949317e-05, + "loss": 0.0217, + "step": 278990 + }, + { + "epoch": 1.8, + "learning_rate": 2.9890213441592387e-05, + "loss": 0.0245, + "step": 279000 + }, + { + "epoch": 1.8, + "eval_cer": 0.9198770760366061, + "eval_loss": 0.01735873706638813, + "eval_runtime": 119.7924, + "eval_samples_per_second": 16.696, + "eval_steps_per_second": 4.174, + "step": 279000 + }, + { + "epoch": 1.8, + "learning_rate": 2.9880532087235456e-05, + "loss": 0.0239, + "step": 279010 + }, + { + "epoch": 1.8, + "learning_rate": 2.9870850732878522e-05, + "loss": 0.025, + "step": 279020 + }, + { + "epoch": 1.8, + "learning_rate": 2.9861169378521592e-05, + "loss": 0.0181, + "step": 279030 + }, + { + "epoch": 1.8, + "learning_rate": 2.9851488024164655e-05, + "loss": 0.0233, + "step": 279040 + }, + { + "epoch": 1.8, + "learning_rate": 2.9841806669807725e-05, + "loss": 0.0239, + "step": 279050 + }, + { + "epoch": 1.8, + "learning_rate": 2.9832125315450794e-05, + "loss": 0.0252, + "step": 279060 + }, + { + "epoch": 1.8, + "learning_rate": 2.982244396109386e-05, + "loss": 0.0211, + "step": 279070 + }, + { + "epoch": 1.8, + "learning_rate": 2.981276260673693e-05, + "loss": 0.0202, + "step": 279080 + }, + { + "epoch": 1.8, + "learning_rate": 2.980308125238e-05, + "loss": 0.0246, + "step": 279090 + }, + { + "epoch": 1.8, + "learning_rate": 2.9793399898023066e-05, + "loss": 0.0255, + "step": 279100 + }, + { + "epoch": 1.8, + "learning_rate": 2.9783718543666132e-05, + "loss": 0.0199, + "step": 279110 + }, + { + "epoch": 1.8, + "learning_rate": 2.97740371893092e-05, + "loss": 0.0249, + "step": 279120 + }, + { + "epoch": 1.8, + "learning_rate": 2.9764355834952268e-05, + "loss": 0.0222, + "step": 279130 + }, + { + "epoch": 1.8, + "learning_rate": 2.9754674480595338e-05, + "loss": 0.0282, + "step": 279140 + }, + { + "epoch": 1.8, + "learning_rate": 2.9744993126238404e-05, + "loss": 0.025, + "step": 279150 + }, + { + "epoch": 1.8, + "learning_rate": 2.9735311771881473e-05, + "loss": 0.0211, + "step": 279160 + }, + { + "epoch": 1.8, + "learning_rate": 2.9725630417524543e-05, + "loss": 0.02, + "step": 279170 + }, + { + "epoch": 1.8, + "learning_rate": 2.9715949063167606e-05, + "loss": 0.0219, + "step": 279180 + }, + { + "epoch": 1.8, + "learning_rate": 2.9706267708810676e-05, + "loss": 0.0245, + "step": 279190 + }, + { + "epoch": 1.8, + "learning_rate": 2.9696586354453742e-05, + "loss": 0.0262, + "step": 279200 + }, + { + "epoch": 1.8, + "learning_rate": 2.968690500009681e-05, + "loss": 0.0267, + "step": 279210 + }, + { + "epoch": 1.8, + "learning_rate": 2.967722364573988e-05, + "loss": 0.0233, + "step": 279220 + }, + { + "epoch": 1.8, + "learning_rate": 2.9667542291382947e-05, + "loss": 0.0289, + "step": 279230 + }, + { + "epoch": 1.8, + "learning_rate": 2.9657860937026017e-05, + "loss": 0.0233, + "step": 279240 + }, + { + "epoch": 1.8, + "learning_rate": 2.964817958266908e-05, + "loss": 0.022, + "step": 279250 + }, + { + "epoch": 1.8, + "learning_rate": 2.963849822831215e-05, + "loss": 0.0246, + "step": 279260 + }, + { + "epoch": 1.8, + "learning_rate": 2.962881687395522e-05, + "loss": 0.0227, + "step": 279270 + }, + { + "epoch": 1.8, + "learning_rate": 2.9619135519598285e-05, + "loss": 0.025, + "step": 279280 + }, + { + "epoch": 1.8, + "learning_rate": 2.9609454165241355e-05, + "loss": 0.0215, + "step": 279290 + }, + { + "epoch": 1.8, + "learning_rate": 2.9599772810884425e-05, + "loss": 0.0175, + "step": 279300 + }, + { + "epoch": 1.8, + "learning_rate": 2.959009145652749e-05, + "loss": 0.0234, + "step": 279310 + }, + { + "epoch": 1.8, + "learning_rate": 2.9580410102170557e-05, + "loss": 0.0264, + "step": 279320 + }, + { + "epoch": 1.8, + "learning_rate": 2.9570728747813623e-05, + "loss": 0.0245, + "step": 279330 + }, + { + "epoch": 1.8, + "learning_rate": 2.9561047393456693e-05, + "loss": 0.026, + "step": 279340 + }, + { + "epoch": 1.8, + "learning_rate": 2.9551366039099763e-05, + "loss": 0.0297, + "step": 279350 + }, + { + "epoch": 1.8, + "learning_rate": 2.954168468474283e-05, + "loss": 0.025, + "step": 279360 + }, + { + "epoch": 1.8, + "learning_rate": 2.95320033303859e-05, + "loss": 0.0239, + "step": 279370 + }, + { + "epoch": 1.8, + "learning_rate": 2.952232197602896e-05, + "loss": 0.0215, + "step": 279380 + }, + { + "epoch": 1.8, + "learning_rate": 2.951264062167203e-05, + "loss": 0.0197, + "step": 279390 + }, + { + "epoch": 1.8, + "learning_rate": 2.95029592673151e-05, + "loss": 0.0211, + "step": 279400 + }, + { + "epoch": 1.8, + "learning_rate": 2.9493277912958167e-05, + "loss": 0.0216, + "step": 279410 + }, + { + "epoch": 1.8, + "learning_rate": 2.9483596558601236e-05, + "loss": 0.0234, + "step": 279420 + }, + { + "epoch": 1.8, + "learning_rate": 2.9473915204244303e-05, + "loss": 0.0221, + "step": 279430 + }, + { + "epoch": 1.8, + "learning_rate": 2.9464233849887372e-05, + "loss": 0.0256, + "step": 279440 + }, + { + "epoch": 1.8, + "learning_rate": 2.945455249553044e-05, + "loss": 0.0202, + "step": 279450 + }, + { + "epoch": 1.8, + "learning_rate": 2.9444871141173505e-05, + "loss": 0.0219, + "step": 279460 + }, + { + "epoch": 1.8, + "learning_rate": 2.9435189786816574e-05, + "loss": 0.0224, + "step": 279470 + }, + { + "epoch": 1.8, + "learning_rate": 2.942550843245964e-05, + "loss": 0.0263, + "step": 279480 + }, + { + "epoch": 1.8, + "learning_rate": 2.941582707810271e-05, + "loss": 0.0273, + "step": 279490 + }, + { + "epoch": 1.8, + "learning_rate": 2.940614572374578e-05, + "loss": 0.0256, + "step": 279500 + }, + { + "epoch": 1.8, + "learning_rate": 2.9396464369388846e-05, + "loss": 0.0337, + "step": 279510 + }, + { + "epoch": 1.8, + "learning_rate": 2.9386783015031912e-05, + "loss": 0.0238, + "step": 279520 + }, + { + "epoch": 1.8, + "learning_rate": 2.937710166067498e-05, + "loss": 0.0226, + "step": 279530 + }, + { + "epoch": 1.8, + "learning_rate": 2.9367420306318048e-05, + "loss": 0.0232, + "step": 279540 + }, + { + "epoch": 1.8, + "learning_rate": 2.9357738951961118e-05, + "loss": 0.0192, + "step": 279550 + }, + { + "epoch": 1.8, + "learning_rate": 2.9348057597604184e-05, + "loss": 0.0226, + "step": 279560 + }, + { + "epoch": 1.8, + "learning_rate": 2.9338376243247254e-05, + "loss": 0.0261, + "step": 279570 + }, + { + "epoch": 1.8, + "learning_rate": 2.9328694888890323e-05, + "loss": 0.0253, + "step": 279580 + }, + { + "epoch": 1.8, + "learning_rate": 2.9319013534533386e-05, + "loss": 0.0266, + "step": 279590 + }, + { + "epoch": 1.8, + "learning_rate": 2.9309332180176456e-05, + "loss": 0.0227, + "step": 279600 + }, + { + "epoch": 1.8, + "learning_rate": 2.9299650825819522e-05, + "loss": 0.025, + "step": 279610 + }, + { + "epoch": 1.8, + "learning_rate": 2.928996947146259e-05, + "loss": 0.022, + "step": 279620 + }, + { + "epoch": 1.8, + "learning_rate": 2.928028811710566e-05, + "loss": 0.0203, + "step": 279630 + }, + { + "epoch": 1.8, + "learning_rate": 2.9270606762748727e-05, + "loss": 0.022, + "step": 279640 + }, + { + "epoch": 1.8, + "learning_rate": 2.9260925408391797e-05, + "loss": 0.022, + "step": 279650 + }, + { + "epoch": 1.8, + "learning_rate": 2.925124405403486e-05, + "loss": 0.0231, + "step": 279660 + }, + { + "epoch": 1.81, + "learning_rate": 2.924156269967793e-05, + "loss": 0.0201, + "step": 279670 + }, + { + "epoch": 1.81, + "learning_rate": 2.9231881345321e-05, + "loss": 0.026, + "step": 279680 + }, + { + "epoch": 1.81, + "learning_rate": 2.9222199990964065e-05, + "loss": 0.0235, + "step": 279690 + }, + { + "epoch": 1.81, + "learning_rate": 2.9212518636607135e-05, + "loss": 0.0224, + "step": 279700 + }, + { + "epoch": 1.81, + "learning_rate": 2.9202837282250205e-05, + "loss": 0.0277, + "step": 279710 + }, + { + "epoch": 1.81, + "learning_rate": 2.919315592789327e-05, + "loss": 0.021, + "step": 279720 + }, + { + "epoch": 1.81, + "learning_rate": 2.9183474573536337e-05, + "loss": 0.0208, + "step": 279730 + }, + { + "epoch": 1.81, + "learning_rate": 2.9173793219179403e-05, + "loss": 0.0205, + "step": 279740 + }, + { + "epoch": 1.81, + "learning_rate": 2.9164111864822473e-05, + "loss": 0.0179, + "step": 279750 + }, + { + "epoch": 1.81, + "learning_rate": 2.9154430510465543e-05, + "loss": 0.024, + "step": 279760 + }, + { + "epoch": 1.81, + "learning_rate": 2.914474915610861e-05, + "loss": 0.0264, + "step": 279770 + }, + { + "epoch": 1.81, + "learning_rate": 2.913506780175168e-05, + "loss": 0.0254, + "step": 279780 + }, + { + "epoch": 1.81, + "learning_rate": 2.9125386447394748e-05, + "loss": 0.0221, + "step": 279790 + }, + { + "epoch": 1.81, + "learning_rate": 2.911570509303781e-05, + "loss": 0.0237, + "step": 279800 + }, + { + "epoch": 1.81, + "learning_rate": 2.910602373868088e-05, + "loss": 0.0241, + "step": 279810 + }, + { + "epoch": 1.81, + "learning_rate": 2.9096342384323947e-05, + "loss": 0.0283, + "step": 279820 + }, + { + "epoch": 1.81, + "learning_rate": 2.9086661029967017e-05, + "loss": 0.0176, + "step": 279830 + }, + { + "epoch": 1.81, + "learning_rate": 2.9076979675610086e-05, + "loss": 0.0253, + "step": 279840 + }, + { + "epoch": 1.81, + "learning_rate": 2.9067298321253152e-05, + "loss": 0.0209, + "step": 279850 + }, + { + "epoch": 1.81, + "learning_rate": 2.9057616966896222e-05, + "loss": 0.0247, + "step": 279860 + }, + { + "epoch": 1.81, + "learning_rate": 2.9047935612539285e-05, + "loss": 0.0205, + "step": 279870 + }, + { + "epoch": 1.81, + "learning_rate": 2.9038254258182355e-05, + "loss": 0.0252, + "step": 279880 + }, + { + "epoch": 1.81, + "learning_rate": 2.9028572903825424e-05, + "loss": 0.0224, + "step": 279890 + }, + { + "epoch": 1.81, + "learning_rate": 2.901889154946849e-05, + "loss": 0.0235, + "step": 279900 + }, + { + "epoch": 1.81, + "learning_rate": 2.900921019511156e-05, + "loss": 0.0267, + "step": 279910 + }, + { + "epoch": 1.81, + "learning_rate": 2.899952884075463e-05, + "loss": 0.0242, + "step": 279920 + }, + { + "epoch": 1.81, + "learning_rate": 2.8989847486397696e-05, + "loss": 0.0193, + "step": 279930 + }, + { + "epoch": 1.81, + "learning_rate": 2.8980166132040762e-05, + "loss": 0.0204, + "step": 279940 + }, + { + "epoch": 1.81, + "learning_rate": 2.897048477768383e-05, + "loss": 0.0238, + "step": 279950 + }, + { + "epoch": 1.81, + "learning_rate": 2.8960803423326898e-05, + "loss": 0.0209, + "step": 279960 + }, + { + "epoch": 1.81, + "learning_rate": 2.8951122068969968e-05, + "loss": 0.0212, + "step": 279970 + }, + { + "epoch": 1.81, + "learning_rate": 2.8941440714613034e-05, + "loss": 0.0236, + "step": 279980 + }, + { + "epoch": 1.81, + "learning_rate": 2.8931759360256103e-05, + "loss": 0.0203, + "step": 279990 + }, + { + "epoch": 1.81, + "learning_rate": 2.892207800589917e-05, + "loss": 0.0177, + "step": 280000 + }, + { + "epoch": 1.81, + "eval_cer": 0.9198617105411818, + "eval_loss": 0.017406921833753586, + "eval_runtime": 119.8646, + "eval_samples_per_second": 16.685, + "eval_steps_per_second": 4.171, + "step": 280000 + }, + { + "epoch": 1.81, + "learning_rate": 2.8912396651542236e-05, + "loss": 0.02, + "step": 280010 + }, + { + "epoch": 1.81, + "learning_rate": 2.8902715297185306e-05, + "loss": 0.0184, + "step": 280020 + }, + { + "epoch": 1.81, + "learning_rate": 2.8893033942828372e-05, + "loss": 0.0206, + "step": 280030 + }, + { + "epoch": 1.81, + "learning_rate": 2.888335258847144e-05, + "loss": 0.0251, + "step": 280040 + }, + { + "epoch": 1.81, + "learning_rate": 2.8873671234114508e-05, + "loss": 0.0217, + "step": 280050 + }, + { + "epoch": 1.81, + "learning_rate": 2.8863989879757577e-05, + "loss": 0.0223, + "step": 280060 + }, + { + "epoch": 1.81, + "learning_rate": 2.8854308525400647e-05, + "loss": 0.0206, + "step": 280070 + }, + { + "epoch": 1.81, + "learning_rate": 2.884462717104371e-05, + "loss": 0.0217, + "step": 280080 + }, + { + "epoch": 1.81, + "learning_rate": 2.883494581668678e-05, + "loss": 0.0278, + "step": 280090 + }, + { + "epoch": 1.81, + "learning_rate": 2.8825264462329846e-05, + "loss": 0.0252, + "step": 280100 + }, + { + "epoch": 1.81, + "learning_rate": 2.8815583107972915e-05, + "loss": 0.0191, + "step": 280110 + }, + { + "epoch": 1.81, + "learning_rate": 2.8805901753615985e-05, + "loss": 0.0217, + "step": 280120 + }, + { + "epoch": 1.81, + "learning_rate": 2.879622039925905e-05, + "loss": 0.026, + "step": 280130 + }, + { + "epoch": 1.81, + "learning_rate": 2.878653904490212e-05, + "loss": 0.0252, + "step": 280140 + }, + { + "epoch": 1.81, + "learning_rate": 2.8776857690545184e-05, + "loss": 0.0188, + "step": 280150 + }, + { + "epoch": 1.81, + "learning_rate": 2.8767176336188253e-05, + "loss": 0.0245, + "step": 280160 + }, + { + "epoch": 1.81, + "learning_rate": 2.8757494981831323e-05, + "loss": 0.0215, + "step": 280170 + }, + { + "epoch": 1.81, + "learning_rate": 2.874781362747439e-05, + "loss": 0.0269, + "step": 280180 + }, + { + "epoch": 1.81, + "learning_rate": 2.873813227311746e-05, + "loss": 0.0181, + "step": 280190 + }, + { + "epoch": 1.81, + "learning_rate": 2.872845091876053e-05, + "loss": 0.0231, + "step": 280200 + }, + { + "epoch": 1.81, + "learning_rate": 2.871876956440359e-05, + "loss": 0.0262, + "step": 280210 + }, + { + "epoch": 1.81, + "learning_rate": 2.870908821004666e-05, + "loss": 0.0231, + "step": 280220 + }, + { + "epoch": 1.81, + "learning_rate": 2.8699406855689727e-05, + "loss": 0.02, + "step": 280230 + }, + { + "epoch": 1.81, + "learning_rate": 2.8689725501332797e-05, + "loss": 0.02, + "step": 280240 + }, + { + "epoch": 1.81, + "learning_rate": 2.8680044146975866e-05, + "loss": 0.025, + "step": 280250 + }, + { + "epoch": 1.81, + "learning_rate": 2.8670362792618933e-05, + "loss": 0.0247, + "step": 280260 + }, + { + "epoch": 1.81, + "learning_rate": 2.8660681438262002e-05, + "loss": 0.0253, + "step": 280270 + }, + { + "epoch": 1.81, + "learning_rate": 2.8651000083905065e-05, + "loss": 0.0233, + "step": 280280 + }, + { + "epoch": 1.81, + "learning_rate": 2.8641318729548135e-05, + "loss": 0.0242, + "step": 280290 + }, + { + "epoch": 1.81, + "learning_rate": 2.8631637375191204e-05, + "loss": 0.0206, + "step": 280300 + }, + { + "epoch": 1.81, + "learning_rate": 2.862195602083427e-05, + "loss": 0.0257, + "step": 280310 + }, + { + "epoch": 1.81, + "learning_rate": 2.861227466647734e-05, + "loss": 0.0238, + "step": 280320 + }, + { + "epoch": 1.81, + "learning_rate": 2.860259331212041e-05, + "loss": 0.0218, + "step": 280330 + }, + { + "epoch": 1.81, + "learning_rate": 2.8592911957763476e-05, + "loss": 0.022, + "step": 280340 + }, + { + "epoch": 1.81, + "learning_rate": 2.8583230603406542e-05, + "loss": 0.0228, + "step": 280350 + }, + { + "epoch": 1.81, + "learning_rate": 2.857354924904961e-05, + "loss": 0.021, + "step": 280360 + }, + { + "epoch": 1.81, + "learning_rate": 2.8563867894692678e-05, + "loss": 0.0231, + "step": 280370 + }, + { + "epoch": 1.81, + "learning_rate": 2.8554186540335748e-05, + "loss": 0.0217, + "step": 280380 + }, + { + "epoch": 1.81, + "learning_rate": 2.8544505185978814e-05, + "loss": 0.0188, + "step": 280390 + }, + { + "epoch": 1.81, + "learning_rate": 2.8534823831621884e-05, + "loss": 0.0272, + "step": 280400 + }, + { + "epoch": 1.81, + "learning_rate": 2.8525142477264953e-05, + "loss": 0.0218, + "step": 280410 + }, + { + "epoch": 1.81, + "learning_rate": 2.8515461122908016e-05, + "loss": 0.0223, + "step": 280420 + }, + { + "epoch": 1.81, + "learning_rate": 2.8505779768551086e-05, + "loss": 0.0235, + "step": 280430 + }, + { + "epoch": 1.81, + "learning_rate": 2.8496098414194152e-05, + "loss": 0.0235, + "step": 280440 + }, + { + "epoch": 1.81, + "learning_rate": 2.848641705983722e-05, + "loss": 0.0226, + "step": 280450 + }, + { + "epoch": 1.81, + "learning_rate": 2.847673570548029e-05, + "loss": 0.0245, + "step": 280460 + }, + { + "epoch": 1.81, + "learning_rate": 2.8467054351123357e-05, + "loss": 0.0223, + "step": 280470 + }, + { + "epoch": 1.81, + "learning_rate": 2.8457372996766427e-05, + "loss": 0.0253, + "step": 280480 + }, + { + "epoch": 1.81, + "learning_rate": 2.844769164240949e-05, + "loss": 0.0242, + "step": 280490 + }, + { + "epoch": 1.81, + "learning_rate": 2.843801028805256e-05, + "loss": 0.0195, + "step": 280500 + }, + { + "epoch": 1.81, + "learning_rate": 2.842832893369563e-05, + "loss": 0.0228, + "step": 280510 + }, + { + "epoch": 1.81, + "learning_rate": 2.8418647579338695e-05, + "loss": 0.0263, + "step": 280520 + }, + { + "epoch": 1.81, + "learning_rate": 2.8408966224981765e-05, + "loss": 0.021, + "step": 280530 + }, + { + "epoch": 1.81, + "learning_rate": 2.8399284870624835e-05, + "loss": 0.0196, + "step": 280540 + }, + { + "epoch": 1.81, + "learning_rate": 2.83896035162679e-05, + "loss": 0.0297, + "step": 280550 + }, + { + "epoch": 1.81, + "learning_rate": 2.8379922161910967e-05, + "loss": 0.0243, + "step": 280560 + }, + { + "epoch": 1.81, + "learning_rate": 2.8370240807554033e-05, + "loss": 0.0249, + "step": 280570 + }, + { + "epoch": 1.81, + "learning_rate": 2.8360559453197103e-05, + "loss": 0.027, + "step": 280580 + }, + { + "epoch": 1.81, + "learning_rate": 2.8350878098840173e-05, + "loss": 0.0265, + "step": 280590 + }, + { + "epoch": 1.81, + "learning_rate": 2.834119674448324e-05, + "loss": 0.0252, + "step": 280600 + }, + { + "epoch": 1.81, + "learning_rate": 2.833151539012631e-05, + "loss": 0.027, + "step": 280610 + }, + { + "epoch": 1.81, + "learning_rate": 2.8321834035769378e-05, + "loss": 0.0222, + "step": 280620 + }, + { + "epoch": 1.81, + "learning_rate": 2.831215268141244e-05, + "loss": 0.021, + "step": 280630 + }, + { + "epoch": 1.81, + "learning_rate": 2.830247132705551e-05, + "loss": 0.0229, + "step": 280640 + }, + { + "epoch": 1.81, + "learning_rate": 2.8292789972698577e-05, + "loss": 0.0247, + "step": 280650 + }, + { + "epoch": 1.81, + "learning_rate": 2.8283108618341647e-05, + "loss": 0.0262, + "step": 280660 + }, + { + "epoch": 1.81, + "learning_rate": 2.8273427263984716e-05, + "loss": 0.0258, + "step": 280670 + }, + { + "epoch": 1.81, + "learning_rate": 2.8263745909627782e-05, + "loss": 0.0217, + "step": 280680 + }, + { + "epoch": 1.81, + "learning_rate": 2.8254064555270852e-05, + "loss": 0.0223, + "step": 280690 + }, + { + "epoch": 1.81, + "learning_rate": 2.8244383200913915e-05, + "loss": 0.0224, + "step": 280700 + }, + { + "epoch": 1.81, + "learning_rate": 2.8234701846556984e-05, + "loss": 0.0209, + "step": 280710 + }, + { + "epoch": 1.81, + "learning_rate": 2.8225020492200054e-05, + "loss": 0.0192, + "step": 280720 + }, + { + "epoch": 1.81, + "learning_rate": 2.821533913784312e-05, + "loss": 0.0278, + "step": 280730 + }, + { + "epoch": 1.81, + "learning_rate": 2.820565778348619e-05, + "loss": 0.0214, + "step": 280740 + }, + { + "epoch": 1.81, + "learning_rate": 2.8195976429129256e-05, + "loss": 0.0247, + "step": 280750 + }, + { + "epoch": 1.81, + "learning_rate": 2.8186295074772326e-05, + "loss": 0.0188, + "step": 280760 + }, + { + "epoch": 1.81, + "learning_rate": 2.8176613720415392e-05, + "loss": 0.0223, + "step": 280770 + }, + { + "epoch": 1.81, + "learning_rate": 2.816693236605846e-05, + "loss": 0.0217, + "step": 280780 + }, + { + "epoch": 1.81, + "learning_rate": 2.8157251011701528e-05, + "loss": 0.0203, + "step": 280790 + }, + { + "epoch": 1.81, + "learning_rate": 2.8147569657344594e-05, + "loss": 0.0231, + "step": 280800 + }, + { + "epoch": 1.81, + "learning_rate": 2.8137888302987664e-05, + "loss": 0.0235, + "step": 280810 + }, + { + "epoch": 1.81, + "learning_rate": 2.8128206948630733e-05, + "loss": 0.0225, + "step": 280820 + }, + { + "epoch": 1.81, + "learning_rate": 2.81185255942738e-05, + "loss": 0.026, + "step": 280830 + }, + { + "epoch": 1.81, + "learning_rate": 2.8108844239916866e-05, + "loss": 0.0224, + "step": 280840 + }, + { + "epoch": 1.81, + "learning_rate": 2.8099162885559932e-05, + "loss": 0.0259, + "step": 280850 + }, + { + "epoch": 1.81, + "learning_rate": 2.8089481531203002e-05, + "loss": 0.0224, + "step": 280860 + }, + { + "epoch": 1.81, + "learning_rate": 2.807980017684607e-05, + "loss": 0.028, + "step": 280870 + }, + { + "epoch": 1.81, + "learning_rate": 2.8070118822489138e-05, + "loss": 0.0256, + "step": 280880 + }, + { + "epoch": 1.81, + "learning_rate": 2.8060437468132207e-05, + "loss": 0.0284, + "step": 280890 + }, + { + "epoch": 1.81, + "learning_rate": 2.8050756113775277e-05, + "loss": 0.0204, + "step": 280900 + }, + { + "epoch": 1.81, + "learning_rate": 2.804107475941834e-05, + "loss": 0.0225, + "step": 280910 + }, + { + "epoch": 1.81, + "learning_rate": 2.803139340506141e-05, + "loss": 0.0251, + "step": 280920 + }, + { + "epoch": 1.81, + "learning_rate": 2.8021712050704476e-05, + "loss": 0.0224, + "step": 280930 + }, + { + "epoch": 1.81, + "learning_rate": 2.8012030696347545e-05, + "loss": 0.0282, + "step": 280940 + }, + { + "epoch": 1.81, + "learning_rate": 2.8002349341990615e-05, + "loss": 0.0259, + "step": 280950 + }, + { + "epoch": 1.81, + "learning_rate": 2.799266798763368e-05, + "loss": 0.0223, + "step": 280960 + }, + { + "epoch": 1.81, + "learning_rate": 2.798298663327675e-05, + "loss": 0.0223, + "step": 280970 + }, + { + "epoch": 1.81, + "learning_rate": 2.7973305278919814e-05, + "loss": 0.0232, + "step": 280980 + }, + { + "epoch": 1.81, + "learning_rate": 2.7963623924562883e-05, + "loss": 0.0224, + "step": 280990 + }, + { + "epoch": 1.81, + "learning_rate": 2.7953942570205953e-05, + "loss": 0.0268, + "step": 281000 + }, + { + "epoch": 1.81, + "eval_cer": 0.9198617105411818, + "eval_loss": 0.017409605905413628, + "eval_runtime": 119.8225, + "eval_samples_per_second": 16.691, + "eval_steps_per_second": 4.173, + "step": 281000 + }, + { + "epoch": 1.81, + "learning_rate": 2.794426121584902e-05, + "loss": 0.0201, + "step": 281010 + }, + { + "epoch": 1.81, + "learning_rate": 2.793457986149209e-05, + "loss": 0.0216, + "step": 281020 + }, + { + "epoch": 1.81, + "learning_rate": 2.792489850713516e-05, + "loss": 0.0205, + "step": 281030 + }, + { + "epoch": 1.81, + "learning_rate": 2.791521715277822e-05, + "loss": 0.0269, + "step": 281040 + }, + { + "epoch": 1.81, + "learning_rate": 2.790553579842129e-05, + "loss": 0.0194, + "step": 281050 + }, + { + "epoch": 1.81, + "learning_rate": 2.7895854444064357e-05, + "loss": 0.0205, + "step": 281060 + }, + { + "epoch": 1.81, + "learning_rate": 2.7886173089707427e-05, + "loss": 0.0236, + "step": 281070 + }, + { + "epoch": 1.81, + "learning_rate": 2.7876491735350496e-05, + "loss": 0.0217, + "step": 281080 + }, + { + "epoch": 1.81, + "learning_rate": 2.7866810380993563e-05, + "loss": 0.0265, + "step": 281090 + }, + { + "epoch": 1.81, + "learning_rate": 2.7857129026636632e-05, + "loss": 0.0225, + "step": 281100 + }, + { + "epoch": 1.81, + "learning_rate": 2.7847447672279695e-05, + "loss": 0.0246, + "step": 281110 + }, + { + "epoch": 1.81, + "learning_rate": 2.7837766317922765e-05, + "loss": 0.0209, + "step": 281120 + }, + { + "epoch": 1.81, + "learning_rate": 2.7828084963565834e-05, + "loss": 0.0189, + "step": 281130 + }, + { + "epoch": 1.81, + "learning_rate": 2.78184036092089e-05, + "loss": 0.0222, + "step": 281140 + }, + { + "epoch": 1.81, + "learning_rate": 2.780872225485197e-05, + "loss": 0.0252, + "step": 281150 + }, + { + "epoch": 1.81, + "learning_rate": 2.779904090049504e-05, + "loss": 0.0287, + "step": 281160 + }, + { + "epoch": 1.81, + "learning_rate": 2.7789359546138106e-05, + "loss": 0.0212, + "step": 281170 + }, + { + "epoch": 1.81, + "learning_rate": 2.7779678191781172e-05, + "loss": 0.0233, + "step": 281180 + }, + { + "epoch": 1.81, + "learning_rate": 2.776999683742424e-05, + "loss": 0.0238, + "step": 281190 + }, + { + "epoch": 1.81, + "learning_rate": 2.7760315483067308e-05, + "loss": 0.0228, + "step": 281200 + }, + { + "epoch": 1.81, + "learning_rate": 2.7750634128710378e-05, + "loss": 0.0215, + "step": 281210 + }, + { + "epoch": 1.82, + "learning_rate": 2.7740952774353444e-05, + "loss": 0.0227, + "step": 281220 + }, + { + "epoch": 1.82, + "learning_rate": 2.7731271419996514e-05, + "loss": 0.0236, + "step": 281230 + }, + { + "epoch": 1.82, + "learning_rate": 2.7721590065639583e-05, + "loss": 0.0221, + "step": 281240 + }, + { + "epoch": 1.82, + "learning_rate": 2.7711908711282646e-05, + "loss": 0.0234, + "step": 281250 + }, + { + "epoch": 1.82, + "learning_rate": 2.7702227356925716e-05, + "loss": 0.0256, + "step": 281260 + }, + { + "epoch": 1.82, + "learning_rate": 2.7692546002568782e-05, + "loss": 0.0194, + "step": 281270 + }, + { + "epoch": 1.82, + "learning_rate": 2.768286464821185e-05, + "loss": 0.0226, + "step": 281280 + }, + { + "epoch": 1.82, + "learning_rate": 2.767318329385492e-05, + "loss": 0.0227, + "step": 281290 + }, + { + "epoch": 1.82, + "learning_rate": 2.7663501939497987e-05, + "loss": 0.0232, + "step": 281300 + }, + { + "epoch": 1.82, + "learning_rate": 2.7653820585141057e-05, + "loss": 0.0224, + "step": 281310 + }, + { + "epoch": 1.82, + "learning_rate": 2.764413923078412e-05, + "loss": 0.0266, + "step": 281320 + }, + { + "epoch": 1.82, + "learning_rate": 2.763445787642719e-05, + "loss": 0.0206, + "step": 281330 + }, + { + "epoch": 1.82, + "learning_rate": 2.762477652207026e-05, + "loss": 0.023, + "step": 281340 + }, + { + "epoch": 1.82, + "learning_rate": 2.7615095167713325e-05, + "loss": 0.0211, + "step": 281350 + }, + { + "epoch": 1.82, + "learning_rate": 2.7605413813356395e-05, + "loss": 0.0223, + "step": 281360 + }, + { + "epoch": 1.82, + "learning_rate": 2.759573245899946e-05, + "loss": 0.0217, + "step": 281370 + }, + { + "epoch": 1.82, + "learning_rate": 2.758605110464253e-05, + "loss": 0.0198, + "step": 281380 + }, + { + "epoch": 1.82, + "learning_rate": 2.7576369750285597e-05, + "loss": 0.0265, + "step": 281390 + }, + { + "epoch": 1.82, + "learning_rate": 2.7566688395928663e-05, + "loss": 0.0279, + "step": 281400 + }, + { + "epoch": 1.82, + "learning_rate": 2.7557007041571733e-05, + "loss": 0.0221, + "step": 281410 + }, + { + "epoch": 1.82, + "learning_rate": 2.7547325687214803e-05, + "loss": 0.0226, + "step": 281420 + }, + { + "epoch": 1.82, + "learning_rate": 2.753764433285787e-05, + "loss": 0.0286, + "step": 281430 + }, + { + "epoch": 1.82, + "learning_rate": 2.752796297850094e-05, + "loss": 0.0243, + "step": 281440 + }, + { + "epoch": 1.82, + "learning_rate": 2.7518281624144005e-05, + "loss": 0.0255, + "step": 281450 + }, + { + "epoch": 1.82, + "learning_rate": 2.750860026978707e-05, + "loss": 0.0224, + "step": 281460 + }, + { + "epoch": 1.82, + "learning_rate": 2.749891891543014e-05, + "loss": 0.0188, + "step": 281470 + }, + { + "epoch": 1.82, + "learning_rate": 2.7489237561073207e-05, + "loss": 0.0211, + "step": 281480 + }, + { + "epoch": 1.82, + "learning_rate": 2.7479556206716277e-05, + "loss": 0.023, + "step": 281490 + }, + { + "epoch": 1.82, + "learning_rate": 2.7469874852359343e-05, + "loss": 0.0219, + "step": 281500 + }, + { + "epoch": 1.82, + "learning_rate": 2.7460193498002412e-05, + "loss": 0.023, + "step": 281510 + }, + { + "epoch": 1.82, + "learning_rate": 2.7450512143645482e-05, + "loss": 0.0272, + "step": 281520 + }, + { + "epoch": 1.82, + "learning_rate": 2.7440830789288545e-05, + "loss": 0.0234, + "step": 281530 + }, + { + "epoch": 1.82, + "learning_rate": 2.7431149434931614e-05, + "loss": 0.0221, + "step": 281540 + }, + { + "epoch": 1.82, + "learning_rate": 2.742146808057468e-05, + "loss": 0.0219, + "step": 281550 + }, + { + "epoch": 1.82, + "learning_rate": 2.741178672621775e-05, + "loss": 0.0195, + "step": 281560 + }, + { + "epoch": 1.82, + "learning_rate": 2.740210537186082e-05, + "loss": 0.0195, + "step": 281570 + }, + { + "epoch": 1.82, + "learning_rate": 2.7392424017503886e-05, + "loss": 0.0186, + "step": 281580 + }, + { + "epoch": 1.82, + "learning_rate": 2.7382742663146956e-05, + "loss": 0.0218, + "step": 281590 + }, + { + "epoch": 1.82, + "learning_rate": 2.737306130879002e-05, + "loss": 0.0218, + "step": 281600 + }, + { + "epoch": 1.82, + "learning_rate": 2.736337995443309e-05, + "loss": 0.0206, + "step": 281610 + }, + { + "epoch": 1.82, + "learning_rate": 2.7353698600076158e-05, + "loss": 0.017, + "step": 281620 + }, + { + "epoch": 1.82, + "learning_rate": 2.7344017245719224e-05, + "loss": 0.0207, + "step": 281630 + }, + { + "epoch": 1.82, + "learning_rate": 2.7334335891362294e-05, + "loss": 0.0191, + "step": 281640 + }, + { + "epoch": 1.82, + "learning_rate": 2.7324654537005363e-05, + "loss": 0.0218, + "step": 281650 + }, + { + "epoch": 1.82, + "learning_rate": 2.731497318264843e-05, + "loss": 0.0326, + "step": 281660 + }, + { + "epoch": 1.82, + "learning_rate": 2.7305291828291496e-05, + "loss": 0.0253, + "step": 281670 + }, + { + "epoch": 1.82, + "learning_rate": 2.7295610473934562e-05, + "loss": 0.0255, + "step": 281680 + }, + { + "epoch": 1.82, + "learning_rate": 2.7285929119577632e-05, + "loss": 0.028, + "step": 281690 + }, + { + "epoch": 1.82, + "learning_rate": 2.72762477652207e-05, + "loss": 0.0194, + "step": 281700 + }, + { + "epoch": 1.82, + "learning_rate": 2.7266566410863768e-05, + "loss": 0.0231, + "step": 281710 + }, + { + "epoch": 1.82, + "learning_rate": 2.7256885056506837e-05, + "loss": 0.0233, + "step": 281720 + }, + { + "epoch": 1.82, + "learning_rate": 2.7247203702149907e-05, + "loss": 0.0202, + "step": 281730 + }, + { + "epoch": 1.82, + "learning_rate": 2.723752234779297e-05, + "loss": 0.0222, + "step": 281740 + }, + { + "epoch": 1.82, + "learning_rate": 2.722784099343604e-05, + "loss": 0.0244, + "step": 281750 + }, + { + "epoch": 1.82, + "learning_rate": 2.7218159639079106e-05, + "loss": 0.0202, + "step": 281760 + }, + { + "epoch": 1.82, + "learning_rate": 2.7208478284722175e-05, + "loss": 0.0233, + "step": 281770 + }, + { + "epoch": 1.82, + "learning_rate": 2.7198796930365245e-05, + "loss": 0.0234, + "step": 281780 + }, + { + "epoch": 1.82, + "learning_rate": 2.718911557600831e-05, + "loss": 0.0211, + "step": 281790 + }, + { + "epoch": 1.82, + "learning_rate": 2.717943422165138e-05, + "loss": 0.0229, + "step": 281800 + }, + { + "epoch": 1.82, + "learning_rate": 2.7169752867294444e-05, + "loss": 0.029, + "step": 281810 + }, + { + "epoch": 1.82, + "learning_rate": 2.7160071512937513e-05, + "loss": 0.0206, + "step": 281820 + }, + { + "epoch": 1.82, + "learning_rate": 2.7150390158580583e-05, + "loss": 0.0257, + "step": 281830 + }, + { + "epoch": 1.82, + "learning_rate": 2.714070880422365e-05, + "loss": 0.0251, + "step": 281840 + }, + { + "epoch": 1.82, + "learning_rate": 2.713102744986672e-05, + "loss": 0.0218, + "step": 281850 + }, + { + "epoch": 1.82, + "learning_rate": 2.712134609550979e-05, + "loss": 0.0252, + "step": 281860 + }, + { + "epoch": 1.82, + "learning_rate": 2.7111664741152855e-05, + "loss": 0.0187, + "step": 281870 + }, + { + "epoch": 1.82, + "learning_rate": 2.710198338679592e-05, + "loss": 0.0217, + "step": 281880 + }, + { + "epoch": 1.82, + "learning_rate": 2.7092302032438987e-05, + "loss": 0.0233, + "step": 281890 + }, + { + "epoch": 1.82, + "learning_rate": 2.7082620678082057e-05, + "loss": 0.0203, + "step": 281900 + }, + { + "epoch": 1.82, + "learning_rate": 2.7072939323725126e-05, + "loss": 0.0251, + "step": 281910 + }, + { + "epoch": 1.82, + "learning_rate": 2.7063257969368193e-05, + "loss": 0.0266, + "step": 281920 + }, + { + "epoch": 1.82, + "learning_rate": 2.7053576615011262e-05, + "loss": 0.0241, + "step": 281930 + }, + { + "epoch": 1.82, + "learning_rate": 2.7043895260654325e-05, + "loss": 0.0267, + "step": 281940 + }, + { + "epoch": 1.82, + "learning_rate": 2.7034213906297395e-05, + "loss": 0.0224, + "step": 281950 + }, + { + "epoch": 1.82, + "learning_rate": 2.7024532551940464e-05, + "loss": 0.0207, + "step": 281960 + }, + { + "epoch": 1.82, + "learning_rate": 2.701485119758353e-05, + "loss": 0.0219, + "step": 281970 + }, + { + "epoch": 1.82, + "learning_rate": 2.70051698432266e-05, + "loss": 0.0209, + "step": 281980 + }, + { + "epoch": 1.82, + "learning_rate": 2.699548848886967e-05, + "loss": 0.0236, + "step": 281990 + }, + { + "epoch": 1.82, + "learning_rate": 2.6985807134512736e-05, + "loss": 0.0209, + "step": 282000 + }, + { + "epoch": 1.82, + "eval_cer": 0.9198553835724776, + "eval_loss": 0.017225535586476326, + "eval_runtime": 119.8192, + "eval_samples_per_second": 16.692, + "eval_steps_per_second": 4.173, + "step": 282000 + }, + { + "epoch": 1.82, + "learning_rate": 2.6976125780155802e-05, + "loss": 0.0249, + "step": 282010 + }, + { + "epoch": 1.82, + "learning_rate": 2.696644442579887e-05, + "loss": 0.0264, + "step": 282020 + }, + { + "epoch": 1.82, + "learning_rate": 2.6956763071441938e-05, + "loss": 0.0206, + "step": 282030 + }, + { + "epoch": 1.82, + "learning_rate": 2.6947081717085008e-05, + "loss": 0.0203, + "step": 282040 + }, + { + "epoch": 1.82, + "learning_rate": 2.6937400362728074e-05, + "loss": 0.0226, + "step": 282050 + }, + { + "epoch": 1.82, + "learning_rate": 2.6927719008371144e-05, + "loss": 0.0262, + "step": 282060 + }, + { + "epoch": 1.82, + "learning_rate": 2.691803765401421e-05, + "loss": 0.0241, + "step": 282070 + }, + { + "epoch": 1.82, + "learning_rate": 2.6908356299657276e-05, + "loss": 0.0209, + "step": 282080 + }, + { + "epoch": 1.82, + "learning_rate": 2.6898674945300346e-05, + "loss": 0.0208, + "step": 282090 + }, + { + "epoch": 1.82, + "learning_rate": 2.6888993590943412e-05, + "loss": 0.0225, + "step": 282100 + }, + { + "epoch": 1.82, + "learning_rate": 2.687931223658648e-05, + "loss": 0.0228, + "step": 282110 + }, + { + "epoch": 1.82, + "learning_rate": 2.6869630882229548e-05, + "loss": 0.0242, + "step": 282120 + }, + { + "epoch": 1.82, + "learning_rate": 2.6859949527872617e-05, + "loss": 0.0204, + "step": 282130 + }, + { + "epoch": 1.82, + "learning_rate": 2.6850268173515687e-05, + "loss": 0.0234, + "step": 282140 + }, + { + "epoch": 1.82, + "learning_rate": 2.684058681915875e-05, + "loss": 0.03, + "step": 282150 + }, + { + "epoch": 1.82, + "learning_rate": 2.683090546480182e-05, + "loss": 0.0253, + "step": 282160 + }, + { + "epoch": 1.82, + "learning_rate": 2.6821224110444886e-05, + "loss": 0.022, + "step": 282170 + }, + { + "epoch": 1.82, + "learning_rate": 2.6811542756087955e-05, + "loss": 0.0195, + "step": 282180 + }, + { + "epoch": 1.82, + "learning_rate": 2.6801861401731025e-05, + "loss": 0.0262, + "step": 282190 + }, + { + "epoch": 1.82, + "learning_rate": 2.679218004737409e-05, + "loss": 0.0258, + "step": 282200 + }, + { + "epoch": 1.82, + "learning_rate": 2.678249869301716e-05, + "loss": 0.0225, + "step": 282210 + }, + { + "epoch": 1.82, + "learning_rate": 2.6772817338660224e-05, + "loss": 0.021, + "step": 282220 + }, + { + "epoch": 1.82, + "learning_rate": 2.6763135984303293e-05, + "loss": 0.0205, + "step": 282230 + }, + { + "epoch": 1.82, + "learning_rate": 2.6753454629946363e-05, + "loss": 0.019, + "step": 282240 + }, + { + "epoch": 1.82, + "learning_rate": 2.674377327558943e-05, + "loss": 0.0261, + "step": 282250 + }, + { + "epoch": 1.82, + "learning_rate": 2.67340919212325e-05, + "loss": 0.0203, + "step": 282260 + }, + { + "epoch": 1.82, + "learning_rate": 2.672441056687557e-05, + "loss": 0.0235, + "step": 282270 + }, + { + "epoch": 1.82, + "learning_rate": 2.6714729212518635e-05, + "loss": 0.0226, + "step": 282280 + }, + { + "epoch": 1.82, + "learning_rate": 2.67050478581617e-05, + "loss": 0.0189, + "step": 282290 + }, + { + "epoch": 1.82, + "learning_rate": 2.6695366503804767e-05, + "loss": 0.0186, + "step": 282300 + }, + { + "epoch": 1.82, + "learning_rate": 2.6685685149447837e-05, + "loss": 0.0224, + "step": 282310 + }, + { + "epoch": 1.82, + "learning_rate": 2.6676003795090906e-05, + "loss": 0.0191, + "step": 282320 + }, + { + "epoch": 1.82, + "learning_rate": 2.6666322440733973e-05, + "loss": 0.0235, + "step": 282330 + }, + { + "epoch": 1.82, + "learning_rate": 2.6656641086377042e-05, + "loss": 0.0264, + "step": 282340 + }, + { + "epoch": 1.82, + "learning_rate": 2.6646959732020112e-05, + "loss": 0.0219, + "step": 282350 + }, + { + "epoch": 1.82, + "learning_rate": 2.6637278377663175e-05, + "loss": 0.0216, + "step": 282360 + }, + { + "epoch": 1.82, + "learning_rate": 2.6627597023306244e-05, + "loss": 0.0212, + "step": 282370 + }, + { + "epoch": 1.82, + "learning_rate": 2.661791566894931e-05, + "loss": 0.0213, + "step": 282380 + }, + { + "epoch": 1.82, + "learning_rate": 2.660823431459238e-05, + "loss": 0.021, + "step": 282390 + }, + { + "epoch": 1.82, + "learning_rate": 2.659855296023545e-05, + "loss": 0.0247, + "step": 282400 + }, + { + "epoch": 1.82, + "learning_rate": 2.6588871605878516e-05, + "loss": 0.0222, + "step": 282410 + }, + { + "epoch": 1.82, + "learning_rate": 2.6579190251521586e-05, + "loss": 0.0244, + "step": 282420 + }, + { + "epoch": 1.82, + "learning_rate": 2.656950889716465e-05, + "loss": 0.0222, + "step": 282430 + }, + { + "epoch": 1.82, + "learning_rate": 2.655982754280772e-05, + "loss": 0.0226, + "step": 282440 + }, + { + "epoch": 1.82, + "learning_rate": 2.6550146188450788e-05, + "loss": 0.0255, + "step": 282450 + }, + { + "epoch": 1.82, + "learning_rate": 2.6540464834093854e-05, + "loss": 0.0268, + "step": 282460 + }, + { + "epoch": 1.82, + "learning_rate": 2.6530783479736924e-05, + "loss": 0.0226, + "step": 282470 + }, + { + "epoch": 1.82, + "learning_rate": 2.6521102125379993e-05, + "loss": 0.0301, + "step": 282480 + }, + { + "epoch": 1.82, + "learning_rate": 2.651142077102306e-05, + "loss": 0.021, + "step": 282490 + }, + { + "epoch": 1.82, + "learning_rate": 2.6501739416666126e-05, + "loss": 0.0268, + "step": 282500 + }, + { + "epoch": 1.82, + "learning_rate": 2.6492058062309192e-05, + "loss": 0.022, + "step": 282510 + }, + { + "epoch": 1.82, + "learning_rate": 2.6482376707952262e-05, + "loss": 0.0235, + "step": 282520 + }, + { + "epoch": 1.82, + "learning_rate": 2.647269535359533e-05, + "loss": 0.0223, + "step": 282530 + }, + { + "epoch": 1.82, + "learning_rate": 2.6463013999238398e-05, + "loss": 0.0223, + "step": 282540 + }, + { + "epoch": 1.82, + "learning_rate": 2.6453332644881467e-05, + "loss": 0.0227, + "step": 282550 + }, + { + "epoch": 1.82, + "learning_rate": 2.6443651290524537e-05, + "loss": 0.0188, + "step": 282560 + }, + { + "epoch": 1.82, + "learning_rate": 2.64339699361676e-05, + "loss": 0.0208, + "step": 282570 + }, + { + "epoch": 1.82, + "learning_rate": 2.642428858181067e-05, + "loss": 0.0258, + "step": 282580 + }, + { + "epoch": 1.82, + "learning_rate": 2.6414607227453736e-05, + "loss": 0.0215, + "step": 282590 + }, + { + "epoch": 1.82, + "learning_rate": 2.6404925873096805e-05, + "loss": 0.0274, + "step": 282600 + }, + { + "epoch": 1.82, + "learning_rate": 2.6395244518739875e-05, + "loss": 0.0229, + "step": 282610 + }, + { + "epoch": 1.82, + "learning_rate": 2.638556316438294e-05, + "loss": 0.0232, + "step": 282620 + }, + { + "epoch": 1.82, + "learning_rate": 2.637588181002601e-05, + "loss": 0.0276, + "step": 282630 + }, + { + "epoch": 1.82, + "learning_rate": 2.6366200455669074e-05, + "loss": 0.0215, + "step": 282640 + }, + { + "epoch": 1.82, + "learning_rate": 2.6356519101312143e-05, + "loss": 0.0227, + "step": 282650 + }, + { + "epoch": 1.82, + "learning_rate": 2.6346837746955213e-05, + "loss": 0.0224, + "step": 282660 + }, + { + "epoch": 1.82, + "learning_rate": 2.633715639259828e-05, + "loss": 0.0258, + "step": 282670 + }, + { + "epoch": 1.82, + "learning_rate": 2.632747503824135e-05, + "loss": 0.0234, + "step": 282680 + }, + { + "epoch": 1.82, + "learning_rate": 2.631779368388442e-05, + "loss": 0.0285, + "step": 282690 + }, + { + "epoch": 1.82, + "learning_rate": 2.6308112329527485e-05, + "loss": 0.0202, + "step": 282700 + }, + { + "epoch": 1.82, + "learning_rate": 2.629843097517055e-05, + "loss": 0.0201, + "step": 282710 + }, + { + "epoch": 1.82, + "learning_rate": 2.6288749620813617e-05, + "loss": 0.0222, + "step": 282720 + }, + { + "epoch": 1.82, + "learning_rate": 2.6279068266456687e-05, + "loss": 0.0231, + "step": 282730 + }, + { + "epoch": 1.82, + "learning_rate": 2.6269386912099756e-05, + "loss": 0.0249, + "step": 282740 + }, + { + "epoch": 1.82, + "learning_rate": 2.6259705557742823e-05, + "loss": 0.0209, + "step": 282750 + }, + { + "epoch": 1.82, + "learning_rate": 2.6250024203385892e-05, + "loss": 0.0248, + "step": 282760 + }, + { + "epoch": 1.83, + "learning_rate": 2.6240342849028955e-05, + "loss": 0.0212, + "step": 282770 + }, + { + "epoch": 1.83, + "learning_rate": 2.6230661494672025e-05, + "loss": 0.0192, + "step": 282780 + }, + { + "epoch": 1.83, + "learning_rate": 2.6220980140315094e-05, + "loss": 0.0221, + "step": 282790 + }, + { + "epoch": 1.83, + "learning_rate": 2.621129878595816e-05, + "loss": 0.0252, + "step": 282800 + }, + { + "epoch": 1.83, + "learning_rate": 2.620161743160123e-05, + "loss": 0.0214, + "step": 282810 + }, + { + "epoch": 1.83, + "learning_rate": 2.6191936077244296e-05, + "loss": 0.0255, + "step": 282820 + }, + { + "epoch": 1.83, + "learning_rate": 2.6182254722887366e-05, + "loss": 0.0199, + "step": 282830 + }, + { + "epoch": 1.83, + "learning_rate": 2.6172573368530432e-05, + "loss": 0.0227, + "step": 282840 + }, + { + "epoch": 1.83, + "learning_rate": 2.61628920141735e-05, + "loss": 0.0322, + "step": 282850 + }, + { + "epoch": 1.83, + "learning_rate": 2.6153210659816568e-05, + "loss": 0.0236, + "step": 282860 + }, + { + "epoch": 1.83, + "learning_rate": 2.6143529305459634e-05, + "loss": 0.0194, + "step": 282870 + }, + { + "epoch": 1.83, + "learning_rate": 2.6133847951102704e-05, + "loss": 0.0207, + "step": 282880 + }, + { + "epoch": 1.83, + "learning_rate": 2.6124166596745774e-05, + "loss": 0.0229, + "step": 282890 + }, + { + "epoch": 1.83, + "learning_rate": 2.611448524238884e-05, + "loss": 0.0244, + "step": 282900 + }, + { + "epoch": 1.83, + "learning_rate": 2.6104803888031906e-05, + "loss": 0.0218, + "step": 282910 + }, + { + "epoch": 1.83, + "learning_rate": 2.6095122533674972e-05, + "loss": 0.0271, + "step": 282920 + }, + { + "epoch": 1.83, + "learning_rate": 2.6085441179318042e-05, + "loss": 0.0209, + "step": 282930 + }, + { + "epoch": 1.83, + "learning_rate": 2.607575982496111e-05, + "loss": 0.0266, + "step": 282940 + }, + { + "epoch": 1.83, + "learning_rate": 2.6066078470604178e-05, + "loss": 0.0286, + "step": 282950 + }, + { + "epoch": 1.83, + "learning_rate": 2.6056397116247247e-05, + "loss": 0.0234, + "step": 282960 + }, + { + "epoch": 1.83, + "learning_rate": 2.6046715761890317e-05, + "loss": 0.0267, + "step": 282970 + }, + { + "epoch": 1.83, + "learning_rate": 2.603703440753338e-05, + "loss": 0.0196, + "step": 282980 + }, + { + "epoch": 1.83, + "learning_rate": 2.602735305317645e-05, + "loss": 0.0252, + "step": 282990 + }, + { + "epoch": 1.83, + "learning_rate": 2.6017671698819516e-05, + "loss": 0.0248, + "step": 283000 + }, + { + "epoch": 1.83, + "eval_cer": 0.9198300756976613, + "eval_loss": 0.0171258095651865, + "eval_runtime": 119.8965, + "eval_samples_per_second": 16.681, + "eval_steps_per_second": 4.17, + "step": 283000 + }, + { + "epoch": 1.83, + "learning_rate": 2.6007990344462585e-05, + "loss": 0.0225, + "step": 283010 + }, + { + "epoch": 1.83, + "learning_rate": 2.5998308990105655e-05, + "loss": 0.0224, + "step": 283020 + }, + { + "epoch": 1.83, + "learning_rate": 2.598862763574872e-05, + "loss": 0.0191, + "step": 283030 + }, + { + "epoch": 1.83, + "learning_rate": 2.597894628139179e-05, + "loss": 0.0192, + "step": 283040 + }, + { + "epoch": 1.83, + "learning_rate": 2.5969264927034854e-05, + "loss": 0.0231, + "step": 283050 + }, + { + "epoch": 1.83, + "learning_rate": 2.5959583572677923e-05, + "loss": 0.0194, + "step": 283060 + }, + { + "epoch": 1.83, + "learning_rate": 2.5949902218320993e-05, + "loss": 0.029, + "step": 283070 + }, + { + "epoch": 1.83, + "learning_rate": 2.594022086396406e-05, + "loss": 0.0293, + "step": 283080 + }, + { + "epoch": 1.83, + "learning_rate": 2.593053950960713e-05, + "loss": 0.0197, + "step": 283090 + }, + { + "epoch": 1.83, + "learning_rate": 2.59208581552502e-05, + "loss": 0.0222, + "step": 283100 + }, + { + "epoch": 1.83, + "learning_rate": 2.5911176800893265e-05, + "loss": 0.023, + "step": 283110 + }, + { + "epoch": 1.83, + "learning_rate": 2.590149544653633e-05, + "loss": 0.027, + "step": 283120 + }, + { + "epoch": 1.83, + "learning_rate": 2.5891814092179397e-05, + "loss": 0.0266, + "step": 283130 + }, + { + "epoch": 1.83, + "learning_rate": 2.5882132737822467e-05, + "loss": 0.028, + "step": 283140 + }, + { + "epoch": 1.83, + "learning_rate": 2.5872451383465536e-05, + "loss": 0.023, + "step": 283150 + }, + { + "epoch": 1.83, + "learning_rate": 2.5862770029108603e-05, + "loss": 0.0231, + "step": 283160 + }, + { + "epoch": 1.83, + "learning_rate": 2.5853088674751672e-05, + "loss": 0.0249, + "step": 283170 + }, + { + "epoch": 1.83, + "learning_rate": 2.5843407320394742e-05, + "loss": 0.0281, + "step": 283180 + }, + { + "epoch": 1.83, + "learning_rate": 2.5833725966037805e-05, + "loss": 0.0224, + "step": 283190 + }, + { + "epoch": 1.83, + "learning_rate": 2.5824044611680874e-05, + "loss": 0.0258, + "step": 283200 + }, + { + "epoch": 1.83, + "learning_rate": 2.581436325732394e-05, + "loss": 0.0304, + "step": 283210 + }, + { + "epoch": 1.83, + "learning_rate": 2.580468190296701e-05, + "loss": 0.0235, + "step": 283220 + }, + { + "epoch": 1.83, + "learning_rate": 2.579500054861008e-05, + "loss": 0.0215, + "step": 283230 + }, + { + "epoch": 1.83, + "learning_rate": 2.5785319194253146e-05, + "loss": 0.0251, + "step": 283240 + }, + { + "epoch": 1.83, + "learning_rate": 2.5775637839896216e-05, + "loss": 0.0268, + "step": 283250 + }, + { + "epoch": 1.83, + "learning_rate": 2.576595648553928e-05, + "loss": 0.0244, + "step": 283260 + }, + { + "epoch": 1.83, + "learning_rate": 2.5756275131182348e-05, + "loss": 0.019, + "step": 283270 + }, + { + "epoch": 1.83, + "learning_rate": 2.5746593776825418e-05, + "loss": 0.0188, + "step": 283280 + }, + { + "epoch": 1.83, + "learning_rate": 2.5736912422468484e-05, + "loss": 0.0272, + "step": 283290 + }, + { + "epoch": 1.83, + "learning_rate": 2.5727231068111554e-05, + "loss": 0.0232, + "step": 283300 + }, + { + "epoch": 1.83, + "learning_rate": 2.5717549713754623e-05, + "loss": 0.025, + "step": 283310 + }, + { + "epoch": 1.83, + "learning_rate": 2.570786835939769e-05, + "loss": 0.0297, + "step": 283320 + }, + { + "epoch": 1.83, + "learning_rate": 2.5698187005040756e-05, + "loss": 0.0209, + "step": 283330 + }, + { + "epoch": 1.83, + "learning_rate": 2.5688505650683822e-05, + "loss": 0.0234, + "step": 283340 + }, + { + "epoch": 1.83, + "learning_rate": 2.5678824296326892e-05, + "loss": 0.0234, + "step": 283350 + }, + { + "epoch": 1.83, + "learning_rate": 2.566914294196996e-05, + "loss": 0.0192, + "step": 283360 + }, + { + "epoch": 1.83, + "learning_rate": 2.5659461587613028e-05, + "loss": 0.0233, + "step": 283370 + }, + { + "epoch": 1.83, + "learning_rate": 2.5649780233256097e-05, + "loss": 0.0232, + "step": 283380 + }, + { + "epoch": 1.83, + "learning_rate": 2.5640098878899163e-05, + "loss": 0.0227, + "step": 283390 + }, + { + "epoch": 1.83, + "learning_rate": 2.563041752454223e-05, + "loss": 0.019, + "step": 283400 + }, + { + "epoch": 1.83, + "learning_rate": 2.56207361701853e-05, + "loss": 0.0247, + "step": 283410 + }, + { + "epoch": 1.83, + "learning_rate": 2.5611054815828366e-05, + "loss": 0.0212, + "step": 283420 + }, + { + "epoch": 1.83, + "learning_rate": 2.5601373461471435e-05, + "loss": 0.0259, + "step": 283430 + }, + { + "epoch": 1.83, + "learning_rate": 2.55916921071145e-05, + "loss": 0.0223, + "step": 283440 + }, + { + "epoch": 1.83, + "learning_rate": 2.558201075275757e-05, + "loss": 0.0219, + "step": 283450 + }, + { + "epoch": 1.83, + "learning_rate": 2.557232939840064e-05, + "loss": 0.022, + "step": 283460 + }, + { + "epoch": 1.83, + "learning_rate": 2.5562648044043704e-05, + "loss": 0.0174, + "step": 283470 + }, + { + "epoch": 1.83, + "learning_rate": 2.5552966689686773e-05, + "loss": 0.0196, + "step": 283480 + }, + { + "epoch": 1.83, + "learning_rate": 2.554328533532984e-05, + "loss": 0.0218, + "step": 283490 + }, + { + "epoch": 1.83, + "learning_rate": 2.553360398097291e-05, + "loss": 0.023, + "step": 283500 + }, + { + "epoch": 1.83, + "learning_rate": 2.552392262661598e-05, + "loss": 0.0219, + "step": 283510 + }, + { + "epoch": 1.83, + "learning_rate": 2.5514241272259045e-05, + "loss": 0.0244, + "step": 283520 + }, + { + "epoch": 1.83, + "learning_rate": 2.5504559917902115e-05, + "loss": 0.0213, + "step": 283530 + }, + { + "epoch": 1.83, + "learning_rate": 2.549487856354518e-05, + "loss": 0.0284, + "step": 283540 + }, + { + "epoch": 1.83, + "learning_rate": 2.5485197209188247e-05, + "loss": 0.0247, + "step": 283550 + }, + { + "epoch": 1.83, + "learning_rate": 2.5475515854831317e-05, + "loss": 0.0269, + "step": 283560 + }, + { + "epoch": 1.83, + "learning_rate": 2.5465834500474383e-05, + "loss": 0.0223, + "step": 283570 + }, + { + "epoch": 1.83, + "learning_rate": 2.5456153146117453e-05, + "loss": 0.0328, + "step": 283580 + }, + { + "epoch": 1.83, + "learning_rate": 2.5446471791760522e-05, + "loss": 0.0224, + "step": 283590 + }, + { + "epoch": 1.83, + "learning_rate": 2.543679043740359e-05, + "loss": 0.0231, + "step": 283600 + }, + { + "epoch": 1.83, + "learning_rate": 2.5427109083046655e-05, + "loss": 0.0204, + "step": 283610 + }, + { + "epoch": 1.83, + "learning_rate": 2.541742772868972e-05, + "loss": 0.0202, + "step": 283620 + }, + { + "epoch": 1.83, + "learning_rate": 2.540774637433279e-05, + "loss": 0.0219, + "step": 283630 + }, + { + "epoch": 1.83, + "learning_rate": 2.539806501997586e-05, + "loss": 0.0224, + "step": 283640 + }, + { + "epoch": 1.83, + "learning_rate": 2.5388383665618926e-05, + "loss": 0.0196, + "step": 283650 + }, + { + "epoch": 1.83, + "learning_rate": 2.5378702311261996e-05, + "loss": 0.024, + "step": 283660 + }, + { + "epoch": 1.83, + "learning_rate": 2.536902095690506e-05, + "loss": 0.0232, + "step": 283670 + }, + { + "epoch": 1.83, + "learning_rate": 2.535933960254813e-05, + "loss": 0.0261, + "step": 283680 + }, + { + "epoch": 1.83, + "learning_rate": 2.5349658248191198e-05, + "loss": 0.0191, + "step": 283690 + }, + { + "epoch": 1.83, + "learning_rate": 2.5339976893834264e-05, + "loss": 0.0197, + "step": 283700 + }, + { + "epoch": 1.83, + "learning_rate": 2.5330295539477334e-05, + "loss": 0.0247, + "step": 283710 + }, + { + "epoch": 1.83, + "learning_rate": 2.5320614185120404e-05, + "loss": 0.0262, + "step": 283720 + }, + { + "epoch": 1.83, + "learning_rate": 2.531093283076347e-05, + "loss": 0.0212, + "step": 283730 + }, + { + "epoch": 1.83, + "learning_rate": 2.5301251476406536e-05, + "loss": 0.0268, + "step": 283740 + }, + { + "epoch": 1.83, + "learning_rate": 2.5291570122049602e-05, + "loss": 0.0209, + "step": 283750 + }, + { + "epoch": 1.83, + "learning_rate": 2.5281888767692672e-05, + "loss": 0.0201, + "step": 283760 + }, + { + "epoch": 1.83, + "learning_rate": 2.527220741333574e-05, + "loss": 0.0222, + "step": 283770 + }, + { + "epoch": 1.83, + "learning_rate": 2.5262526058978808e-05, + "loss": 0.024, + "step": 283780 + }, + { + "epoch": 1.83, + "learning_rate": 2.5252844704621877e-05, + "loss": 0.0216, + "step": 283790 + }, + { + "epoch": 1.83, + "learning_rate": 2.5243163350264947e-05, + "loss": 0.0315, + "step": 283800 + }, + { + "epoch": 1.83, + "learning_rate": 2.523348199590801e-05, + "loss": 0.0222, + "step": 283810 + }, + { + "epoch": 1.83, + "learning_rate": 2.522380064155108e-05, + "loss": 0.0206, + "step": 283820 + }, + { + "epoch": 1.83, + "learning_rate": 2.5214119287194146e-05, + "loss": 0.0235, + "step": 283830 + }, + { + "epoch": 1.83, + "learning_rate": 2.5204437932837215e-05, + "loss": 0.0251, + "step": 283840 + }, + { + "epoch": 1.83, + "learning_rate": 2.5194756578480285e-05, + "loss": 0.0261, + "step": 283850 + }, + { + "epoch": 1.83, + "learning_rate": 2.518507522412335e-05, + "loss": 0.0281, + "step": 283860 + }, + { + "epoch": 1.83, + "learning_rate": 2.517539386976642e-05, + "loss": 0.0244, + "step": 283870 + }, + { + "epoch": 1.83, + "learning_rate": 2.5165712515409484e-05, + "loss": 0.0219, + "step": 283880 + }, + { + "epoch": 1.83, + "learning_rate": 2.5156031161052553e-05, + "loss": 0.0232, + "step": 283890 + }, + { + "epoch": 1.83, + "learning_rate": 2.5146349806695623e-05, + "loss": 0.0266, + "step": 283900 + }, + { + "epoch": 1.83, + "learning_rate": 2.513666845233869e-05, + "loss": 0.024, + "step": 283910 + }, + { + "epoch": 1.83, + "learning_rate": 2.512698709798176e-05, + "loss": 0.0243, + "step": 283920 + }, + { + "epoch": 1.83, + "learning_rate": 2.511730574362483e-05, + "loss": 0.0222, + "step": 283930 + }, + { + "epoch": 1.83, + "learning_rate": 2.5107624389267895e-05, + "loss": 0.0232, + "step": 283940 + }, + { + "epoch": 1.83, + "learning_rate": 2.509794303491096e-05, + "loss": 0.0271, + "step": 283950 + }, + { + "epoch": 1.83, + "learning_rate": 2.5088261680554027e-05, + "loss": 0.0207, + "step": 283960 + }, + { + "epoch": 1.83, + "learning_rate": 2.5078580326197097e-05, + "loss": 0.0238, + "step": 283970 + }, + { + "epoch": 1.83, + "learning_rate": 2.5068898971840166e-05, + "loss": 0.0185, + "step": 283980 + }, + { + "epoch": 1.83, + "learning_rate": 2.5059217617483233e-05, + "loss": 0.0257, + "step": 283990 + }, + { + "epoch": 1.83, + "learning_rate": 2.5049536263126302e-05, + "loss": 0.0205, + "step": 284000 + }, + { + "epoch": 1.83, + "eval_cer": 0.919813806349565, + "eval_loss": 0.01731204241514206, + "eval_runtime": 119.8623, + "eval_samples_per_second": 16.686, + "eval_steps_per_second": 4.171, + "step": 284000 + }, + { + "epoch": 1.83, + "learning_rate": 2.5039854908769372e-05, + "loss": 0.0279, + "step": 284010 + }, + { + "epoch": 1.83, + "learning_rate": 2.5030173554412435e-05, + "loss": 0.024, + "step": 284020 + }, + { + "epoch": 1.83, + "learning_rate": 2.5020492200055504e-05, + "loss": 0.0262, + "step": 284030 + }, + { + "epoch": 1.83, + "learning_rate": 2.501081084569857e-05, + "loss": 0.021, + "step": 284040 + }, + { + "epoch": 1.83, + "learning_rate": 2.500112949134164e-05, + "loss": 0.0226, + "step": 284050 + }, + { + "epoch": 1.83, + "learning_rate": 2.499144813698471e-05, + "loss": 0.0215, + "step": 284060 + }, + { + "epoch": 1.83, + "learning_rate": 2.4981766782627776e-05, + "loss": 0.0256, + "step": 284070 + }, + { + "epoch": 1.83, + "learning_rate": 2.4972085428270846e-05, + "loss": 0.0201, + "step": 284080 + }, + { + "epoch": 1.83, + "learning_rate": 2.496240407391391e-05, + "loss": 0.0221, + "step": 284090 + }, + { + "epoch": 1.83, + "learning_rate": 2.4952722719556978e-05, + "loss": 0.0228, + "step": 284100 + }, + { + "epoch": 1.83, + "learning_rate": 2.4943041365200048e-05, + "loss": 0.0243, + "step": 284110 + }, + { + "epoch": 1.83, + "learning_rate": 2.4933360010843114e-05, + "loss": 0.0218, + "step": 284120 + }, + { + "epoch": 1.83, + "learning_rate": 2.4923678656486184e-05, + "loss": 0.0214, + "step": 284130 + }, + { + "epoch": 1.83, + "learning_rate": 2.491399730212925e-05, + "loss": 0.023, + "step": 284140 + }, + { + "epoch": 1.83, + "learning_rate": 2.490431594777232e-05, + "loss": 0.0267, + "step": 284150 + }, + { + "epoch": 1.83, + "learning_rate": 2.4894634593415386e-05, + "loss": 0.0212, + "step": 284160 + }, + { + "epoch": 1.83, + "learning_rate": 2.4884953239058452e-05, + "loss": 0.0182, + "step": 284170 + }, + { + "epoch": 1.83, + "learning_rate": 2.4875271884701522e-05, + "loss": 0.0231, + "step": 284180 + }, + { + "epoch": 1.83, + "learning_rate": 2.4865590530344588e-05, + "loss": 0.022, + "step": 284190 + }, + { + "epoch": 1.83, + "learning_rate": 2.4855909175987658e-05, + "loss": 0.0217, + "step": 284200 + }, + { + "epoch": 1.83, + "learning_rate": 2.4846227821630727e-05, + "loss": 0.0257, + "step": 284210 + }, + { + "epoch": 1.83, + "learning_rate": 2.4836546467273793e-05, + "loss": 0.0212, + "step": 284220 + }, + { + "epoch": 1.83, + "learning_rate": 2.482686511291686e-05, + "loss": 0.0251, + "step": 284230 + }, + { + "epoch": 1.83, + "learning_rate": 2.4817183758559926e-05, + "loss": 0.021, + "step": 284240 + }, + { + "epoch": 1.83, + "learning_rate": 2.4807502404202996e-05, + "loss": 0.0212, + "step": 284250 + }, + { + "epoch": 1.83, + "learning_rate": 2.4797821049846065e-05, + "loss": 0.023, + "step": 284260 + }, + { + "epoch": 1.83, + "learning_rate": 2.478813969548913e-05, + "loss": 0.0272, + "step": 284270 + }, + { + "epoch": 1.83, + "learning_rate": 2.47784583411322e-05, + "loss": 0.0256, + "step": 284280 + }, + { + "epoch": 1.83, + "learning_rate": 2.476877698677527e-05, + "loss": 0.0234, + "step": 284290 + }, + { + "epoch": 1.83, + "learning_rate": 2.4759095632418334e-05, + "loss": 0.0224, + "step": 284300 + }, + { + "epoch": 1.83, + "learning_rate": 2.4749414278061403e-05, + "loss": 0.0241, + "step": 284310 + }, + { + "epoch": 1.84, + "learning_rate": 2.473973292370447e-05, + "loss": 0.0197, + "step": 284320 + }, + { + "epoch": 1.84, + "learning_rate": 2.473005156934754e-05, + "loss": 0.0187, + "step": 284330 + }, + { + "epoch": 1.84, + "learning_rate": 2.472037021499061e-05, + "loss": 0.0233, + "step": 284340 + }, + { + "epoch": 1.84, + "learning_rate": 2.4710688860633675e-05, + "loss": 0.0205, + "step": 284350 + }, + { + "epoch": 1.84, + "learning_rate": 2.4701007506276745e-05, + "loss": 0.0241, + "step": 284360 + }, + { + "epoch": 1.84, + "learning_rate": 2.4691326151919807e-05, + "loss": 0.02, + "step": 284370 + }, + { + "epoch": 1.84, + "learning_rate": 2.4681644797562877e-05, + "loss": 0.0231, + "step": 284380 + }, + { + "epoch": 1.84, + "learning_rate": 2.4671963443205947e-05, + "loss": 0.0209, + "step": 284390 + }, + { + "epoch": 1.84, + "learning_rate": 2.4662282088849013e-05, + "loss": 0.0245, + "step": 284400 + }, + { + "epoch": 1.84, + "learning_rate": 2.4652600734492083e-05, + "loss": 0.0183, + "step": 284410 + }, + { + "epoch": 1.84, + "learning_rate": 2.4642919380135152e-05, + "loss": 0.029, + "step": 284420 + }, + { + "epoch": 1.84, + "learning_rate": 2.463323802577822e-05, + "loss": 0.0267, + "step": 284430 + }, + { + "epoch": 1.84, + "learning_rate": 2.4623556671421285e-05, + "loss": 0.0241, + "step": 284440 + }, + { + "epoch": 1.84, + "learning_rate": 2.461387531706435e-05, + "loss": 0.0226, + "step": 284450 + }, + { + "epoch": 1.84, + "learning_rate": 2.460419396270742e-05, + "loss": 0.023, + "step": 284460 + }, + { + "epoch": 1.84, + "learning_rate": 2.459451260835049e-05, + "loss": 0.0266, + "step": 284470 + }, + { + "epoch": 1.84, + "learning_rate": 2.4584831253993556e-05, + "loss": 0.0241, + "step": 284480 + }, + { + "epoch": 1.84, + "learning_rate": 2.4575149899636626e-05, + "loss": 0.0242, + "step": 284490 + }, + { + "epoch": 1.84, + "learning_rate": 2.456546854527969e-05, + "loss": 0.0181, + "step": 284500 + }, + { + "epoch": 1.84, + "learning_rate": 2.455578719092276e-05, + "loss": 0.0229, + "step": 284510 + }, + { + "epoch": 1.84, + "learning_rate": 2.4546105836565828e-05, + "loss": 0.0208, + "step": 284520 + }, + { + "epoch": 1.84, + "learning_rate": 2.4536424482208894e-05, + "loss": 0.0217, + "step": 284530 + }, + { + "epoch": 1.84, + "learning_rate": 2.4526743127851964e-05, + "loss": 0.0309, + "step": 284540 + }, + { + "epoch": 1.84, + "learning_rate": 2.4517061773495034e-05, + "loss": 0.023, + "step": 284550 + }, + { + "epoch": 1.84, + "learning_rate": 2.45073804191381e-05, + "loss": 0.0225, + "step": 284560 + }, + { + "epoch": 1.84, + "learning_rate": 2.4497699064781166e-05, + "loss": 0.0211, + "step": 284570 + }, + { + "epoch": 1.84, + "learning_rate": 2.4488017710424232e-05, + "loss": 0.0216, + "step": 284580 + }, + { + "epoch": 1.84, + "learning_rate": 2.4478336356067302e-05, + "loss": 0.0187, + "step": 284590 + }, + { + "epoch": 1.84, + "learning_rate": 2.446865500171037e-05, + "loss": 0.022, + "step": 284600 + }, + { + "epoch": 1.84, + "learning_rate": 2.4458973647353438e-05, + "loss": 0.0212, + "step": 284610 + }, + { + "epoch": 1.84, + "learning_rate": 2.4449292292996507e-05, + "loss": 0.0192, + "step": 284620 + }, + { + "epoch": 1.84, + "learning_rate": 2.4439610938639577e-05, + "loss": 0.0273, + "step": 284630 + }, + { + "epoch": 1.84, + "learning_rate": 2.442992958428264e-05, + "loss": 0.0267, + "step": 284640 + }, + { + "epoch": 1.84, + "learning_rate": 2.442024822992571e-05, + "loss": 0.0247, + "step": 284650 + }, + { + "epoch": 1.84, + "learning_rate": 2.4410566875568776e-05, + "loss": 0.0249, + "step": 284660 + }, + { + "epoch": 1.84, + "learning_rate": 2.4400885521211845e-05, + "loss": 0.0189, + "step": 284670 + }, + { + "epoch": 1.84, + "learning_rate": 2.4391204166854915e-05, + "loss": 0.0226, + "step": 284680 + }, + { + "epoch": 1.84, + "learning_rate": 2.438152281249798e-05, + "loss": 0.0198, + "step": 284690 + }, + { + "epoch": 1.84, + "learning_rate": 2.437184145814105e-05, + "loss": 0.0213, + "step": 284700 + }, + { + "epoch": 1.84, + "learning_rate": 2.4362160103784114e-05, + "loss": 0.0244, + "step": 284710 + }, + { + "epoch": 1.84, + "learning_rate": 2.4352478749427183e-05, + "loss": 0.0239, + "step": 284720 + }, + { + "epoch": 1.84, + "learning_rate": 2.4342797395070253e-05, + "loss": 0.025, + "step": 284730 + }, + { + "epoch": 1.84, + "learning_rate": 2.433311604071332e-05, + "loss": 0.0235, + "step": 284740 + }, + { + "epoch": 1.84, + "learning_rate": 2.432343468635639e-05, + "loss": 0.0213, + "step": 284750 + }, + { + "epoch": 1.84, + "learning_rate": 2.431375333199946e-05, + "loss": 0.0235, + "step": 284760 + }, + { + "epoch": 1.84, + "learning_rate": 2.4304071977642525e-05, + "loss": 0.0217, + "step": 284770 + }, + { + "epoch": 1.84, + "learning_rate": 2.429439062328559e-05, + "loss": 0.0232, + "step": 284780 + }, + { + "epoch": 1.84, + "learning_rate": 2.4284709268928657e-05, + "loss": 0.019, + "step": 284790 + }, + { + "epoch": 1.84, + "learning_rate": 2.4275027914571727e-05, + "loss": 0.0267, + "step": 284800 + }, + { + "epoch": 1.84, + "learning_rate": 2.4265346560214796e-05, + "loss": 0.0208, + "step": 284810 + }, + { + "epoch": 1.84, + "learning_rate": 2.4255665205857863e-05, + "loss": 0.0203, + "step": 284820 + }, + { + "epoch": 1.84, + "learning_rate": 2.4245983851500932e-05, + "loss": 0.0278, + "step": 284830 + }, + { + "epoch": 1.84, + "learning_rate": 2.4236302497144e-05, + "loss": 0.021, + "step": 284840 + }, + { + "epoch": 1.84, + "learning_rate": 2.4226621142787065e-05, + "loss": 0.0266, + "step": 284850 + }, + { + "epoch": 1.84, + "learning_rate": 2.4216939788430134e-05, + "loss": 0.0203, + "step": 284860 + }, + { + "epoch": 1.84, + "learning_rate": 2.42072584340732e-05, + "loss": 0.0269, + "step": 284870 + }, + { + "epoch": 1.84, + "learning_rate": 2.419757707971627e-05, + "loss": 0.0234, + "step": 284880 + }, + { + "epoch": 1.84, + "learning_rate": 2.4187895725359337e-05, + "loss": 0.0251, + "step": 284890 + }, + { + "epoch": 1.84, + "learning_rate": 2.4178214371002406e-05, + "loss": 0.0258, + "step": 284900 + }, + { + "epoch": 1.84, + "learning_rate": 2.4168533016645476e-05, + "loss": 0.0289, + "step": 284910 + }, + { + "epoch": 1.84, + "learning_rate": 2.415885166228854e-05, + "loss": 0.0223, + "step": 284920 + }, + { + "epoch": 1.84, + "learning_rate": 2.4149170307931608e-05, + "loss": 0.0209, + "step": 284930 + }, + { + "epoch": 1.84, + "learning_rate": 2.4139488953574675e-05, + "loss": 0.0217, + "step": 284940 + }, + { + "epoch": 1.84, + "learning_rate": 2.4129807599217744e-05, + "loss": 0.0192, + "step": 284950 + }, + { + "epoch": 1.84, + "learning_rate": 2.4120126244860814e-05, + "loss": 0.0227, + "step": 284960 + }, + { + "epoch": 1.84, + "learning_rate": 2.411044489050388e-05, + "loss": 0.0213, + "step": 284970 + }, + { + "epoch": 1.84, + "learning_rate": 2.410076353614695e-05, + "loss": 0.0219, + "step": 284980 + }, + { + "epoch": 1.84, + "learning_rate": 2.4091082181790012e-05, + "loss": 0.0234, + "step": 284990 + }, + { + "epoch": 1.84, + "learning_rate": 2.4081400827433082e-05, + "loss": 0.0231, + "step": 285000 + }, + { + "epoch": 1.84, + "eval_cer": 0.9198599028358377, + "eval_loss": 0.01720038801431656, + "eval_runtime": 120.0459, + "eval_samples_per_second": 16.66, + "eval_steps_per_second": 4.165, + "step": 285000 + }, + { + "epoch": 1.84, + "learning_rate": 2.4071719473076152e-05, + "loss": 0.0181, + "step": 285010 + }, + { + "epoch": 1.84, + "learning_rate": 2.4062038118719218e-05, + "loss": 0.0266, + "step": 285020 + }, + { + "epoch": 1.84, + "learning_rate": 2.4052356764362288e-05, + "loss": 0.0198, + "step": 285030 + }, + { + "epoch": 1.84, + "learning_rate": 2.4042675410005357e-05, + "loss": 0.0249, + "step": 285040 + }, + { + "epoch": 1.84, + "learning_rate": 2.4032994055648423e-05, + "loss": 0.0213, + "step": 285050 + }, + { + "epoch": 1.84, + "learning_rate": 2.402331270129149e-05, + "loss": 0.0286, + "step": 285060 + }, + { + "epoch": 1.84, + "learning_rate": 2.4013631346934556e-05, + "loss": 0.0241, + "step": 285070 + }, + { + "epoch": 1.84, + "learning_rate": 2.4003949992577626e-05, + "loss": 0.0222, + "step": 285080 + }, + { + "epoch": 1.84, + "learning_rate": 2.3994268638220695e-05, + "loss": 0.0228, + "step": 285090 + }, + { + "epoch": 1.84, + "learning_rate": 2.398458728386376e-05, + "loss": 0.0257, + "step": 285100 + }, + { + "epoch": 1.84, + "learning_rate": 2.397490592950683e-05, + "loss": 0.0248, + "step": 285110 + }, + { + "epoch": 1.84, + "learning_rate": 2.39652245751499e-05, + "loss": 0.0248, + "step": 285120 + }, + { + "epoch": 1.84, + "learning_rate": 2.3955543220792964e-05, + "loss": 0.0262, + "step": 285130 + }, + { + "epoch": 1.84, + "learning_rate": 2.3945861866436033e-05, + "loss": 0.0238, + "step": 285140 + }, + { + "epoch": 1.84, + "learning_rate": 2.39361805120791e-05, + "loss": 0.0173, + "step": 285150 + }, + { + "epoch": 1.84, + "learning_rate": 2.392649915772217e-05, + "loss": 0.028, + "step": 285160 + }, + { + "epoch": 1.84, + "learning_rate": 2.391681780336524e-05, + "loss": 0.0259, + "step": 285170 + }, + { + "epoch": 1.84, + "learning_rate": 2.3907136449008305e-05, + "loss": 0.0202, + "step": 285180 + }, + { + "epoch": 1.84, + "learning_rate": 2.3897455094651375e-05, + "loss": 0.0212, + "step": 285190 + }, + { + "epoch": 1.84, + "learning_rate": 2.3887773740294437e-05, + "loss": 0.018, + "step": 285200 + }, + { + "epoch": 1.84, + "learning_rate": 2.3878092385937507e-05, + "loss": 0.02, + "step": 285210 + }, + { + "epoch": 1.84, + "learning_rate": 2.3868411031580577e-05, + "loss": 0.0225, + "step": 285220 + }, + { + "epoch": 1.84, + "learning_rate": 2.3858729677223643e-05, + "loss": 0.0286, + "step": 285230 + }, + { + "epoch": 1.84, + "learning_rate": 2.3849048322866713e-05, + "loss": 0.0209, + "step": 285240 + }, + { + "epoch": 1.84, + "learning_rate": 2.3839366968509782e-05, + "loss": 0.0192, + "step": 285250 + }, + { + "epoch": 1.84, + "learning_rate": 2.382968561415285e-05, + "loss": 0.0258, + "step": 285260 + }, + { + "epoch": 1.84, + "learning_rate": 2.3820004259795915e-05, + "loss": 0.0237, + "step": 285270 + }, + { + "epoch": 1.84, + "learning_rate": 2.381032290543898e-05, + "loss": 0.0244, + "step": 285280 + }, + { + "epoch": 1.84, + "learning_rate": 2.380064155108205e-05, + "loss": 0.0239, + "step": 285290 + }, + { + "epoch": 1.84, + "learning_rate": 2.379096019672512e-05, + "loss": 0.0178, + "step": 285300 + }, + { + "epoch": 1.84, + "learning_rate": 2.3781278842368186e-05, + "loss": 0.0237, + "step": 285310 + }, + { + "epoch": 1.84, + "learning_rate": 2.3771597488011256e-05, + "loss": 0.0208, + "step": 285320 + }, + { + "epoch": 1.84, + "learning_rate": 2.3761916133654326e-05, + "loss": 0.0243, + "step": 285330 + }, + { + "epoch": 1.84, + "learning_rate": 2.375223477929739e-05, + "loss": 0.0253, + "step": 285340 + }, + { + "epoch": 1.84, + "learning_rate": 2.3742553424940458e-05, + "loss": 0.0238, + "step": 285350 + }, + { + "epoch": 1.84, + "learning_rate": 2.3732872070583524e-05, + "loss": 0.0246, + "step": 285360 + }, + { + "epoch": 1.84, + "learning_rate": 2.3723190716226594e-05, + "loss": 0.0231, + "step": 285370 + }, + { + "epoch": 1.84, + "learning_rate": 2.3713509361869664e-05, + "loss": 0.0183, + "step": 285380 + }, + { + "epoch": 1.84, + "learning_rate": 2.370382800751273e-05, + "loss": 0.0239, + "step": 285390 + }, + { + "epoch": 1.84, + "learning_rate": 2.3694146653155796e-05, + "loss": 0.0206, + "step": 285400 + }, + { + "epoch": 1.84, + "learning_rate": 2.3684465298798862e-05, + "loss": 0.0226, + "step": 285410 + }, + { + "epoch": 1.84, + "learning_rate": 2.3674783944441932e-05, + "loss": 0.0256, + "step": 285420 + }, + { + "epoch": 1.84, + "learning_rate": 2.3665102590085e-05, + "loss": 0.0219, + "step": 285430 + }, + { + "epoch": 1.84, + "learning_rate": 2.3655421235728068e-05, + "loss": 0.0223, + "step": 285440 + }, + { + "epoch": 1.84, + "learning_rate": 2.3645739881371137e-05, + "loss": 0.022, + "step": 285450 + }, + { + "epoch": 1.84, + "learning_rate": 2.3636058527014204e-05, + "loss": 0.0198, + "step": 285460 + }, + { + "epoch": 1.84, + "learning_rate": 2.362637717265727e-05, + "loss": 0.0206, + "step": 285470 + }, + { + "epoch": 1.84, + "learning_rate": 2.361669581830034e-05, + "loss": 0.0232, + "step": 285480 + }, + { + "epoch": 1.84, + "learning_rate": 2.3607014463943406e-05, + "loss": 0.0235, + "step": 285490 + }, + { + "epoch": 1.84, + "learning_rate": 2.3597333109586475e-05, + "loss": 0.0221, + "step": 285500 + }, + { + "epoch": 1.84, + "learning_rate": 2.358765175522954e-05, + "loss": 0.0212, + "step": 285510 + }, + { + "epoch": 1.84, + "learning_rate": 2.357797040087261e-05, + "loss": 0.0275, + "step": 285520 + }, + { + "epoch": 1.84, + "learning_rate": 2.356828904651568e-05, + "loss": 0.0235, + "step": 285530 + }, + { + "epoch": 1.84, + "learning_rate": 2.3558607692158744e-05, + "loss": 0.0191, + "step": 285540 + }, + { + "epoch": 1.84, + "learning_rate": 2.3548926337801813e-05, + "loss": 0.0261, + "step": 285550 + }, + { + "epoch": 1.84, + "learning_rate": 2.353924498344488e-05, + "loss": 0.0216, + "step": 285560 + }, + { + "epoch": 1.84, + "learning_rate": 2.352956362908795e-05, + "loss": 0.0216, + "step": 285570 + }, + { + "epoch": 1.84, + "learning_rate": 2.351988227473102e-05, + "loss": 0.0235, + "step": 285580 + }, + { + "epoch": 1.84, + "learning_rate": 2.3510200920374085e-05, + "loss": 0.0275, + "step": 285590 + }, + { + "epoch": 1.84, + "learning_rate": 2.3500519566017155e-05, + "loss": 0.0261, + "step": 285600 + }, + { + "epoch": 1.84, + "learning_rate": 2.3490838211660218e-05, + "loss": 0.0257, + "step": 285610 + }, + { + "epoch": 1.84, + "learning_rate": 2.3481156857303287e-05, + "loss": 0.0277, + "step": 285620 + }, + { + "epoch": 1.84, + "learning_rate": 2.3471475502946357e-05, + "loss": 0.0217, + "step": 285630 + }, + { + "epoch": 1.84, + "learning_rate": 2.3461794148589423e-05, + "loss": 0.0244, + "step": 285640 + }, + { + "epoch": 1.84, + "learning_rate": 2.3452112794232493e-05, + "loss": 0.0255, + "step": 285650 + }, + { + "epoch": 1.84, + "learning_rate": 2.3442431439875562e-05, + "loss": 0.0211, + "step": 285660 + }, + { + "epoch": 1.84, + "learning_rate": 2.343275008551863e-05, + "loss": 0.0285, + "step": 285670 + }, + { + "epoch": 1.84, + "learning_rate": 2.3423068731161695e-05, + "loss": 0.0213, + "step": 285680 + }, + { + "epoch": 1.84, + "learning_rate": 2.341338737680476e-05, + "loss": 0.0233, + "step": 285690 + }, + { + "epoch": 1.84, + "learning_rate": 2.340370602244783e-05, + "loss": 0.0228, + "step": 285700 + }, + { + "epoch": 1.84, + "learning_rate": 2.33940246680909e-05, + "loss": 0.0206, + "step": 285710 + }, + { + "epoch": 1.84, + "learning_rate": 2.3384343313733967e-05, + "loss": 0.0231, + "step": 285720 + }, + { + "epoch": 1.84, + "learning_rate": 2.3374661959377036e-05, + "loss": 0.0346, + "step": 285730 + }, + { + "epoch": 1.84, + "learning_rate": 2.3364980605020106e-05, + "loss": 0.0195, + "step": 285740 + }, + { + "epoch": 1.84, + "learning_rate": 2.335529925066317e-05, + "loss": 0.026, + "step": 285750 + }, + { + "epoch": 1.84, + "learning_rate": 2.3345617896306238e-05, + "loss": 0.0221, + "step": 285760 + }, + { + "epoch": 1.84, + "learning_rate": 2.3335936541949304e-05, + "loss": 0.0265, + "step": 285770 + }, + { + "epoch": 1.84, + "learning_rate": 2.3326255187592374e-05, + "loss": 0.0222, + "step": 285780 + }, + { + "epoch": 1.84, + "learning_rate": 2.3316573833235444e-05, + "loss": 0.0226, + "step": 285790 + }, + { + "epoch": 1.84, + "learning_rate": 2.330689247887851e-05, + "loss": 0.0226, + "step": 285800 + }, + { + "epoch": 1.84, + "learning_rate": 2.329721112452158e-05, + "loss": 0.022, + "step": 285810 + }, + { + "epoch": 1.84, + "learning_rate": 2.3287529770164642e-05, + "loss": 0.024, + "step": 285820 + }, + { + "epoch": 1.84, + "learning_rate": 2.3277848415807712e-05, + "loss": 0.0228, + "step": 285830 + }, + { + "epoch": 1.84, + "learning_rate": 2.3268167061450782e-05, + "loss": 0.0246, + "step": 285840 + }, + { + "epoch": 1.84, + "learning_rate": 2.3258485707093848e-05, + "loss": 0.0247, + "step": 285850 + }, + { + "epoch": 1.85, + "learning_rate": 2.3248804352736918e-05, + "loss": 0.0224, + "step": 285860 + }, + { + "epoch": 1.85, + "learning_rate": 2.3239122998379987e-05, + "loss": 0.026, + "step": 285870 + }, + { + "epoch": 1.85, + "learning_rate": 2.3229441644023053e-05, + "loss": 0.0238, + "step": 285880 + }, + { + "epoch": 1.85, + "learning_rate": 2.321976028966612e-05, + "loss": 0.0265, + "step": 285890 + }, + { + "epoch": 1.85, + "learning_rate": 2.3210078935309186e-05, + "loss": 0.0216, + "step": 285900 + }, + { + "epoch": 1.85, + "learning_rate": 2.3200397580952256e-05, + "loss": 0.029, + "step": 285910 + }, + { + "epoch": 1.85, + "learning_rate": 2.3190716226595325e-05, + "loss": 0.0242, + "step": 285920 + }, + { + "epoch": 1.85, + "learning_rate": 2.318103487223839e-05, + "loss": 0.0222, + "step": 285930 + }, + { + "epoch": 1.85, + "learning_rate": 2.317135351788146e-05, + "loss": 0.0192, + "step": 285940 + }, + { + "epoch": 1.85, + "learning_rate": 2.316167216352453e-05, + "loss": 0.0223, + "step": 285950 + }, + { + "epoch": 1.85, + "learning_rate": 2.3151990809167594e-05, + "loss": 0.021, + "step": 285960 + }, + { + "epoch": 1.85, + "learning_rate": 2.3142309454810663e-05, + "loss": 0.0256, + "step": 285970 + }, + { + "epoch": 1.85, + "learning_rate": 2.313262810045373e-05, + "loss": 0.0212, + "step": 285980 + }, + { + "epoch": 1.85, + "learning_rate": 2.31229467460968e-05, + "loss": 0.0251, + "step": 285990 + }, + { + "epoch": 1.85, + "learning_rate": 2.311326539173987e-05, + "loss": 0.0278, + "step": 286000 + }, + { + "epoch": 1.85, + "eval_cer": 0.9198391142243815, + "eval_loss": 0.017069820314645767, + "eval_runtime": 120.131, + "eval_samples_per_second": 16.648, + "eval_steps_per_second": 4.162, + "step": 286000 + }, + { + "epoch": 1.85, + "learning_rate": 2.3103584037382935e-05, + "loss": 0.0253, + "step": 286010 + }, + { + "epoch": 1.85, + "learning_rate": 2.3093902683026005e-05, + "loss": 0.0194, + "step": 286020 + }, + { + "epoch": 1.85, + "learning_rate": 2.3084221328669067e-05, + "loss": 0.0229, + "step": 286030 + }, + { + "epoch": 1.85, + "learning_rate": 2.3074539974312137e-05, + "loss": 0.0207, + "step": 286040 + }, + { + "epoch": 1.85, + "learning_rate": 2.3064858619955207e-05, + "loss": 0.0254, + "step": 286050 + }, + { + "epoch": 1.85, + "learning_rate": 2.3055177265598273e-05, + "loss": 0.0226, + "step": 286060 + }, + { + "epoch": 1.85, + "learning_rate": 2.3045495911241342e-05, + "loss": 0.0318, + "step": 286070 + }, + { + "epoch": 1.85, + "learning_rate": 2.3035814556884412e-05, + "loss": 0.0185, + "step": 286080 + }, + { + "epoch": 1.85, + "learning_rate": 2.302613320252748e-05, + "loss": 0.0243, + "step": 286090 + }, + { + "epoch": 1.85, + "learning_rate": 2.3016451848170545e-05, + "loss": 0.0232, + "step": 286100 + }, + { + "epoch": 1.85, + "learning_rate": 2.300677049381361e-05, + "loss": 0.0262, + "step": 286110 + }, + { + "epoch": 1.85, + "learning_rate": 2.299708913945668e-05, + "loss": 0.0173, + "step": 286120 + }, + { + "epoch": 1.85, + "learning_rate": 2.298740778509975e-05, + "loss": 0.0198, + "step": 286130 + }, + { + "epoch": 1.85, + "learning_rate": 2.2977726430742816e-05, + "loss": 0.021, + "step": 286140 + }, + { + "epoch": 1.85, + "learning_rate": 2.2968045076385886e-05, + "loss": 0.0229, + "step": 286150 + }, + { + "epoch": 1.85, + "learning_rate": 2.2958363722028952e-05, + "loss": 0.0216, + "step": 286160 + }, + { + "epoch": 1.85, + "learning_rate": 2.294868236767202e-05, + "loss": 0.0224, + "step": 286170 + }, + { + "epoch": 1.85, + "learning_rate": 2.2939001013315088e-05, + "loss": 0.0228, + "step": 286180 + }, + { + "epoch": 1.85, + "learning_rate": 2.2929319658958154e-05, + "loss": 0.0205, + "step": 286190 + }, + { + "epoch": 1.85, + "learning_rate": 2.2919638304601224e-05, + "loss": 0.027, + "step": 286200 + }, + { + "epoch": 1.85, + "learning_rate": 2.290995695024429e-05, + "loss": 0.0244, + "step": 286210 + }, + { + "epoch": 1.85, + "learning_rate": 2.290027559588736e-05, + "loss": 0.03, + "step": 286220 + }, + { + "epoch": 1.85, + "learning_rate": 2.2890594241530426e-05, + "loss": 0.0197, + "step": 286230 + }, + { + "epoch": 1.85, + "learning_rate": 2.2880912887173492e-05, + "loss": 0.0194, + "step": 286240 + }, + { + "epoch": 1.85, + "learning_rate": 2.2871231532816562e-05, + "loss": 0.0268, + "step": 286250 + }, + { + "epoch": 1.85, + "learning_rate": 2.2861550178459628e-05, + "loss": 0.0195, + "step": 286260 + }, + { + "epoch": 1.85, + "learning_rate": 2.2851868824102698e-05, + "loss": 0.0228, + "step": 286270 + }, + { + "epoch": 1.85, + "learning_rate": 2.2842187469745767e-05, + "loss": 0.0223, + "step": 286280 + }, + { + "epoch": 1.85, + "learning_rate": 2.2832506115388834e-05, + "loss": 0.0197, + "step": 286290 + }, + { + "epoch": 1.85, + "learning_rate": 2.28228247610319e-05, + "loss": 0.0212, + "step": 286300 + }, + { + "epoch": 1.85, + "learning_rate": 2.2813143406674966e-05, + "loss": 0.0259, + "step": 286310 + }, + { + "epoch": 1.85, + "learning_rate": 2.2803462052318036e-05, + "loss": 0.0243, + "step": 286320 + }, + { + "epoch": 1.85, + "learning_rate": 2.2793780697961105e-05, + "loss": 0.0278, + "step": 286330 + }, + { + "epoch": 1.85, + "learning_rate": 2.278409934360417e-05, + "loss": 0.0226, + "step": 286340 + }, + { + "epoch": 1.85, + "learning_rate": 2.277441798924724e-05, + "loss": 0.0206, + "step": 286350 + }, + { + "epoch": 1.85, + "learning_rate": 2.276473663489031e-05, + "loss": 0.022, + "step": 286360 + }, + { + "epoch": 1.85, + "learning_rate": 2.2755055280533374e-05, + "loss": 0.0227, + "step": 286370 + }, + { + "epoch": 1.85, + "learning_rate": 2.2745373926176443e-05, + "loss": 0.0235, + "step": 286380 + }, + { + "epoch": 1.85, + "learning_rate": 2.273569257181951e-05, + "loss": 0.0279, + "step": 286390 + }, + { + "epoch": 1.85, + "learning_rate": 2.272601121746258e-05, + "loss": 0.0195, + "step": 286400 + }, + { + "epoch": 1.85, + "learning_rate": 2.271632986310565e-05, + "loss": 0.0237, + "step": 286410 + }, + { + "epoch": 1.85, + "learning_rate": 2.2706648508748715e-05, + "loss": 0.0205, + "step": 286420 + }, + { + "epoch": 1.85, + "learning_rate": 2.2696967154391785e-05, + "loss": 0.0188, + "step": 286430 + }, + { + "epoch": 1.85, + "learning_rate": 2.2687285800034848e-05, + "loss": 0.0192, + "step": 286440 + }, + { + "epoch": 1.85, + "learning_rate": 2.2677604445677917e-05, + "loss": 0.0208, + "step": 286450 + }, + { + "epoch": 1.85, + "learning_rate": 2.2667923091320987e-05, + "loss": 0.0185, + "step": 286460 + }, + { + "epoch": 1.85, + "learning_rate": 2.2658241736964053e-05, + "loss": 0.0181, + "step": 286470 + }, + { + "epoch": 1.85, + "learning_rate": 2.2648560382607123e-05, + "loss": 0.0227, + "step": 286480 + }, + { + "epoch": 1.85, + "learning_rate": 2.2638879028250192e-05, + "loss": 0.0262, + "step": 286490 + }, + { + "epoch": 1.85, + "learning_rate": 2.262919767389326e-05, + "loss": 0.0224, + "step": 286500 + }, + { + "epoch": 1.85, + "learning_rate": 2.2619516319536325e-05, + "loss": 0.0187, + "step": 286510 + }, + { + "epoch": 1.85, + "learning_rate": 2.260983496517939e-05, + "loss": 0.0241, + "step": 286520 + }, + { + "epoch": 1.85, + "learning_rate": 2.260015361082246e-05, + "loss": 0.0178, + "step": 286530 + }, + { + "epoch": 1.85, + "learning_rate": 2.259047225646553e-05, + "loss": 0.0294, + "step": 286540 + }, + { + "epoch": 1.85, + "learning_rate": 2.2580790902108597e-05, + "loss": 0.0198, + "step": 286550 + }, + { + "epoch": 1.85, + "learning_rate": 2.2571109547751666e-05, + "loss": 0.0277, + "step": 286560 + }, + { + "epoch": 1.85, + "learning_rate": 2.2561428193394736e-05, + "loss": 0.0197, + "step": 286570 + }, + { + "epoch": 1.85, + "learning_rate": 2.25517468390378e-05, + "loss": 0.0304, + "step": 286580 + }, + { + "epoch": 1.85, + "learning_rate": 2.2542065484680868e-05, + "loss": 0.0245, + "step": 286590 + }, + { + "epoch": 1.85, + "learning_rate": 2.2532384130323934e-05, + "loss": 0.0269, + "step": 286600 + }, + { + "epoch": 1.85, + "learning_rate": 2.2522702775967004e-05, + "loss": 0.0233, + "step": 286610 + }, + { + "epoch": 1.85, + "learning_rate": 2.2513021421610074e-05, + "loss": 0.0243, + "step": 286620 + }, + { + "epoch": 1.85, + "learning_rate": 2.250334006725314e-05, + "loss": 0.0189, + "step": 286630 + }, + { + "epoch": 1.85, + "learning_rate": 2.249365871289621e-05, + "loss": 0.022, + "step": 286640 + }, + { + "epoch": 1.85, + "learning_rate": 2.2483977358539272e-05, + "loss": 0.0189, + "step": 286650 + }, + { + "epoch": 1.85, + "learning_rate": 2.2474296004182342e-05, + "loss": 0.0226, + "step": 286660 + }, + { + "epoch": 1.85, + "learning_rate": 2.2464614649825412e-05, + "loss": 0.0258, + "step": 286670 + }, + { + "epoch": 1.85, + "learning_rate": 2.2454933295468478e-05, + "loss": 0.0248, + "step": 286680 + }, + { + "epoch": 1.85, + "learning_rate": 2.2445251941111548e-05, + "loss": 0.0238, + "step": 286690 + }, + { + "epoch": 1.85, + "learning_rate": 2.2435570586754617e-05, + "loss": 0.0222, + "step": 286700 + }, + { + "epoch": 1.85, + "learning_rate": 2.2425889232397683e-05, + "loss": 0.0272, + "step": 286710 + }, + { + "epoch": 1.85, + "learning_rate": 2.241620787804075e-05, + "loss": 0.0222, + "step": 286720 + }, + { + "epoch": 1.85, + "learning_rate": 2.2406526523683816e-05, + "loss": 0.0197, + "step": 286730 + }, + { + "epoch": 1.85, + "learning_rate": 2.2396845169326886e-05, + "loss": 0.0239, + "step": 286740 + }, + { + "epoch": 1.85, + "learning_rate": 2.2387163814969955e-05, + "loss": 0.0207, + "step": 286750 + }, + { + "epoch": 1.85, + "learning_rate": 2.237748246061302e-05, + "loss": 0.0204, + "step": 286760 + }, + { + "epoch": 1.85, + "learning_rate": 2.236780110625609e-05, + "loss": 0.0221, + "step": 286770 + }, + { + "epoch": 1.85, + "learning_rate": 2.2358119751899157e-05, + "loss": 0.0208, + "step": 286780 + }, + { + "epoch": 1.85, + "learning_rate": 2.2348438397542224e-05, + "loss": 0.0306, + "step": 286790 + }, + { + "epoch": 1.85, + "learning_rate": 2.2338757043185293e-05, + "loss": 0.0256, + "step": 286800 + }, + { + "epoch": 1.85, + "learning_rate": 2.232907568882836e-05, + "loss": 0.021, + "step": 286810 + }, + { + "epoch": 1.85, + "learning_rate": 2.231939433447143e-05, + "loss": 0.0223, + "step": 286820 + }, + { + "epoch": 1.85, + "learning_rate": 2.2309712980114495e-05, + "loss": 0.0205, + "step": 286830 + }, + { + "epoch": 1.85, + "learning_rate": 2.2300031625757565e-05, + "loss": 0.0213, + "step": 286840 + }, + { + "epoch": 1.85, + "learning_rate": 2.2290350271400635e-05, + "loss": 0.0217, + "step": 286850 + }, + { + "epoch": 1.85, + "learning_rate": 2.2280668917043697e-05, + "loss": 0.0254, + "step": 286860 + }, + { + "epoch": 1.85, + "learning_rate": 2.2270987562686767e-05, + "loss": 0.0222, + "step": 286870 + }, + { + "epoch": 1.85, + "learning_rate": 2.2261306208329833e-05, + "loss": 0.0222, + "step": 286880 + }, + { + "epoch": 1.85, + "learning_rate": 2.2251624853972903e-05, + "loss": 0.023, + "step": 286890 + }, + { + "epoch": 1.85, + "learning_rate": 2.2241943499615972e-05, + "loss": 0.0213, + "step": 286900 + }, + { + "epoch": 1.85, + "learning_rate": 2.223226214525904e-05, + "loss": 0.0228, + "step": 286910 + }, + { + "epoch": 1.85, + "learning_rate": 2.222258079090211e-05, + "loss": 0.0245, + "step": 286920 + }, + { + "epoch": 1.85, + "learning_rate": 2.2212899436545175e-05, + "loss": 0.0227, + "step": 286930 + }, + { + "epoch": 1.85, + "learning_rate": 2.220321808218824e-05, + "loss": 0.0232, + "step": 286940 + }, + { + "epoch": 1.85, + "learning_rate": 2.219353672783131e-05, + "loss": 0.0256, + "step": 286950 + }, + { + "epoch": 1.85, + "learning_rate": 2.2183855373474377e-05, + "loss": 0.0223, + "step": 286960 + }, + { + "epoch": 1.85, + "learning_rate": 2.2174174019117446e-05, + "loss": 0.0259, + "step": 286970 + }, + { + "epoch": 1.85, + "learning_rate": 2.2164492664760516e-05, + "loss": 0.0225, + "step": 286980 + }, + { + "epoch": 1.85, + "learning_rate": 2.2154811310403582e-05, + "loss": 0.0199, + "step": 286990 + }, + { + "epoch": 1.85, + "learning_rate": 2.214512995604665e-05, + "loss": 0.0244, + "step": 287000 + }, + { + "epoch": 1.85, + "eval_cer": 0.9198436334877415, + "eval_loss": 0.017086287960410118, + "eval_runtime": 119.8872, + "eval_samples_per_second": 16.682, + "eval_steps_per_second": 4.171, + "step": 287000 + }, + { + "epoch": 1.85, + "learning_rate": 2.2135448601689715e-05, + "loss": 0.0207, + "step": 287010 + }, + { + "epoch": 1.85, + "learning_rate": 2.2125767247332784e-05, + "loss": 0.0265, + "step": 287020 + }, + { + "epoch": 1.85, + "learning_rate": 2.2116085892975854e-05, + "loss": 0.0233, + "step": 287030 + }, + { + "epoch": 1.85, + "learning_rate": 2.210640453861892e-05, + "loss": 0.023, + "step": 287040 + }, + { + "epoch": 1.85, + "learning_rate": 2.209672318426199e-05, + "loss": 0.0213, + "step": 287050 + }, + { + "epoch": 1.85, + "learning_rate": 2.208704182990506e-05, + "loss": 0.0221, + "step": 287060 + }, + { + "epoch": 1.85, + "learning_rate": 2.2077360475548122e-05, + "loss": 0.0221, + "step": 287070 + }, + { + "epoch": 1.85, + "learning_rate": 2.2067679121191192e-05, + "loss": 0.0203, + "step": 287080 + }, + { + "epoch": 1.85, + "learning_rate": 2.2057997766834258e-05, + "loss": 0.018, + "step": 287090 + }, + { + "epoch": 1.85, + "learning_rate": 2.2048316412477328e-05, + "loss": 0.0229, + "step": 287100 + }, + { + "epoch": 1.85, + "learning_rate": 2.2038635058120397e-05, + "loss": 0.0192, + "step": 287110 + }, + { + "epoch": 1.85, + "learning_rate": 2.2028953703763464e-05, + "loss": 0.0214, + "step": 287120 + }, + { + "epoch": 1.85, + "learning_rate": 2.201927234940653e-05, + "loss": 0.0192, + "step": 287130 + }, + { + "epoch": 1.85, + "learning_rate": 2.2009590995049596e-05, + "loss": 0.0237, + "step": 287140 + }, + { + "epoch": 1.85, + "learning_rate": 2.1999909640692666e-05, + "loss": 0.0257, + "step": 287150 + }, + { + "epoch": 1.85, + "learning_rate": 2.1990228286335735e-05, + "loss": 0.0214, + "step": 287160 + }, + { + "epoch": 1.85, + "learning_rate": 2.19805469319788e-05, + "loss": 0.0225, + "step": 287170 + }, + { + "epoch": 1.85, + "learning_rate": 2.197086557762187e-05, + "loss": 0.0265, + "step": 287180 + }, + { + "epoch": 1.85, + "learning_rate": 2.196118422326494e-05, + "loss": 0.0183, + "step": 287190 + }, + { + "epoch": 1.85, + "learning_rate": 2.1951502868908004e-05, + "loss": 0.0209, + "step": 287200 + }, + { + "epoch": 1.85, + "learning_rate": 2.1941821514551073e-05, + "loss": 0.0182, + "step": 287210 + }, + { + "epoch": 1.85, + "learning_rate": 2.193214016019414e-05, + "loss": 0.0234, + "step": 287220 + }, + { + "epoch": 1.85, + "learning_rate": 2.192245880583721e-05, + "loss": 0.0237, + "step": 287230 + }, + { + "epoch": 1.85, + "learning_rate": 2.191277745148028e-05, + "loss": 0.0217, + "step": 287240 + }, + { + "epoch": 1.85, + "learning_rate": 2.1903096097123345e-05, + "loss": 0.0223, + "step": 287250 + }, + { + "epoch": 1.85, + "learning_rate": 2.1893414742766415e-05, + "loss": 0.0188, + "step": 287260 + }, + { + "epoch": 1.85, + "learning_rate": 2.1883733388409478e-05, + "loss": 0.0208, + "step": 287270 + }, + { + "epoch": 1.85, + "learning_rate": 2.1874052034052547e-05, + "loss": 0.0191, + "step": 287280 + }, + { + "epoch": 1.85, + "learning_rate": 2.1864370679695617e-05, + "loss": 0.0209, + "step": 287290 + }, + { + "epoch": 1.85, + "learning_rate": 2.1854689325338683e-05, + "loss": 0.0185, + "step": 287300 + }, + { + "epoch": 1.85, + "learning_rate": 2.1845007970981753e-05, + "loss": 0.0255, + "step": 287310 + }, + { + "epoch": 1.85, + "learning_rate": 2.1835326616624822e-05, + "loss": 0.021, + "step": 287320 + }, + { + "epoch": 1.85, + "learning_rate": 2.182564526226789e-05, + "loss": 0.0232, + "step": 287330 + }, + { + "epoch": 1.85, + "learning_rate": 2.1815963907910955e-05, + "loss": 0.029, + "step": 287340 + }, + { + "epoch": 1.85, + "learning_rate": 2.180628255355402e-05, + "loss": 0.0194, + "step": 287350 + }, + { + "epoch": 1.85, + "learning_rate": 2.179660119919709e-05, + "loss": 0.022, + "step": 287360 + }, + { + "epoch": 1.85, + "learning_rate": 2.178691984484016e-05, + "loss": 0.0242, + "step": 287370 + }, + { + "epoch": 1.85, + "learning_rate": 2.1777238490483226e-05, + "loss": 0.0208, + "step": 287380 + }, + { + "epoch": 1.85, + "learning_rate": 2.1767557136126296e-05, + "loss": 0.0263, + "step": 287390 + }, + { + "epoch": 1.85, + "learning_rate": 2.1757875781769366e-05, + "loss": 0.0207, + "step": 287400 + }, + { + "epoch": 1.86, + "learning_rate": 2.174819442741243e-05, + "loss": 0.0241, + "step": 287410 + }, + { + "epoch": 1.86, + "learning_rate": 2.1738513073055498e-05, + "loss": 0.0259, + "step": 287420 + }, + { + "epoch": 1.86, + "learning_rate": 2.1728831718698564e-05, + "loss": 0.0247, + "step": 287430 + }, + { + "epoch": 1.86, + "learning_rate": 2.1719150364341634e-05, + "loss": 0.0222, + "step": 287440 + }, + { + "epoch": 1.86, + "learning_rate": 2.1709469009984704e-05, + "loss": 0.0344, + "step": 287450 + }, + { + "epoch": 1.86, + "learning_rate": 2.169978765562777e-05, + "loss": 0.0215, + "step": 287460 + }, + { + "epoch": 1.86, + "learning_rate": 2.169010630127084e-05, + "loss": 0.0187, + "step": 287470 + }, + { + "epoch": 1.86, + "learning_rate": 2.1680424946913902e-05, + "loss": 0.0217, + "step": 287480 + }, + { + "epoch": 1.86, + "learning_rate": 2.1670743592556972e-05, + "loss": 0.0225, + "step": 287490 + }, + { + "epoch": 1.86, + "learning_rate": 2.166106223820004e-05, + "loss": 0.0189, + "step": 287500 + }, + { + "epoch": 1.86, + "learning_rate": 2.1651380883843108e-05, + "loss": 0.0209, + "step": 287510 + }, + { + "epoch": 1.86, + "learning_rate": 2.1641699529486178e-05, + "loss": 0.0255, + "step": 287520 + }, + { + "epoch": 1.86, + "learning_rate": 2.1632018175129244e-05, + "loss": 0.0215, + "step": 287530 + }, + { + "epoch": 1.86, + "learning_rate": 2.1622336820772313e-05, + "loss": 0.0225, + "step": 287540 + }, + { + "epoch": 1.86, + "learning_rate": 2.161265546641538e-05, + "loss": 0.0241, + "step": 287550 + }, + { + "epoch": 1.86, + "learning_rate": 2.1602974112058446e-05, + "loss": 0.0262, + "step": 287560 + }, + { + "epoch": 1.86, + "learning_rate": 2.1593292757701516e-05, + "loss": 0.0231, + "step": 287570 + }, + { + "epoch": 1.86, + "learning_rate": 2.1583611403344582e-05, + "loss": 0.019, + "step": 287580 + }, + { + "epoch": 1.86, + "learning_rate": 2.157393004898765e-05, + "loss": 0.019, + "step": 287590 + }, + { + "epoch": 1.86, + "learning_rate": 2.156424869463072e-05, + "loss": 0.0241, + "step": 287600 + }, + { + "epoch": 1.86, + "learning_rate": 2.1554567340273787e-05, + "loss": 0.0202, + "step": 287610 + }, + { + "epoch": 1.86, + "learning_rate": 2.1544885985916854e-05, + "loss": 0.0285, + "step": 287620 + }, + { + "epoch": 1.86, + "learning_rate": 2.153520463155992e-05, + "loss": 0.0207, + "step": 287630 + }, + { + "epoch": 1.86, + "learning_rate": 2.152552327720299e-05, + "loss": 0.0204, + "step": 287640 + }, + { + "epoch": 1.86, + "learning_rate": 2.151584192284606e-05, + "loss": 0.0251, + "step": 287650 + }, + { + "epoch": 1.86, + "learning_rate": 2.1506160568489125e-05, + "loss": 0.0212, + "step": 287660 + }, + { + "epoch": 1.86, + "learning_rate": 2.1496479214132195e-05, + "loss": 0.0196, + "step": 287670 + }, + { + "epoch": 1.86, + "learning_rate": 2.1486797859775264e-05, + "loss": 0.0184, + "step": 287680 + }, + { + "epoch": 1.86, + "learning_rate": 2.1477116505418327e-05, + "loss": 0.0205, + "step": 287690 + }, + { + "epoch": 1.86, + "learning_rate": 2.1467435151061397e-05, + "loss": 0.0217, + "step": 287700 + }, + { + "epoch": 1.86, + "learning_rate": 2.1457753796704463e-05, + "loss": 0.0225, + "step": 287710 + }, + { + "epoch": 1.86, + "learning_rate": 2.1448072442347533e-05, + "loss": 0.0229, + "step": 287720 + }, + { + "epoch": 1.86, + "learning_rate": 2.1438391087990602e-05, + "loss": 0.0215, + "step": 287730 + }, + { + "epoch": 1.86, + "learning_rate": 2.142870973363367e-05, + "loss": 0.0237, + "step": 287740 + }, + { + "epoch": 1.86, + "learning_rate": 2.141902837927674e-05, + "loss": 0.0273, + "step": 287750 + }, + { + "epoch": 1.86, + "learning_rate": 2.14093470249198e-05, + "loss": 0.0264, + "step": 287760 + }, + { + "epoch": 1.86, + "learning_rate": 2.139966567056287e-05, + "loss": 0.0275, + "step": 287770 + }, + { + "epoch": 1.86, + "learning_rate": 2.138998431620594e-05, + "loss": 0.0215, + "step": 287780 + }, + { + "epoch": 1.86, + "learning_rate": 2.1380302961849007e-05, + "loss": 0.0211, + "step": 287790 + }, + { + "epoch": 1.86, + "learning_rate": 2.1370621607492076e-05, + "loss": 0.0228, + "step": 287800 + }, + { + "epoch": 1.86, + "learning_rate": 2.1360940253135146e-05, + "loss": 0.0276, + "step": 287810 + }, + { + "epoch": 1.86, + "learning_rate": 2.1351258898778212e-05, + "loss": 0.0221, + "step": 287820 + }, + { + "epoch": 1.86, + "learning_rate": 2.134157754442128e-05, + "loss": 0.0227, + "step": 287830 + }, + { + "epoch": 1.86, + "learning_rate": 2.1331896190064345e-05, + "loss": 0.0244, + "step": 287840 + }, + { + "epoch": 1.86, + "learning_rate": 2.1322214835707414e-05, + "loss": 0.0268, + "step": 287850 + }, + { + "epoch": 1.86, + "learning_rate": 2.1312533481350484e-05, + "loss": 0.0249, + "step": 287860 + }, + { + "epoch": 1.86, + "learning_rate": 2.130285212699355e-05, + "loss": 0.0271, + "step": 287870 + }, + { + "epoch": 1.86, + "learning_rate": 2.129317077263662e-05, + "loss": 0.0221, + "step": 287880 + }, + { + "epoch": 1.86, + "learning_rate": 2.128348941827969e-05, + "loss": 0.0217, + "step": 287890 + }, + { + "epoch": 1.86, + "learning_rate": 2.1273808063922752e-05, + "loss": 0.0246, + "step": 287900 + }, + { + "epoch": 1.86, + "learning_rate": 2.1264126709565822e-05, + "loss": 0.026, + "step": 287910 + }, + { + "epoch": 1.86, + "learning_rate": 2.1254445355208888e-05, + "loss": 0.0267, + "step": 287920 + }, + { + "epoch": 1.86, + "learning_rate": 2.1244764000851958e-05, + "loss": 0.0246, + "step": 287930 + }, + { + "epoch": 1.86, + "learning_rate": 2.1235082646495027e-05, + "loss": 0.0205, + "step": 287940 + }, + { + "epoch": 1.86, + "learning_rate": 2.1225401292138094e-05, + "loss": 0.0197, + "step": 287950 + }, + { + "epoch": 1.86, + "learning_rate": 2.121571993778116e-05, + "loss": 0.022, + "step": 287960 + }, + { + "epoch": 1.86, + "learning_rate": 2.1206038583424226e-05, + "loss": 0.0237, + "step": 287970 + }, + { + "epoch": 1.86, + "learning_rate": 2.1196357229067296e-05, + "loss": 0.022, + "step": 287980 + }, + { + "epoch": 1.86, + "learning_rate": 2.1186675874710365e-05, + "loss": 0.0299, + "step": 287990 + }, + { + "epoch": 1.86, + "learning_rate": 2.117699452035343e-05, + "loss": 0.0223, + "step": 288000 + }, + { + "epoch": 1.86, + "eval_cer": 0.9198327872556773, + "eval_loss": 0.016944361850619316, + "eval_runtime": 120.4246, + "eval_samples_per_second": 16.608, + "eval_steps_per_second": 4.152, + "step": 288000 + }, + { + "epoch": 1.86, + "learning_rate": 2.11673131659965e-05, + "loss": 0.025, + "step": 288010 + }, + { + "epoch": 1.86, + "learning_rate": 2.115763181163957e-05, + "loss": 0.0272, + "step": 288020 + }, + { + "epoch": 1.86, + "learning_rate": 2.1147950457282634e-05, + "loss": 0.028, + "step": 288030 + }, + { + "epoch": 1.86, + "learning_rate": 2.1138269102925703e-05, + "loss": 0.0282, + "step": 288040 + }, + { + "epoch": 1.86, + "learning_rate": 2.112858774856877e-05, + "loss": 0.0293, + "step": 288050 + }, + { + "epoch": 1.86, + "learning_rate": 2.111890639421184e-05, + "loss": 0.0233, + "step": 288060 + }, + { + "epoch": 1.86, + "learning_rate": 2.110922503985491e-05, + "loss": 0.0248, + "step": 288070 + }, + { + "epoch": 1.86, + "learning_rate": 2.1099543685497975e-05, + "loss": 0.0184, + "step": 288080 + }, + { + "epoch": 1.86, + "learning_rate": 2.1089862331141045e-05, + "loss": 0.0227, + "step": 288090 + }, + { + "epoch": 1.86, + "learning_rate": 2.1080180976784108e-05, + "loss": 0.0218, + "step": 288100 + }, + { + "epoch": 1.86, + "learning_rate": 2.1070499622427177e-05, + "loss": 0.02, + "step": 288110 + }, + { + "epoch": 1.86, + "learning_rate": 2.1060818268070247e-05, + "loss": 0.0231, + "step": 288120 + }, + { + "epoch": 1.86, + "learning_rate": 2.1051136913713313e-05, + "loss": 0.0227, + "step": 288130 + }, + { + "epoch": 1.86, + "learning_rate": 2.1041455559356383e-05, + "loss": 0.0224, + "step": 288140 + }, + { + "epoch": 1.86, + "learning_rate": 2.1031774204999452e-05, + "loss": 0.0211, + "step": 288150 + }, + { + "epoch": 1.86, + "learning_rate": 2.102209285064252e-05, + "loss": 0.0257, + "step": 288160 + }, + { + "epoch": 1.86, + "learning_rate": 2.1012411496285585e-05, + "loss": 0.0225, + "step": 288170 + }, + { + "epoch": 1.86, + "learning_rate": 2.100273014192865e-05, + "loss": 0.0189, + "step": 288180 + }, + { + "epoch": 1.86, + "learning_rate": 2.099304878757172e-05, + "loss": 0.0247, + "step": 288190 + }, + { + "epoch": 1.86, + "learning_rate": 2.098336743321479e-05, + "loss": 0.0207, + "step": 288200 + }, + { + "epoch": 1.86, + "learning_rate": 2.0973686078857856e-05, + "loss": 0.0244, + "step": 288210 + }, + { + "epoch": 1.86, + "learning_rate": 2.0964004724500926e-05, + "loss": 0.0244, + "step": 288220 + }, + { + "epoch": 1.86, + "learning_rate": 2.0954323370143992e-05, + "loss": 0.0222, + "step": 288230 + }, + { + "epoch": 1.86, + "learning_rate": 2.094464201578706e-05, + "loss": 0.0219, + "step": 288240 + }, + { + "epoch": 1.86, + "learning_rate": 2.0934960661430128e-05, + "loss": 0.0243, + "step": 288250 + }, + { + "epoch": 1.86, + "learning_rate": 2.0925279307073194e-05, + "loss": 0.0197, + "step": 288260 + }, + { + "epoch": 1.86, + "learning_rate": 2.0915597952716264e-05, + "loss": 0.025, + "step": 288270 + }, + { + "epoch": 1.86, + "learning_rate": 2.090591659835933e-05, + "loss": 0.0246, + "step": 288280 + }, + { + "epoch": 1.86, + "learning_rate": 2.08962352440024e-05, + "loss": 0.022, + "step": 288290 + }, + { + "epoch": 1.86, + "learning_rate": 2.088655388964547e-05, + "loss": 0.0222, + "step": 288300 + }, + { + "epoch": 1.86, + "learning_rate": 2.0876872535288532e-05, + "loss": 0.0271, + "step": 288310 + }, + { + "epoch": 1.86, + "learning_rate": 2.0867191180931602e-05, + "loss": 0.0207, + "step": 288320 + }, + { + "epoch": 1.86, + "learning_rate": 2.0857509826574668e-05, + "loss": 0.0178, + "step": 288330 + }, + { + "epoch": 1.86, + "learning_rate": 2.0847828472217738e-05, + "loss": 0.023, + "step": 288340 + }, + { + "epoch": 1.86, + "learning_rate": 2.0838147117860808e-05, + "loss": 0.0235, + "step": 288350 + }, + { + "epoch": 1.86, + "learning_rate": 2.0828465763503874e-05, + "loss": 0.0177, + "step": 288360 + }, + { + "epoch": 1.86, + "learning_rate": 2.0818784409146943e-05, + "loss": 0.0243, + "step": 288370 + }, + { + "epoch": 1.86, + "learning_rate": 2.0809103054790006e-05, + "loss": 0.0214, + "step": 288380 + }, + { + "epoch": 1.86, + "learning_rate": 2.0799421700433076e-05, + "loss": 0.0221, + "step": 288390 + }, + { + "epoch": 1.86, + "learning_rate": 2.0789740346076146e-05, + "loss": 0.0203, + "step": 288400 + }, + { + "epoch": 1.86, + "learning_rate": 2.0780058991719212e-05, + "loss": 0.0175, + "step": 288410 + }, + { + "epoch": 1.86, + "learning_rate": 2.077037763736228e-05, + "loss": 0.0201, + "step": 288420 + }, + { + "epoch": 1.86, + "learning_rate": 2.076069628300535e-05, + "loss": 0.025, + "step": 288430 + }, + { + "epoch": 1.86, + "learning_rate": 2.0751014928648417e-05, + "loss": 0.0187, + "step": 288440 + }, + { + "epoch": 1.86, + "learning_rate": 2.0741333574291483e-05, + "loss": 0.0225, + "step": 288450 + }, + { + "epoch": 1.86, + "learning_rate": 2.073165221993455e-05, + "loss": 0.0215, + "step": 288460 + }, + { + "epoch": 1.86, + "learning_rate": 2.072197086557762e-05, + "loss": 0.0233, + "step": 288470 + }, + { + "epoch": 1.86, + "learning_rate": 2.071228951122069e-05, + "loss": 0.0212, + "step": 288480 + }, + { + "epoch": 1.86, + "learning_rate": 2.0702608156863755e-05, + "loss": 0.0264, + "step": 288490 + }, + { + "epoch": 1.86, + "learning_rate": 2.0692926802506825e-05, + "loss": 0.0206, + "step": 288500 + }, + { + "epoch": 1.86, + "learning_rate": 2.0683245448149894e-05, + "loss": 0.0208, + "step": 288510 + }, + { + "epoch": 1.86, + "learning_rate": 2.0673564093792957e-05, + "loss": 0.0295, + "step": 288520 + }, + { + "epoch": 1.86, + "learning_rate": 2.0663882739436027e-05, + "loss": 0.0207, + "step": 288530 + }, + { + "epoch": 1.86, + "learning_rate": 2.0654201385079093e-05, + "loss": 0.0213, + "step": 288540 + }, + { + "epoch": 1.86, + "learning_rate": 2.0644520030722163e-05, + "loss": 0.0183, + "step": 288550 + }, + { + "epoch": 1.86, + "learning_rate": 2.0634838676365232e-05, + "loss": 0.0213, + "step": 288560 + }, + { + "epoch": 1.86, + "learning_rate": 2.06251573220083e-05, + "loss": 0.0219, + "step": 288570 + }, + { + "epoch": 1.86, + "learning_rate": 2.061547596765137e-05, + "loss": 0.024, + "step": 288580 + }, + { + "epoch": 1.86, + "learning_rate": 2.060579461329443e-05, + "loss": 0.0185, + "step": 288590 + }, + { + "epoch": 1.86, + "learning_rate": 2.05961132589375e-05, + "loss": 0.0271, + "step": 288600 + }, + { + "epoch": 1.86, + "learning_rate": 2.058643190458057e-05, + "loss": 0.0255, + "step": 288610 + }, + { + "epoch": 1.86, + "learning_rate": 2.0576750550223637e-05, + "loss": 0.0278, + "step": 288620 + }, + { + "epoch": 1.86, + "learning_rate": 2.0567069195866706e-05, + "loss": 0.0206, + "step": 288630 + }, + { + "epoch": 1.86, + "learning_rate": 2.0557387841509776e-05, + "loss": 0.024, + "step": 288640 + }, + { + "epoch": 1.86, + "learning_rate": 2.0547706487152842e-05, + "loss": 0.021, + "step": 288650 + }, + { + "epoch": 1.86, + "learning_rate": 2.053802513279591e-05, + "loss": 0.0278, + "step": 288660 + }, + { + "epoch": 1.86, + "learning_rate": 2.0528343778438975e-05, + "loss": 0.0231, + "step": 288670 + }, + { + "epoch": 1.86, + "learning_rate": 2.0518662424082044e-05, + "loss": 0.0242, + "step": 288680 + }, + { + "epoch": 1.86, + "learning_rate": 2.0508981069725114e-05, + "loss": 0.019, + "step": 288690 + }, + { + "epoch": 1.86, + "learning_rate": 2.049929971536818e-05, + "loss": 0.0216, + "step": 288700 + }, + { + "epoch": 1.86, + "learning_rate": 2.048961836101125e-05, + "loss": 0.0221, + "step": 288710 + }, + { + "epoch": 1.86, + "learning_rate": 2.047993700665432e-05, + "loss": 0.0245, + "step": 288720 + }, + { + "epoch": 1.86, + "learning_rate": 2.0470255652297382e-05, + "loss": 0.0231, + "step": 288730 + }, + { + "epoch": 1.86, + "learning_rate": 2.0460574297940452e-05, + "loss": 0.0216, + "step": 288740 + }, + { + "epoch": 1.86, + "learning_rate": 2.0450892943583518e-05, + "loss": 0.0234, + "step": 288750 + }, + { + "epoch": 1.86, + "learning_rate": 2.0441211589226588e-05, + "loss": 0.0217, + "step": 288760 + }, + { + "epoch": 1.86, + "learning_rate": 2.0431530234869657e-05, + "loss": 0.0238, + "step": 288770 + }, + { + "epoch": 1.86, + "learning_rate": 2.0421848880512724e-05, + "loss": 0.0208, + "step": 288780 + }, + { + "epoch": 1.86, + "learning_rate": 2.041216752615579e-05, + "loss": 0.0252, + "step": 288790 + }, + { + "epoch": 1.86, + "learning_rate": 2.0402486171798856e-05, + "loss": 0.0195, + "step": 288800 + }, + { + "epoch": 1.86, + "learning_rate": 2.0392804817441926e-05, + "loss": 0.0242, + "step": 288810 + }, + { + "epoch": 1.86, + "learning_rate": 2.0383123463084995e-05, + "loss": 0.0252, + "step": 288820 + }, + { + "epoch": 1.86, + "learning_rate": 2.037344210872806e-05, + "loss": 0.025, + "step": 288830 + }, + { + "epoch": 1.86, + "learning_rate": 2.036376075437113e-05, + "loss": 0.0286, + "step": 288840 + }, + { + "epoch": 1.86, + "learning_rate": 2.0354079400014197e-05, + "loss": 0.0181, + "step": 288850 + }, + { + "epoch": 1.86, + "learning_rate": 2.0344398045657264e-05, + "loss": 0.0233, + "step": 288860 + }, + { + "epoch": 1.86, + "learning_rate": 2.0334716691300333e-05, + "loss": 0.0216, + "step": 288870 + }, + { + "epoch": 1.86, + "learning_rate": 2.03250353369434e-05, + "loss": 0.0275, + "step": 288880 + }, + { + "epoch": 1.86, + "learning_rate": 2.031535398258647e-05, + "loss": 0.0263, + "step": 288890 + }, + { + "epoch": 1.86, + "learning_rate": 2.0305672628229535e-05, + "loss": 0.0256, + "step": 288900 + }, + { + "epoch": 1.86, + "learning_rate": 2.0295991273872605e-05, + "loss": 0.0202, + "step": 288910 + }, + { + "epoch": 1.86, + "learning_rate": 2.0286309919515675e-05, + "loss": 0.0258, + "step": 288920 + }, + { + "epoch": 1.86, + "learning_rate": 2.0276628565158738e-05, + "loss": 0.0202, + "step": 288930 + }, + { + "epoch": 1.86, + "learning_rate": 2.0266947210801807e-05, + "loss": 0.0221, + "step": 288940 + }, + { + "epoch": 1.86, + "learning_rate": 2.0257265856444873e-05, + "loss": 0.0227, + "step": 288950 + }, + { + "epoch": 1.87, + "learning_rate": 2.0247584502087943e-05, + "loss": 0.0245, + "step": 288960 + }, + { + "epoch": 1.87, + "learning_rate": 2.0237903147731013e-05, + "loss": 0.0208, + "step": 288970 + }, + { + "epoch": 1.87, + "learning_rate": 2.022822179337408e-05, + "loss": 0.0341, + "step": 288980 + }, + { + "epoch": 1.87, + "learning_rate": 2.021854043901715e-05, + "loss": 0.0197, + "step": 288990 + }, + { + "epoch": 1.87, + "learning_rate": 2.020885908466021e-05, + "loss": 0.0285, + "step": 289000 + }, + { + "epoch": 1.87, + "eval_cer": 0.9198481527511015, + "eval_loss": 0.016835737973451614, + "eval_runtime": 119.8731, + "eval_samples_per_second": 16.684, + "eval_steps_per_second": 4.171, + "step": 289000 + }, + { + "epoch": 1.87, + "learning_rate": 2.019917773030328e-05, + "loss": 0.0222, + "step": 289010 + }, + { + "epoch": 1.87, + "learning_rate": 2.018949637594635e-05, + "loss": 0.0217, + "step": 289020 + }, + { + "epoch": 1.87, + "learning_rate": 2.0179815021589417e-05, + "loss": 0.0216, + "step": 289030 + }, + { + "epoch": 1.87, + "learning_rate": 2.0170133667232486e-05, + "loss": 0.0236, + "step": 289040 + }, + { + "epoch": 1.87, + "learning_rate": 2.0160452312875556e-05, + "loss": 0.0253, + "step": 289050 + }, + { + "epoch": 1.87, + "learning_rate": 2.0150770958518622e-05, + "loss": 0.021, + "step": 289060 + }, + { + "epoch": 1.87, + "learning_rate": 2.014108960416169e-05, + "loss": 0.0255, + "step": 289070 + }, + { + "epoch": 1.87, + "learning_rate": 2.0131408249804755e-05, + "loss": 0.0206, + "step": 289080 + }, + { + "epoch": 1.87, + "learning_rate": 2.0121726895447824e-05, + "loss": 0.0239, + "step": 289090 + }, + { + "epoch": 1.87, + "learning_rate": 2.0112045541090894e-05, + "loss": 0.0224, + "step": 289100 + }, + { + "epoch": 1.87, + "learning_rate": 2.010236418673396e-05, + "loss": 0.0174, + "step": 289110 + }, + { + "epoch": 1.87, + "learning_rate": 2.009268283237703e-05, + "loss": 0.0199, + "step": 289120 + }, + { + "epoch": 1.87, + "learning_rate": 2.00830014780201e-05, + "loss": 0.0259, + "step": 289130 + }, + { + "epoch": 1.87, + "learning_rate": 2.0073320123663162e-05, + "loss": 0.0218, + "step": 289140 + }, + { + "epoch": 1.87, + "learning_rate": 2.0063638769306232e-05, + "loss": 0.0208, + "step": 289150 + }, + { + "epoch": 1.87, + "learning_rate": 2.0053957414949298e-05, + "loss": 0.0254, + "step": 289160 + }, + { + "epoch": 1.87, + "learning_rate": 2.0044276060592368e-05, + "loss": 0.0212, + "step": 289170 + }, + { + "epoch": 1.87, + "learning_rate": 2.0034594706235438e-05, + "loss": 0.0288, + "step": 289180 + }, + { + "epoch": 1.87, + "learning_rate": 2.0024913351878504e-05, + "loss": 0.0245, + "step": 289190 + }, + { + "epoch": 1.87, + "learning_rate": 2.0015231997521573e-05, + "loss": 0.0237, + "step": 289200 + }, + { + "epoch": 1.87, + "learning_rate": 2.0005550643164636e-05, + "loss": 0.0228, + "step": 289210 + }, + { + "epoch": 1.87, + "learning_rate": 1.9995869288807706e-05, + "loss": 0.0226, + "step": 289220 + }, + { + "epoch": 1.87, + "learning_rate": 1.9986187934450776e-05, + "loss": 0.0171, + "step": 289230 + }, + { + "epoch": 1.87, + "learning_rate": 1.9976506580093842e-05, + "loss": 0.0223, + "step": 289240 + }, + { + "epoch": 1.87, + "learning_rate": 1.996682522573691e-05, + "loss": 0.0219, + "step": 289250 + }, + { + "epoch": 1.87, + "learning_rate": 1.995714387137998e-05, + "loss": 0.0206, + "step": 289260 + }, + { + "epoch": 1.87, + "learning_rate": 1.9947462517023047e-05, + "loss": 0.0234, + "step": 289270 + }, + { + "epoch": 1.87, + "learning_rate": 1.9937781162666113e-05, + "loss": 0.0208, + "step": 289280 + }, + { + "epoch": 1.87, + "learning_rate": 1.992809980830918e-05, + "loss": 0.0258, + "step": 289290 + }, + { + "epoch": 1.87, + "learning_rate": 1.991841845395225e-05, + "loss": 0.0287, + "step": 289300 + }, + { + "epoch": 1.87, + "learning_rate": 1.990873709959532e-05, + "loss": 0.0187, + "step": 289310 + }, + { + "epoch": 1.87, + "learning_rate": 1.9899055745238385e-05, + "loss": 0.0211, + "step": 289320 + }, + { + "epoch": 1.87, + "learning_rate": 1.9889374390881455e-05, + "loss": 0.019, + "step": 289330 + }, + { + "epoch": 1.87, + "learning_rate": 1.9879693036524524e-05, + "loss": 0.0247, + "step": 289340 + }, + { + "epoch": 1.87, + "learning_rate": 1.9870011682167587e-05, + "loss": 0.0205, + "step": 289350 + }, + { + "epoch": 1.87, + "learning_rate": 1.9860330327810657e-05, + "loss": 0.0213, + "step": 289360 + }, + { + "epoch": 1.87, + "learning_rate": 1.9850648973453723e-05, + "loss": 0.0196, + "step": 289370 + }, + { + "epoch": 1.87, + "learning_rate": 1.9840967619096793e-05, + "loss": 0.0182, + "step": 289380 + }, + { + "epoch": 1.87, + "learning_rate": 1.9831286264739862e-05, + "loss": 0.0208, + "step": 289390 + }, + { + "epoch": 1.87, + "learning_rate": 1.982160491038293e-05, + "loss": 0.0209, + "step": 289400 + }, + { + "epoch": 1.87, + "learning_rate": 1.9811923556025998e-05, + "loss": 0.024, + "step": 289410 + }, + { + "epoch": 1.87, + "learning_rate": 1.980224220166906e-05, + "loss": 0.0249, + "step": 289420 + }, + { + "epoch": 1.87, + "learning_rate": 1.979256084731213e-05, + "loss": 0.0209, + "step": 289430 + }, + { + "epoch": 1.87, + "learning_rate": 1.97828794929552e-05, + "loss": 0.021, + "step": 289440 + }, + { + "epoch": 1.87, + "learning_rate": 1.9773198138598267e-05, + "loss": 0.0209, + "step": 289450 + }, + { + "epoch": 1.87, + "learning_rate": 1.9763516784241336e-05, + "loss": 0.0207, + "step": 289460 + }, + { + "epoch": 1.87, + "learning_rate": 1.9753835429884406e-05, + "loss": 0.0233, + "step": 289470 + }, + { + "epoch": 1.87, + "learning_rate": 1.9744154075527472e-05, + "loss": 0.0332, + "step": 289480 + }, + { + "epoch": 1.87, + "learning_rate": 1.973447272117054e-05, + "loss": 0.0299, + "step": 289490 + }, + { + "epoch": 1.87, + "learning_rate": 1.9724791366813605e-05, + "loss": 0.0267, + "step": 289500 + }, + { + "epoch": 1.87, + "learning_rate": 1.9715110012456674e-05, + "loss": 0.0223, + "step": 289510 + }, + { + "epoch": 1.87, + "learning_rate": 1.9705428658099744e-05, + "loss": 0.0207, + "step": 289520 + }, + { + "epoch": 1.87, + "learning_rate": 1.969574730374281e-05, + "loss": 0.0207, + "step": 289530 + }, + { + "epoch": 1.87, + "learning_rate": 1.968606594938588e-05, + "loss": 0.0228, + "step": 289540 + }, + { + "epoch": 1.87, + "learning_rate": 1.9676384595028946e-05, + "loss": 0.0289, + "step": 289550 + }, + { + "epoch": 1.87, + "learning_rate": 1.9666703240672012e-05, + "loss": 0.0223, + "step": 289560 + }, + { + "epoch": 1.87, + "learning_rate": 1.9657021886315082e-05, + "loss": 0.0189, + "step": 289570 + }, + { + "epoch": 1.87, + "learning_rate": 1.9647340531958148e-05, + "loss": 0.0232, + "step": 289580 + }, + { + "epoch": 1.87, + "learning_rate": 1.9637659177601218e-05, + "loss": 0.0189, + "step": 289590 + }, + { + "epoch": 1.87, + "learning_rate": 1.9627977823244284e-05, + "loss": 0.023, + "step": 289600 + }, + { + "epoch": 1.87, + "learning_rate": 1.9618296468887354e-05, + "loss": 0.0194, + "step": 289610 + }, + { + "epoch": 1.87, + "learning_rate": 1.9608615114530423e-05, + "loss": 0.0218, + "step": 289620 + }, + { + "epoch": 1.87, + "learning_rate": 1.9598933760173486e-05, + "loss": 0.0251, + "step": 289630 + }, + { + "epoch": 1.87, + "learning_rate": 1.9589252405816556e-05, + "loss": 0.0193, + "step": 289640 + }, + { + "epoch": 1.87, + "learning_rate": 1.9579571051459622e-05, + "loss": 0.0186, + "step": 289650 + }, + { + "epoch": 1.87, + "learning_rate": 1.956988969710269e-05, + "loss": 0.0246, + "step": 289660 + }, + { + "epoch": 1.87, + "learning_rate": 1.956020834274576e-05, + "loss": 0.0194, + "step": 289670 + }, + { + "epoch": 1.87, + "learning_rate": 1.9550526988388827e-05, + "loss": 0.022, + "step": 289680 + }, + { + "epoch": 1.87, + "learning_rate": 1.9540845634031894e-05, + "loss": 0.031, + "step": 289690 + }, + { + "epoch": 1.87, + "learning_rate": 1.953116427967496e-05, + "loss": 0.0227, + "step": 289700 + }, + { + "epoch": 1.87, + "learning_rate": 1.952148292531803e-05, + "loss": 0.0257, + "step": 289710 + }, + { + "epoch": 1.87, + "learning_rate": 1.95118015709611e-05, + "loss": 0.0233, + "step": 289720 + }, + { + "epoch": 1.87, + "learning_rate": 1.9502120216604165e-05, + "loss": 0.0199, + "step": 289730 + }, + { + "epoch": 1.87, + "learning_rate": 1.9492438862247235e-05, + "loss": 0.0231, + "step": 289740 + }, + { + "epoch": 1.87, + "learning_rate": 1.9482757507890305e-05, + "loss": 0.022, + "step": 289750 + }, + { + "epoch": 1.87, + "learning_rate": 1.9473076153533367e-05, + "loss": 0.0244, + "step": 289760 + }, + { + "epoch": 1.87, + "learning_rate": 1.9463394799176437e-05, + "loss": 0.0311, + "step": 289770 + }, + { + "epoch": 1.87, + "learning_rate": 1.9453713444819503e-05, + "loss": 0.0241, + "step": 289780 + }, + { + "epoch": 1.87, + "learning_rate": 1.9444032090462573e-05, + "loss": 0.018, + "step": 289790 + }, + { + "epoch": 1.87, + "learning_rate": 1.9434350736105643e-05, + "loss": 0.0263, + "step": 289800 + }, + { + "epoch": 1.87, + "learning_rate": 1.942466938174871e-05, + "loss": 0.0224, + "step": 289810 + }, + { + "epoch": 1.87, + "learning_rate": 1.941498802739178e-05, + "loss": 0.0223, + "step": 289820 + }, + { + "epoch": 1.87, + "learning_rate": 1.940530667303484e-05, + "loss": 0.0227, + "step": 289830 + }, + { + "epoch": 1.87, + "learning_rate": 1.939562531867791e-05, + "loss": 0.0225, + "step": 289840 + }, + { + "epoch": 1.87, + "learning_rate": 1.938594396432098e-05, + "loss": 0.0198, + "step": 289850 + }, + { + "epoch": 1.87, + "learning_rate": 1.9376262609964047e-05, + "loss": 0.0203, + "step": 289860 + }, + { + "epoch": 1.87, + "learning_rate": 1.9366581255607116e-05, + "loss": 0.0211, + "step": 289870 + }, + { + "epoch": 1.87, + "learning_rate": 1.9356899901250186e-05, + "loss": 0.0211, + "step": 289880 + }, + { + "epoch": 1.87, + "learning_rate": 1.9347218546893252e-05, + "loss": 0.0212, + "step": 289890 + }, + { + "epoch": 1.87, + "learning_rate": 1.933753719253632e-05, + "loss": 0.0213, + "step": 289900 + }, + { + "epoch": 1.87, + "learning_rate": 1.9327855838179385e-05, + "loss": 0.02, + "step": 289910 + }, + { + "epoch": 1.87, + "learning_rate": 1.9318174483822454e-05, + "loss": 0.0233, + "step": 289920 + }, + { + "epoch": 1.87, + "learning_rate": 1.9308493129465524e-05, + "loss": 0.0196, + "step": 289930 + }, + { + "epoch": 1.87, + "learning_rate": 1.929881177510859e-05, + "loss": 0.0188, + "step": 289940 + }, + { + "epoch": 1.87, + "learning_rate": 1.928913042075166e-05, + "loss": 0.0233, + "step": 289950 + }, + { + "epoch": 1.87, + "learning_rate": 1.927944906639473e-05, + "loss": 0.0251, + "step": 289960 + }, + { + "epoch": 1.87, + "learning_rate": 1.9269767712037792e-05, + "loss": 0.0217, + "step": 289970 + }, + { + "epoch": 1.87, + "learning_rate": 1.9260086357680862e-05, + "loss": 0.0216, + "step": 289980 + }, + { + "epoch": 1.87, + "learning_rate": 1.9250405003323928e-05, + "loss": 0.0218, + "step": 289990 + }, + { + "epoch": 1.87, + "learning_rate": 1.9240723648966998e-05, + "loss": 0.0223, + "step": 290000 + }, + { + "epoch": 1.87, + "eval_cer": 0.9198074793808609, + "eval_loss": 0.016939295455813408, + "eval_runtime": 120.1344, + "eval_samples_per_second": 16.648, + "eval_steps_per_second": 4.162, + "step": 290000 + }, + { + "epoch": 1.87, + "learning_rate": 1.9231042294610068e-05, + "loss": 0.0252, + "step": 290010 + }, + { + "epoch": 1.87, + "learning_rate": 1.9221360940253134e-05, + "loss": 0.024, + "step": 290020 + }, + { + "epoch": 1.87, + "learning_rate": 1.9211679585896203e-05, + "loss": 0.0221, + "step": 290030 + }, + { + "epoch": 1.87, + "learning_rate": 1.9201998231539266e-05, + "loss": 0.0208, + "step": 290040 + }, + { + "epoch": 1.87, + "learning_rate": 1.9192316877182336e-05, + "loss": 0.0196, + "step": 290050 + }, + { + "epoch": 1.87, + "learning_rate": 1.9182635522825405e-05, + "loss": 0.0239, + "step": 290060 + }, + { + "epoch": 1.87, + "learning_rate": 1.9172954168468472e-05, + "loss": 0.0235, + "step": 290070 + }, + { + "epoch": 1.87, + "learning_rate": 1.916327281411154e-05, + "loss": 0.0207, + "step": 290080 + }, + { + "epoch": 1.87, + "learning_rate": 1.915359145975461e-05, + "loss": 0.0335, + "step": 290090 + }, + { + "epoch": 1.87, + "learning_rate": 1.9143910105397677e-05, + "loss": 0.0246, + "step": 290100 + }, + { + "epoch": 1.87, + "learning_rate": 1.9134228751040743e-05, + "loss": 0.02, + "step": 290110 + }, + { + "epoch": 1.87, + "learning_rate": 1.912454739668381e-05, + "loss": 0.0226, + "step": 290120 + }, + { + "epoch": 1.87, + "learning_rate": 1.911486604232688e-05, + "loss": 0.0214, + "step": 290130 + }, + { + "epoch": 1.87, + "learning_rate": 1.910518468796995e-05, + "loss": 0.0305, + "step": 290140 + }, + { + "epoch": 1.87, + "learning_rate": 1.9095503333613015e-05, + "loss": 0.0202, + "step": 290150 + }, + { + "epoch": 1.87, + "learning_rate": 1.9085821979256085e-05, + "loss": 0.0238, + "step": 290160 + }, + { + "epoch": 1.87, + "learning_rate": 1.907614062489915e-05, + "loss": 0.0206, + "step": 290170 + }, + { + "epoch": 1.87, + "learning_rate": 1.9066459270542217e-05, + "loss": 0.0218, + "step": 290180 + }, + { + "epoch": 1.87, + "learning_rate": 1.9056777916185287e-05, + "loss": 0.0204, + "step": 290190 + }, + { + "epoch": 1.87, + "learning_rate": 1.9047096561828353e-05, + "loss": 0.0218, + "step": 290200 + }, + { + "epoch": 1.87, + "learning_rate": 1.9037415207471423e-05, + "loss": 0.0287, + "step": 290210 + }, + { + "epoch": 1.87, + "learning_rate": 1.902773385311449e-05, + "loss": 0.0244, + "step": 290220 + }, + { + "epoch": 1.87, + "learning_rate": 1.901805249875756e-05, + "loss": 0.0221, + "step": 290230 + }, + { + "epoch": 1.87, + "learning_rate": 1.9008371144400628e-05, + "loss": 0.0212, + "step": 290240 + }, + { + "epoch": 1.87, + "learning_rate": 1.899868979004369e-05, + "loss": 0.0191, + "step": 290250 + }, + { + "epoch": 1.87, + "learning_rate": 1.898900843568676e-05, + "loss": 0.0241, + "step": 290260 + }, + { + "epoch": 1.87, + "learning_rate": 1.897932708132983e-05, + "loss": 0.0223, + "step": 290270 + }, + { + "epoch": 1.87, + "learning_rate": 1.8969645726972897e-05, + "loss": 0.0229, + "step": 290280 + }, + { + "epoch": 1.87, + "learning_rate": 1.8959964372615966e-05, + "loss": 0.0231, + "step": 290290 + }, + { + "epoch": 1.87, + "learning_rate": 1.8950283018259033e-05, + "loss": 0.0277, + "step": 290300 + }, + { + "epoch": 1.87, + "learning_rate": 1.8940601663902102e-05, + "loss": 0.0234, + "step": 290310 + }, + { + "epoch": 1.87, + "learning_rate": 1.893092030954517e-05, + "loss": 0.0236, + "step": 290320 + }, + { + "epoch": 1.87, + "learning_rate": 1.8921238955188235e-05, + "loss": 0.0228, + "step": 290330 + }, + { + "epoch": 1.87, + "learning_rate": 1.8911557600831304e-05, + "loss": 0.0208, + "step": 290340 + }, + { + "epoch": 1.87, + "learning_rate": 1.890187624647437e-05, + "loss": 0.0192, + "step": 290350 + }, + { + "epoch": 1.87, + "learning_rate": 1.889219489211744e-05, + "loss": 0.0226, + "step": 290360 + }, + { + "epoch": 1.87, + "learning_rate": 1.888251353776051e-05, + "loss": 0.0238, + "step": 290370 + }, + { + "epoch": 1.87, + "learning_rate": 1.8872832183403576e-05, + "loss": 0.0235, + "step": 290380 + }, + { + "epoch": 1.87, + "learning_rate": 1.8863150829046642e-05, + "loss": 0.0231, + "step": 290390 + }, + { + "epoch": 1.87, + "learning_rate": 1.885346947468971e-05, + "loss": 0.0202, + "step": 290400 + }, + { + "epoch": 1.87, + "learning_rate": 1.8843788120332778e-05, + "loss": 0.0176, + "step": 290410 + }, + { + "epoch": 1.87, + "learning_rate": 1.8834106765975848e-05, + "loss": 0.0234, + "step": 290420 + }, + { + "epoch": 1.87, + "learning_rate": 1.8824425411618914e-05, + "loss": 0.0215, + "step": 290430 + }, + { + "epoch": 1.87, + "learning_rate": 1.8814744057261984e-05, + "loss": 0.022, + "step": 290440 + }, + { + "epoch": 1.87, + "learning_rate": 1.8805062702905053e-05, + "loss": 0.0198, + "step": 290450 + }, + { + "epoch": 1.87, + "learning_rate": 1.8795381348548116e-05, + "loss": 0.0241, + "step": 290460 + }, + { + "epoch": 1.87, + "learning_rate": 1.8785699994191186e-05, + "loss": 0.0208, + "step": 290470 + }, + { + "epoch": 1.87, + "learning_rate": 1.8776018639834252e-05, + "loss": 0.0211, + "step": 290480 + }, + { + "epoch": 1.87, + "learning_rate": 1.876633728547732e-05, + "loss": 0.0229, + "step": 290490 + }, + { + "epoch": 1.87, + "learning_rate": 1.875665593112039e-05, + "loss": 0.019, + "step": 290500 + }, + { + "epoch": 1.88, + "learning_rate": 1.8746974576763457e-05, + "loss": 0.0204, + "step": 290510 + }, + { + "epoch": 1.88, + "learning_rate": 1.8737293222406524e-05, + "loss": 0.0239, + "step": 290520 + }, + { + "epoch": 1.88, + "learning_rate": 1.8727611868049593e-05, + "loss": 0.0236, + "step": 290530 + }, + { + "epoch": 1.88, + "learning_rate": 1.871793051369266e-05, + "loss": 0.0248, + "step": 290540 + }, + { + "epoch": 1.88, + "learning_rate": 1.870824915933573e-05, + "loss": 0.0235, + "step": 290550 + }, + { + "epoch": 1.88, + "learning_rate": 1.8698567804978795e-05, + "loss": 0.0177, + "step": 290560 + }, + { + "epoch": 1.88, + "learning_rate": 1.8688886450621865e-05, + "loss": 0.02, + "step": 290570 + }, + { + "epoch": 1.88, + "learning_rate": 1.867920509626493e-05, + "loss": 0.0182, + "step": 290580 + }, + { + "epoch": 1.88, + "learning_rate": 1.8669523741908e-05, + "loss": 0.0205, + "step": 290590 + }, + { + "epoch": 1.88, + "learning_rate": 1.8659842387551067e-05, + "loss": 0.0241, + "step": 290600 + }, + { + "epoch": 1.88, + "learning_rate": 1.8650161033194133e-05, + "loss": 0.0256, + "step": 290610 + }, + { + "epoch": 1.88, + "learning_rate": 1.8640479678837203e-05, + "loss": 0.022, + "step": 290620 + }, + { + "epoch": 1.88, + "learning_rate": 1.8630798324480273e-05, + "loss": 0.0277, + "step": 290630 + }, + { + "epoch": 1.88, + "learning_rate": 1.862111697012334e-05, + "loss": 0.0281, + "step": 290640 + }, + { + "epoch": 1.88, + "learning_rate": 1.8611435615766405e-05, + "loss": 0.0182, + "step": 290650 + }, + { + "epoch": 1.88, + "learning_rate": 1.8601754261409475e-05, + "loss": 0.0224, + "step": 290660 + }, + { + "epoch": 1.88, + "learning_rate": 1.8592072907052544e-05, + "loss": 0.0209, + "step": 290670 + }, + { + "epoch": 1.88, + "learning_rate": 1.858239155269561e-05, + "loss": 0.0231, + "step": 290680 + }, + { + "epoch": 1.88, + "learning_rate": 1.8572710198338677e-05, + "loss": 0.0255, + "step": 290690 + }, + { + "epoch": 1.88, + "learning_rate": 1.8563028843981746e-05, + "loss": 0.0228, + "step": 290700 + }, + { + "epoch": 1.88, + "learning_rate": 1.8553347489624816e-05, + "loss": 0.0197, + "step": 290710 + }, + { + "epoch": 1.88, + "learning_rate": 1.8543666135267882e-05, + "loss": 0.0217, + "step": 290720 + }, + { + "epoch": 1.88, + "learning_rate": 1.853398478091095e-05, + "loss": 0.0223, + "step": 290730 + }, + { + "epoch": 1.88, + "learning_rate": 1.8524303426554018e-05, + "loss": 0.0221, + "step": 290740 + }, + { + "epoch": 1.88, + "learning_rate": 1.8514622072197084e-05, + "loss": 0.02, + "step": 290750 + }, + { + "epoch": 1.88, + "learning_rate": 1.8504940717840154e-05, + "loss": 0.0182, + "step": 290760 + }, + { + "epoch": 1.88, + "learning_rate": 1.849525936348322e-05, + "loss": 0.0221, + "step": 290770 + }, + { + "epoch": 1.88, + "learning_rate": 1.8485578009126287e-05, + "loss": 0.0244, + "step": 290780 + }, + { + "epoch": 1.88, + "learning_rate": 1.8475896654769356e-05, + "loss": 0.022, + "step": 290790 + }, + { + "epoch": 1.88, + "learning_rate": 1.8466215300412426e-05, + "loss": 0.023, + "step": 290800 + }, + { + "epoch": 1.88, + "learning_rate": 1.8456533946055492e-05, + "loss": 0.0209, + "step": 290810 + }, + { + "epoch": 1.88, + "learning_rate": 1.8446852591698558e-05, + "loss": 0.0258, + "step": 290820 + }, + { + "epoch": 1.88, + "learning_rate": 1.8437171237341628e-05, + "loss": 0.0182, + "step": 290830 + }, + { + "epoch": 1.88, + "learning_rate": 1.8427489882984698e-05, + "loss": 0.0242, + "step": 290840 + }, + { + "epoch": 1.88, + "learning_rate": 1.8417808528627764e-05, + "loss": 0.0195, + "step": 290850 + }, + { + "epoch": 1.88, + "learning_rate": 1.840812717427083e-05, + "loss": 0.0216, + "step": 290860 + }, + { + "epoch": 1.88, + "learning_rate": 1.83984458199139e-05, + "loss": 0.0207, + "step": 290870 + }, + { + "epoch": 1.88, + "learning_rate": 1.838876446555697e-05, + "loss": 0.0204, + "step": 290880 + }, + { + "epoch": 1.88, + "learning_rate": 1.8379083111200035e-05, + "loss": 0.027, + "step": 290890 + }, + { + "epoch": 1.88, + "learning_rate": 1.8369401756843102e-05, + "loss": 0.0213, + "step": 290900 + }, + { + "epoch": 1.88, + "learning_rate": 1.835972040248617e-05, + "loss": 0.0235, + "step": 290910 + }, + { + "epoch": 1.88, + "learning_rate": 1.8350039048129238e-05, + "loss": 0.0258, + "step": 290920 + }, + { + "epoch": 1.88, + "learning_rate": 1.8340357693772307e-05, + "loss": 0.0177, + "step": 290930 + }, + { + "epoch": 1.88, + "learning_rate": 1.8330676339415373e-05, + "loss": 0.021, + "step": 290940 + }, + { + "epoch": 1.88, + "learning_rate": 1.8320994985058443e-05, + "loss": 0.0202, + "step": 290950 + }, + { + "epoch": 1.88, + "learning_rate": 1.831131363070151e-05, + "loss": 0.0232, + "step": 290960 + }, + { + "epoch": 1.88, + "learning_rate": 1.8301632276344576e-05, + "loss": 0.0236, + "step": 290970 + }, + { + "epoch": 1.88, + "learning_rate": 1.8291950921987645e-05, + "loss": 0.0258, + "step": 290980 + }, + { + "epoch": 1.88, + "learning_rate": 1.828226956763071e-05, + "loss": 0.021, + "step": 290990 + }, + { + "epoch": 1.88, + "learning_rate": 1.827258821327378e-05, + "loss": 0.0231, + "step": 291000 + }, + { + "epoch": 1.88, + "eval_cer": 0.9198291718449892, + "eval_loss": 0.016914011910557747, + "eval_runtime": 120.5766, + "eval_samples_per_second": 16.587, + "eval_steps_per_second": 4.147, + "step": 291000 + }, + { + "epoch": 1.88, + "learning_rate": 1.8262906858916847e-05, + "loss": 0.0221, + "step": 291010 + }, + { + "epoch": 1.88, + "learning_rate": 1.8253225504559917e-05, + "loss": 0.0218, + "step": 291020 + }, + { + "epoch": 1.88, + "learning_rate": 1.8243544150202983e-05, + "loss": 0.0275, + "step": 291030 + }, + { + "epoch": 1.88, + "learning_rate": 1.8233862795846053e-05, + "loss": 0.0208, + "step": 291040 + }, + { + "epoch": 1.88, + "learning_rate": 1.822418144148912e-05, + "loss": 0.0234, + "step": 291050 + }, + { + "epoch": 1.88, + "learning_rate": 1.8214500087132185e-05, + "loss": 0.0262, + "step": 291060 + }, + { + "epoch": 1.88, + "learning_rate": 1.8204818732775255e-05, + "loss": 0.0214, + "step": 291070 + }, + { + "epoch": 1.88, + "learning_rate": 1.8195137378418325e-05, + "loss": 0.0214, + "step": 291080 + }, + { + "epoch": 1.88, + "learning_rate": 1.818545602406139e-05, + "loss": 0.0212, + "step": 291090 + }, + { + "epoch": 1.88, + "learning_rate": 1.8175774669704457e-05, + "loss": 0.0226, + "step": 291100 + }, + { + "epoch": 1.88, + "learning_rate": 1.8166093315347527e-05, + "loss": 0.0231, + "step": 291110 + }, + { + "epoch": 1.88, + "learning_rate": 1.8156411960990596e-05, + "loss": 0.0205, + "step": 291120 + }, + { + "epoch": 1.88, + "learning_rate": 1.8146730606633662e-05, + "loss": 0.0175, + "step": 291130 + }, + { + "epoch": 1.88, + "learning_rate": 1.813704925227673e-05, + "loss": 0.0187, + "step": 291140 + }, + { + "epoch": 1.88, + "learning_rate": 1.81273678979198e-05, + "loss": 0.0214, + "step": 291150 + }, + { + "epoch": 1.88, + "learning_rate": 1.8117686543562865e-05, + "loss": 0.0301, + "step": 291160 + }, + { + "epoch": 1.88, + "learning_rate": 1.8108005189205934e-05, + "loss": 0.0205, + "step": 291170 + }, + { + "epoch": 1.88, + "learning_rate": 1.8098323834849e-05, + "loss": 0.0218, + "step": 291180 + }, + { + "epoch": 1.88, + "learning_rate": 1.808864248049207e-05, + "loss": 0.0232, + "step": 291190 + }, + { + "epoch": 1.88, + "learning_rate": 1.8078961126135136e-05, + "loss": 0.0231, + "step": 291200 + }, + { + "epoch": 1.88, + "learning_rate": 1.8069279771778206e-05, + "loss": 0.0223, + "step": 291210 + }, + { + "epoch": 1.88, + "learning_rate": 1.8059598417421272e-05, + "loss": 0.0192, + "step": 291220 + }, + { + "epoch": 1.88, + "learning_rate": 1.804991706306434e-05, + "loss": 0.0222, + "step": 291230 + }, + { + "epoch": 1.88, + "learning_rate": 1.8040235708707408e-05, + "loss": 0.0244, + "step": 291240 + }, + { + "epoch": 1.88, + "learning_rate": 1.8030554354350478e-05, + "loss": 0.0249, + "step": 291250 + }, + { + "epoch": 1.88, + "learning_rate": 1.8020872999993544e-05, + "loss": 0.025, + "step": 291260 + }, + { + "epoch": 1.88, + "learning_rate": 1.801119164563661e-05, + "loss": 0.0236, + "step": 291270 + }, + { + "epoch": 1.88, + "learning_rate": 1.800151029127968e-05, + "loss": 0.0252, + "step": 291280 + }, + { + "epoch": 1.88, + "learning_rate": 1.799182893692275e-05, + "loss": 0.0231, + "step": 291290 + }, + { + "epoch": 1.88, + "learning_rate": 1.7982147582565816e-05, + "loss": 0.0224, + "step": 291300 + }, + { + "epoch": 1.88, + "learning_rate": 1.7972466228208882e-05, + "loss": 0.02, + "step": 291310 + }, + { + "epoch": 1.88, + "learning_rate": 1.796278487385195e-05, + "loss": 0.0217, + "step": 291320 + }, + { + "epoch": 1.88, + "learning_rate": 1.795310351949502e-05, + "loss": 0.023, + "step": 291330 + }, + { + "epoch": 1.88, + "learning_rate": 1.7943422165138087e-05, + "loss": 0.0226, + "step": 291340 + }, + { + "epoch": 1.88, + "learning_rate": 1.7933740810781154e-05, + "loss": 0.0245, + "step": 291350 + }, + { + "epoch": 1.88, + "learning_rate": 1.7924059456424223e-05, + "loss": 0.0219, + "step": 291360 + }, + { + "epoch": 1.88, + "learning_rate": 1.791437810206729e-05, + "loss": 0.02, + "step": 291370 + }, + { + "epoch": 1.88, + "learning_rate": 1.790469674771036e-05, + "loss": 0.0229, + "step": 291380 + }, + { + "epoch": 1.88, + "learning_rate": 1.7895015393353425e-05, + "loss": 0.0232, + "step": 291390 + }, + { + "epoch": 1.88, + "learning_rate": 1.7885334038996495e-05, + "loss": 0.0195, + "step": 291400 + }, + { + "epoch": 1.88, + "learning_rate": 1.787565268463956e-05, + "loss": 0.0195, + "step": 291410 + }, + { + "epoch": 1.88, + "learning_rate": 1.786597133028263e-05, + "loss": 0.0249, + "step": 291420 + }, + { + "epoch": 1.88, + "learning_rate": 1.7856289975925697e-05, + "loss": 0.0205, + "step": 291430 + }, + { + "epoch": 1.88, + "learning_rate": 1.7846608621568763e-05, + "loss": 0.0301, + "step": 291440 + }, + { + "epoch": 1.88, + "learning_rate": 1.7836927267211833e-05, + "loss": 0.0204, + "step": 291450 + }, + { + "epoch": 1.88, + "learning_rate": 1.7827245912854903e-05, + "loss": 0.022, + "step": 291460 + }, + { + "epoch": 1.88, + "learning_rate": 1.781756455849797e-05, + "loss": 0.0185, + "step": 291470 + }, + { + "epoch": 1.88, + "learning_rate": 1.7807883204141035e-05, + "loss": 0.0218, + "step": 291480 + }, + { + "epoch": 1.88, + "learning_rate": 1.7798201849784105e-05, + "loss": 0.0242, + "step": 291490 + }, + { + "epoch": 1.88, + "learning_rate": 1.7788520495427174e-05, + "loss": 0.0188, + "step": 291500 + }, + { + "epoch": 1.88, + "learning_rate": 1.777883914107024e-05, + "loss": 0.0219, + "step": 291510 + }, + { + "epoch": 1.88, + "learning_rate": 1.7769157786713307e-05, + "loss": 0.0258, + "step": 291520 + }, + { + "epoch": 1.88, + "learning_rate": 1.7759476432356376e-05, + "loss": 0.0245, + "step": 291530 + }, + { + "epoch": 1.88, + "learning_rate": 1.7749795077999446e-05, + "loss": 0.0197, + "step": 291540 + }, + { + "epoch": 1.88, + "learning_rate": 1.7740113723642512e-05, + "loss": 0.0312, + "step": 291550 + }, + { + "epoch": 1.88, + "learning_rate": 1.773043236928558e-05, + "loss": 0.025, + "step": 291560 + }, + { + "epoch": 1.88, + "learning_rate": 1.7720751014928648e-05, + "loss": 0.0228, + "step": 291570 + }, + { + "epoch": 1.88, + "learning_rate": 1.7711069660571714e-05, + "loss": 0.0267, + "step": 291580 + }, + { + "epoch": 1.88, + "learning_rate": 1.7701388306214784e-05, + "loss": 0.0192, + "step": 291590 + }, + { + "epoch": 1.88, + "learning_rate": 1.769170695185785e-05, + "loss": 0.02, + "step": 291600 + }, + { + "epoch": 1.88, + "learning_rate": 1.7682025597500917e-05, + "loss": 0.0262, + "step": 291610 + }, + { + "epoch": 1.88, + "learning_rate": 1.7672344243143986e-05, + "loss": 0.0211, + "step": 291620 + }, + { + "epoch": 1.88, + "learning_rate": 1.7662662888787052e-05, + "loss": 0.0233, + "step": 291630 + }, + { + "epoch": 1.88, + "learning_rate": 1.7652981534430122e-05, + "loss": 0.022, + "step": 291640 + }, + { + "epoch": 1.88, + "learning_rate": 1.7643300180073188e-05, + "loss": 0.0266, + "step": 291650 + }, + { + "epoch": 1.88, + "learning_rate": 1.7633618825716258e-05, + "loss": 0.0226, + "step": 291660 + }, + { + "epoch": 1.88, + "learning_rate": 1.7623937471359324e-05, + "loss": 0.0204, + "step": 291670 + }, + { + "epoch": 1.88, + "learning_rate": 1.761425611700239e-05, + "loss": 0.0186, + "step": 291680 + }, + { + "epoch": 1.88, + "learning_rate": 1.760457476264546e-05, + "loss": 0.0196, + "step": 291690 + }, + { + "epoch": 1.88, + "learning_rate": 1.759489340828853e-05, + "loss": 0.0207, + "step": 291700 + }, + { + "epoch": 1.88, + "learning_rate": 1.7585212053931596e-05, + "loss": 0.0231, + "step": 291710 + }, + { + "epoch": 1.88, + "learning_rate": 1.7575530699574662e-05, + "loss": 0.0234, + "step": 291720 + }, + { + "epoch": 1.88, + "learning_rate": 1.7565849345217732e-05, + "loss": 0.0224, + "step": 291730 + }, + { + "epoch": 1.88, + "learning_rate": 1.75561679908608e-05, + "loss": 0.0222, + "step": 291740 + }, + { + "epoch": 1.88, + "learning_rate": 1.7546486636503868e-05, + "loss": 0.0217, + "step": 291750 + }, + { + "epoch": 1.88, + "learning_rate": 1.7536805282146934e-05, + "loss": 0.0236, + "step": 291760 + }, + { + "epoch": 1.88, + "learning_rate": 1.7527123927790003e-05, + "loss": 0.0234, + "step": 291770 + }, + { + "epoch": 1.88, + "learning_rate": 1.7517442573433073e-05, + "loss": 0.0246, + "step": 291780 + }, + { + "epoch": 1.88, + "learning_rate": 1.750776121907614e-05, + "loss": 0.0211, + "step": 291790 + }, + { + "epoch": 1.88, + "learning_rate": 1.7498079864719206e-05, + "loss": 0.0225, + "step": 291800 + }, + { + "epoch": 1.88, + "learning_rate": 1.7488398510362275e-05, + "loss": 0.0218, + "step": 291810 + }, + { + "epoch": 1.88, + "learning_rate": 1.747871715600534e-05, + "loss": 0.0218, + "step": 291820 + }, + { + "epoch": 1.88, + "learning_rate": 1.746903580164841e-05, + "loss": 0.0263, + "step": 291830 + }, + { + "epoch": 1.88, + "learning_rate": 1.7459354447291477e-05, + "loss": 0.0238, + "step": 291840 + }, + { + "epoch": 1.88, + "learning_rate": 1.7449673092934547e-05, + "loss": 0.0208, + "step": 291850 + }, + { + "epoch": 1.88, + "learning_rate": 1.7439991738577613e-05, + "loss": 0.0227, + "step": 291860 + }, + { + "epoch": 1.88, + "learning_rate": 1.7430310384220683e-05, + "loss": 0.0197, + "step": 291870 + }, + { + "epoch": 1.88, + "learning_rate": 1.742062902986375e-05, + "loss": 0.0226, + "step": 291880 + }, + { + "epoch": 1.88, + "learning_rate": 1.7410947675506815e-05, + "loss": 0.0227, + "step": 291890 + }, + { + "epoch": 1.88, + "learning_rate": 1.7401266321149885e-05, + "loss": 0.02, + "step": 291900 + }, + { + "epoch": 1.88, + "learning_rate": 1.7391584966792955e-05, + "loss": 0.0197, + "step": 291910 + }, + { + "epoch": 1.88, + "learning_rate": 1.738190361243602e-05, + "loss": 0.0228, + "step": 291920 + }, + { + "epoch": 1.88, + "learning_rate": 1.7372222258079087e-05, + "loss": 0.0196, + "step": 291930 + }, + { + "epoch": 1.88, + "learning_rate": 1.7362540903722157e-05, + "loss": 0.0305, + "step": 291940 + }, + { + "epoch": 1.88, + "learning_rate": 1.7352859549365226e-05, + "loss": 0.0226, + "step": 291950 + }, + { + "epoch": 1.88, + "learning_rate": 1.7343178195008292e-05, + "loss": 0.0262, + "step": 291960 + }, + { + "epoch": 1.88, + "learning_rate": 1.733349684065136e-05, + "loss": 0.0228, + "step": 291970 + }, + { + "epoch": 1.88, + "learning_rate": 1.732381548629443e-05, + "loss": 0.019, + "step": 291980 + }, + { + "epoch": 1.88, + "learning_rate": 1.7314134131937498e-05, + "loss": 0.0169, + "step": 291990 + }, + { + "epoch": 1.88, + "learning_rate": 1.7304452777580564e-05, + "loss": 0.0192, + "step": 292000 + }, + { + "epoch": 1.88, + "eval_cer": 0.9198345949610214, + "eval_loss": 0.01690409518778324, + "eval_runtime": 120.2396, + "eval_samples_per_second": 16.633, + "eval_steps_per_second": 4.158, + "step": 292000 + }, + { + "epoch": 1.88, + "learning_rate": 1.729477142322363e-05, + "loss": 0.0219, + "step": 292010 + }, + { + "epoch": 1.88, + "learning_rate": 1.72850900688667e-05, + "loss": 0.0224, + "step": 292020 + }, + { + "epoch": 1.88, + "learning_rate": 1.7275408714509766e-05, + "loss": 0.0229, + "step": 292030 + }, + { + "epoch": 1.88, + "learning_rate": 1.7265727360152836e-05, + "loss": 0.0231, + "step": 292040 + }, + { + "epoch": 1.88, + "learning_rate": 1.7256046005795902e-05, + "loss": 0.0235, + "step": 292050 + }, + { + "epoch": 1.89, + "learning_rate": 1.724636465143897e-05, + "loss": 0.0221, + "step": 292060 + }, + { + "epoch": 1.89, + "learning_rate": 1.7236683297082038e-05, + "loss": 0.0217, + "step": 292070 + }, + { + "epoch": 1.89, + "learning_rate": 1.7227001942725108e-05, + "loss": 0.0217, + "step": 292080 + }, + { + "epoch": 1.89, + "learning_rate": 1.7217320588368174e-05, + "loss": 0.0216, + "step": 292090 + }, + { + "epoch": 1.89, + "learning_rate": 1.720763923401124e-05, + "loss": 0.0216, + "step": 292100 + }, + { + "epoch": 1.89, + "learning_rate": 1.719795787965431e-05, + "loss": 0.0228, + "step": 292110 + }, + { + "epoch": 1.89, + "learning_rate": 1.718827652529738e-05, + "loss": 0.0252, + "step": 292120 + }, + { + "epoch": 1.89, + "learning_rate": 1.7178595170940446e-05, + "loss": 0.0258, + "step": 292130 + }, + { + "epoch": 1.89, + "learning_rate": 1.7168913816583512e-05, + "loss": 0.0255, + "step": 292140 + }, + { + "epoch": 1.89, + "learning_rate": 1.715923246222658e-05, + "loss": 0.0225, + "step": 292150 + }, + { + "epoch": 1.89, + "learning_rate": 1.714955110786965e-05, + "loss": 0.0255, + "step": 292160 + }, + { + "epoch": 1.89, + "learning_rate": 1.7139869753512717e-05, + "loss": 0.0241, + "step": 292170 + }, + { + "epoch": 1.89, + "learning_rate": 1.7130188399155784e-05, + "loss": 0.0283, + "step": 292180 + }, + { + "epoch": 1.89, + "learning_rate": 1.7120507044798853e-05, + "loss": 0.0222, + "step": 292190 + }, + { + "epoch": 1.89, + "learning_rate": 1.711082569044192e-05, + "loss": 0.0243, + "step": 292200 + }, + { + "epoch": 1.89, + "learning_rate": 1.710114433608499e-05, + "loss": 0.0226, + "step": 292210 + }, + { + "epoch": 1.89, + "learning_rate": 1.7091462981728055e-05, + "loss": 0.0197, + "step": 292220 + }, + { + "epoch": 1.89, + "learning_rate": 1.7081781627371125e-05, + "loss": 0.022, + "step": 292230 + }, + { + "epoch": 1.89, + "learning_rate": 1.707210027301419e-05, + "loss": 0.0167, + "step": 292240 + }, + { + "epoch": 1.89, + "learning_rate": 1.706241891865726e-05, + "loss": 0.0205, + "step": 292250 + }, + { + "epoch": 1.89, + "learning_rate": 1.7052737564300327e-05, + "loss": 0.0208, + "step": 292260 + }, + { + "epoch": 1.89, + "learning_rate": 1.7043056209943393e-05, + "loss": 0.019, + "step": 292270 + }, + { + "epoch": 1.89, + "learning_rate": 1.7033374855586463e-05, + "loss": 0.0225, + "step": 292280 + }, + { + "epoch": 1.89, + "learning_rate": 1.702369350122953e-05, + "loss": 0.0237, + "step": 292290 + }, + { + "epoch": 1.89, + "learning_rate": 1.70140121468726e-05, + "loss": 0.0204, + "step": 292300 + }, + { + "epoch": 1.89, + "learning_rate": 1.7004330792515665e-05, + "loss": 0.0222, + "step": 292310 + }, + { + "epoch": 1.89, + "learning_rate": 1.6994649438158735e-05, + "loss": 0.0252, + "step": 292320 + }, + { + "epoch": 1.89, + "learning_rate": 1.69849680838018e-05, + "loss": 0.0239, + "step": 292330 + }, + { + "epoch": 1.89, + "learning_rate": 1.6975286729444867e-05, + "loss": 0.0229, + "step": 292340 + }, + { + "epoch": 1.89, + "learning_rate": 1.6965605375087937e-05, + "loss": 0.021, + "step": 292350 + }, + { + "epoch": 1.89, + "learning_rate": 1.6955924020731006e-05, + "loss": 0.0234, + "step": 292360 + }, + { + "epoch": 1.89, + "learning_rate": 1.6946242666374073e-05, + "loss": 0.0185, + "step": 292370 + }, + { + "epoch": 1.89, + "learning_rate": 1.693656131201714e-05, + "loss": 0.023, + "step": 292380 + }, + { + "epoch": 1.89, + "learning_rate": 1.692687995766021e-05, + "loss": 0.0236, + "step": 292390 + }, + { + "epoch": 1.89, + "learning_rate": 1.6917198603303278e-05, + "loss": 0.0242, + "step": 292400 + }, + { + "epoch": 1.89, + "learning_rate": 1.6907517248946344e-05, + "loss": 0.0273, + "step": 292410 + }, + { + "epoch": 1.89, + "learning_rate": 1.689783589458941e-05, + "loss": 0.0243, + "step": 292420 + }, + { + "epoch": 1.89, + "learning_rate": 1.688815454023248e-05, + "loss": 0.0195, + "step": 292430 + }, + { + "epoch": 1.89, + "learning_rate": 1.687847318587555e-05, + "loss": 0.0225, + "step": 292440 + }, + { + "epoch": 1.89, + "learning_rate": 1.6868791831518616e-05, + "loss": 0.0189, + "step": 292450 + }, + { + "epoch": 1.89, + "learning_rate": 1.6859110477161682e-05, + "loss": 0.0217, + "step": 292460 + }, + { + "epoch": 1.89, + "learning_rate": 1.6849429122804752e-05, + "loss": 0.0281, + "step": 292470 + }, + { + "epoch": 1.89, + "learning_rate": 1.6839747768447818e-05, + "loss": 0.0225, + "step": 292480 + }, + { + "epoch": 1.89, + "learning_rate": 1.6830066414090888e-05, + "loss": 0.0193, + "step": 292490 + }, + { + "epoch": 1.89, + "learning_rate": 1.6820385059733954e-05, + "loss": 0.0259, + "step": 292500 + }, + { + "epoch": 1.89, + "learning_rate": 1.681070370537702e-05, + "loss": 0.0189, + "step": 292510 + }, + { + "epoch": 1.89, + "learning_rate": 1.680102235102009e-05, + "loss": 0.0206, + "step": 292520 + }, + { + "epoch": 1.89, + "learning_rate": 1.679134099666316e-05, + "loss": 0.0258, + "step": 292530 + }, + { + "epoch": 1.89, + "learning_rate": 1.6781659642306226e-05, + "loss": 0.0309, + "step": 292540 + }, + { + "epoch": 1.89, + "learning_rate": 1.6771978287949292e-05, + "loss": 0.0184, + "step": 292550 + }, + { + "epoch": 1.89, + "learning_rate": 1.676229693359236e-05, + "loss": 0.0247, + "step": 292560 + }, + { + "epoch": 1.89, + "learning_rate": 1.675261557923543e-05, + "loss": 0.0216, + "step": 292570 + }, + { + "epoch": 1.89, + "learning_rate": 1.6742934224878498e-05, + "loss": 0.0179, + "step": 292580 + }, + { + "epoch": 1.89, + "learning_rate": 1.6733252870521564e-05, + "loss": 0.0235, + "step": 292590 + }, + { + "epoch": 1.89, + "learning_rate": 1.6723571516164633e-05, + "loss": 0.0218, + "step": 292600 + }, + { + "epoch": 1.89, + "learning_rate": 1.6713890161807703e-05, + "loss": 0.0275, + "step": 292610 + }, + { + "epoch": 1.89, + "learning_rate": 1.670420880745077e-05, + "loss": 0.0226, + "step": 292620 + }, + { + "epoch": 1.89, + "learning_rate": 1.6694527453093836e-05, + "loss": 0.0291, + "step": 292630 + }, + { + "epoch": 1.89, + "learning_rate": 1.6684846098736905e-05, + "loss": 0.0243, + "step": 292640 + }, + { + "epoch": 1.89, + "learning_rate": 1.667516474437997e-05, + "loss": 0.0203, + "step": 292650 + }, + { + "epoch": 1.89, + "learning_rate": 1.666548339002304e-05, + "loss": 0.0216, + "step": 292660 + }, + { + "epoch": 1.89, + "learning_rate": 1.6655802035666107e-05, + "loss": 0.0224, + "step": 292670 + }, + { + "epoch": 1.89, + "learning_rate": 1.6646120681309177e-05, + "loss": 0.0223, + "step": 292680 + }, + { + "epoch": 1.89, + "learning_rate": 1.6636439326952243e-05, + "loss": 0.0197, + "step": 292690 + }, + { + "epoch": 1.89, + "learning_rate": 1.6626757972595313e-05, + "loss": 0.0218, + "step": 292700 + }, + { + "epoch": 1.89, + "learning_rate": 1.661707661823838e-05, + "loss": 0.0226, + "step": 292710 + }, + { + "epoch": 1.89, + "learning_rate": 1.6607395263881445e-05, + "loss": 0.0236, + "step": 292720 + }, + { + "epoch": 1.89, + "learning_rate": 1.6597713909524515e-05, + "loss": 0.0232, + "step": 292730 + }, + { + "epoch": 1.89, + "learning_rate": 1.6588032555167584e-05, + "loss": 0.0233, + "step": 292740 + }, + { + "epoch": 1.89, + "learning_rate": 1.657835120081065e-05, + "loss": 0.0216, + "step": 292750 + }, + { + "epoch": 1.89, + "learning_rate": 1.6568669846453717e-05, + "loss": 0.0201, + "step": 292760 + }, + { + "epoch": 1.89, + "learning_rate": 1.6558988492096787e-05, + "loss": 0.0237, + "step": 292770 + }, + { + "epoch": 1.89, + "learning_rate": 1.6549307137739856e-05, + "loss": 0.0207, + "step": 292780 + }, + { + "epoch": 1.89, + "learning_rate": 1.6539625783382922e-05, + "loss": 0.0222, + "step": 292790 + }, + { + "epoch": 1.89, + "learning_rate": 1.652994442902599e-05, + "loss": 0.0226, + "step": 292800 + }, + { + "epoch": 1.89, + "learning_rate": 1.652026307466906e-05, + "loss": 0.0219, + "step": 292810 + }, + { + "epoch": 1.89, + "learning_rate": 1.6510581720312128e-05, + "loss": 0.0214, + "step": 292820 + }, + { + "epoch": 1.89, + "learning_rate": 1.6500900365955194e-05, + "loss": 0.0205, + "step": 292830 + }, + { + "epoch": 1.89, + "learning_rate": 1.649121901159826e-05, + "loss": 0.0238, + "step": 292840 + }, + { + "epoch": 1.89, + "learning_rate": 1.648153765724133e-05, + "loss": 0.0241, + "step": 292850 + }, + { + "epoch": 1.89, + "learning_rate": 1.6471856302884396e-05, + "loss": 0.0263, + "step": 292860 + }, + { + "epoch": 1.89, + "learning_rate": 1.6462174948527466e-05, + "loss": 0.0307, + "step": 292870 + }, + { + "epoch": 1.89, + "learning_rate": 1.6452493594170532e-05, + "loss": 0.0255, + "step": 292880 + }, + { + "epoch": 1.89, + "learning_rate": 1.64428122398136e-05, + "loss": 0.0218, + "step": 292890 + }, + { + "epoch": 1.89, + "learning_rate": 1.6433130885456668e-05, + "loss": 0.0259, + "step": 292900 + }, + { + "epoch": 1.89, + "learning_rate": 1.6423449531099738e-05, + "loss": 0.025, + "step": 292910 + }, + { + "epoch": 1.89, + "learning_rate": 1.6413768176742804e-05, + "loss": 0.0252, + "step": 292920 + }, + { + "epoch": 1.89, + "learning_rate": 1.640408682238587e-05, + "loss": 0.0252, + "step": 292930 + }, + { + "epoch": 1.89, + "learning_rate": 1.639440546802894e-05, + "loss": 0.0204, + "step": 292940 + }, + { + "epoch": 1.89, + "learning_rate": 1.6384724113672006e-05, + "loss": 0.0245, + "step": 292950 + }, + { + "epoch": 1.89, + "learning_rate": 1.6375042759315076e-05, + "loss": 0.02, + "step": 292960 + }, + { + "epoch": 1.89, + "learning_rate": 1.6365361404958142e-05, + "loss": 0.0262, + "step": 292970 + }, + { + "epoch": 1.89, + "learning_rate": 1.635568005060121e-05, + "loss": 0.0235, + "step": 292980 + }, + { + "epoch": 1.89, + "learning_rate": 1.6345998696244278e-05, + "loss": 0.0216, + "step": 292990 + }, + { + "epoch": 1.89, + "learning_rate": 1.6336317341887347e-05, + "loss": 0.0234, + "step": 293000 + }, + { + "epoch": 1.89, + "eval_cer": 0.9198382103717094, + "eval_loss": 0.016830649226903915, + "eval_runtime": 120.2142, + "eval_samples_per_second": 16.637, + "eval_steps_per_second": 4.159, + "step": 293000 + }, + { + "epoch": 1.89, + "learning_rate": 1.6326635987530414e-05, + "loss": 0.0237, + "step": 293010 + }, + { + "epoch": 1.89, + "learning_rate": 1.6316954633173483e-05, + "loss": 0.0241, + "step": 293020 + }, + { + "epoch": 1.89, + "learning_rate": 1.630727327881655e-05, + "loss": 0.0203, + "step": 293030 + }, + { + "epoch": 1.89, + "learning_rate": 1.6297591924459616e-05, + "loss": 0.0252, + "step": 293040 + }, + { + "epoch": 1.89, + "learning_rate": 1.6287910570102685e-05, + "loss": 0.0223, + "step": 293050 + }, + { + "epoch": 1.89, + "learning_rate": 1.6278229215745755e-05, + "loss": 0.026, + "step": 293060 + }, + { + "epoch": 1.89, + "learning_rate": 1.626854786138882e-05, + "loss": 0.0253, + "step": 293070 + }, + { + "epoch": 1.89, + "learning_rate": 1.6258866507031887e-05, + "loss": 0.0222, + "step": 293080 + }, + { + "epoch": 1.89, + "learning_rate": 1.6249185152674957e-05, + "loss": 0.0234, + "step": 293090 + }, + { + "epoch": 1.89, + "learning_rate": 1.6239503798318023e-05, + "loss": 0.0179, + "step": 293100 + }, + { + "epoch": 1.89, + "learning_rate": 1.6229822443961093e-05, + "loss": 0.0227, + "step": 293110 + }, + { + "epoch": 1.89, + "learning_rate": 1.622014108960416e-05, + "loss": 0.0272, + "step": 293120 + }, + { + "epoch": 1.89, + "learning_rate": 1.621045973524723e-05, + "loss": 0.024, + "step": 293130 + }, + { + "epoch": 1.89, + "learning_rate": 1.6200778380890295e-05, + "loss": 0.0248, + "step": 293140 + }, + { + "epoch": 1.89, + "learning_rate": 1.6191097026533365e-05, + "loss": 0.0212, + "step": 293150 + }, + { + "epoch": 1.89, + "learning_rate": 1.618141567217643e-05, + "loss": 0.0258, + "step": 293160 + }, + { + "epoch": 1.89, + "learning_rate": 1.6171734317819497e-05, + "loss": 0.0189, + "step": 293170 + }, + { + "epoch": 1.89, + "learning_rate": 1.6162052963462567e-05, + "loss": 0.0211, + "step": 293180 + }, + { + "epoch": 1.89, + "learning_rate": 1.6152371609105636e-05, + "loss": 0.0191, + "step": 293190 + }, + { + "epoch": 1.89, + "learning_rate": 1.6142690254748703e-05, + "loss": 0.0212, + "step": 293200 + }, + { + "epoch": 1.89, + "learning_rate": 1.613300890039177e-05, + "loss": 0.0229, + "step": 293210 + }, + { + "epoch": 1.89, + "learning_rate": 1.612332754603484e-05, + "loss": 0.0219, + "step": 293220 + }, + { + "epoch": 1.89, + "learning_rate": 1.6113646191677908e-05, + "loss": 0.0245, + "step": 293230 + }, + { + "epoch": 1.89, + "learning_rate": 1.6103964837320974e-05, + "loss": 0.0209, + "step": 293240 + }, + { + "epoch": 1.89, + "learning_rate": 1.609428348296404e-05, + "loss": 0.0208, + "step": 293250 + }, + { + "epoch": 1.89, + "learning_rate": 1.608460212860711e-05, + "loss": 0.0193, + "step": 293260 + }, + { + "epoch": 1.89, + "learning_rate": 1.607492077425018e-05, + "loss": 0.0222, + "step": 293270 + }, + { + "epoch": 1.89, + "learning_rate": 1.6065239419893246e-05, + "loss": 0.0241, + "step": 293280 + }, + { + "epoch": 1.89, + "learning_rate": 1.6055558065536312e-05, + "loss": 0.0228, + "step": 293290 + }, + { + "epoch": 1.89, + "learning_rate": 1.6045876711179382e-05, + "loss": 0.0193, + "step": 293300 + }, + { + "epoch": 1.89, + "learning_rate": 1.6036195356822448e-05, + "loss": 0.0253, + "step": 293310 + }, + { + "epoch": 1.89, + "learning_rate": 1.6026514002465518e-05, + "loss": 0.0223, + "step": 293320 + }, + { + "epoch": 1.89, + "learning_rate": 1.6016832648108584e-05, + "loss": 0.0215, + "step": 293330 + }, + { + "epoch": 1.89, + "learning_rate": 1.600715129375165e-05, + "loss": 0.0196, + "step": 293340 + }, + { + "epoch": 1.89, + "learning_rate": 1.599746993939472e-05, + "loss": 0.0208, + "step": 293350 + }, + { + "epoch": 1.89, + "learning_rate": 1.598778858503779e-05, + "loss": 0.0238, + "step": 293360 + }, + { + "epoch": 1.89, + "learning_rate": 1.5978107230680856e-05, + "loss": 0.0196, + "step": 293370 + }, + { + "epoch": 1.89, + "learning_rate": 1.5968425876323922e-05, + "loss": 0.0238, + "step": 293380 + }, + { + "epoch": 1.89, + "learning_rate": 1.595874452196699e-05, + "loss": 0.0254, + "step": 293390 + }, + { + "epoch": 1.89, + "learning_rate": 1.594906316761006e-05, + "loss": 0.0292, + "step": 293400 + }, + { + "epoch": 1.89, + "learning_rate": 1.5939381813253128e-05, + "loss": 0.0249, + "step": 293410 + }, + { + "epoch": 1.89, + "learning_rate": 1.5929700458896194e-05, + "loss": 0.0204, + "step": 293420 + }, + { + "epoch": 1.89, + "learning_rate": 1.5920019104539263e-05, + "loss": 0.0236, + "step": 293430 + }, + { + "epoch": 1.89, + "learning_rate": 1.5910337750182333e-05, + "loss": 0.0198, + "step": 293440 + }, + { + "epoch": 1.89, + "learning_rate": 1.59006563958254e-05, + "loss": 0.0239, + "step": 293450 + }, + { + "epoch": 1.89, + "learning_rate": 1.5890975041468466e-05, + "loss": 0.0229, + "step": 293460 + }, + { + "epoch": 1.89, + "learning_rate": 1.5881293687111535e-05, + "loss": 0.0193, + "step": 293470 + }, + { + "epoch": 1.89, + "learning_rate": 1.58716123327546e-05, + "loss": 0.0259, + "step": 293480 + }, + { + "epoch": 1.89, + "learning_rate": 1.586193097839767e-05, + "loss": 0.0209, + "step": 293490 + }, + { + "epoch": 1.89, + "learning_rate": 1.5852249624040737e-05, + "loss": 0.0298, + "step": 293500 + }, + { + "epoch": 1.89, + "learning_rate": 1.5842568269683807e-05, + "loss": 0.0224, + "step": 293510 + }, + { + "epoch": 1.89, + "learning_rate": 1.5832886915326873e-05, + "loss": 0.0244, + "step": 293520 + }, + { + "epoch": 1.89, + "learning_rate": 1.5823205560969943e-05, + "loss": 0.0243, + "step": 293530 + }, + { + "epoch": 1.89, + "learning_rate": 1.581352420661301e-05, + "loss": 0.0213, + "step": 293540 + }, + { + "epoch": 1.89, + "learning_rate": 1.5803842852256075e-05, + "loss": 0.023, + "step": 293550 + }, + { + "epoch": 1.89, + "learning_rate": 1.5794161497899145e-05, + "loss": 0.0209, + "step": 293560 + }, + { + "epoch": 1.89, + "learning_rate": 1.5784480143542214e-05, + "loss": 0.0246, + "step": 293570 + }, + { + "epoch": 1.89, + "learning_rate": 1.577479878918528e-05, + "loss": 0.0198, + "step": 293580 + }, + { + "epoch": 1.89, + "learning_rate": 1.5765117434828347e-05, + "loss": 0.0204, + "step": 293590 + }, + { + "epoch": 1.89, + "learning_rate": 1.5755436080471417e-05, + "loss": 0.0205, + "step": 293600 + }, + { + "epoch": 1.9, + "learning_rate": 1.5745754726114486e-05, + "loss": 0.0215, + "step": 293610 + }, + { + "epoch": 1.9, + "learning_rate": 1.5736073371757552e-05, + "loss": 0.025, + "step": 293620 + }, + { + "epoch": 1.9, + "learning_rate": 1.572639201740062e-05, + "loss": 0.024, + "step": 293630 + }, + { + "epoch": 1.9, + "learning_rate": 1.571671066304369e-05, + "loss": 0.0229, + "step": 293640 + }, + { + "epoch": 1.9, + "learning_rate": 1.5707029308686755e-05, + "loss": 0.0253, + "step": 293650 + }, + { + "epoch": 1.9, + "learning_rate": 1.5697347954329824e-05, + "loss": 0.0234, + "step": 293660 + }, + { + "epoch": 1.9, + "learning_rate": 1.568766659997289e-05, + "loss": 0.0248, + "step": 293670 + }, + { + "epoch": 1.9, + "learning_rate": 1.567798524561596e-05, + "loss": 0.0159, + "step": 293680 + }, + { + "epoch": 1.9, + "learning_rate": 1.5668303891259026e-05, + "loss": 0.0213, + "step": 293690 + }, + { + "epoch": 1.9, + "learning_rate": 1.5658622536902093e-05, + "loss": 0.0265, + "step": 293700 + }, + { + "epoch": 1.9, + "learning_rate": 1.5648941182545162e-05, + "loss": 0.0239, + "step": 293710 + }, + { + "epoch": 1.9, + "learning_rate": 1.5639259828188232e-05, + "loss": 0.0218, + "step": 293720 + }, + { + "epoch": 1.9, + "learning_rate": 1.5629578473831298e-05, + "loss": 0.0185, + "step": 293730 + }, + { + "epoch": 1.9, + "learning_rate": 1.5619897119474364e-05, + "loss": 0.0259, + "step": 293740 + }, + { + "epoch": 1.9, + "learning_rate": 1.5610215765117434e-05, + "loss": 0.0274, + "step": 293750 + }, + { + "epoch": 1.9, + "learning_rate": 1.56005344107605e-05, + "loss": 0.0227, + "step": 293760 + }, + { + "epoch": 1.9, + "learning_rate": 1.559085305640357e-05, + "loss": 0.0248, + "step": 293770 + }, + { + "epoch": 1.9, + "learning_rate": 1.5581171702046636e-05, + "loss": 0.0241, + "step": 293780 + }, + { + "epoch": 1.9, + "learning_rate": 1.5571490347689702e-05, + "loss": 0.0255, + "step": 293790 + }, + { + "epoch": 1.9, + "learning_rate": 1.5561808993332772e-05, + "loss": 0.0191, + "step": 293800 + }, + { + "epoch": 1.9, + "learning_rate": 1.555212763897584e-05, + "loss": 0.0205, + "step": 293810 + }, + { + "epoch": 1.9, + "learning_rate": 1.5542446284618908e-05, + "loss": 0.0229, + "step": 293820 + }, + { + "epoch": 1.9, + "learning_rate": 1.5532764930261974e-05, + "loss": 0.0263, + "step": 293830 + }, + { + "epoch": 1.9, + "learning_rate": 1.5523083575905044e-05, + "loss": 0.0233, + "step": 293840 + }, + { + "epoch": 1.9, + "learning_rate": 1.5513402221548113e-05, + "loss": 0.0235, + "step": 293850 + }, + { + "epoch": 1.9, + "learning_rate": 1.550372086719118e-05, + "loss": 0.0222, + "step": 293860 + }, + { + "epoch": 1.9, + "learning_rate": 1.5494039512834246e-05, + "loss": 0.0243, + "step": 293870 + }, + { + "epoch": 1.9, + "learning_rate": 1.5484358158477315e-05, + "loss": 0.0223, + "step": 293880 + }, + { + "epoch": 1.9, + "learning_rate": 1.5474676804120385e-05, + "loss": 0.0273, + "step": 293890 + }, + { + "epoch": 1.9, + "learning_rate": 1.546499544976345e-05, + "loss": 0.0209, + "step": 293900 + }, + { + "epoch": 1.9, + "learning_rate": 1.5455314095406517e-05, + "loss": 0.0234, + "step": 293910 + }, + { + "epoch": 1.9, + "learning_rate": 1.5445632741049587e-05, + "loss": 0.0201, + "step": 293920 + }, + { + "epoch": 1.9, + "learning_rate": 1.5435951386692653e-05, + "loss": 0.0188, + "step": 293930 + }, + { + "epoch": 1.9, + "learning_rate": 1.5426270032335723e-05, + "loss": 0.0215, + "step": 293940 + }, + { + "epoch": 1.9, + "learning_rate": 1.541658867797879e-05, + "loss": 0.0254, + "step": 293950 + }, + { + "epoch": 1.9, + "learning_rate": 1.540690732362186e-05, + "loss": 0.0228, + "step": 293960 + }, + { + "epoch": 1.9, + "learning_rate": 1.5397225969264925e-05, + "loss": 0.0195, + "step": 293970 + }, + { + "epoch": 1.9, + "learning_rate": 1.5387544614907995e-05, + "loss": 0.0181, + "step": 293980 + }, + { + "epoch": 1.9, + "learning_rate": 1.537786326055106e-05, + "loss": 0.0216, + "step": 293990 + }, + { + "epoch": 1.9, + "learning_rate": 1.5368181906194127e-05, + "loss": 0.0223, + "step": 294000 + }, + { + "epoch": 1.9, + "eval_cer": 0.9198427296350695, + "eval_loss": 0.016799306496977806, + "eval_runtime": 120.1061, + "eval_samples_per_second": 16.652, + "eval_steps_per_second": 4.163, + "step": 294000 + }, + { + "epoch": 1.9, + "learning_rate": 1.5358500551837197e-05, + "loss": 0.0189, + "step": 294010 + }, + { + "epoch": 1.9, + "learning_rate": 1.5348819197480266e-05, + "loss": 0.0198, + "step": 294020 + }, + { + "epoch": 1.9, + "learning_rate": 1.5339137843123333e-05, + "loss": 0.0212, + "step": 294030 + }, + { + "epoch": 1.9, + "learning_rate": 1.53294564887664e-05, + "loss": 0.0218, + "step": 294040 + }, + { + "epoch": 1.9, + "learning_rate": 1.531977513440947e-05, + "loss": 0.0271, + "step": 294050 + }, + { + "epoch": 1.9, + "learning_rate": 1.5310093780052538e-05, + "loss": 0.0209, + "step": 294060 + }, + { + "epoch": 1.9, + "learning_rate": 1.5300412425695604e-05, + "loss": 0.0185, + "step": 294070 + }, + { + "epoch": 1.9, + "learning_rate": 1.529073107133867e-05, + "loss": 0.0206, + "step": 294080 + }, + { + "epoch": 1.9, + "learning_rate": 1.528104971698174e-05, + "loss": 0.0236, + "step": 294090 + }, + { + "epoch": 1.9, + "learning_rate": 1.527136836262481e-05, + "loss": 0.0239, + "step": 294100 + }, + { + "epoch": 1.9, + "learning_rate": 1.5261687008267876e-05, + "loss": 0.0236, + "step": 294110 + }, + { + "epoch": 1.9, + "learning_rate": 1.5252005653910944e-05, + "loss": 0.0239, + "step": 294120 + }, + { + "epoch": 1.9, + "learning_rate": 1.5242324299554012e-05, + "loss": 0.0235, + "step": 294130 + }, + { + "epoch": 1.9, + "learning_rate": 1.5232642945197078e-05, + "loss": 0.0193, + "step": 294140 + }, + { + "epoch": 1.9, + "learning_rate": 1.5222961590840146e-05, + "loss": 0.0219, + "step": 294150 + }, + { + "epoch": 1.9, + "learning_rate": 1.5213280236483214e-05, + "loss": 0.0251, + "step": 294160 + }, + { + "epoch": 1.9, + "learning_rate": 1.5203598882126282e-05, + "loss": 0.0234, + "step": 294170 + }, + { + "epoch": 1.9, + "learning_rate": 1.519391752776935e-05, + "loss": 0.0215, + "step": 294180 + }, + { + "epoch": 1.9, + "learning_rate": 1.5184236173412418e-05, + "loss": 0.023, + "step": 294190 + }, + { + "epoch": 1.9, + "learning_rate": 1.5174554819055486e-05, + "loss": 0.0259, + "step": 294200 + }, + { + "epoch": 1.9, + "learning_rate": 1.5164873464698552e-05, + "loss": 0.0252, + "step": 294210 + }, + { + "epoch": 1.9, + "learning_rate": 1.5155192110341622e-05, + "loss": 0.0205, + "step": 294220 + }, + { + "epoch": 1.9, + "learning_rate": 1.514551075598469e-05, + "loss": 0.022, + "step": 294230 + }, + { + "epoch": 1.9, + "learning_rate": 1.5135829401627756e-05, + "loss": 0.0242, + "step": 294240 + }, + { + "epoch": 1.9, + "learning_rate": 1.5126148047270824e-05, + "loss": 0.0217, + "step": 294250 + }, + { + "epoch": 1.9, + "learning_rate": 1.5116466692913893e-05, + "loss": 0.0223, + "step": 294260 + }, + { + "epoch": 1.9, + "learning_rate": 1.5106785338556961e-05, + "loss": 0.0193, + "step": 294270 + }, + { + "epoch": 1.9, + "learning_rate": 1.5097103984200028e-05, + "loss": 0.0217, + "step": 294280 + }, + { + "epoch": 1.9, + "learning_rate": 1.5087422629843096e-05, + "loss": 0.0219, + "step": 294290 + }, + { + "epoch": 1.9, + "learning_rate": 1.5077741275486165e-05, + "loss": 0.0219, + "step": 294300 + }, + { + "epoch": 1.9, + "learning_rate": 1.5068059921129231e-05, + "loss": 0.0244, + "step": 294310 + }, + { + "epoch": 1.9, + "learning_rate": 1.50583785667723e-05, + "loss": 0.0259, + "step": 294320 + }, + { + "epoch": 1.9, + "learning_rate": 1.5048697212415367e-05, + "loss": 0.0258, + "step": 294330 + }, + { + "epoch": 1.9, + "learning_rate": 1.5039015858058437e-05, + "loss": 0.0204, + "step": 294340 + }, + { + "epoch": 1.9, + "learning_rate": 1.5029334503701503e-05, + "loss": 0.0239, + "step": 294350 + }, + { + "epoch": 1.9, + "learning_rate": 1.5019653149344571e-05, + "loss": 0.0234, + "step": 294360 + }, + { + "epoch": 1.9, + "learning_rate": 1.5009971794987639e-05, + "loss": 0.0226, + "step": 294370 + }, + { + "epoch": 1.9, + "learning_rate": 1.5000290440630705e-05, + "loss": 0.0237, + "step": 294380 + }, + { + "epoch": 1.9, + "learning_rate": 1.4990609086273775e-05, + "loss": 0.0248, + "step": 294390 + }, + { + "epoch": 1.9, + "learning_rate": 1.4980927731916843e-05, + "loss": 0.0215, + "step": 294400 + }, + { + "epoch": 1.9, + "learning_rate": 1.497124637755991e-05, + "loss": 0.0266, + "step": 294410 + }, + { + "epoch": 1.9, + "learning_rate": 1.4961565023202977e-05, + "loss": 0.0231, + "step": 294420 + }, + { + "epoch": 1.9, + "learning_rate": 1.4951883668846047e-05, + "loss": 0.0203, + "step": 294430 + }, + { + "epoch": 1.9, + "learning_rate": 1.4942202314489115e-05, + "loss": 0.0192, + "step": 294440 + }, + { + "epoch": 1.9, + "learning_rate": 1.493252096013218e-05, + "loss": 0.02, + "step": 294450 + }, + { + "epoch": 1.9, + "learning_rate": 1.4922839605775249e-05, + "loss": 0.0191, + "step": 294460 + }, + { + "epoch": 1.9, + "learning_rate": 1.4913158251418318e-05, + "loss": 0.0229, + "step": 294470 + }, + { + "epoch": 1.9, + "learning_rate": 1.4903476897061386e-05, + "loss": 0.0265, + "step": 294480 + }, + { + "epoch": 1.9, + "learning_rate": 1.4893795542704452e-05, + "loss": 0.0199, + "step": 294490 + }, + { + "epoch": 1.9, + "learning_rate": 1.488411418834752e-05, + "loss": 0.0245, + "step": 294500 + }, + { + "epoch": 1.9, + "learning_rate": 1.4874432833990588e-05, + "loss": 0.0206, + "step": 294510 + }, + { + "epoch": 1.9, + "learning_rate": 1.4864751479633656e-05, + "loss": 0.025, + "step": 294520 + }, + { + "epoch": 1.9, + "learning_rate": 1.4855070125276724e-05, + "loss": 0.0252, + "step": 294530 + }, + { + "epoch": 1.9, + "learning_rate": 1.4845388770919792e-05, + "loss": 0.0242, + "step": 294540 + }, + { + "epoch": 1.9, + "learning_rate": 1.483570741656286e-05, + "loss": 0.0219, + "step": 294550 + }, + { + "epoch": 1.9, + "learning_rate": 1.4826026062205926e-05, + "loss": 0.0205, + "step": 294560 + }, + { + "epoch": 1.9, + "learning_rate": 1.4816344707848996e-05, + "loss": 0.0214, + "step": 294570 + }, + { + "epoch": 1.9, + "learning_rate": 1.4806663353492064e-05, + "loss": 0.0242, + "step": 294580 + }, + { + "epoch": 1.9, + "learning_rate": 1.479698199913513e-05, + "loss": 0.0186, + "step": 294590 + }, + { + "epoch": 1.9, + "learning_rate": 1.4787300644778198e-05, + "loss": 0.0216, + "step": 294600 + }, + { + "epoch": 1.9, + "learning_rate": 1.4777619290421268e-05, + "loss": 0.0236, + "step": 294610 + }, + { + "epoch": 1.9, + "learning_rate": 1.4767937936064334e-05, + "loss": 0.0214, + "step": 294620 + }, + { + "epoch": 1.9, + "learning_rate": 1.4758256581707402e-05, + "loss": 0.022, + "step": 294630 + }, + { + "epoch": 1.9, + "learning_rate": 1.474857522735047e-05, + "loss": 0.0226, + "step": 294640 + }, + { + "epoch": 1.9, + "learning_rate": 1.473889387299354e-05, + "loss": 0.0231, + "step": 294650 + }, + { + "epoch": 1.9, + "learning_rate": 1.4729212518636606e-05, + "loss": 0.0217, + "step": 294660 + }, + { + "epoch": 1.9, + "learning_rate": 1.4719531164279674e-05, + "loss": 0.023, + "step": 294670 + }, + { + "epoch": 1.9, + "learning_rate": 1.4709849809922742e-05, + "loss": 0.0267, + "step": 294680 + }, + { + "epoch": 1.9, + "learning_rate": 1.4700168455565808e-05, + "loss": 0.0244, + "step": 294690 + }, + { + "epoch": 1.9, + "learning_rate": 1.4690487101208877e-05, + "loss": 0.0223, + "step": 294700 + }, + { + "epoch": 1.9, + "learning_rate": 1.4680805746851945e-05, + "loss": 0.017, + "step": 294710 + }, + { + "epoch": 1.9, + "learning_rate": 1.4671124392495013e-05, + "loss": 0.0246, + "step": 294720 + }, + { + "epoch": 1.9, + "learning_rate": 1.466144303813808e-05, + "loss": 0.0259, + "step": 294730 + }, + { + "epoch": 1.9, + "learning_rate": 1.4651761683781149e-05, + "loss": 0.0227, + "step": 294740 + }, + { + "epoch": 1.9, + "learning_rate": 1.4642080329424217e-05, + "loss": 0.0205, + "step": 294750 + }, + { + "epoch": 1.9, + "learning_rate": 1.4632398975067283e-05, + "loss": 0.0237, + "step": 294760 + }, + { + "epoch": 1.9, + "learning_rate": 1.4622717620710351e-05, + "loss": 0.0226, + "step": 294770 + }, + { + "epoch": 1.9, + "learning_rate": 1.461303626635342e-05, + "loss": 0.0194, + "step": 294780 + }, + { + "epoch": 1.9, + "learning_rate": 1.4603354911996489e-05, + "loss": 0.0226, + "step": 294790 + }, + { + "epoch": 1.9, + "learning_rate": 1.4593673557639555e-05, + "loss": 0.021, + "step": 294800 + }, + { + "epoch": 1.9, + "learning_rate": 1.4583992203282623e-05, + "loss": 0.0214, + "step": 294810 + }, + { + "epoch": 1.9, + "learning_rate": 1.4574310848925691e-05, + "loss": 0.0273, + "step": 294820 + }, + { + "epoch": 1.9, + "learning_rate": 1.4564629494568759e-05, + "loss": 0.0273, + "step": 294830 + }, + { + "epoch": 1.9, + "learning_rate": 1.4554948140211827e-05, + "loss": 0.019, + "step": 294840 + }, + { + "epoch": 1.9, + "learning_rate": 1.4545266785854895e-05, + "loss": 0.0231, + "step": 294850 + }, + { + "epoch": 1.9, + "learning_rate": 1.4535585431497963e-05, + "loss": 0.0226, + "step": 294860 + }, + { + "epoch": 1.9, + "learning_rate": 1.4525904077141029e-05, + "loss": 0.0174, + "step": 294870 + }, + { + "epoch": 1.9, + "learning_rate": 1.4516222722784098e-05, + "loss": 0.0191, + "step": 294880 + }, + { + "epoch": 1.9, + "learning_rate": 1.4506541368427166e-05, + "loss": 0.0197, + "step": 294890 + }, + { + "epoch": 1.9, + "learning_rate": 1.4496860014070233e-05, + "loss": 0.0235, + "step": 294900 + }, + { + "epoch": 1.9, + "learning_rate": 1.44871786597133e-05, + "loss": 0.0209, + "step": 294910 + }, + { + "epoch": 1.9, + "learning_rate": 1.447749730535637e-05, + "loss": 0.0242, + "step": 294920 + }, + { + "epoch": 1.9, + "learning_rate": 1.4467815950999438e-05, + "loss": 0.0241, + "step": 294930 + }, + { + "epoch": 1.9, + "learning_rate": 1.4458134596642504e-05, + "loss": 0.0216, + "step": 294940 + }, + { + "epoch": 1.9, + "learning_rate": 1.4448453242285572e-05, + "loss": 0.0205, + "step": 294950 + }, + { + "epoch": 1.9, + "learning_rate": 1.4438771887928642e-05, + "loss": 0.0194, + "step": 294960 + }, + { + "epoch": 1.9, + "learning_rate": 1.4429090533571708e-05, + "loss": 0.0201, + "step": 294970 + }, + { + "epoch": 1.9, + "learning_rate": 1.4419409179214776e-05, + "loss": 0.0347, + "step": 294980 + }, + { + "epoch": 1.9, + "learning_rate": 1.4409727824857844e-05, + "loss": 0.0224, + "step": 294990 + }, + { + "epoch": 1.9, + "learning_rate": 1.4400046470500914e-05, + "loss": 0.0255, + "step": 295000 + }, + { + "epoch": 1.9, + "eval_cer": 0.9198345949610214, + "eval_loss": 0.01676587574183941, + "eval_runtime": 120.4368, + "eval_samples_per_second": 16.606, + "eval_steps_per_second": 4.152, + "step": 295000 + }, + { + "epoch": 1.9, + "learning_rate": 1.439036511614398e-05, + "loss": 0.0216, + "step": 295010 + }, + { + "epoch": 1.9, + "learning_rate": 1.4380683761787048e-05, + "loss": 0.0258, + "step": 295020 + }, + { + "epoch": 1.9, + "learning_rate": 1.4371002407430116e-05, + "loss": 0.0238, + "step": 295030 + }, + { + "epoch": 1.9, + "learning_rate": 1.4361321053073182e-05, + "loss": 0.0207, + "step": 295040 + }, + { + "epoch": 1.9, + "learning_rate": 1.4351639698716252e-05, + "loss": 0.0224, + "step": 295050 + }, + { + "epoch": 1.9, + "learning_rate": 1.434195834435932e-05, + "loss": 0.0238, + "step": 295060 + }, + { + "epoch": 1.9, + "learning_rate": 1.4332276990002386e-05, + "loss": 0.022, + "step": 295070 + }, + { + "epoch": 1.9, + "learning_rate": 1.4322595635645454e-05, + "loss": 0.0232, + "step": 295080 + }, + { + "epoch": 1.9, + "learning_rate": 1.4312914281288523e-05, + "loss": 0.0234, + "step": 295090 + }, + { + "epoch": 1.9, + "learning_rate": 1.4303232926931591e-05, + "loss": 0.0184, + "step": 295100 + }, + { + "epoch": 1.9, + "learning_rate": 1.4293551572574658e-05, + "loss": 0.0217, + "step": 295110 + }, + { + "epoch": 1.9, + "learning_rate": 1.4283870218217725e-05, + "loss": 0.0216, + "step": 295120 + }, + { + "epoch": 1.9, + "learning_rate": 1.4274188863860795e-05, + "loss": 0.0229, + "step": 295130 + }, + { + "epoch": 1.9, + "learning_rate": 1.4264507509503861e-05, + "loss": 0.0217, + "step": 295140 + }, + { + "epoch": 1.9, + "learning_rate": 1.425482615514693e-05, + "loss": 0.0242, + "step": 295150 + }, + { + "epoch": 1.91, + "learning_rate": 1.4245144800789997e-05, + "loss": 0.0233, + "step": 295160 + }, + { + "epoch": 1.91, + "learning_rate": 1.4235463446433065e-05, + "loss": 0.0173, + "step": 295170 + }, + { + "epoch": 1.91, + "learning_rate": 1.4225782092076133e-05, + "loss": 0.0195, + "step": 295180 + }, + { + "epoch": 1.91, + "learning_rate": 1.4216100737719201e-05, + "loss": 0.0249, + "step": 295190 + }, + { + "epoch": 1.91, + "learning_rate": 1.4206419383362269e-05, + "loss": 0.0236, + "step": 295200 + }, + { + "epoch": 1.91, + "learning_rate": 1.4196738029005335e-05, + "loss": 0.0262, + "step": 295210 + }, + { + "epoch": 1.91, + "learning_rate": 1.4187056674648403e-05, + "loss": 0.0204, + "step": 295220 + }, + { + "epoch": 1.91, + "learning_rate": 1.4177375320291473e-05, + "loss": 0.0212, + "step": 295230 + }, + { + "epoch": 1.91, + "learning_rate": 1.416769396593454e-05, + "loss": 0.0172, + "step": 295240 + }, + { + "epoch": 1.91, + "learning_rate": 1.4158012611577607e-05, + "loss": 0.022, + "step": 295250 + }, + { + "epoch": 1.91, + "learning_rate": 1.4148331257220675e-05, + "loss": 0.0229, + "step": 295260 + }, + { + "epoch": 1.91, + "learning_rate": 1.4138649902863744e-05, + "loss": 0.0218, + "step": 295270 + }, + { + "epoch": 1.91, + "learning_rate": 1.412896854850681e-05, + "loss": 0.0215, + "step": 295280 + }, + { + "epoch": 1.91, + "learning_rate": 1.4119287194149879e-05, + "loss": 0.0217, + "step": 295290 + }, + { + "epoch": 1.91, + "learning_rate": 1.4109605839792947e-05, + "loss": 0.024, + "step": 295300 + }, + { + "epoch": 1.91, + "learning_rate": 1.4099924485436016e-05, + "loss": 0.0238, + "step": 295310 + }, + { + "epoch": 1.91, + "learning_rate": 1.4090243131079082e-05, + "loss": 0.0222, + "step": 295320 + }, + { + "epoch": 1.91, + "learning_rate": 1.408056177672215e-05, + "loss": 0.0244, + "step": 295330 + }, + { + "epoch": 1.91, + "learning_rate": 1.4070880422365218e-05, + "loss": 0.026, + "step": 295340 + }, + { + "epoch": 1.91, + "learning_rate": 1.4061199068008285e-05, + "loss": 0.0169, + "step": 295350 + }, + { + "epoch": 1.91, + "learning_rate": 1.4051517713651354e-05, + "loss": 0.0232, + "step": 295360 + }, + { + "epoch": 1.91, + "learning_rate": 1.4041836359294422e-05, + "loss": 0.0263, + "step": 295370 + }, + { + "epoch": 1.91, + "learning_rate": 1.403215500493749e-05, + "loss": 0.021, + "step": 295380 + }, + { + "epoch": 1.91, + "learning_rate": 1.4022473650580556e-05, + "loss": 0.0195, + "step": 295390 + }, + { + "epoch": 1.91, + "learning_rate": 1.4012792296223626e-05, + "loss": 0.0211, + "step": 295400 + }, + { + "epoch": 1.91, + "learning_rate": 1.4003110941866694e-05, + "loss": 0.0251, + "step": 295410 + }, + { + "epoch": 1.91, + "learning_rate": 1.399342958750976e-05, + "loss": 0.0182, + "step": 295420 + }, + { + "epoch": 1.91, + "learning_rate": 1.3983748233152828e-05, + "loss": 0.0245, + "step": 295430 + }, + { + "epoch": 1.91, + "learning_rate": 1.3974066878795898e-05, + "loss": 0.0169, + "step": 295440 + }, + { + "epoch": 1.91, + "learning_rate": 1.3964385524438966e-05, + "loss": 0.0232, + "step": 295450 + }, + { + "epoch": 1.91, + "learning_rate": 1.3954704170082032e-05, + "loss": 0.0275, + "step": 295460 + }, + { + "epoch": 1.91, + "learning_rate": 1.39450228157251e-05, + "loss": 0.021, + "step": 295470 + }, + { + "epoch": 1.91, + "learning_rate": 1.3935341461368168e-05, + "loss": 0.0209, + "step": 295480 + }, + { + "epoch": 1.91, + "learning_rate": 1.3925660107011236e-05, + "loss": 0.0231, + "step": 295490 + }, + { + "epoch": 1.91, + "learning_rate": 1.3915978752654304e-05, + "loss": 0.0224, + "step": 295500 + }, + { + "epoch": 1.91, + "learning_rate": 1.3906297398297371e-05, + "loss": 0.0223, + "step": 295510 + }, + { + "epoch": 1.91, + "learning_rate": 1.3896616043940438e-05, + "loss": 0.0236, + "step": 295520 + }, + { + "epoch": 1.91, + "learning_rate": 1.3886934689583507e-05, + "loss": 0.0213, + "step": 295530 + }, + { + "epoch": 1.91, + "learning_rate": 1.3877253335226575e-05, + "loss": 0.0248, + "step": 295540 + }, + { + "epoch": 1.91, + "learning_rate": 1.3867571980869643e-05, + "loss": 0.0185, + "step": 295550 + }, + { + "epoch": 1.91, + "learning_rate": 1.385789062651271e-05, + "loss": 0.0218, + "step": 295560 + }, + { + "epoch": 1.91, + "learning_rate": 1.3848209272155777e-05, + "loss": 0.0201, + "step": 295570 + }, + { + "epoch": 1.91, + "learning_rate": 1.3838527917798847e-05, + "loss": 0.025, + "step": 295580 + }, + { + "epoch": 1.91, + "learning_rate": 1.3828846563441913e-05, + "loss": 0.0227, + "step": 295590 + }, + { + "epoch": 1.91, + "learning_rate": 1.3819165209084981e-05, + "loss": 0.0216, + "step": 295600 + }, + { + "epoch": 1.91, + "learning_rate": 1.3809483854728049e-05, + "loss": 0.0252, + "step": 295610 + }, + { + "epoch": 1.91, + "learning_rate": 1.3799802500371119e-05, + "loss": 0.0195, + "step": 295620 + }, + { + "epoch": 1.91, + "learning_rate": 1.3790121146014185e-05, + "loss": 0.0214, + "step": 295630 + }, + { + "epoch": 1.91, + "learning_rate": 1.3780439791657253e-05, + "loss": 0.0253, + "step": 295640 + }, + { + "epoch": 1.91, + "learning_rate": 1.3770758437300321e-05, + "loss": 0.0209, + "step": 295650 + }, + { + "epoch": 1.91, + "learning_rate": 1.3761077082943387e-05, + "loss": 0.0204, + "step": 295660 + }, + { + "epoch": 1.91, + "learning_rate": 1.3751395728586457e-05, + "loss": 0.0229, + "step": 295670 + }, + { + "epoch": 1.91, + "learning_rate": 1.3741714374229525e-05, + "loss": 0.0265, + "step": 295680 + }, + { + "epoch": 1.91, + "learning_rate": 1.3732033019872593e-05, + "loss": 0.02, + "step": 295690 + }, + { + "epoch": 1.91, + "learning_rate": 1.3722351665515659e-05, + "loss": 0.0211, + "step": 295700 + }, + { + "epoch": 1.91, + "learning_rate": 1.3712670311158728e-05, + "loss": 0.0232, + "step": 295710 + }, + { + "epoch": 1.91, + "learning_rate": 1.3702988956801796e-05, + "loss": 0.0233, + "step": 295720 + }, + { + "epoch": 1.91, + "learning_rate": 1.3693307602444863e-05, + "loss": 0.028, + "step": 295730 + }, + { + "epoch": 1.91, + "learning_rate": 1.368362624808793e-05, + "loss": 0.0224, + "step": 295740 + }, + { + "epoch": 1.91, + "learning_rate": 1.3673944893731e-05, + "loss": 0.0186, + "step": 295750 + }, + { + "epoch": 1.91, + "learning_rate": 1.3664263539374068e-05, + "loss": 0.0215, + "step": 295760 + }, + { + "epoch": 1.91, + "learning_rate": 1.3654582185017134e-05, + "loss": 0.0232, + "step": 295770 + }, + { + "epoch": 1.91, + "learning_rate": 1.3644900830660202e-05, + "loss": 0.0194, + "step": 295780 + }, + { + "epoch": 1.91, + "learning_rate": 1.3635219476303272e-05, + "loss": 0.026, + "step": 295790 + }, + { + "epoch": 1.91, + "learning_rate": 1.3625538121946338e-05, + "loss": 0.0231, + "step": 295800 + }, + { + "epoch": 1.91, + "learning_rate": 1.3615856767589406e-05, + "loss": 0.0199, + "step": 295810 + }, + { + "epoch": 1.91, + "learning_rate": 1.3606175413232474e-05, + "loss": 0.0206, + "step": 295820 + }, + { + "epoch": 1.91, + "learning_rate": 1.3596494058875542e-05, + "loss": 0.0272, + "step": 295830 + }, + { + "epoch": 1.91, + "learning_rate": 1.358681270451861e-05, + "loss": 0.0242, + "step": 295840 + }, + { + "epoch": 1.91, + "learning_rate": 1.3577131350161678e-05, + "loss": 0.0236, + "step": 295850 + }, + { + "epoch": 1.91, + "learning_rate": 1.3567449995804746e-05, + "loss": 0.0206, + "step": 295860 + }, + { + "epoch": 1.91, + "learning_rate": 1.3557768641447812e-05, + "loss": 0.0184, + "step": 295870 + }, + { + "epoch": 1.91, + "learning_rate": 1.354808728709088e-05, + "loss": 0.0213, + "step": 295880 + }, + { + "epoch": 1.91, + "learning_rate": 1.353840593273395e-05, + "loss": 0.0209, + "step": 295890 + }, + { + "epoch": 1.91, + "learning_rate": 1.3528724578377016e-05, + "loss": 0.0225, + "step": 295900 + }, + { + "epoch": 1.91, + "learning_rate": 1.3519043224020084e-05, + "loss": 0.0203, + "step": 295910 + }, + { + "epoch": 1.91, + "learning_rate": 1.3509361869663152e-05, + "loss": 0.0206, + "step": 295920 + }, + { + "epoch": 1.91, + "learning_rate": 1.3499680515306221e-05, + "loss": 0.0246, + "step": 295930 + }, + { + "epoch": 1.91, + "learning_rate": 1.3489999160949288e-05, + "loss": 0.0189, + "step": 295940 + }, + { + "epoch": 1.91, + "learning_rate": 1.3480317806592355e-05, + "loss": 0.0229, + "step": 295950 + }, + { + "epoch": 1.91, + "learning_rate": 1.3470636452235423e-05, + "loss": 0.023, + "step": 295960 + }, + { + "epoch": 1.91, + "learning_rate": 1.346095509787849e-05, + "loss": 0.0237, + "step": 295970 + }, + { + "epoch": 1.91, + "learning_rate": 1.345127374352156e-05, + "loss": 0.0212, + "step": 295980 + }, + { + "epoch": 1.91, + "learning_rate": 1.3441592389164627e-05, + "loss": 0.0192, + "step": 295990 + }, + { + "epoch": 1.91, + "learning_rate": 1.3431911034807695e-05, + "loss": 0.0248, + "step": 296000 + }, + { + "epoch": 1.91, + "eval_cer": 0.9198454411930855, + "eval_loss": 0.0166392233222723, + "eval_runtime": 120.6295, + "eval_samples_per_second": 16.58, + "eval_steps_per_second": 4.145, + "step": 296000 + }, + { + "epoch": 1.91, + "learning_rate": 1.3422229680450761e-05, + "loss": 0.0237, + "step": 296010 + }, + { + "epoch": 1.91, + "learning_rate": 1.3412548326093831e-05, + "loss": 0.0253, + "step": 296020 + }, + { + "epoch": 1.91, + "learning_rate": 1.3402866971736899e-05, + "loss": 0.0262, + "step": 296030 + }, + { + "epoch": 1.91, + "learning_rate": 1.3393185617379965e-05, + "loss": 0.0233, + "step": 296040 + }, + { + "epoch": 1.91, + "learning_rate": 1.3383504263023033e-05, + "loss": 0.0249, + "step": 296050 + }, + { + "epoch": 1.91, + "learning_rate": 1.3373822908666103e-05, + "loss": 0.0229, + "step": 296060 + }, + { + "epoch": 1.91, + "learning_rate": 1.336414155430917e-05, + "loss": 0.0212, + "step": 296070 + }, + { + "epoch": 1.91, + "learning_rate": 1.3354460199952237e-05, + "loss": 0.0217, + "step": 296080 + }, + { + "epoch": 1.91, + "learning_rate": 1.3344778845595305e-05, + "loss": 0.0225, + "step": 296090 + }, + { + "epoch": 1.91, + "learning_rate": 1.3335097491238374e-05, + "loss": 0.0216, + "step": 296100 + }, + { + "epoch": 1.91, + "learning_rate": 1.332541613688144e-05, + "loss": 0.0338, + "step": 296110 + }, + { + "epoch": 1.91, + "learning_rate": 1.3315734782524509e-05, + "loss": 0.0252, + "step": 296120 + }, + { + "epoch": 1.91, + "learning_rate": 1.3306053428167577e-05, + "loss": 0.026, + "step": 296130 + }, + { + "epoch": 1.91, + "learning_rate": 1.3296372073810646e-05, + "loss": 0.0255, + "step": 296140 + }, + { + "epoch": 1.91, + "learning_rate": 1.3286690719453712e-05, + "loss": 0.02, + "step": 296150 + }, + { + "epoch": 1.91, + "learning_rate": 1.327700936509678e-05, + "loss": 0.0219, + "step": 296160 + }, + { + "epoch": 1.91, + "learning_rate": 1.3267328010739848e-05, + "loss": 0.029, + "step": 296170 + }, + { + "epoch": 1.91, + "learning_rate": 1.3257646656382915e-05, + "loss": 0.0295, + "step": 296180 + }, + { + "epoch": 1.91, + "learning_rate": 1.3247965302025984e-05, + "loss": 0.019, + "step": 296190 + }, + { + "epoch": 1.91, + "learning_rate": 1.3238283947669052e-05, + "loss": 0.023, + "step": 296200 + }, + { + "epoch": 1.91, + "learning_rate": 1.322860259331212e-05, + "loss": 0.0252, + "step": 296210 + }, + { + "epoch": 1.91, + "learning_rate": 1.3218921238955186e-05, + "loss": 0.023, + "step": 296220 + }, + { + "epoch": 1.91, + "learning_rate": 1.3209239884598254e-05, + "loss": 0.0218, + "step": 296230 + }, + { + "epoch": 1.91, + "learning_rate": 1.3199558530241324e-05, + "loss": 0.0235, + "step": 296240 + }, + { + "epoch": 1.91, + "learning_rate": 1.318987717588439e-05, + "loss": 0.0208, + "step": 296250 + }, + { + "epoch": 1.91, + "learning_rate": 1.3180195821527458e-05, + "loss": 0.0291, + "step": 296260 + }, + { + "epoch": 1.91, + "learning_rate": 1.3170514467170526e-05, + "loss": 0.0206, + "step": 296270 + }, + { + "epoch": 1.91, + "learning_rate": 1.3160833112813596e-05, + "loss": 0.02, + "step": 296280 + }, + { + "epoch": 1.91, + "learning_rate": 1.3151151758456662e-05, + "loss": 0.0203, + "step": 296290 + }, + { + "epoch": 1.91, + "learning_rate": 1.314147040409973e-05, + "loss": 0.0185, + "step": 296300 + }, + { + "epoch": 1.91, + "learning_rate": 1.3131789049742798e-05, + "loss": 0.0194, + "step": 296310 + }, + { + "epoch": 1.91, + "learning_rate": 1.3122107695385864e-05, + "loss": 0.02, + "step": 296320 + }, + { + "epoch": 1.91, + "learning_rate": 1.3112426341028934e-05, + "loss": 0.0204, + "step": 296330 + }, + { + "epoch": 1.91, + "learning_rate": 1.3102744986672001e-05, + "loss": 0.0233, + "step": 296340 + }, + { + "epoch": 1.91, + "learning_rate": 1.3093063632315068e-05, + "loss": 0.0207, + "step": 296350 + }, + { + "epoch": 1.91, + "learning_rate": 1.3083382277958136e-05, + "loss": 0.0237, + "step": 296360 + }, + { + "epoch": 1.91, + "learning_rate": 1.3073700923601205e-05, + "loss": 0.0223, + "step": 296370 + }, + { + "epoch": 1.91, + "learning_rate": 1.3064019569244273e-05, + "loss": 0.0239, + "step": 296380 + }, + { + "epoch": 1.91, + "learning_rate": 1.305433821488734e-05, + "loss": 0.0223, + "step": 296390 + }, + { + "epoch": 1.91, + "learning_rate": 1.3044656860530407e-05, + "loss": 0.0195, + "step": 296400 + }, + { + "epoch": 1.91, + "learning_rate": 1.3034975506173477e-05, + "loss": 0.0217, + "step": 296410 + }, + { + "epoch": 1.91, + "learning_rate": 1.3025294151816543e-05, + "loss": 0.0233, + "step": 296420 + }, + { + "epoch": 1.91, + "learning_rate": 1.3015612797459611e-05, + "loss": 0.0239, + "step": 296430 + }, + { + "epoch": 1.91, + "learning_rate": 1.3005931443102679e-05, + "loss": 0.0224, + "step": 296440 + }, + { + "epoch": 1.91, + "learning_rate": 1.2996250088745749e-05, + "loss": 0.0272, + "step": 296450 + }, + { + "epoch": 1.91, + "learning_rate": 1.2986568734388815e-05, + "loss": 0.0196, + "step": 296460 + }, + { + "epoch": 1.91, + "learning_rate": 1.2976887380031883e-05, + "loss": 0.0212, + "step": 296470 + }, + { + "epoch": 1.91, + "learning_rate": 1.2967206025674951e-05, + "loss": 0.0231, + "step": 296480 + }, + { + "epoch": 1.91, + "learning_rate": 1.2957524671318017e-05, + "loss": 0.0241, + "step": 296490 + }, + { + "epoch": 1.91, + "learning_rate": 1.2947843316961087e-05, + "loss": 0.0253, + "step": 296500 + }, + { + "epoch": 1.91, + "learning_rate": 1.2938161962604155e-05, + "loss": 0.0226, + "step": 296510 + }, + { + "epoch": 1.91, + "learning_rate": 1.2928480608247223e-05, + "loss": 0.0209, + "step": 296520 + }, + { + "epoch": 1.91, + "learning_rate": 1.2918799253890289e-05, + "loss": 0.022, + "step": 296530 + }, + { + "epoch": 1.91, + "learning_rate": 1.2909117899533357e-05, + "loss": 0.0267, + "step": 296540 + }, + { + "epoch": 1.91, + "learning_rate": 1.2899436545176426e-05, + "loss": 0.0271, + "step": 296550 + }, + { + "epoch": 1.91, + "learning_rate": 1.2889755190819493e-05, + "loss": 0.0235, + "step": 296560 + }, + { + "epoch": 1.91, + "learning_rate": 1.288007383646256e-05, + "loss": 0.0216, + "step": 296570 + }, + { + "epoch": 1.91, + "learning_rate": 1.2870392482105628e-05, + "loss": 0.0209, + "step": 296580 + }, + { + "epoch": 1.91, + "learning_rate": 1.2860711127748698e-05, + "loss": 0.0203, + "step": 296590 + }, + { + "epoch": 1.91, + "learning_rate": 1.2851029773391764e-05, + "loss": 0.0266, + "step": 296600 + }, + { + "epoch": 1.91, + "learning_rate": 1.2841348419034832e-05, + "loss": 0.0207, + "step": 296610 + }, + { + "epoch": 1.91, + "learning_rate": 1.28316670646779e-05, + "loss": 0.0193, + "step": 296620 + }, + { + "epoch": 1.91, + "learning_rate": 1.2821985710320966e-05, + "loss": 0.0222, + "step": 296630 + }, + { + "epoch": 1.91, + "learning_rate": 1.2812304355964036e-05, + "loss": 0.0186, + "step": 296640 + }, + { + "epoch": 1.91, + "learning_rate": 1.2802623001607104e-05, + "loss": 0.0234, + "step": 296650 + }, + { + "epoch": 1.91, + "learning_rate": 1.2792941647250172e-05, + "loss": 0.0251, + "step": 296660 + }, + { + "epoch": 1.91, + "learning_rate": 1.2783260292893238e-05, + "loss": 0.0232, + "step": 296670 + }, + { + "epoch": 1.91, + "learning_rate": 1.2773578938536308e-05, + "loss": 0.0194, + "step": 296680 + }, + { + "epoch": 1.91, + "learning_rate": 1.2763897584179376e-05, + "loss": 0.0199, + "step": 296690 + }, + { + "epoch": 1.91, + "learning_rate": 1.2754216229822442e-05, + "loss": 0.0249, + "step": 296700 + }, + { + "epoch": 1.92, + "learning_rate": 1.274453487546551e-05, + "loss": 0.0237, + "step": 296710 + }, + { + "epoch": 1.92, + "learning_rate": 1.273485352110858e-05, + "loss": 0.0235, + "step": 296720 + }, + { + "epoch": 1.92, + "learning_rate": 1.2725172166751647e-05, + "loss": 0.0201, + "step": 296730 + }, + { + "epoch": 1.92, + "learning_rate": 1.2715490812394714e-05, + "loss": 0.0235, + "step": 296740 + }, + { + "epoch": 1.92, + "learning_rate": 1.2705809458037782e-05, + "loss": 0.0195, + "step": 296750 + }, + { + "epoch": 1.92, + "learning_rate": 1.2696128103680851e-05, + "loss": 0.0235, + "step": 296760 + }, + { + "epoch": 1.92, + "learning_rate": 1.2686446749323918e-05, + "loss": 0.0216, + "step": 296770 + }, + { + "epoch": 1.92, + "learning_rate": 1.2676765394966985e-05, + "loss": 0.0268, + "step": 296780 + }, + { + "epoch": 1.92, + "learning_rate": 1.2667084040610053e-05, + "loss": 0.0176, + "step": 296790 + }, + { + "epoch": 1.92, + "learning_rate": 1.265740268625312e-05, + "loss": 0.024, + "step": 296800 + }, + { + "epoch": 1.92, + "learning_rate": 1.264772133189619e-05, + "loss": 0.0251, + "step": 296810 + }, + { + "epoch": 1.92, + "learning_rate": 1.2638039977539257e-05, + "loss": 0.0245, + "step": 296820 + }, + { + "epoch": 1.92, + "learning_rate": 1.2628358623182325e-05, + "loss": 0.0282, + "step": 296830 + }, + { + "epoch": 1.92, + "learning_rate": 1.2618677268825391e-05, + "loss": 0.0229, + "step": 296840 + }, + { + "epoch": 1.92, + "learning_rate": 1.2608995914468461e-05, + "loss": 0.0189, + "step": 296850 + }, + { + "epoch": 1.92, + "learning_rate": 1.2599314560111529e-05, + "loss": 0.0247, + "step": 296860 + }, + { + "epoch": 1.92, + "learning_rate": 1.2589633205754595e-05, + "loss": 0.0258, + "step": 296870 + }, + { + "epoch": 1.92, + "learning_rate": 1.2579951851397663e-05, + "loss": 0.0289, + "step": 296880 + }, + { + "epoch": 1.92, + "learning_rate": 1.2570270497040731e-05, + "loss": 0.0298, + "step": 296890 + }, + { + "epoch": 1.92, + "learning_rate": 1.25605891426838e-05, + "loss": 0.0228, + "step": 296900 + }, + { + "epoch": 1.92, + "learning_rate": 1.2550907788326867e-05, + "loss": 0.0247, + "step": 296910 + }, + { + "epoch": 1.92, + "learning_rate": 1.2541226433969935e-05, + "loss": 0.0251, + "step": 296920 + }, + { + "epoch": 1.92, + "learning_rate": 1.2531545079613003e-05, + "loss": 0.0191, + "step": 296930 + }, + { + "epoch": 1.92, + "learning_rate": 1.2521863725256069e-05, + "loss": 0.0229, + "step": 296940 + }, + { + "epoch": 1.92, + "learning_rate": 1.2512182370899139e-05, + "loss": 0.0236, + "step": 296950 + }, + { + "epoch": 1.92, + "learning_rate": 1.2502501016542207e-05, + "loss": 0.0159, + "step": 296960 + }, + { + "epoch": 1.92, + "learning_rate": 1.2492819662185275e-05, + "loss": 0.0254, + "step": 296970 + }, + { + "epoch": 1.92, + "learning_rate": 1.248313830782834e-05, + "loss": 0.0226, + "step": 296980 + }, + { + "epoch": 1.92, + "learning_rate": 1.247345695347141e-05, + "loss": 0.0248, + "step": 296990 + }, + { + "epoch": 1.92, + "learning_rate": 1.2463775599114478e-05, + "loss": 0.0216, + "step": 297000 + }, + { + "epoch": 1.92, + "eval_cer": 0.9198427296350695, + "eval_loss": 0.016580868512392044, + "eval_runtime": 120.5977, + "eval_samples_per_second": 16.584, + "eval_steps_per_second": 4.146, + "step": 297000 + }, + { + "epoch": 1.92, + "learning_rate": 1.2454094244757545e-05, + "loss": 0.0207, + "step": 297010 + }, + { + "epoch": 1.92, + "learning_rate": 1.2444412890400612e-05, + "loss": 0.0212, + "step": 297020 + }, + { + "epoch": 1.92, + "learning_rate": 1.2434731536043682e-05, + "loss": 0.0192, + "step": 297030 + }, + { + "epoch": 1.92, + "learning_rate": 1.242505018168675e-05, + "loss": 0.0201, + "step": 297040 + }, + { + "epoch": 1.92, + "learning_rate": 1.2415368827329816e-05, + "loss": 0.0199, + "step": 297050 + }, + { + "epoch": 1.92, + "learning_rate": 1.2405687472972884e-05, + "loss": 0.024, + "step": 297060 + }, + { + "epoch": 1.92, + "learning_rate": 1.2396006118615954e-05, + "loss": 0.0193, + "step": 297070 + }, + { + "epoch": 1.92, + "learning_rate": 1.238632476425902e-05, + "loss": 0.0257, + "step": 297080 + }, + { + "epoch": 1.92, + "learning_rate": 1.2376643409902088e-05, + "loss": 0.0252, + "step": 297090 + }, + { + "epoch": 1.92, + "learning_rate": 1.2366962055545156e-05, + "loss": 0.0248, + "step": 297100 + }, + { + "epoch": 1.92, + "learning_rate": 1.2357280701188226e-05, + "loss": 0.026, + "step": 297110 + }, + { + "epoch": 1.92, + "learning_rate": 1.2347599346831292e-05, + "loss": 0.0227, + "step": 297120 + }, + { + "epoch": 1.92, + "learning_rate": 1.233791799247436e-05, + "loss": 0.0298, + "step": 297130 + }, + { + "epoch": 1.92, + "learning_rate": 1.2328236638117428e-05, + "loss": 0.0227, + "step": 297140 + }, + { + "epoch": 1.92, + "learning_rate": 1.2318555283760494e-05, + "loss": 0.019, + "step": 297150 + }, + { + "epoch": 1.92, + "learning_rate": 1.2308873929403564e-05, + "loss": 0.0174, + "step": 297160 + }, + { + "epoch": 1.92, + "learning_rate": 1.2299192575046631e-05, + "loss": 0.021, + "step": 297170 + }, + { + "epoch": 1.92, + "learning_rate": 1.2289511220689698e-05, + "loss": 0.0208, + "step": 297180 + }, + { + "epoch": 1.92, + "learning_rate": 1.2279829866332766e-05, + "loss": 0.0207, + "step": 297190 + }, + { + "epoch": 1.92, + "learning_rate": 1.2270148511975835e-05, + "loss": 0.0237, + "step": 297200 + }, + { + "epoch": 1.92, + "learning_rate": 1.2260467157618903e-05, + "loss": 0.0219, + "step": 297210 + }, + { + "epoch": 1.92, + "learning_rate": 1.225078580326197e-05, + "loss": 0.0228, + "step": 297220 + }, + { + "epoch": 1.92, + "learning_rate": 1.2241104448905037e-05, + "loss": 0.0237, + "step": 297230 + }, + { + "epoch": 1.92, + "learning_rate": 1.2231423094548105e-05, + "loss": 0.0242, + "step": 297240 + }, + { + "epoch": 1.92, + "learning_rate": 1.2221741740191173e-05, + "loss": 0.0247, + "step": 297250 + }, + { + "epoch": 1.92, + "learning_rate": 1.2212060385834241e-05, + "loss": 0.0206, + "step": 297260 + }, + { + "epoch": 1.92, + "learning_rate": 1.2202379031477309e-05, + "loss": 0.0212, + "step": 297270 + }, + { + "epoch": 1.92, + "learning_rate": 1.2192697677120377e-05, + "loss": 0.0199, + "step": 297280 + }, + { + "epoch": 1.92, + "learning_rate": 1.2183016322763443e-05, + "loss": 0.0243, + "step": 297290 + }, + { + "epoch": 1.92, + "learning_rate": 1.2173334968406513e-05, + "loss": 0.0228, + "step": 297300 + }, + { + "epoch": 1.92, + "learning_rate": 1.216365361404958e-05, + "loss": 0.0194, + "step": 297310 + }, + { + "epoch": 1.92, + "learning_rate": 1.2153972259692647e-05, + "loss": 0.0244, + "step": 297320 + }, + { + "epoch": 1.92, + "learning_rate": 1.2144290905335715e-05, + "loss": 0.018, + "step": 297330 + }, + { + "epoch": 1.92, + "learning_rate": 1.2134609550978785e-05, + "loss": 0.0212, + "step": 297340 + }, + { + "epoch": 1.92, + "learning_rate": 1.2124928196621853e-05, + "loss": 0.0193, + "step": 297350 + }, + { + "epoch": 1.92, + "learning_rate": 1.2115246842264919e-05, + "loss": 0.0216, + "step": 297360 + }, + { + "epoch": 1.92, + "learning_rate": 1.2105565487907987e-05, + "loss": 0.0212, + "step": 297370 + }, + { + "epoch": 1.92, + "learning_rate": 1.2095884133551056e-05, + "loss": 0.02, + "step": 297380 + }, + { + "epoch": 1.92, + "learning_rate": 1.2086202779194123e-05, + "loss": 0.0264, + "step": 297390 + }, + { + "epoch": 1.92, + "learning_rate": 1.207652142483719e-05, + "loss": 0.0254, + "step": 297400 + }, + { + "epoch": 1.92, + "learning_rate": 1.2066840070480258e-05, + "loss": 0.0188, + "step": 297410 + }, + { + "epoch": 1.92, + "learning_rate": 1.2057158716123328e-05, + "loss": 0.021, + "step": 297420 + }, + { + "epoch": 1.92, + "learning_rate": 1.2047477361766394e-05, + "loss": 0.0204, + "step": 297430 + }, + { + "epoch": 1.92, + "learning_rate": 1.2037796007409462e-05, + "loss": 0.0217, + "step": 297440 + }, + { + "epoch": 1.92, + "learning_rate": 1.202811465305253e-05, + "loss": 0.0248, + "step": 297450 + }, + { + "epoch": 1.92, + "learning_rate": 1.2018433298695596e-05, + "loss": 0.0178, + "step": 297460 + }, + { + "epoch": 1.92, + "learning_rate": 1.2008751944338666e-05, + "loss": 0.0229, + "step": 297470 + }, + { + "epoch": 1.92, + "learning_rate": 1.1999070589981734e-05, + "loss": 0.0255, + "step": 297480 + }, + { + "epoch": 1.92, + "learning_rate": 1.1989389235624802e-05, + "loss": 0.0208, + "step": 297490 + }, + { + "epoch": 1.92, + "learning_rate": 1.1979707881267868e-05, + "loss": 0.0227, + "step": 297500 + }, + { + "epoch": 1.92, + "learning_rate": 1.1970026526910938e-05, + "loss": 0.0264, + "step": 297510 + }, + { + "epoch": 1.92, + "learning_rate": 1.1960345172554006e-05, + "loss": 0.0219, + "step": 297520 + }, + { + "epoch": 1.92, + "learning_rate": 1.1950663818197072e-05, + "loss": 0.0216, + "step": 297530 + }, + { + "epoch": 1.92, + "learning_rate": 1.194098246384014e-05, + "loss": 0.0235, + "step": 297540 + }, + { + "epoch": 1.92, + "learning_rate": 1.1931301109483208e-05, + "loss": 0.0202, + "step": 297550 + }, + { + "epoch": 1.92, + "learning_rate": 1.1921619755126277e-05, + "loss": 0.021, + "step": 297560 + }, + { + "epoch": 1.92, + "learning_rate": 1.1911938400769344e-05, + "loss": 0.0188, + "step": 297570 + }, + { + "epoch": 1.92, + "learning_rate": 1.1902257046412412e-05, + "loss": 0.02, + "step": 297580 + }, + { + "epoch": 1.92, + "learning_rate": 1.189257569205548e-05, + "loss": 0.0232, + "step": 297590 + }, + { + "epoch": 1.92, + "learning_rate": 1.1882894337698546e-05, + "loss": 0.0186, + "step": 297600 + }, + { + "epoch": 1.92, + "learning_rate": 1.1873212983341615e-05, + "loss": 0.0199, + "step": 297610 + }, + { + "epoch": 1.92, + "learning_rate": 1.1863531628984683e-05, + "loss": 0.0213, + "step": 297620 + }, + { + "epoch": 1.92, + "learning_rate": 1.185385027462775e-05, + "loss": 0.0192, + "step": 297630 + }, + { + "epoch": 1.92, + "learning_rate": 1.1844168920270818e-05, + "loss": 0.0224, + "step": 297640 + }, + { + "epoch": 1.92, + "learning_rate": 1.1834487565913887e-05, + "loss": 0.0207, + "step": 297650 + }, + { + "epoch": 1.92, + "learning_rate": 1.1824806211556955e-05, + "loss": 0.0227, + "step": 297660 + }, + { + "epoch": 1.92, + "learning_rate": 1.1815124857200021e-05, + "loss": 0.0211, + "step": 297670 + }, + { + "epoch": 1.92, + "learning_rate": 1.180544350284309e-05, + "loss": 0.0216, + "step": 297680 + }, + { + "epoch": 1.92, + "learning_rate": 1.1795762148486159e-05, + "loss": 0.0202, + "step": 297690 + }, + { + "epoch": 1.92, + "learning_rate": 1.1786080794129225e-05, + "loss": 0.022, + "step": 297700 + }, + { + "epoch": 1.92, + "learning_rate": 1.1776399439772293e-05, + "loss": 0.0207, + "step": 297710 + }, + { + "epoch": 1.92, + "learning_rate": 1.1766718085415361e-05, + "loss": 0.022, + "step": 297720 + }, + { + "epoch": 1.92, + "learning_rate": 1.175703673105843e-05, + "loss": 0.0235, + "step": 297730 + }, + { + "epoch": 1.92, + "learning_rate": 1.1747355376701497e-05, + "loss": 0.0213, + "step": 297740 + }, + { + "epoch": 1.92, + "learning_rate": 1.1737674022344565e-05, + "loss": 0.0201, + "step": 297750 + }, + { + "epoch": 1.92, + "learning_rate": 1.1727992667987633e-05, + "loss": 0.0202, + "step": 297760 + }, + { + "epoch": 1.92, + "learning_rate": 1.1718311313630699e-05, + "loss": 0.0219, + "step": 297770 + }, + { + "epoch": 1.92, + "learning_rate": 1.1708629959273769e-05, + "loss": 0.023, + "step": 297780 + }, + { + "epoch": 1.92, + "learning_rate": 1.1698948604916837e-05, + "loss": 0.0198, + "step": 297790 + }, + { + "epoch": 1.92, + "learning_rate": 1.1689267250559904e-05, + "loss": 0.0198, + "step": 297800 + }, + { + "epoch": 1.92, + "learning_rate": 1.167958589620297e-05, + "loss": 0.0183, + "step": 297810 + }, + { + "epoch": 1.92, + "learning_rate": 1.166990454184604e-05, + "loss": 0.0251, + "step": 297820 + }, + { + "epoch": 1.92, + "learning_rate": 1.1660223187489108e-05, + "loss": 0.0203, + "step": 297830 + }, + { + "epoch": 1.92, + "learning_rate": 1.1650541833132175e-05, + "loss": 0.0233, + "step": 297840 + }, + { + "epoch": 1.92, + "learning_rate": 1.1640860478775242e-05, + "loss": 0.0203, + "step": 297850 + }, + { + "epoch": 1.92, + "learning_rate": 1.1631179124418312e-05, + "loss": 0.0225, + "step": 297860 + }, + { + "epoch": 1.92, + "learning_rate": 1.162149777006138e-05, + "loss": 0.0213, + "step": 297870 + }, + { + "epoch": 1.92, + "learning_rate": 1.1611816415704446e-05, + "loss": 0.0226, + "step": 297880 + }, + { + "epoch": 1.92, + "learning_rate": 1.1602135061347514e-05, + "loss": 0.0193, + "step": 297890 + }, + { + "epoch": 1.92, + "learning_rate": 1.1592453706990582e-05, + "loss": 0.0256, + "step": 297900 + }, + { + "epoch": 1.92, + "learning_rate": 1.158277235263365e-05, + "loss": 0.0239, + "step": 297910 + }, + { + "epoch": 1.92, + "learning_rate": 1.1573090998276718e-05, + "loss": 0.0244, + "step": 297920 + }, + { + "epoch": 1.92, + "learning_rate": 1.1563409643919786e-05, + "loss": 0.0176, + "step": 297930 + }, + { + "epoch": 1.92, + "learning_rate": 1.1553728289562854e-05, + "loss": 0.0206, + "step": 297940 + }, + { + "epoch": 1.92, + "learning_rate": 1.154404693520592e-05, + "loss": 0.0201, + "step": 297950 + }, + { + "epoch": 1.92, + "learning_rate": 1.153436558084899e-05, + "loss": 0.0205, + "step": 297960 + }, + { + "epoch": 1.92, + "learning_rate": 1.1524684226492058e-05, + "loss": 0.0181, + "step": 297970 + }, + { + "epoch": 1.92, + "learning_rate": 1.1515002872135124e-05, + "loss": 0.0254, + "step": 297980 + }, + { + "epoch": 1.92, + "learning_rate": 1.1505321517778192e-05, + "loss": 0.0255, + "step": 297990 + }, + { + "epoch": 1.92, + "learning_rate": 1.1495640163421261e-05, + "loss": 0.0219, + "step": 298000 + }, + { + "epoch": 1.92, + "eval_cer": 0.9198427296350695, + "eval_loss": 0.016680259257555008, + "eval_runtime": 120.6259, + "eval_samples_per_second": 16.58, + "eval_steps_per_second": 4.145, + "step": 298000 + }, + { + "epoch": 1.92, + "learning_rate": 1.148595880906433e-05, + "loss": 0.0187, + "step": 298010 + }, + { + "epoch": 1.92, + "learning_rate": 1.1476277454707396e-05, + "loss": 0.03, + "step": 298020 + }, + { + "epoch": 1.92, + "learning_rate": 1.1466596100350464e-05, + "loss": 0.0263, + "step": 298030 + }, + { + "epoch": 1.92, + "learning_rate": 1.1456914745993533e-05, + "loss": 0.0191, + "step": 298040 + }, + { + "epoch": 1.92, + "learning_rate": 1.14472333916366e-05, + "loss": 0.0175, + "step": 298050 + }, + { + "epoch": 1.92, + "learning_rate": 1.1437552037279667e-05, + "loss": 0.0223, + "step": 298060 + }, + { + "epoch": 1.92, + "learning_rate": 1.1427870682922735e-05, + "loss": 0.0195, + "step": 298070 + }, + { + "epoch": 1.92, + "learning_rate": 1.1418189328565802e-05, + "loss": 0.0282, + "step": 298080 + }, + { + "epoch": 1.92, + "learning_rate": 1.1408507974208871e-05, + "loss": 0.0231, + "step": 298090 + }, + { + "epoch": 1.92, + "learning_rate": 1.1398826619851939e-05, + "loss": 0.0211, + "step": 298100 + }, + { + "epoch": 1.92, + "learning_rate": 1.1389145265495007e-05, + "loss": 0.0215, + "step": 298110 + }, + { + "epoch": 1.92, + "learning_rate": 1.1379463911138073e-05, + "loss": 0.0199, + "step": 298120 + }, + { + "epoch": 1.92, + "learning_rate": 1.1369782556781143e-05, + "loss": 0.0235, + "step": 298130 + }, + { + "epoch": 1.92, + "learning_rate": 1.136010120242421e-05, + "loss": 0.0212, + "step": 298140 + }, + { + "epoch": 1.92, + "learning_rate": 1.1350419848067277e-05, + "loss": 0.0223, + "step": 298150 + }, + { + "epoch": 1.92, + "learning_rate": 1.1340738493710345e-05, + "loss": 0.0227, + "step": 298160 + }, + { + "epoch": 1.92, + "learning_rate": 1.1331057139353415e-05, + "loss": 0.0268, + "step": 298170 + }, + { + "epoch": 1.92, + "learning_rate": 1.1321375784996483e-05, + "loss": 0.0245, + "step": 298180 + }, + { + "epoch": 1.92, + "learning_rate": 1.1311694430639549e-05, + "loss": 0.0241, + "step": 298190 + }, + { + "epoch": 1.92, + "learning_rate": 1.1302013076282617e-05, + "loss": 0.0235, + "step": 298200 + }, + { + "epoch": 1.92, + "learning_rate": 1.1292331721925685e-05, + "loss": 0.0226, + "step": 298210 + }, + { + "epoch": 1.92, + "learning_rate": 1.1282650367568753e-05, + "loss": 0.0226, + "step": 298220 + }, + { + "epoch": 1.92, + "learning_rate": 1.127296901321182e-05, + "loss": 0.0215, + "step": 298230 + }, + { + "epoch": 1.92, + "learning_rate": 1.1263287658854888e-05, + "loss": 0.0207, + "step": 298240 + }, + { + "epoch": 1.92, + "learning_rate": 1.1253606304497956e-05, + "loss": 0.0263, + "step": 298250 + }, + { + "epoch": 1.93, + "learning_rate": 1.1243924950141024e-05, + "loss": 0.017, + "step": 298260 + }, + { + "epoch": 1.93, + "learning_rate": 1.1234243595784092e-05, + "loss": 0.0208, + "step": 298270 + }, + { + "epoch": 1.93, + "learning_rate": 1.122456224142716e-05, + "loss": 0.0195, + "step": 298280 + }, + { + "epoch": 1.93, + "learning_rate": 1.1214880887070226e-05, + "loss": 0.0226, + "step": 298290 + }, + { + "epoch": 1.93, + "learning_rate": 1.1205199532713294e-05, + "loss": 0.0227, + "step": 298300 + }, + { + "epoch": 1.93, + "learning_rate": 1.1195518178356364e-05, + "loss": 0.0214, + "step": 298310 + }, + { + "epoch": 1.93, + "learning_rate": 1.1185836823999432e-05, + "loss": 0.0223, + "step": 298320 + }, + { + "epoch": 1.93, + "learning_rate": 1.1176155469642498e-05, + "loss": 0.0196, + "step": 298330 + }, + { + "epoch": 1.93, + "learning_rate": 1.1166474115285566e-05, + "loss": 0.0201, + "step": 298340 + }, + { + "epoch": 1.93, + "learning_rate": 1.1156792760928636e-05, + "loss": 0.0247, + "step": 298350 + }, + { + "epoch": 1.93, + "learning_rate": 1.1147111406571702e-05, + "loss": 0.0213, + "step": 298360 + }, + { + "epoch": 1.93, + "learning_rate": 1.113743005221477e-05, + "loss": 0.0186, + "step": 298370 + }, + { + "epoch": 1.93, + "learning_rate": 1.1127748697857838e-05, + "loss": 0.0248, + "step": 298380 + }, + { + "epoch": 1.93, + "learning_rate": 1.1118067343500907e-05, + "loss": 0.0233, + "step": 298390 + }, + { + "epoch": 1.93, + "learning_rate": 1.1108385989143974e-05, + "loss": 0.0223, + "step": 298400 + }, + { + "epoch": 1.93, + "learning_rate": 1.1098704634787042e-05, + "loss": 0.0181, + "step": 298410 + }, + { + "epoch": 1.93, + "learning_rate": 1.108902328043011e-05, + "loss": 0.028, + "step": 298420 + }, + { + "epoch": 1.93, + "learning_rate": 1.1079341926073176e-05, + "loss": 0.0232, + "step": 298430 + }, + { + "epoch": 1.93, + "learning_rate": 1.1069660571716245e-05, + "loss": 0.0208, + "step": 298440 + }, + { + "epoch": 1.93, + "learning_rate": 1.1059979217359313e-05, + "loss": 0.0208, + "step": 298450 + }, + { + "epoch": 1.93, + "learning_rate": 1.1050297863002381e-05, + "loss": 0.0261, + "step": 298460 + }, + { + "epoch": 1.93, + "learning_rate": 1.1040616508645448e-05, + "loss": 0.0188, + "step": 298470 + }, + { + "epoch": 1.93, + "learning_rate": 1.1030935154288517e-05, + "loss": 0.0239, + "step": 298480 + }, + { + "epoch": 1.93, + "learning_rate": 1.1021253799931585e-05, + "loss": 0.0229, + "step": 298490 + }, + { + "epoch": 1.93, + "learning_rate": 1.1011572445574651e-05, + "loss": 0.0221, + "step": 298500 + }, + { + "epoch": 1.93, + "learning_rate": 1.100189109121772e-05, + "loss": 0.0272, + "step": 298510 + }, + { + "epoch": 1.93, + "learning_rate": 1.0992209736860789e-05, + "loss": 0.0209, + "step": 298520 + }, + { + "epoch": 1.93, + "learning_rate": 1.0982528382503855e-05, + "loss": 0.0198, + "step": 298530 + }, + { + "epoch": 1.93, + "learning_rate": 1.0972847028146923e-05, + "loss": 0.0294, + "step": 298540 + }, + { + "epoch": 1.93, + "learning_rate": 1.0963165673789991e-05, + "loss": 0.0203, + "step": 298550 + }, + { + "epoch": 1.93, + "learning_rate": 1.0953484319433059e-05, + "loss": 0.0201, + "step": 298560 + }, + { + "epoch": 1.93, + "learning_rate": 1.0943802965076127e-05, + "loss": 0.0175, + "step": 298570 + }, + { + "epoch": 1.93, + "learning_rate": 1.0934121610719195e-05, + "loss": 0.0222, + "step": 298580 + }, + { + "epoch": 1.93, + "learning_rate": 1.0924440256362263e-05, + "loss": 0.0197, + "step": 298590 + }, + { + "epoch": 1.93, + "learning_rate": 1.0914758902005329e-05, + "loss": 0.0225, + "step": 298600 + }, + { + "epoch": 1.93, + "learning_rate": 1.0905077547648397e-05, + "loss": 0.0239, + "step": 298610 + }, + { + "epoch": 1.93, + "learning_rate": 1.0895396193291467e-05, + "loss": 0.0198, + "step": 298620 + }, + { + "epoch": 1.93, + "learning_rate": 1.0885714838934534e-05, + "loss": 0.0211, + "step": 298630 + }, + { + "epoch": 1.93, + "learning_rate": 1.08760334845776e-05, + "loss": 0.0175, + "step": 298640 + }, + { + "epoch": 1.93, + "learning_rate": 1.0866352130220669e-05, + "loss": 0.0241, + "step": 298650 + }, + { + "epoch": 1.93, + "learning_rate": 1.0856670775863738e-05, + "loss": 0.0235, + "step": 298660 + }, + { + "epoch": 1.93, + "learning_rate": 1.0846989421506805e-05, + "loss": 0.0159, + "step": 298670 + }, + { + "epoch": 1.93, + "learning_rate": 1.0837308067149872e-05, + "loss": 0.0202, + "step": 298680 + }, + { + "epoch": 1.93, + "learning_rate": 1.082762671279294e-05, + "loss": 0.0204, + "step": 298690 + }, + { + "epoch": 1.93, + "learning_rate": 1.081794535843601e-05, + "loss": 0.0171, + "step": 298700 + }, + { + "epoch": 1.93, + "learning_rate": 1.0808264004079076e-05, + "loss": 0.0228, + "step": 298710 + }, + { + "epoch": 1.93, + "learning_rate": 1.0798582649722144e-05, + "loss": 0.0224, + "step": 298720 + }, + { + "epoch": 1.93, + "learning_rate": 1.0788901295365212e-05, + "loss": 0.0227, + "step": 298730 + }, + { + "epoch": 1.93, + "learning_rate": 1.0779219941008278e-05, + "loss": 0.0221, + "step": 298740 + }, + { + "epoch": 1.93, + "learning_rate": 1.0769538586651348e-05, + "loss": 0.0221, + "step": 298750 + }, + { + "epoch": 1.93, + "learning_rate": 1.0759857232294416e-05, + "loss": 0.0202, + "step": 298760 + }, + { + "epoch": 1.93, + "learning_rate": 1.0750175877937484e-05, + "loss": 0.0215, + "step": 298770 + }, + { + "epoch": 1.93, + "learning_rate": 1.074049452358055e-05, + "loss": 0.0203, + "step": 298780 + }, + { + "epoch": 1.93, + "learning_rate": 1.073081316922362e-05, + "loss": 0.0256, + "step": 298790 + }, + { + "epoch": 1.93, + "learning_rate": 1.0721131814866688e-05, + "loss": 0.0236, + "step": 298800 + }, + { + "epoch": 1.93, + "learning_rate": 1.0711450460509754e-05, + "loss": 0.0193, + "step": 298810 + }, + { + "epoch": 1.93, + "learning_rate": 1.0701769106152822e-05, + "loss": 0.0202, + "step": 298820 + }, + { + "epoch": 1.93, + "learning_rate": 1.0692087751795891e-05, + "loss": 0.0255, + "step": 298830 + }, + { + "epoch": 1.93, + "learning_rate": 1.068240639743896e-05, + "loss": 0.0237, + "step": 298840 + }, + { + "epoch": 1.93, + "learning_rate": 1.0672725043082026e-05, + "loss": 0.025, + "step": 298850 + }, + { + "epoch": 1.93, + "learning_rate": 1.0663043688725094e-05, + "loss": 0.022, + "step": 298860 + }, + { + "epoch": 1.93, + "learning_rate": 1.0653362334368163e-05, + "loss": 0.0226, + "step": 298870 + }, + { + "epoch": 1.93, + "learning_rate": 1.064368098001123e-05, + "loss": 0.0225, + "step": 298880 + }, + { + "epoch": 1.93, + "learning_rate": 1.0633999625654297e-05, + "loss": 0.02, + "step": 298890 + }, + { + "epoch": 1.93, + "learning_rate": 1.0624318271297365e-05, + "loss": 0.0225, + "step": 298900 + }, + { + "epoch": 1.93, + "learning_rate": 1.0614636916940432e-05, + "loss": 0.0183, + "step": 298910 + }, + { + "epoch": 1.93, + "learning_rate": 1.0604955562583501e-05, + "loss": 0.0266, + "step": 298920 + }, + { + "epoch": 1.93, + "learning_rate": 1.0595274208226569e-05, + "loss": 0.0196, + "step": 298930 + }, + { + "epoch": 1.93, + "learning_rate": 1.0585592853869637e-05, + "loss": 0.0203, + "step": 298940 + }, + { + "epoch": 1.93, + "learning_rate": 1.0575911499512703e-05, + "loss": 0.0192, + "step": 298950 + }, + { + "epoch": 1.93, + "learning_rate": 1.0566230145155771e-05, + "loss": 0.0213, + "step": 298960 + }, + { + "epoch": 1.93, + "learning_rate": 1.055654879079884e-05, + "loss": 0.0228, + "step": 298970 + }, + { + "epoch": 1.93, + "learning_rate": 1.0546867436441907e-05, + "loss": 0.0177, + "step": 298980 + }, + { + "epoch": 1.93, + "learning_rate": 1.0537186082084975e-05, + "loss": 0.023, + "step": 298990 + }, + { + "epoch": 1.93, + "learning_rate": 1.0527504727728043e-05, + "loss": 0.0196, + "step": 299000 + }, + { + "epoch": 1.93, + "eval_cer": 0.919811998644221, + "eval_loss": 0.016669558361172676, + "eval_runtime": 120.4327, + "eval_samples_per_second": 16.607, + "eval_steps_per_second": 4.152, + "step": 299000 + }, + { + "epoch": 1.93, + "learning_rate": 1.0517823373371113e-05, + "loss": 0.0249, + "step": 299010 + }, + { + "epoch": 1.93, + "learning_rate": 1.0508142019014179e-05, + "loss": 0.0218, + "step": 299020 + }, + { + "epoch": 1.93, + "learning_rate": 1.0498460664657247e-05, + "loss": 0.0258, + "step": 299030 + }, + { + "epoch": 1.93, + "learning_rate": 1.0488779310300315e-05, + "loss": 0.0226, + "step": 299040 + }, + { + "epoch": 1.93, + "learning_rate": 1.0479097955943381e-05, + "loss": 0.021, + "step": 299050 + }, + { + "epoch": 1.93, + "learning_rate": 1.046941660158645e-05, + "loss": 0.0235, + "step": 299060 + }, + { + "epoch": 1.93, + "learning_rate": 1.0459735247229518e-05, + "loss": 0.0238, + "step": 299070 + }, + { + "epoch": 1.93, + "learning_rate": 1.0450053892872586e-05, + "loss": 0.0196, + "step": 299080 + }, + { + "epoch": 1.93, + "learning_rate": 1.0440372538515653e-05, + "loss": 0.0235, + "step": 299090 + }, + { + "epoch": 1.93, + "learning_rate": 1.0430691184158722e-05, + "loss": 0.0226, + "step": 299100 + }, + { + "epoch": 1.93, + "learning_rate": 1.042100982980179e-05, + "loss": 0.0227, + "step": 299110 + }, + { + "epoch": 1.93, + "learning_rate": 1.0411328475444856e-05, + "loss": 0.0225, + "step": 299120 + }, + { + "epoch": 1.93, + "learning_rate": 1.0401647121087924e-05, + "loss": 0.0226, + "step": 299130 + }, + { + "epoch": 1.93, + "learning_rate": 1.0391965766730994e-05, + "loss": 0.0221, + "step": 299140 + }, + { + "epoch": 1.93, + "learning_rate": 1.0382284412374062e-05, + "loss": 0.0198, + "step": 299150 + }, + { + "epoch": 1.93, + "learning_rate": 1.0372603058017128e-05, + "loss": 0.029, + "step": 299160 + }, + { + "epoch": 1.93, + "learning_rate": 1.0362921703660196e-05, + "loss": 0.0228, + "step": 299170 + }, + { + "epoch": 1.93, + "learning_rate": 1.0353240349303266e-05, + "loss": 0.0252, + "step": 299180 + }, + { + "epoch": 1.93, + "learning_rate": 1.0343558994946332e-05, + "loss": 0.0205, + "step": 299190 + }, + { + "epoch": 1.93, + "learning_rate": 1.03338776405894e-05, + "loss": 0.0195, + "step": 299200 + }, + { + "epoch": 1.93, + "learning_rate": 1.0324196286232468e-05, + "loss": 0.0276, + "step": 299210 + }, + { + "epoch": 1.93, + "learning_rate": 1.0314514931875536e-05, + "loss": 0.0237, + "step": 299220 + }, + { + "epoch": 1.93, + "learning_rate": 1.0304833577518604e-05, + "loss": 0.0195, + "step": 299230 + }, + { + "epoch": 1.93, + "learning_rate": 1.0295152223161672e-05, + "loss": 0.0185, + "step": 299240 + }, + { + "epoch": 1.93, + "learning_rate": 1.028547086880474e-05, + "loss": 0.0194, + "step": 299250 + }, + { + "epoch": 1.93, + "learning_rate": 1.0275789514447806e-05, + "loss": 0.0213, + "step": 299260 + }, + { + "epoch": 1.93, + "learning_rate": 1.0266108160090874e-05, + "loss": 0.0206, + "step": 299270 + }, + { + "epoch": 1.93, + "learning_rate": 1.0256426805733943e-05, + "loss": 0.0218, + "step": 299280 + }, + { + "epoch": 1.93, + "learning_rate": 1.0246745451377011e-05, + "loss": 0.0202, + "step": 299290 + }, + { + "epoch": 1.93, + "learning_rate": 1.0237064097020078e-05, + "loss": 0.0252, + "step": 299300 + }, + { + "epoch": 1.93, + "learning_rate": 1.0227382742663145e-05, + "loss": 0.0254, + "step": 299310 + }, + { + "epoch": 1.93, + "learning_rate": 1.0217701388306215e-05, + "loss": 0.019, + "step": 299320 + }, + { + "epoch": 1.93, + "learning_rate": 1.0208020033949281e-05, + "loss": 0.0212, + "step": 299330 + }, + { + "epoch": 1.93, + "learning_rate": 1.019833867959235e-05, + "loss": 0.0197, + "step": 299340 + }, + { + "epoch": 1.93, + "learning_rate": 1.0188657325235417e-05, + "loss": 0.0245, + "step": 299350 + }, + { + "epoch": 1.93, + "learning_rate": 1.0178975970878483e-05, + "loss": 0.0308, + "step": 299360 + }, + { + "epoch": 1.93, + "learning_rate": 1.0169294616521553e-05, + "loss": 0.0203, + "step": 299370 + }, + { + "epoch": 1.93, + "learning_rate": 1.0159613262164621e-05, + "loss": 0.0215, + "step": 299380 + }, + { + "epoch": 1.93, + "learning_rate": 1.0149931907807689e-05, + "loss": 0.0187, + "step": 299390 + }, + { + "epoch": 1.93, + "learning_rate": 1.0140250553450755e-05, + "loss": 0.0223, + "step": 299400 + }, + { + "epoch": 1.93, + "learning_rate": 1.0130569199093825e-05, + "loss": 0.0214, + "step": 299410 + }, + { + "epoch": 1.93, + "learning_rate": 1.0120887844736893e-05, + "loss": 0.0221, + "step": 299420 + }, + { + "epoch": 1.93, + "learning_rate": 1.0111206490379959e-05, + "loss": 0.0227, + "step": 299430 + }, + { + "epoch": 1.93, + "learning_rate": 1.0101525136023027e-05, + "loss": 0.0228, + "step": 299440 + }, + { + "epoch": 1.93, + "learning_rate": 1.0091843781666097e-05, + "loss": 0.0213, + "step": 299450 + }, + { + "epoch": 1.93, + "learning_rate": 1.0082162427309164e-05, + "loss": 0.0255, + "step": 299460 + }, + { + "epoch": 1.93, + "learning_rate": 1.007248107295223e-05, + "loss": 0.0215, + "step": 299470 + }, + { + "epoch": 1.93, + "learning_rate": 1.0062799718595299e-05, + "loss": 0.0209, + "step": 299480 + }, + { + "epoch": 1.93, + "learning_rate": 1.0053118364238368e-05, + "loss": 0.0244, + "step": 299490 + }, + { + "epoch": 1.93, + "learning_rate": 1.0043437009881434e-05, + "loss": 0.0229, + "step": 299500 + }, + { + "epoch": 1.93, + "learning_rate": 1.0033755655524502e-05, + "loss": 0.0275, + "step": 299510 + }, + { + "epoch": 1.93, + "learning_rate": 1.002407430116757e-05, + "loss": 0.02, + "step": 299520 + }, + { + "epoch": 1.93, + "learning_rate": 1.001439294681064e-05, + "loss": 0.025, + "step": 299530 + }, + { + "epoch": 1.93, + "learning_rate": 1.0004711592453706e-05, + "loss": 0.0264, + "step": 299540 + }, + { + "epoch": 1.93, + "learning_rate": 9.995030238096774e-06, + "loss": 0.0209, + "step": 299550 + }, + { + "epoch": 1.93, + "learning_rate": 9.985348883739842e-06, + "loss": 0.0187, + "step": 299560 + }, + { + "epoch": 1.93, + "learning_rate": 9.975667529382908e-06, + "loss": 0.019, + "step": 299570 + }, + { + "epoch": 1.93, + "learning_rate": 9.965986175025978e-06, + "loss": 0.0196, + "step": 299580 + }, + { + "epoch": 1.93, + "learning_rate": 9.956304820669046e-06, + "loss": 0.0232, + "step": 299590 + }, + { + "epoch": 1.93, + "learning_rate": 9.946623466312114e-06, + "loss": 0.0209, + "step": 299600 + }, + { + "epoch": 1.93, + "learning_rate": 9.93694211195518e-06, + "loss": 0.0211, + "step": 299610 + }, + { + "epoch": 1.93, + "learning_rate": 9.927260757598248e-06, + "loss": 0.0172, + "step": 299620 + }, + { + "epoch": 1.93, + "learning_rate": 9.917579403241318e-06, + "loss": 0.021, + "step": 299630 + }, + { + "epoch": 1.93, + "learning_rate": 9.907898048884384e-06, + "loss": 0.0214, + "step": 299640 + }, + { + "epoch": 1.93, + "learning_rate": 9.898216694527452e-06, + "loss": 0.0213, + "step": 299650 + }, + { + "epoch": 1.93, + "learning_rate": 9.88853534017052e-06, + "loss": 0.0216, + "step": 299660 + }, + { + "epoch": 1.93, + "learning_rate": 9.87885398581359e-06, + "loss": 0.0284, + "step": 299670 + }, + { + "epoch": 1.93, + "learning_rate": 9.869172631456656e-06, + "loss": 0.0238, + "step": 299680 + }, + { + "epoch": 1.93, + "learning_rate": 9.859491277099724e-06, + "loss": 0.0211, + "step": 299690 + }, + { + "epoch": 1.93, + "learning_rate": 9.849809922742791e-06, + "loss": 0.0198, + "step": 299700 + }, + { + "epoch": 1.93, + "learning_rate": 9.840128568385858e-06, + "loss": 0.0171, + "step": 299710 + }, + { + "epoch": 1.93, + "learning_rate": 9.830447214028927e-06, + "loss": 0.0264, + "step": 299720 + }, + { + "epoch": 1.93, + "learning_rate": 9.820765859671995e-06, + "loss": 0.0279, + "step": 299730 + }, + { + "epoch": 1.93, + "learning_rate": 9.811084505315063e-06, + "loss": 0.0213, + "step": 299740 + }, + { + "epoch": 1.93, + "learning_rate": 9.80140315095813e-06, + "loss": 0.0204, + "step": 299750 + }, + { + "epoch": 1.93, + "learning_rate": 9.791721796601199e-06, + "loss": 0.0217, + "step": 299760 + }, + { + "epoch": 1.93, + "learning_rate": 9.782040442244267e-06, + "loss": 0.022, + "step": 299770 + }, + { + "epoch": 1.93, + "learning_rate": 9.772359087887333e-06, + "loss": 0.0297, + "step": 299780 + }, + { + "epoch": 1.93, + "learning_rate": 9.762677733530401e-06, + "loss": 0.0209, + "step": 299790 + }, + { + "epoch": 1.93, + "learning_rate": 9.75299637917347e-06, + "loss": 0.0226, + "step": 299800 + }, + { + "epoch": 1.94, + "learning_rate": 9.743315024816537e-06, + "loss": 0.021, + "step": 299810 + }, + { + "epoch": 1.94, + "learning_rate": 9.733633670459605e-06, + "loss": 0.0204, + "step": 299820 + }, + { + "epoch": 1.94, + "learning_rate": 9.723952316102673e-06, + "loss": 0.0222, + "step": 299830 + }, + { + "epoch": 1.94, + "learning_rate": 9.714270961745743e-06, + "loss": 0.0261, + "step": 299840 + }, + { + "epoch": 1.94, + "learning_rate": 9.704589607388809e-06, + "loss": 0.0181, + "step": 299850 + }, + { + "epoch": 1.94, + "learning_rate": 9.694908253031877e-06, + "loss": 0.0233, + "step": 299860 + }, + { + "epoch": 1.94, + "learning_rate": 9.685226898674945e-06, + "loss": 0.0263, + "step": 299870 + }, + { + "epoch": 1.94, + "learning_rate": 9.675545544318011e-06, + "loss": 0.0203, + "step": 299880 + }, + { + "epoch": 1.94, + "learning_rate": 9.66586418996108e-06, + "loss": 0.0187, + "step": 299890 + }, + { + "epoch": 1.94, + "learning_rate": 9.656182835604148e-06, + "loss": 0.0226, + "step": 299900 + }, + { + "epoch": 1.94, + "learning_rate": 9.646501481247216e-06, + "loss": 0.0194, + "step": 299910 + }, + { + "epoch": 1.94, + "learning_rate": 9.636820126890283e-06, + "loss": 0.0197, + "step": 299920 + }, + { + "epoch": 1.94, + "learning_rate": 9.62713877253335e-06, + "loss": 0.0212, + "step": 299930 + }, + { + "epoch": 1.94, + "learning_rate": 9.61745741817642e-06, + "loss": 0.0205, + "step": 299940 + }, + { + "epoch": 1.94, + "learning_rate": 9.607776063819486e-06, + "loss": 0.0221, + "step": 299950 + }, + { + "epoch": 1.94, + "learning_rate": 9.598094709462554e-06, + "loss": 0.0207, + "step": 299960 + }, + { + "epoch": 1.94, + "learning_rate": 9.588413355105622e-06, + "loss": 0.0157, + "step": 299970 + }, + { + "epoch": 1.94, + "learning_rate": 9.578732000748692e-06, + "loss": 0.0219, + "step": 299980 + }, + { + "epoch": 1.94, + "learning_rate": 9.569050646391758e-06, + "loss": 0.0325, + "step": 299990 + }, + { + "epoch": 1.94, + "learning_rate": 9.559369292034826e-06, + "loss": 0.0175, + "step": 300000 + }, + { + "epoch": 1.94, + "eval_cer": 0.9198219410236131, + "eval_loss": 0.0166050735861063, + "eval_runtime": 120.2268, + "eval_samples_per_second": 16.635, + "eval_steps_per_second": 4.159, + "step": 300000 + }, + { + "epoch": 1.94, + "learning_rate": 9.549687937677894e-06, + "loss": 0.0235, + "step": 300010 + }, + { + "epoch": 1.94, + "learning_rate": 9.54000658332096e-06, + "loss": 0.0249, + "step": 300020 + }, + { + "epoch": 1.94, + "learning_rate": 9.53032522896403e-06, + "loss": 0.022, + "step": 300030 + }, + { + "epoch": 1.94, + "learning_rate": 9.520643874607098e-06, + "loss": 0.0221, + "step": 300040 + }, + { + "epoch": 1.94, + "learning_rate": 9.510962520250166e-06, + "loss": 0.0196, + "step": 300050 + }, + { + "epoch": 1.94, + "learning_rate": 9.501281165893232e-06, + "loss": 0.0206, + "step": 300060 + }, + { + "epoch": 1.94, + "learning_rate": 9.491599811536302e-06, + "loss": 0.0238, + "step": 300070 + }, + { + "epoch": 1.94, + "learning_rate": 9.48191845717937e-06, + "loss": 0.021, + "step": 300080 + }, + { + "epoch": 1.94, + "learning_rate": 9.472237102822436e-06, + "loss": 0.0202, + "step": 300090 + }, + { + "epoch": 1.94, + "learning_rate": 9.462555748465504e-06, + "loss": 0.0199, + "step": 300100 + }, + { + "epoch": 1.94, + "learning_rate": 9.452874394108573e-06, + "loss": 0.0233, + "step": 300110 + }, + { + "epoch": 1.94, + "learning_rate": 9.443193039751641e-06, + "loss": 0.019, + "step": 300120 + }, + { + "epoch": 1.94, + "learning_rate": 9.433511685394708e-06, + "loss": 0.0239, + "step": 300130 + }, + { + "epoch": 1.94, + "learning_rate": 9.423830331037775e-06, + "loss": 0.0219, + "step": 300140 + }, + { + "epoch": 1.94, + "learning_rate": 9.414148976680845e-06, + "loss": 0.0188, + "step": 300150 + }, + { + "epoch": 1.94, + "learning_rate": 9.404467622323911e-06, + "loss": 0.0245, + "step": 300160 + }, + { + "epoch": 1.94, + "learning_rate": 9.39478626796698e-06, + "loss": 0.0241, + "step": 300170 + }, + { + "epoch": 1.94, + "learning_rate": 9.385104913610047e-06, + "loss": 0.0225, + "step": 300180 + }, + { + "epoch": 1.94, + "learning_rate": 9.375423559253117e-06, + "loss": 0.0221, + "step": 300190 + }, + { + "epoch": 1.94, + "learning_rate": 9.365742204896183e-06, + "loss": 0.0216, + "step": 300200 + }, + { + "epoch": 1.94, + "learning_rate": 9.356060850539251e-06, + "loss": 0.0229, + "step": 300210 + }, + { + "epoch": 1.94, + "learning_rate": 9.346379496182319e-06, + "loss": 0.0218, + "step": 300220 + }, + { + "epoch": 1.94, + "learning_rate": 9.336698141825387e-06, + "loss": 0.0259, + "step": 300230 + }, + { + "epoch": 1.94, + "learning_rate": 9.327016787468455e-06, + "loss": 0.0233, + "step": 300240 + }, + { + "epoch": 1.94, + "learning_rate": 9.317335433111523e-06, + "loss": 0.0209, + "step": 300250 + }, + { + "epoch": 1.94, + "learning_rate": 9.30765407875459e-06, + "loss": 0.0232, + "step": 300260 + }, + { + "epoch": 1.94, + "learning_rate": 9.297972724397657e-06, + "loss": 0.0207, + "step": 300270 + }, + { + "epoch": 1.94, + "learning_rate": 9.288291370040725e-06, + "loss": 0.0225, + "step": 300280 + }, + { + "epoch": 1.94, + "learning_rate": 9.278610015683793e-06, + "loss": 0.0227, + "step": 300290 + }, + { + "epoch": 1.94, + "learning_rate": 9.26892866132686e-06, + "loss": 0.0223, + "step": 300300 + }, + { + "epoch": 1.94, + "learning_rate": 9.259247306969929e-06, + "loss": 0.0194, + "step": 300310 + }, + { + "epoch": 1.94, + "learning_rate": 9.249565952612997e-06, + "loss": 0.0244, + "step": 300320 + }, + { + "epoch": 1.94, + "learning_rate": 9.239884598256064e-06, + "loss": 0.02, + "step": 300330 + }, + { + "epoch": 1.94, + "learning_rate": 9.230203243899132e-06, + "loss": 0.0211, + "step": 300340 + }, + { + "epoch": 1.94, + "learning_rate": 9.2205218895422e-06, + "loss": 0.0286, + "step": 300350 + }, + { + "epoch": 1.94, + "learning_rate": 9.210840535185268e-06, + "loss": 0.0202, + "step": 300360 + }, + { + "epoch": 1.94, + "learning_rate": 9.201159180828336e-06, + "loss": 0.0267, + "step": 300370 + }, + { + "epoch": 1.94, + "learning_rate": 9.191477826471404e-06, + "loss": 0.0251, + "step": 300380 + }, + { + "epoch": 1.94, + "learning_rate": 9.18179647211447e-06, + "loss": 0.0234, + "step": 300390 + }, + { + "epoch": 1.94, + "learning_rate": 9.17211511775754e-06, + "loss": 0.0164, + "step": 300400 + }, + { + "epoch": 1.94, + "learning_rate": 9.162433763400606e-06, + "loss": 0.0235, + "step": 300410 + }, + { + "epoch": 1.94, + "learning_rate": 9.152752409043676e-06, + "loss": 0.022, + "step": 300420 + }, + { + "epoch": 1.94, + "learning_rate": 9.143071054686742e-06, + "loss": 0.0216, + "step": 300430 + }, + { + "epoch": 1.94, + "learning_rate": 9.133389700329812e-06, + "loss": 0.0224, + "step": 300440 + }, + { + "epoch": 1.94, + "learning_rate": 9.123708345972878e-06, + "loss": 0.0252, + "step": 300450 + }, + { + "epoch": 1.94, + "learning_rate": 9.114026991615946e-06, + "loss": 0.0243, + "step": 300460 + }, + { + "epoch": 1.94, + "learning_rate": 9.104345637259014e-06, + "loss": 0.0189, + "step": 300470 + }, + { + "epoch": 1.94, + "learning_rate": 9.094664282902082e-06, + "loss": 0.0218, + "step": 300480 + }, + { + "epoch": 1.94, + "learning_rate": 9.08498292854515e-06, + "loss": 0.0277, + "step": 300490 + }, + { + "epoch": 1.94, + "learning_rate": 9.075301574188218e-06, + "loss": 0.0231, + "step": 300500 + }, + { + "epoch": 1.94, + "learning_rate": 9.065620219831286e-06, + "loss": 0.0197, + "step": 300510 + }, + { + "epoch": 1.94, + "learning_rate": 9.055938865474354e-06, + "loss": 0.019, + "step": 300520 + }, + { + "epoch": 1.94, + "learning_rate": 9.046257511117421e-06, + "loss": 0.018, + "step": 300530 + }, + { + "epoch": 1.94, + "learning_rate": 9.03657615676049e-06, + "loss": 0.0211, + "step": 300540 + }, + { + "epoch": 1.94, + "learning_rate": 9.026894802403557e-06, + "loss": 0.0223, + "step": 300550 + }, + { + "epoch": 1.94, + "learning_rate": 9.017213448046625e-06, + "loss": 0.0226, + "step": 300560 + }, + { + "epoch": 1.94, + "learning_rate": 9.007532093689693e-06, + "loss": 0.0251, + "step": 300570 + }, + { + "epoch": 1.94, + "learning_rate": 8.99785073933276e-06, + "loss": 0.021, + "step": 300580 + }, + { + "epoch": 1.94, + "learning_rate": 8.988169384975829e-06, + "loss": 0.0199, + "step": 300590 + }, + { + "epoch": 1.94, + "learning_rate": 8.978488030618895e-06, + "loss": 0.0205, + "step": 300600 + }, + { + "epoch": 1.94, + "learning_rate": 8.968806676261963e-06, + "loss": 0.0211, + "step": 300610 + }, + { + "epoch": 1.94, + "learning_rate": 8.959125321905031e-06, + "loss": 0.0235, + "step": 300620 + }, + { + "epoch": 1.94, + "learning_rate": 8.949443967548099e-06, + "loss": 0.0243, + "step": 300630 + }, + { + "epoch": 1.94, + "learning_rate": 8.939762613191167e-06, + "loss": 0.0227, + "step": 300640 + }, + { + "epoch": 1.94, + "learning_rate": 8.930081258834235e-06, + "loss": 0.02, + "step": 300650 + }, + { + "epoch": 1.94, + "learning_rate": 8.920399904477303e-06, + "loss": 0.0282, + "step": 300660 + }, + { + "epoch": 1.94, + "learning_rate": 8.91071855012037e-06, + "loss": 0.0227, + "step": 300670 + }, + { + "epoch": 1.94, + "learning_rate": 8.901037195763439e-06, + "loss": 0.0221, + "step": 300680 + }, + { + "epoch": 1.94, + "learning_rate": 8.891355841406507e-06, + "loss": 0.018, + "step": 300690 + }, + { + "epoch": 1.94, + "learning_rate": 8.881674487049575e-06, + "loss": 0.0226, + "step": 300700 + }, + { + "epoch": 1.94, + "learning_rate": 8.871993132692643e-06, + "loss": 0.0224, + "step": 300710 + }, + { + "epoch": 1.94, + "learning_rate": 8.862311778335709e-06, + "loss": 0.0217, + "step": 300720 + }, + { + "epoch": 1.94, + "learning_rate": 8.852630423978778e-06, + "loss": 0.0228, + "step": 300730 + }, + { + "epoch": 1.94, + "learning_rate": 8.842949069621845e-06, + "loss": 0.0198, + "step": 300740 + }, + { + "epoch": 1.94, + "learning_rate": 8.833267715264914e-06, + "loss": 0.0189, + "step": 300750 + }, + { + "epoch": 1.94, + "learning_rate": 8.82358636090798e-06, + "loss": 0.0208, + "step": 300760 + }, + { + "epoch": 1.94, + "learning_rate": 8.813905006551048e-06, + "loss": 0.0215, + "step": 300770 + }, + { + "epoch": 1.94, + "learning_rate": 8.804223652194116e-06, + "loss": 0.0198, + "step": 300780 + }, + { + "epoch": 1.94, + "learning_rate": 8.794542297837184e-06, + "loss": 0.026, + "step": 300790 + }, + { + "epoch": 1.94, + "learning_rate": 8.784860943480252e-06, + "loss": 0.0216, + "step": 300800 + }, + { + "epoch": 1.94, + "learning_rate": 8.77517958912332e-06, + "loss": 0.0183, + "step": 300810 + }, + { + "epoch": 1.94, + "learning_rate": 8.765498234766388e-06, + "loss": 0.0227, + "step": 300820 + }, + { + "epoch": 1.94, + "learning_rate": 8.755816880409456e-06, + "loss": 0.0188, + "step": 300830 + }, + { + "epoch": 1.94, + "learning_rate": 8.746135526052524e-06, + "loss": 0.0172, + "step": 300840 + }, + { + "epoch": 1.94, + "learning_rate": 8.736454171695592e-06, + "loss": 0.0198, + "step": 300850 + }, + { + "epoch": 1.94, + "learning_rate": 8.72677281733866e-06, + "loss": 0.0239, + "step": 300860 + }, + { + "epoch": 1.94, + "learning_rate": 8.717091462981728e-06, + "loss": 0.0201, + "step": 300870 + }, + { + "epoch": 1.94, + "learning_rate": 8.707410108624796e-06, + "loss": 0.0209, + "step": 300880 + }, + { + "epoch": 1.94, + "learning_rate": 8.697728754267864e-06, + "loss": 0.0226, + "step": 300890 + }, + { + "epoch": 1.94, + "learning_rate": 8.688047399910932e-06, + "loss": 0.0259, + "step": 300900 + }, + { + "epoch": 1.94, + "learning_rate": 8.678366045553998e-06, + "loss": 0.0199, + "step": 300910 + }, + { + "epoch": 1.94, + "learning_rate": 8.668684691197067e-06, + "loss": 0.02, + "step": 300920 + }, + { + "epoch": 1.94, + "learning_rate": 8.659003336840134e-06, + "loss": 0.0237, + "step": 300930 + }, + { + "epoch": 1.94, + "learning_rate": 8.649321982483202e-06, + "loss": 0.0182, + "step": 300940 + }, + { + "epoch": 1.94, + "learning_rate": 8.63964062812627e-06, + "loss": 0.0203, + "step": 300950 + }, + { + "epoch": 1.94, + "learning_rate": 8.629959273769338e-06, + "loss": 0.0232, + "step": 300960 + }, + { + "epoch": 1.94, + "learning_rate": 8.620277919412405e-06, + "loss": 0.0219, + "step": 300970 + }, + { + "epoch": 1.94, + "learning_rate": 8.610596565055473e-06, + "loss": 0.0239, + "step": 300980 + }, + { + "epoch": 1.94, + "learning_rate": 8.600915210698541e-06, + "loss": 0.0189, + "step": 300990 + }, + { + "epoch": 1.94, + "learning_rate": 8.59123385634161e-06, + "loss": 0.0228, + "step": 301000 + }, + { + "epoch": 1.94, + "eval_cer": 0.9198273641396453, + "eval_loss": 0.016501974314451218, + "eval_runtime": 120.1039, + "eval_samples_per_second": 16.652, + "eval_steps_per_second": 4.163, + "step": 301000 + }, + { + "epoch": 1.94, + "learning_rate": 8.581552501984677e-06, + "loss": 0.0258, + "step": 301010 + }, + { + "epoch": 1.94, + "learning_rate": 8.571871147627745e-06, + "loss": 0.0265, + "step": 301020 + }, + { + "epoch": 1.94, + "learning_rate": 8.562189793270811e-06, + "loss": 0.0176, + "step": 301030 + }, + { + "epoch": 1.94, + "learning_rate": 8.552508438913881e-06, + "loss": 0.0223, + "step": 301040 + }, + { + "epoch": 1.94, + "learning_rate": 8.542827084556947e-06, + "loss": 0.0191, + "step": 301050 + }, + { + "epoch": 1.94, + "learning_rate": 8.533145730200017e-06, + "loss": 0.0207, + "step": 301060 + }, + { + "epoch": 1.94, + "learning_rate": 8.523464375843083e-06, + "loss": 0.0229, + "step": 301070 + }, + { + "epoch": 1.94, + "learning_rate": 8.513783021486153e-06, + "loss": 0.0203, + "step": 301080 + }, + { + "epoch": 1.94, + "learning_rate": 8.504101667129219e-06, + "loss": 0.0241, + "step": 301090 + }, + { + "epoch": 1.94, + "learning_rate": 8.494420312772287e-06, + "loss": 0.0182, + "step": 301100 + }, + { + "epoch": 1.94, + "learning_rate": 8.484738958415355e-06, + "loss": 0.023, + "step": 301110 + }, + { + "epoch": 1.94, + "learning_rate": 8.475057604058423e-06, + "loss": 0.0234, + "step": 301120 + }, + { + "epoch": 1.94, + "learning_rate": 8.46537624970149e-06, + "loss": 0.0217, + "step": 301130 + }, + { + "epoch": 1.94, + "learning_rate": 8.455694895344559e-06, + "loss": 0.0247, + "step": 301140 + }, + { + "epoch": 1.94, + "learning_rate": 8.446013540987627e-06, + "loss": 0.0193, + "step": 301150 + }, + { + "epoch": 1.94, + "learning_rate": 8.436332186630694e-06, + "loss": 0.0227, + "step": 301160 + }, + { + "epoch": 1.94, + "learning_rate": 8.426650832273762e-06, + "loss": 0.0252, + "step": 301170 + }, + { + "epoch": 1.94, + "learning_rate": 8.41696947791683e-06, + "loss": 0.0224, + "step": 301180 + }, + { + "epoch": 1.94, + "learning_rate": 8.407288123559898e-06, + "loss": 0.0198, + "step": 301190 + }, + { + "epoch": 1.94, + "learning_rate": 8.397606769202966e-06, + "loss": 0.02, + "step": 301200 + }, + { + "epoch": 1.94, + "learning_rate": 8.387925414846034e-06, + "loss": 0.0231, + "step": 301210 + }, + { + "epoch": 1.94, + "learning_rate": 8.3782440604891e-06, + "loss": 0.0193, + "step": 301220 + }, + { + "epoch": 1.94, + "learning_rate": 8.36856270613217e-06, + "loss": 0.0238, + "step": 301230 + }, + { + "epoch": 1.94, + "learning_rate": 8.358881351775236e-06, + "loss": 0.0221, + "step": 301240 + }, + { + "epoch": 1.94, + "learning_rate": 8.349199997418306e-06, + "loss": 0.0231, + "step": 301250 + }, + { + "epoch": 1.94, + "learning_rate": 8.339518643061372e-06, + "loss": 0.0173, + "step": 301260 + }, + { + "epoch": 1.94, + "learning_rate": 8.32983728870444e-06, + "loss": 0.0232, + "step": 301270 + }, + { + "epoch": 1.94, + "learning_rate": 8.320155934347508e-06, + "loss": 0.0226, + "step": 301280 + }, + { + "epoch": 1.94, + "learning_rate": 8.310474579990576e-06, + "loss": 0.0244, + "step": 301290 + }, + { + "epoch": 1.94, + "learning_rate": 8.300793225633644e-06, + "loss": 0.0197, + "step": 301300 + }, + { + "epoch": 1.94, + "learning_rate": 8.291111871276712e-06, + "loss": 0.0222, + "step": 301310 + }, + { + "epoch": 1.94, + "learning_rate": 8.28143051691978e-06, + "loss": 0.0229, + "step": 301320 + }, + { + "epoch": 1.94, + "learning_rate": 8.271749162562848e-06, + "loss": 0.0195, + "step": 301330 + }, + { + "epoch": 1.94, + "learning_rate": 8.262067808205916e-06, + "loss": 0.0209, + "step": 301340 + }, + { + "epoch": 1.94, + "learning_rate": 8.252386453848984e-06, + "loss": 0.0215, + "step": 301350 + }, + { + "epoch": 1.95, + "learning_rate": 8.24270509949205e-06, + "loss": 0.0286, + "step": 301360 + }, + { + "epoch": 1.95, + "learning_rate": 8.23302374513512e-06, + "loss": 0.0278, + "step": 301370 + }, + { + "epoch": 1.95, + "learning_rate": 8.223342390778186e-06, + "loss": 0.026, + "step": 301380 + }, + { + "epoch": 1.95, + "learning_rate": 8.213661036421255e-06, + "loss": 0.0212, + "step": 301390 + }, + { + "epoch": 1.95, + "learning_rate": 8.203979682064321e-06, + "loss": 0.0235, + "step": 301400 + }, + { + "epoch": 1.95, + "learning_rate": 8.19429832770739e-06, + "loss": 0.0252, + "step": 301410 + }, + { + "epoch": 1.95, + "learning_rate": 8.184616973350457e-06, + "loss": 0.022, + "step": 301420 + }, + { + "epoch": 1.95, + "learning_rate": 8.174935618993525e-06, + "loss": 0.02, + "step": 301430 + }, + { + "epoch": 1.95, + "learning_rate": 8.165254264636593e-06, + "loss": 0.0219, + "step": 301440 + }, + { + "epoch": 1.95, + "learning_rate": 8.155572910279661e-06, + "loss": 0.0277, + "step": 301450 + }, + { + "epoch": 1.95, + "learning_rate": 8.145891555922729e-06, + "loss": 0.0205, + "step": 301460 + }, + { + "epoch": 1.95, + "learning_rate": 8.136210201565797e-06, + "loss": 0.0184, + "step": 301470 + }, + { + "epoch": 1.95, + "learning_rate": 8.126528847208865e-06, + "loss": 0.02, + "step": 301480 + }, + { + "epoch": 1.95, + "learning_rate": 8.116847492851933e-06, + "loss": 0.0276, + "step": 301490 + }, + { + "epoch": 1.95, + "learning_rate": 8.107166138495e-06, + "loss": 0.0236, + "step": 301500 + }, + { + "epoch": 1.95, + "learning_rate": 8.097484784138069e-06, + "loss": 0.0206, + "step": 301510 + }, + { + "epoch": 1.95, + "learning_rate": 8.087803429781137e-06, + "loss": 0.024, + "step": 301520 + }, + { + "epoch": 1.95, + "learning_rate": 8.078122075424205e-06, + "loss": 0.0234, + "step": 301530 + }, + { + "epoch": 1.95, + "learning_rate": 8.068440721067273e-06, + "loss": 0.0227, + "step": 301540 + }, + { + "epoch": 1.95, + "learning_rate": 8.058759366710339e-06, + "loss": 0.0225, + "step": 301550 + }, + { + "epoch": 1.95, + "learning_rate": 8.049078012353408e-06, + "loss": 0.023, + "step": 301560 + }, + { + "epoch": 1.95, + "learning_rate": 8.039396657996475e-06, + "loss": 0.0216, + "step": 301570 + }, + { + "epoch": 1.95, + "learning_rate": 8.029715303639544e-06, + "loss": 0.0222, + "step": 301580 + }, + { + "epoch": 1.95, + "learning_rate": 8.02003394928261e-06, + "loss": 0.0238, + "step": 301590 + }, + { + "epoch": 1.95, + "learning_rate": 8.010352594925678e-06, + "loss": 0.0198, + "step": 301600 + }, + { + "epoch": 1.95, + "learning_rate": 8.000671240568746e-06, + "loss": 0.0249, + "step": 301610 + }, + { + "epoch": 1.95, + "learning_rate": 7.990989886211814e-06, + "loss": 0.023, + "step": 301620 + }, + { + "epoch": 1.95, + "learning_rate": 7.981308531854882e-06, + "loss": 0.0211, + "step": 301630 + }, + { + "epoch": 1.95, + "learning_rate": 7.97162717749795e-06, + "loss": 0.0187, + "step": 301640 + }, + { + "epoch": 1.95, + "learning_rate": 7.961945823141018e-06, + "loss": 0.0206, + "step": 301650 + }, + { + "epoch": 1.95, + "learning_rate": 7.952264468784086e-06, + "loss": 0.02, + "step": 301660 + }, + { + "epoch": 1.95, + "learning_rate": 7.942583114427152e-06, + "loss": 0.0293, + "step": 301670 + }, + { + "epoch": 1.95, + "learning_rate": 7.932901760070222e-06, + "loss": 0.0278, + "step": 301680 + }, + { + "epoch": 1.95, + "learning_rate": 7.923220405713288e-06, + "loss": 0.021, + "step": 301690 + }, + { + "epoch": 1.95, + "learning_rate": 7.913539051356358e-06, + "loss": 0.0225, + "step": 301700 + }, + { + "epoch": 1.95, + "learning_rate": 7.903857696999424e-06, + "loss": 0.0301, + "step": 301710 + }, + { + "epoch": 1.95, + "learning_rate": 7.894176342642494e-06, + "loss": 0.0218, + "step": 301720 + }, + { + "epoch": 1.95, + "learning_rate": 7.88449498828556e-06, + "loss": 0.0186, + "step": 301730 + }, + { + "epoch": 1.95, + "learning_rate": 7.874813633928628e-06, + "loss": 0.0204, + "step": 301740 + }, + { + "epoch": 1.95, + "learning_rate": 7.865132279571696e-06, + "loss": 0.0202, + "step": 301750 + }, + { + "epoch": 1.95, + "learning_rate": 7.855450925214764e-06, + "loss": 0.0221, + "step": 301760 + }, + { + "epoch": 1.95, + "learning_rate": 7.845769570857832e-06, + "loss": 0.0236, + "step": 301770 + }, + { + "epoch": 1.95, + "learning_rate": 7.8360882165009e-06, + "loss": 0.0242, + "step": 301780 + }, + { + "epoch": 1.95, + "learning_rate": 7.826406862143967e-06, + "loss": 0.02, + "step": 301790 + }, + { + "epoch": 1.95, + "learning_rate": 7.816725507787035e-06, + "loss": 0.0223, + "step": 301800 + }, + { + "epoch": 1.95, + "learning_rate": 7.807044153430103e-06, + "loss": 0.0202, + "step": 301810 + }, + { + "epoch": 1.95, + "learning_rate": 7.797362799073171e-06, + "loss": 0.0218, + "step": 301820 + }, + { + "epoch": 1.95, + "learning_rate": 7.78768144471624e-06, + "loss": 0.0189, + "step": 301830 + }, + { + "epoch": 1.95, + "learning_rate": 7.778000090359307e-06, + "loss": 0.0213, + "step": 301840 + }, + { + "epoch": 1.95, + "learning_rate": 7.768318736002375e-06, + "loss": 0.0206, + "step": 301850 + }, + { + "epoch": 1.95, + "learning_rate": 7.758637381645441e-06, + "loss": 0.021, + "step": 301860 + }, + { + "epoch": 1.95, + "learning_rate": 7.748956027288511e-06, + "loss": 0.0247, + "step": 301870 + }, + { + "epoch": 1.95, + "learning_rate": 7.739274672931577e-06, + "loss": 0.0215, + "step": 301880 + }, + { + "epoch": 1.95, + "learning_rate": 7.729593318574647e-06, + "loss": 0.0201, + "step": 301890 + }, + { + "epoch": 1.95, + "learning_rate": 7.719911964217713e-06, + "loss": 0.02, + "step": 301900 + }, + { + "epoch": 1.95, + "learning_rate": 7.710230609860783e-06, + "loss": 0.0268, + "step": 301910 + }, + { + "epoch": 1.95, + "learning_rate": 7.700549255503849e-06, + "loss": 0.0201, + "step": 301920 + }, + { + "epoch": 1.95, + "learning_rate": 7.690867901146917e-06, + "loss": 0.0227, + "step": 301930 + }, + { + "epoch": 1.95, + "learning_rate": 7.681186546789985e-06, + "loss": 0.0288, + "step": 301940 + }, + { + "epoch": 1.95, + "learning_rate": 7.671505192433053e-06, + "loss": 0.0219, + "step": 301950 + }, + { + "epoch": 1.95, + "learning_rate": 7.66182383807612e-06, + "loss": 0.0248, + "step": 301960 + }, + { + "epoch": 1.95, + "learning_rate": 7.652142483719189e-06, + "loss": 0.0197, + "step": 301970 + }, + { + "epoch": 1.95, + "learning_rate": 7.642461129362257e-06, + "loss": 0.02, + "step": 301980 + }, + { + "epoch": 1.95, + "learning_rate": 7.632779775005324e-06, + "loss": 0.0198, + "step": 301990 + }, + { + "epoch": 1.95, + "learning_rate": 7.6230984206483915e-06, + "loss": 0.019, + "step": 302000 + }, + { + "epoch": 1.95, + "eval_cer": 0.9198327872556773, + "eval_loss": 0.016491882503032684, + "eval_runtime": 120.5919, + "eval_samples_per_second": 16.585, + "eval_steps_per_second": 4.146, + "step": 302000 + }, + { + "epoch": 1.95, + "learning_rate": 7.61341706629146e-06, + "loss": 0.0247, + "step": 302010 + }, + { + "epoch": 1.95, + "learning_rate": 7.603735711934527e-06, + "loss": 0.0204, + "step": 302020 + }, + { + "epoch": 1.95, + "learning_rate": 7.594054357577595e-06, + "loss": 0.0265, + "step": 302030 + }, + { + "epoch": 1.95, + "learning_rate": 7.584373003220663e-06, + "loss": 0.0241, + "step": 302040 + }, + { + "epoch": 1.95, + "learning_rate": 7.57469164886373e-06, + "loss": 0.0178, + "step": 302050 + }, + { + "epoch": 1.95, + "learning_rate": 7.565010294506799e-06, + "loss": 0.0224, + "step": 302060 + }, + { + "epoch": 1.95, + "learning_rate": 7.555328940149866e-06, + "loss": 0.0218, + "step": 302070 + }, + { + "epoch": 1.95, + "learning_rate": 7.545647585792935e-06, + "loss": 0.0254, + "step": 302080 + }, + { + "epoch": 1.95, + "learning_rate": 7.535966231436002e-06, + "loss": 0.0221, + "step": 302090 + }, + { + "epoch": 1.95, + "learning_rate": 7.526284877079071e-06, + "loss": 0.0216, + "step": 302100 + }, + { + "epoch": 1.95, + "learning_rate": 7.516603522722138e-06, + "loss": 0.0237, + "step": 302110 + }, + { + "epoch": 1.95, + "learning_rate": 7.506922168365205e-06, + "loss": 0.0195, + "step": 302120 + }, + { + "epoch": 1.95, + "learning_rate": 7.497240814008274e-06, + "loss": 0.0225, + "step": 302130 + }, + { + "epoch": 1.95, + "learning_rate": 7.487559459651341e-06, + "loss": 0.024, + "step": 302140 + }, + { + "epoch": 1.95, + "learning_rate": 7.47787810529441e-06, + "loss": 0.0201, + "step": 302150 + }, + { + "epoch": 1.95, + "learning_rate": 7.468196750937477e-06, + "loss": 0.0201, + "step": 302160 + }, + { + "epoch": 1.95, + "learning_rate": 7.4585153965805456e-06, + "loss": 0.0238, + "step": 302170 + }, + { + "epoch": 1.95, + "learning_rate": 7.448834042223613e-06, + "loss": 0.0229, + "step": 302180 + }, + { + "epoch": 1.95, + "learning_rate": 7.439152687866681e-06, + "loss": 0.0205, + "step": 302190 + }, + { + "epoch": 1.95, + "learning_rate": 7.4294713335097485e-06, + "loss": 0.024, + "step": 302200 + }, + { + "epoch": 1.95, + "learning_rate": 7.4197899791528164e-06, + "loss": 0.0164, + "step": 302210 + }, + { + "epoch": 1.95, + "learning_rate": 7.410108624795884e-06, + "loss": 0.0188, + "step": 302220 + }, + { + "epoch": 1.95, + "learning_rate": 7.4004272704389515e-06, + "loss": 0.0207, + "step": 302230 + }, + { + "epoch": 1.95, + "learning_rate": 7.390745916082019e-06, + "loss": 0.0199, + "step": 302240 + }, + { + "epoch": 1.95, + "learning_rate": 7.381064561725087e-06, + "loss": 0.0204, + "step": 302250 + }, + { + "epoch": 1.95, + "learning_rate": 7.371383207368155e-06, + "loss": 0.0192, + "step": 302260 + }, + { + "epoch": 1.95, + "learning_rate": 7.361701853011223e-06, + "loss": 0.0264, + "step": 302270 + }, + { + "epoch": 1.95, + "learning_rate": 7.352020498654291e-06, + "loss": 0.022, + "step": 302280 + }, + { + "epoch": 1.95, + "learning_rate": 7.342339144297359e-06, + "loss": 0.0201, + "step": 302290 + }, + { + "epoch": 1.95, + "learning_rate": 7.332657789940427e-06, + "loss": 0.0184, + "step": 302300 + }, + { + "epoch": 1.95, + "learning_rate": 7.322976435583494e-06, + "loss": 0.0199, + "step": 302310 + }, + { + "epoch": 1.95, + "learning_rate": 7.313295081226563e-06, + "loss": 0.0244, + "step": 302320 + }, + { + "epoch": 1.95, + "learning_rate": 7.30361372686963e-06, + "loss": 0.0236, + "step": 302330 + }, + { + "epoch": 1.95, + "learning_rate": 7.293932372512699e-06, + "loss": 0.0209, + "step": 302340 + }, + { + "epoch": 1.95, + "learning_rate": 7.284251018155766e-06, + "loss": 0.0242, + "step": 302350 + }, + { + "epoch": 1.95, + "learning_rate": 7.274569663798835e-06, + "loss": 0.0245, + "step": 302360 + }, + { + "epoch": 1.95, + "learning_rate": 7.264888309441902e-06, + "loss": 0.0243, + "step": 302370 + }, + { + "epoch": 1.95, + "learning_rate": 7.255206955084969e-06, + "loss": 0.0235, + "step": 302380 + }, + { + "epoch": 1.95, + "learning_rate": 7.2455256007280376e-06, + "loss": 0.0237, + "step": 302390 + }, + { + "epoch": 1.95, + "learning_rate": 7.235844246371105e-06, + "loss": 0.0198, + "step": 302400 + }, + { + "epoch": 1.95, + "learning_rate": 7.226162892014173e-06, + "loss": 0.0282, + "step": 302410 + }, + { + "epoch": 1.95, + "learning_rate": 7.2164815376572405e-06, + "loss": 0.0246, + "step": 302420 + }, + { + "epoch": 1.95, + "learning_rate": 7.206800183300309e-06, + "loss": 0.0172, + "step": 302430 + }, + { + "epoch": 1.95, + "learning_rate": 7.197118828943376e-06, + "loss": 0.0215, + "step": 302440 + }, + { + "epoch": 1.95, + "learning_rate": 7.1874374745864435e-06, + "loss": 0.0207, + "step": 302450 + }, + { + "epoch": 1.95, + "learning_rate": 7.177756120229512e-06, + "loss": 0.0261, + "step": 302460 + }, + { + "epoch": 1.95, + "learning_rate": 7.168074765872579e-06, + "loss": 0.0179, + "step": 302470 + }, + { + "epoch": 1.95, + "learning_rate": 7.158393411515648e-06, + "loss": 0.0204, + "step": 302480 + }, + { + "epoch": 1.95, + "learning_rate": 7.148712057158715e-06, + "loss": 0.0267, + "step": 302490 + }, + { + "epoch": 1.95, + "learning_rate": 7.139030702801783e-06, + "loss": 0.0243, + "step": 302500 + }, + { + "epoch": 1.95, + "learning_rate": 7.129349348444851e-06, + "loss": 0.0241, + "step": 302510 + }, + { + "epoch": 1.95, + "learning_rate": 7.119667994087919e-06, + "loss": 0.022, + "step": 302520 + }, + { + "epoch": 1.95, + "learning_rate": 7.109986639730987e-06, + "loss": 0.0191, + "step": 302530 + }, + { + "epoch": 1.95, + "learning_rate": 7.100305285374055e-06, + "loss": 0.0237, + "step": 302540 + }, + { + "epoch": 1.95, + "learning_rate": 7.090623931017123e-06, + "loss": 0.0198, + "step": 302550 + }, + { + "epoch": 1.95, + "learning_rate": 7.08094257666019e-06, + "loss": 0.0222, + "step": 302560 + }, + { + "epoch": 1.95, + "learning_rate": 7.071261222303258e-06, + "loss": 0.0221, + "step": 302570 + }, + { + "epoch": 1.95, + "learning_rate": 7.061579867946326e-06, + "loss": 0.0268, + "step": 302580 + }, + { + "epoch": 1.95, + "learning_rate": 7.051898513589394e-06, + "loss": 0.0268, + "step": 302590 + }, + { + "epoch": 1.95, + "learning_rate": 7.042217159232462e-06, + "loss": 0.0207, + "step": 302600 + }, + { + "epoch": 1.95, + "learning_rate": 7.0325358048755295e-06, + "loss": 0.0163, + "step": 302610 + }, + { + "epoch": 1.95, + "learning_rate": 7.0228544505185975e-06, + "loss": 0.021, + "step": 302620 + }, + { + "epoch": 1.95, + "learning_rate": 7.013173096161665e-06, + "loss": 0.0189, + "step": 302630 + }, + { + "epoch": 1.95, + "learning_rate": 7.0034917418047325e-06, + "loss": 0.0187, + "step": 302640 + }, + { + "epoch": 1.95, + "learning_rate": 6.993810387447801e-06, + "loss": 0.0184, + "step": 302650 + }, + { + "epoch": 1.95, + "learning_rate": 6.984129033090868e-06, + "loss": 0.0207, + "step": 302660 + }, + { + "epoch": 1.95, + "learning_rate": 6.974447678733937e-06, + "loss": 0.0177, + "step": 302670 + }, + { + "epoch": 1.95, + "learning_rate": 6.964766324377004e-06, + "loss": 0.0195, + "step": 302680 + }, + { + "epoch": 1.95, + "learning_rate": 6.955084970020071e-06, + "loss": 0.0225, + "step": 302690 + }, + { + "epoch": 1.95, + "learning_rate": 6.94540361566314e-06, + "loss": 0.0173, + "step": 302700 + }, + { + "epoch": 1.95, + "learning_rate": 6.935722261306207e-06, + "loss": 0.0202, + "step": 302710 + }, + { + "epoch": 1.95, + "learning_rate": 6.926040906949276e-06, + "loss": 0.0231, + "step": 302720 + }, + { + "epoch": 1.95, + "learning_rate": 6.916359552592343e-06, + "loss": 0.0256, + "step": 302730 + }, + { + "epoch": 1.95, + "learning_rate": 6.906678198235412e-06, + "loss": 0.0205, + "step": 302740 + }, + { + "epoch": 1.95, + "learning_rate": 6.896996843878479e-06, + "loss": 0.0243, + "step": 302750 + }, + { + "epoch": 1.95, + "learning_rate": 6.887315489521546e-06, + "loss": 0.02, + "step": 302760 + }, + { + "epoch": 1.95, + "learning_rate": 6.877634135164615e-06, + "loss": 0.0161, + "step": 302770 + }, + { + "epoch": 1.95, + "learning_rate": 6.867952780807682e-06, + "loss": 0.0255, + "step": 302780 + }, + { + "epoch": 1.95, + "learning_rate": 6.858271426450751e-06, + "loss": 0.0215, + "step": 302790 + }, + { + "epoch": 1.95, + "learning_rate": 6.848590072093818e-06, + "loss": 0.0246, + "step": 302800 + }, + { + "epoch": 1.95, + "learning_rate": 6.8389087177368865e-06, + "loss": 0.0211, + "step": 302810 + }, + { + "epoch": 1.95, + "learning_rate": 6.829227363379954e-06, + "loss": 0.0218, + "step": 302820 + }, + { + "epoch": 1.95, + "learning_rate": 6.8195460090230215e-06, + "loss": 0.0247, + "step": 302830 + }, + { + "epoch": 1.95, + "learning_rate": 6.8098646546660895e-06, + "loss": 0.0232, + "step": 302840 + }, + { + "epoch": 1.95, + "learning_rate": 6.800183300309157e-06, + "loss": 0.0195, + "step": 302850 + }, + { + "epoch": 1.95, + "learning_rate": 6.790501945952225e-06, + "loss": 0.0236, + "step": 302860 + }, + { + "epoch": 1.95, + "learning_rate": 6.780820591595293e-06, + "loss": 0.021, + "step": 302870 + }, + { + "epoch": 1.95, + "learning_rate": 6.771139237238361e-06, + "loss": 0.0208, + "step": 302880 + }, + { + "epoch": 1.95, + "learning_rate": 6.761457882881429e-06, + "loss": 0.0209, + "step": 302890 + }, + { + "epoch": 1.95, + "learning_rate": 6.751776528524496e-06, + "loss": 0.0222, + "step": 302900 + }, + { + "epoch": 1.96, + "learning_rate": 6.742095174167564e-06, + "loss": 0.0233, + "step": 302910 + }, + { + "epoch": 1.96, + "learning_rate": 6.732413819810632e-06, + "loss": 0.023, + "step": 302920 + }, + { + "epoch": 1.96, + "learning_rate": 6.7227324654537e-06, + "loss": 0.0239, + "step": 302930 + }, + { + "epoch": 1.96, + "learning_rate": 6.713051111096768e-06, + "loss": 0.0314, + "step": 302940 + }, + { + "epoch": 1.96, + "learning_rate": 6.703369756739835e-06, + "loss": 0.0205, + "step": 302950 + }, + { + "epoch": 1.96, + "learning_rate": 6.693688402382904e-06, + "loss": 0.023, + "step": 302960 + }, + { + "epoch": 1.96, + "learning_rate": 6.684007048025971e-06, + "loss": 0.0217, + "step": 302970 + }, + { + "epoch": 1.96, + "learning_rate": 6.67432569366904e-06, + "loss": 0.025, + "step": 302980 + }, + { + "epoch": 1.96, + "learning_rate": 6.664644339312107e-06, + "loss": 0.02, + "step": 302990 + }, + { + "epoch": 1.96, + "learning_rate": 6.6549629849551756e-06, + "loss": 0.0191, + "step": 303000 + }, + { + "epoch": 1.96, + "eval_cer": 0.9198228448762852, + "eval_loss": 0.016516968607902527, + "eval_runtime": 120.4114, + "eval_samples_per_second": 16.61, + "eval_steps_per_second": 4.152, + "step": 303000 + }, + { + "epoch": 1.96, + "learning_rate": 6.645281630598243e-06, + "loss": 0.0222, + "step": 303010 + }, + { + "epoch": 1.96, + "learning_rate": 6.63560027624131e-06, + "loss": 0.025, + "step": 303020 + }, + { + "epoch": 1.96, + "learning_rate": 6.6259189218843785e-06, + "loss": 0.034, + "step": 303030 + }, + { + "epoch": 1.96, + "learning_rate": 6.616237567527446e-06, + "loss": 0.0218, + "step": 303040 + }, + { + "epoch": 1.96, + "learning_rate": 6.606556213170514e-06, + "loss": 0.0288, + "step": 303050 + }, + { + "epoch": 1.96, + "learning_rate": 6.5968748588135815e-06, + "loss": 0.0241, + "step": 303060 + }, + { + "epoch": 1.96, + "learning_rate": 6.58719350445665e-06, + "loss": 0.0191, + "step": 303070 + }, + { + "epoch": 1.96, + "learning_rate": 6.577512150099717e-06, + "loss": 0.0217, + "step": 303080 + }, + { + "epoch": 1.96, + "learning_rate": 6.567830795742784e-06, + "loss": 0.0176, + "step": 303090 + }, + { + "epoch": 1.96, + "learning_rate": 6.558149441385853e-06, + "loss": 0.027, + "step": 303100 + }, + { + "epoch": 1.96, + "learning_rate": 6.54846808702892e-06, + "loss": 0.0202, + "step": 303110 + }, + { + "epoch": 1.96, + "learning_rate": 6.538786732671989e-06, + "loss": 0.0166, + "step": 303120 + }, + { + "epoch": 1.96, + "learning_rate": 6.529105378315056e-06, + "loss": 0.0187, + "step": 303130 + }, + { + "epoch": 1.96, + "learning_rate": 6.519424023958124e-06, + "loss": 0.0176, + "step": 303140 + }, + { + "epoch": 1.96, + "learning_rate": 6.509742669601192e-06, + "loss": 0.0235, + "step": 303150 + }, + { + "epoch": 1.96, + "learning_rate": 6.50006131524426e-06, + "loss": 0.0218, + "step": 303160 + }, + { + "epoch": 1.96, + "learning_rate": 6.490379960887328e-06, + "loss": 0.0236, + "step": 303170 + }, + { + "epoch": 1.96, + "learning_rate": 6.480698606530396e-06, + "loss": 0.0216, + "step": 303180 + }, + { + "epoch": 1.96, + "learning_rate": 6.471017252173464e-06, + "loss": 0.0253, + "step": 303190 + }, + { + "epoch": 1.96, + "learning_rate": 6.461335897816532e-06, + "loss": 0.0214, + "step": 303200 + }, + { + "epoch": 1.96, + "learning_rate": 6.451654543459599e-06, + "loss": 0.024, + "step": 303210 + }, + { + "epoch": 1.96, + "learning_rate": 6.4419731891026675e-06, + "loss": 0.0214, + "step": 303220 + }, + { + "epoch": 1.96, + "learning_rate": 6.432291834745735e-06, + "loss": 0.024, + "step": 303230 + }, + { + "epoch": 1.96, + "learning_rate": 6.4226104803888026e-06, + "loss": 0.0227, + "step": 303240 + }, + { + "epoch": 1.96, + "learning_rate": 6.4129291260318705e-06, + "loss": 0.0268, + "step": 303250 + }, + { + "epoch": 1.96, + "learning_rate": 6.4032477716749384e-06, + "loss": 0.0191, + "step": 303260 + }, + { + "epoch": 1.96, + "learning_rate": 6.393566417318006e-06, + "loss": 0.0225, + "step": 303270 + }, + { + "epoch": 1.96, + "learning_rate": 6.3838850629610734e-06, + "loss": 0.0178, + "step": 303280 + }, + { + "epoch": 1.96, + "learning_rate": 6.374203708604142e-06, + "loss": 0.0193, + "step": 303290 + }, + { + "epoch": 1.96, + "learning_rate": 6.364522354247209e-06, + "loss": 0.023, + "step": 303300 + }, + { + "epoch": 1.96, + "learning_rate": 6.354840999890278e-06, + "loss": 0.0214, + "step": 303310 + }, + { + "epoch": 1.96, + "learning_rate": 6.345159645533345e-06, + "loss": 0.0218, + "step": 303320 + }, + { + "epoch": 1.96, + "learning_rate": 6.335478291176412e-06, + "loss": 0.0203, + "step": 303330 + }, + { + "epoch": 1.96, + "learning_rate": 6.325796936819481e-06, + "loss": 0.0205, + "step": 303340 + }, + { + "epoch": 1.96, + "learning_rate": 6.316115582462548e-06, + "loss": 0.0198, + "step": 303350 + }, + { + "epoch": 1.96, + "learning_rate": 6.306434228105617e-06, + "loss": 0.0274, + "step": 303360 + }, + { + "epoch": 1.96, + "learning_rate": 6.296752873748684e-06, + "loss": 0.0236, + "step": 303370 + }, + { + "epoch": 1.96, + "learning_rate": 6.287071519391753e-06, + "loss": 0.0258, + "step": 303380 + }, + { + "epoch": 1.96, + "learning_rate": 6.27739016503482e-06, + "loss": 0.0202, + "step": 303390 + }, + { + "epoch": 1.96, + "learning_rate": 6.267708810677888e-06, + "loss": 0.0242, + "step": 303400 + }, + { + "epoch": 1.96, + "learning_rate": 6.258027456320956e-06, + "loss": 0.0212, + "step": 303410 + }, + { + "epoch": 1.96, + "learning_rate": 6.248346101964024e-06, + "loss": 0.0197, + "step": 303420 + }, + { + "epoch": 1.96, + "learning_rate": 6.238664747607092e-06, + "loss": 0.021, + "step": 303430 + }, + { + "epoch": 1.96, + "learning_rate": 6.228983393250159e-06, + "loss": 0.0248, + "step": 303440 + }, + { + "epoch": 1.96, + "learning_rate": 6.2193020388932275e-06, + "loss": 0.0218, + "step": 303450 + }, + { + "epoch": 1.96, + "learning_rate": 6.2096206845362945e-06, + "loss": 0.0252, + "step": 303460 + }, + { + "epoch": 1.96, + "learning_rate": 6.1999393301793625e-06, + "loss": 0.022, + "step": 303470 + }, + { + "epoch": 1.96, + "learning_rate": 6.19025797582243e-06, + "loss": 0.0276, + "step": 303480 + }, + { + "epoch": 1.96, + "learning_rate": 6.180576621465498e-06, + "loss": 0.0211, + "step": 303490 + }, + { + "epoch": 1.96, + "learning_rate": 6.170895267108566e-06, + "loss": 0.0256, + "step": 303500 + }, + { + "epoch": 1.96, + "learning_rate": 6.161213912751634e-06, + "loss": 0.0204, + "step": 303510 + }, + { + "epoch": 1.96, + "learning_rate": 6.151532558394702e-06, + "loss": 0.021, + "step": 303520 + }, + { + "epoch": 1.96, + "learning_rate": 6.14185120403777e-06, + "loss": 0.0205, + "step": 303530 + }, + { + "epoch": 1.96, + "learning_rate": 6.132169849680837e-06, + "loss": 0.0233, + "step": 303540 + }, + { + "epoch": 1.96, + "learning_rate": 6.122488495323906e-06, + "loss": 0.0206, + "step": 303550 + }, + { + "epoch": 1.96, + "learning_rate": 6.112807140966973e-06, + "loss": 0.0201, + "step": 303560 + }, + { + "epoch": 1.96, + "learning_rate": 6.103125786610041e-06, + "loss": 0.0208, + "step": 303570 + }, + { + "epoch": 1.96, + "learning_rate": 6.093444432253109e-06, + "loss": 0.0183, + "step": 303580 + }, + { + "epoch": 1.96, + "learning_rate": 6.083763077896176e-06, + "loss": 0.0182, + "step": 303590 + }, + { + "epoch": 1.96, + "learning_rate": 6.074081723539245e-06, + "loss": 0.0176, + "step": 303600 + }, + { + "epoch": 1.96, + "learning_rate": 6.064400369182312e-06, + "loss": 0.0217, + "step": 303610 + }, + { + "epoch": 1.96, + "learning_rate": 6.054719014825381e-06, + "loss": 0.0189, + "step": 303620 + }, + { + "epoch": 1.96, + "learning_rate": 6.045037660468448e-06, + "loss": 0.0229, + "step": 303630 + }, + { + "epoch": 1.96, + "learning_rate": 6.0353563061115165e-06, + "loss": 0.0174, + "step": 303640 + }, + { + "epoch": 1.96, + "learning_rate": 6.025674951754584e-06, + "loss": 0.0206, + "step": 303650 + }, + { + "epoch": 1.96, + "learning_rate": 6.015993597397651e-06, + "loss": 0.0273, + "step": 303660 + }, + { + "epoch": 1.96, + "learning_rate": 6.0063122430407195e-06, + "loss": 0.0256, + "step": 303670 + }, + { + "epoch": 1.96, + "learning_rate": 5.9966308886837865e-06, + "loss": 0.0212, + "step": 303680 + }, + { + "epoch": 1.96, + "learning_rate": 5.986949534326855e-06, + "loss": 0.0185, + "step": 303690 + }, + { + "epoch": 1.96, + "learning_rate": 5.977268179969922e-06, + "loss": 0.0193, + "step": 303700 + }, + { + "epoch": 1.96, + "learning_rate": 5.967586825612991e-06, + "loss": 0.0241, + "step": 303710 + }, + { + "epoch": 1.96, + "learning_rate": 5.957905471256058e-06, + "loss": 0.0212, + "step": 303720 + }, + { + "epoch": 1.96, + "learning_rate": 5.948224116899126e-06, + "loss": 0.0203, + "step": 303730 + }, + { + "epoch": 1.96, + "learning_rate": 5.938542762542194e-06, + "loss": 0.0233, + "step": 303740 + }, + { + "epoch": 1.96, + "learning_rate": 5.928861408185262e-06, + "loss": 0.0252, + "step": 303750 + }, + { + "epoch": 1.96, + "learning_rate": 5.91918005382833e-06, + "loss": 0.0242, + "step": 303760 + }, + { + "epoch": 1.96, + "learning_rate": 5.909498699471397e-06, + "loss": 0.0236, + "step": 303770 + }, + { + "epoch": 1.96, + "learning_rate": 5.899817345114465e-06, + "loss": 0.0233, + "step": 303780 + }, + { + "epoch": 1.96, + "learning_rate": 5.890135990757533e-06, + "loss": 0.0187, + "step": 303790 + }, + { + "epoch": 1.96, + "learning_rate": 5.880454636400601e-06, + "loss": 0.0211, + "step": 303800 + }, + { + "epoch": 1.96, + "learning_rate": 5.870773282043669e-06, + "loss": 0.0237, + "step": 303810 + }, + { + "epoch": 1.96, + "learning_rate": 5.861091927686737e-06, + "loss": 0.0189, + "step": 303820 + }, + { + "epoch": 1.96, + "learning_rate": 5.851410573329805e-06, + "loss": 0.026, + "step": 303830 + }, + { + "epoch": 1.96, + "learning_rate": 5.841729218972873e-06, + "loss": 0.0194, + "step": 303840 + }, + { + "epoch": 1.96, + "learning_rate": 5.83204786461594e-06, + "loss": 0.0207, + "step": 303850 + }, + { + "epoch": 1.96, + "learning_rate": 5.8223665102590085e-06, + "loss": 0.0189, + "step": 303860 + }, + { + "epoch": 1.96, + "learning_rate": 5.8126851559020756e-06, + "loss": 0.0202, + "step": 303870 + }, + { + "epoch": 1.96, + "learning_rate": 5.803003801545144e-06, + "loss": 0.0174, + "step": 303880 + }, + { + "epoch": 1.96, + "learning_rate": 5.7933224471882114e-06, + "loss": 0.0226, + "step": 303890 + }, + { + "epoch": 1.96, + "learning_rate": 5.783641092831279e-06, + "loss": 0.0239, + "step": 303900 + }, + { + "epoch": 1.96, + "learning_rate": 5.773959738474347e-06, + "loss": 0.0195, + "step": 303910 + }, + { + "epoch": 1.96, + "learning_rate": 5.764278384117414e-06, + "loss": 0.0191, + "step": 303920 + }, + { + "epoch": 1.96, + "learning_rate": 5.754597029760483e-06, + "loss": 0.0192, + "step": 303930 + }, + { + "epoch": 1.96, + "learning_rate": 5.74491567540355e-06, + "loss": 0.0177, + "step": 303940 + }, + { + "epoch": 1.96, + "learning_rate": 5.735234321046619e-06, + "loss": 0.0204, + "step": 303950 + }, + { + "epoch": 1.96, + "learning_rate": 5.725552966689686e-06, + "loss": 0.0253, + "step": 303960 + }, + { + "epoch": 1.96, + "learning_rate": 5.715871612332753e-06, + "loss": 0.0227, + "step": 303970 + }, + { + "epoch": 1.96, + "learning_rate": 5.706190257975822e-06, + "loss": 0.0195, + "step": 303980 + }, + { + "epoch": 1.96, + "learning_rate": 5.696508903618889e-06, + "loss": 0.0247, + "step": 303990 + }, + { + "epoch": 1.96, + "learning_rate": 5.686827549261958e-06, + "loss": 0.0249, + "step": 304000 + }, + { + "epoch": 1.96, + "eval_cer": 0.9197939215907807, + "eval_loss": 0.016484426334500313, + "eval_runtime": 120.4979, + "eval_samples_per_second": 16.598, + "eval_steps_per_second": 4.149, + "step": 304000 + }, + { + "epoch": 1.96, + "learning_rate": 5.677146194905025e-06, + "loss": 0.0266, + "step": 304010 + }, + { + "epoch": 1.96, + "learning_rate": 5.667464840548094e-06, + "loss": 0.026, + "step": 304020 + }, + { + "epoch": 1.96, + "learning_rate": 5.657783486191161e-06, + "loss": 0.0257, + "step": 304030 + }, + { + "epoch": 1.96, + "learning_rate": 5.648102131834229e-06, + "loss": 0.0213, + "step": 304040 + }, + { + "epoch": 1.96, + "learning_rate": 5.638420777477297e-06, + "loss": 0.0222, + "step": 304050 + }, + { + "epoch": 1.96, + "learning_rate": 5.628739423120365e-06, + "loss": 0.0196, + "step": 304060 + }, + { + "epoch": 1.96, + "learning_rate": 5.6190580687634325e-06, + "loss": 0.0224, + "step": 304070 + }, + { + "epoch": 1.96, + "learning_rate": 5.6093767144065005e-06, + "loss": 0.0203, + "step": 304080 + }, + { + "epoch": 1.96, + "learning_rate": 5.599695360049568e-06, + "loss": 0.0242, + "step": 304090 + }, + { + "epoch": 1.96, + "learning_rate": 5.5900140056926355e-06, + "loss": 0.02, + "step": 304100 + }, + { + "epoch": 1.96, + "learning_rate": 5.5803326513357034e-06, + "loss": 0.0226, + "step": 304110 + }, + { + "epoch": 1.96, + "learning_rate": 5.570651296978771e-06, + "loss": 0.0185, + "step": 304120 + }, + { + "epoch": 1.96, + "learning_rate": 5.560969942621839e-06, + "loss": 0.0209, + "step": 304130 + }, + { + "epoch": 1.96, + "learning_rate": 5.551288588264907e-06, + "loss": 0.0199, + "step": 304140 + }, + { + "epoch": 1.96, + "learning_rate": 5.541607233907975e-06, + "loss": 0.0214, + "step": 304150 + }, + { + "epoch": 1.96, + "learning_rate": 5.531925879551043e-06, + "loss": 0.021, + "step": 304160 + }, + { + "epoch": 1.96, + "learning_rate": 5.522244525194111e-06, + "loss": 0.0191, + "step": 304170 + }, + { + "epoch": 1.96, + "learning_rate": 5.512563170837178e-06, + "loss": 0.0191, + "step": 304180 + }, + { + "epoch": 1.96, + "learning_rate": 5.502881816480247e-06, + "loss": 0.021, + "step": 304190 + }, + { + "epoch": 1.96, + "learning_rate": 5.493200462123314e-06, + "loss": 0.024, + "step": 304200 + }, + { + "epoch": 1.96, + "learning_rate": 5.483519107766383e-06, + "loss": 0.0205, + "step": 304210 + }, + { + "epoch": 1.96, + "learning_rate": 5.47383775340945e-06, + "loss": 0.0234, + "step": 304220 + }, + { + "epoch": 1.96, + "learning_rate": 5.464156399052517e-06, + "loss": 0.0206, + "step": 304230 + }, + { + "epoch": 1.96, + "learning_rate": 5.454475044695586e-06, + "loss": 0.028, + "step": 304240 + }, + { + "epoch": 1.96, + "learning_rate": 5.444793690338653e-06, + "loss": 0.0237, + "step": 304250 + }, + { + "epoch": 1.96, + "learning_rate": 5.435112335981722e-06, + "loss": 0.0238, + "step": 304260 + }, + { + "epoch": 1.96, + "learning_rate": 5.425430981624789e-06, + "loss": 0.0217, + "step": 304270 + }, + { + "epoch": 1.96, + "learning_rate": 5.4157496272678575e-06, + "loss": 0.0231, + "step": 304280 + }, + { + "epoch": 1.96, + "learning_rate": 5.4060682729109245e-06, + "loss": 0.0204, + "step": 304290 + }, + { + "epoch": 1.96, + "learning_rate": 5.396386918553992e-06, + "loss": 0.0223, + "step": 304300 + }, + { + "epoch": 1.96, + "learning_rate": 5.38670556419706e-06, + "loss": 0.0246, + "step": 304310 + }, + { + "epoch": 1.96, + "learning_rate": 5.3770242098401275e-06, + "loss": 0.0219, + "step": 304320 + }, + { + "epoch": 1.96, + "learning_rate": 5.367342855483196e-06, + "loss": 0.021, + "step": 304330 + }, + { + "epoch": 1.96, + "learning_rate": 5.357661501126263e-06, + "loss": 0.0193, + "step": 304340 + }, + { + "epoch": 1.96, + "learning_rate": 5.347980146769332e-06, + "loss": 0.0175, + "step": 304350 + }, + { + "epoch": 1.96, + "learning_rate": 5.338298792412399e-06, + "loss": 0.0216, + "step": 304360 + }, + { + "epoch": 1.96, + "learning_rate": 5.328617438055467e-06, + "loss": 0.021, + "step": 304370 + }, + { + "epoch": 1.96, + "learning_rate": 5.318936083698535e-06, + "loss": 0.0263, + "step": 304380 + }, + { + "epoch": 1.96, + "learning_rate": 5.309254729341603e-06, + "loss": 0.0212, + "step": 304390 + }, + { + "epoch": 1.96, + "learning_rate": 5.299573374984671e-06, + "loss": 0.023, + "step": 304400 + }, + { + "epoch": 1.96, + "learning_rate": 5.289892020627739e-06, + "loss": 0.0205, + "step": 304410 + }, + { + "epoch": 1.96, + "learning_rate": 5.280210666270806e-06, + "loss": 0.0215, + "step": 304420 + }, + { + "epoch": 1.96, + "learning_rate": 5.270529311913874e-06, + "loss": 0.0191, + "step": 304430 + }, + { + "epoch": 1.96, + "learning_rate": 5.260847957556942e-06, + "loss": 0.0206, + "step": 304440 + }, + { + "epoch": 1.96, + "learning_rate": 5.25116660320001e-06, + "loss": 0.0226, + "step": 304450 + }, + { + "epoch": 1.97, + "learning_rate": 5.241485248843078e-06, + "loss": 0.0258, + "step": 304460 + }, + { + "epoch": 1.97, + "learning_rate": 5.231803894486146e-06, + "loss": 0.0248, + "step": 304470 + }, + { + "epoch": 1.97, + "learning_rate": 5.2221225401292136e-06, + "loss": 0.018, + "step": 304480 + }, + { + "epoch": 1.97, + "learning_rate": 5.212441185772281e-06, + "loss": 0.0215, + "step": 304490 + }, + { + "epoch": 1.97, + "learning_rate": 5.2027598314153494e-06, + "loss": 0.0269, + "step": 304500 + }, + { + "epoch": 1.97, + "learning_rate": 5.1930784770584165e-06, + "loss": 0.0205, + "step": 304510 + }, + { + "epoch": 1.97, + "learning_rate": 5.183397122701485e-06, + "loss": 0.0201, + "step": 304520 + }, + { + "epoch": 1.97, + "learning_rate": 5.173715768344552e-06, + "loss": 0.0201, + "step": 304530 + }, + { + "epoch": 1.97, + "learning_rate": 5.164034413987621e-06, + "loss": 0.0184, + "step": 304540 + }, + { + "epoch": 1.97, + "learning_rate": 5.154353059630688e-06, + "loss": 0.0212, + "step": 304550 + }, + { + "epoch": 1.97, + "learning_rate": 5.144671705273755e-06, + "loss": 0.0215, + "step": 304560 + }, + { + "epoch": 1.97, + "learning_rate": 5.134990350916824e-06, + "loss": 0.0197, + "step": 304570 + }, + { + "epoch": 1.97, + "learning_rate": 5.125308996559891e-06, + "loss": 0.0199, + "step": 304580 + }, + { + "epoch": 1.97, + "learning_rate": 5.11562764220296e-06, + "loss": 0.0264, + "step": 304590 + }, + { + "epoch": 1.97, + "learning_rate": 5.105946287846027e-06, + "loss": 0.0186, + "step": 304600 + }, + { + "epoch": 1.97, + "learning_rate": 5.096264933489095e-06, + "loss": 0.0241, + "step": 304610 + }, + { + "epoch": 1.97, + "learning_rate": 5.086583579132163e-06, + "loss": 0.0219, + "step": 304620 + }, + { + "epoch": 1.97, + "learning_rate": 5.07690222477523e-06, + "loss": 0.0217, + "step": 304630 + }, + { + "epoch": 1.97, + "learning_rate": 5.067220870418299e-06, + "loss": 0.0203, + "step": 304640 + }, + { + "epoch": 1.97, + "learning_rate": 5.057539516061366e-06, + "loss": 0.0224, + "step": 304650 + }, + { + "epoch": 1.97, + "learning_rate": 5.047858161704435e-06, + "loss": 0.0243, + "step": 304660 + }, + { + "epoch": 1.97, + "learning_rate": 5.038176807347502e-06, + "loss": 0.0187, + "step": 304670 + }, + { + "epoch": 1.97, + "learning_rate": 5.02849545299057e-06, + "loss": 0.0217, + "step": 304680 + }, + { + "epoch": 1.97, + "learning_rate": 5.018814098633638e-06, + "loss": 0.0177, + "step": 304690 + }, + { + "epoch": 1.97, + "learning_rate": 5.0091327442767056e-06, + "loss": 0.0219, + "step": 304700 + }, + { + "epoch": 1.97, + "learning_rate": 4.9994513899197735e-06, + "loss": 0.0223, + "step": 304710 + }, + { + "epoch": 1.97, + "learning_rate": 4.9897700355628414e-06, + "loss": 0.0198, + "step": 304720 + }, + { + "epoch": 1.97, + "learning_rate": 4.980088681205909e-06, + "loss": 0.0262, + "step": 304730 + }, + { + "epoch": 1.97, + "learning_rate": 4.970407326848977e-06, + "loss": 0.0233, + "step": 304740 + }, + { + "epoch": 1.97, + "learning_rate": 4.960725972492044e-06, + "loss": 0.0198, + "step": 304750 + }, + { + "epoch": 1.97, + "learning_rate": 4.951044618135112e-06, + "loss": 0.0214, + "step": 304760 + }, + { + "epoch": 1.97, + "learning_rate": 4.94136326377818e-06, + "loss": 0.0252, + "step": 304770 + }, + { + "epoch": 1.97, + "learning_rate": 4.931681909421248e-06, + "loss": 0.0221, + "step": 304780 + }, + { + "epoch": 1.97, + "learning_rate": 4.922000555064316e-06, + "loss": 0.0255, + "step": 304790 + }, + { + "epoch": 1.97, + "learning_rate": 4.912319200707384e-06, + "loss": 0.0262, + "step": 304800 + }, + { + "epoch": 1.97, + "learning_rate": 4.902637846350452e-06, + "loss": 0.0242, + "step": 304810 + }, + { + "epoch": 1.97, + "learning_rate": 4.892956491993519e-06, + "loss": 0.0252, + "step": 304820 + }, + { + "epoch": 1.97, + "learning_rate": 4.883275137636588e-06, + "loss": 0.022, + "step": 304830 + }, + { + "epoch": 1.97, + "learning_rate": 4.873593783279655e-06, + "loss": 0.023, + "step": 304840 + }, + { + "epoch": 1.97, + "learning_rate": 4.863912428922724e-06, + "loss": 0.022, + "step": 304850 + }, + { + "epoch": 1.97, + "learning_rate": 4.854231074565791e-06, + "loss": 0.0195, + "step": 304860 + }, + { + "epoch": 1.97, + "learning_rate": 4.844549720208858e-06, + "loss": 0.0236, + "step": 304870 + }, + { + "epoch": 1.97, + "learning_rate": 4.834868365851927e-06, + "loss": 0.0259, + "step": 304880 + }, + { + "epoch": 1.97, + "learning_rate": 4.825187011494994e-06, + "loss": 0.02, + "step": 304890 + }, + { + "epoch": 1.97, + "learning_rate": 4.8155056571380625e-06, + "loss": 0.0194, + "step": 304900 + }, + { + "epoch": 1.97, + "learning_rate": 4.80582430278113e-06, + "loss": 0.0256, + "step": 304910 + }, + { + "epoch": 1.97, + "learning_rate": 4.796142948424198e-06, + "loss": 0.024, + "step": 304920 + }, + { + "epoch": 1.97, + "learning_rate": 4.7864615940672655e-06, + "loss": 0.0261, + "step": 304930 + }, + { + "epoch": 1.97, + "learning_rate": 4.776780239710333e-06, + "loss": 0.0206, + "step": 304940 + }, + { + "epoch": 1.97, + "learning_rate": 4.767098885353401e-06, + "loss": 0.0223, + "step": 304950 + }, + { + "epoch": 1.97, + "learning_rate": 4.7574175309964684e-06, + "loss": 0.0175, + "step": 304960 + }, + { + "epoch": 1.97, + "learning_rate": 4.747736176639537e-06, + "loss": 0.0189, + "step": 304970 + }, + { + "epoch": 1.97, + "learning_rate": 4.738054822282604e-06, + "loss": 0.0245, + "step": 304980 + }, + { + "epoch": 1.97, + "learning_rate": 4.728373467925673e-06, + "loss": 0.0249, + "step": 304990 + }, + { + "epoch": 1.97, + "learning_rate": 4.71869211356874e-06, + "loss": 0.0233, + "step": 305000 + }, + { + "epoch": 1.97, + "eval_cer": 0.9198092870862049, + "eval_loss": 0.016421254724264145, + "eval_runtime": 120.2527, + "eval_samples_per_second": 16.632, + "eval_steps_per_second": 4.158, + "step": 305000 + }, + { + "epoch": 1.97, + "learning_rate": 4.709010759211808e-06, + "loss": 0.0207, + "step": 305010 + }, + { + "epoch": 1.97, + "learning_rate": 4.699329404854876e-06, + "loss": 0.0231, + "step": 305020 + }, + { + "epoch": 1.97, + "learning_rate": 4.689648050497944e-06, + "loss": 0.0218, + "step": 305030 + }, + { + "epoch": 1.97, + "learning_rate": 4.679966696141012e-06, + "loss": 0.0242, + "step": 305040 + }, + { + "epoch": 1.97, + "learning_rate": 4.67028534178408e-06, + "loss": 0.021, + "step": 305050 + }, + { + "epoch": 1.97, + "learning_rate": 4.660603987427148e-06, + "loss": 0.024, + "step": 305060 + }, + { + "epoch": 1.97, + "learning_rate": 4.650922633070216e-06, + "loss": 0.0197, + "step": 305070 + }, + { + "epoch": 1.97, + "learning_rate": 4.641241278713284e-06, + "loss": 0.0237, + "step": 305080 + }, + { + "epoch": 1.97, + "learning_rate": 4.631559924356351e-06, + "loss": 0.022, + "step": 305090 + }, + { + "epoch": 1.97, + "learning_rate": 4.621878569999419e-06, + "loss": 0.0203, + "step": 305100 + }, + { + "epoch": 1.97, + "learning_rate": 4.612197215642487e-06, + "loss": 0.0221, + "step": 305110 + }, + { + "epoch": 1.97, + "learning_rate": 4.6025158612855545e-06, + "loss": 0.0183, + "step": 305120 + }, + { + "epoch": 1.97, + "learning_rate": 4.5928345069286225e-06, + "loss": 0.0192, + "step": 305130 + }, + { + "epoch": 1.97, + "learning_rate": 4.58315315257169e-06, + "loss": 0.0199, + "step": 305140 + }, + { + "epoch": 1.97, + "learning_rate": 4.573471798214758e-06, + "loss": 0.0198, + "step": 305150 + }, + { + "epoch": 1.97, + "learning_rate": 4.563790443857825e-06, + "loss": 0.0196, + "step": 305160 + }, + { + "epoch": 1.97, + "learning_rate": 4.554109089500893e-06, + "loss": 0.0188, + "step": 305170 + }, + { + "epoch": 1.97, + "learning_rate": 4.544427735143961e-06, + "loss": 0.0219, + "step": 305180 + }, + { + "epoch": 1.97, + "learning_rate": 4.534746380787029e-06, + "loss": 0.0215, + "step": 305190 + }, + { + "epoch": 1.97, + "learning_rate": 4.525065026430097e-06, + "loss": 0.0199, + "step": 305200 + }, + { + "epoch": 1.97, + "learning_rate": 4.515383672073165e-06, + "loss": 0.0207, + "step": 305210 + }, + { + "epoch": 1.97, + "learning_rate": 4.505702317716232e-06, + "loss": 0.0194, + "step": 305220 + }, + { + "epoch": 1.97, + "learning_rate": 4.4960209633593e-06, + "loss": 0.0184, + "step": 305230 + }, + { + "epoch": 1.97, + "learning_rate": 4.486339609002368e-06, + "loss": 0.0194, + "step": 305240 + }, + { + "epoch": 1.97, + "learning_rate": 4.476658254645436e-06, + "loss": 0.0232, + "step": 305250 + }, + { + "epoch": 1.97, + "learning_rate": 4.466976900288504e-06, + "loss": 0.0205, + "step": 305260 + }, + { + "epoch": 1.97, + "learning_rate": 4.457295545931572e-06, + "loss": 0.0234, + "step": 305270 + }, + { + "epoch": 1.97, + "learning_rate": 4.44761419157464e-06, + "loss": 0.021, + "step": 305280 + }, + { + "epoch": 1.97, + "learning_rate": 4.437932837217707e-06, + "loss": 0.0198, + "step": 305290 + }, + { + "epoch": 1.97, + "learning_rate": 4.428251482860775e-06, + "loss": 0.0227, + "step": 305300 + }, + { + "epoch": 1.97, + "learning_rate": 4.418570128503843e-06, + "loss": 0.0213, + "step": 305310 + }, + { + "epoch": 1.97, + "learning_rate": 4.408888774146911e-06, + "loss": 0.0226, + "step": 305320 + }, + { + "epoch": 1.97, + "learning_rate": 4.399207419789979e-06, + "loss": 0.0206, + "step": 305330 + }, + { + "epoch": 1.97, + "learning_rate": 4.3895260654330465e-06, + "loss": 0.0185, + "step": 305340 + }, + { + "epoch": 1.97, + "learning_rate": 4.3798447110761144e-06, + "loss": 0.0236, + "step": 305350 + }, + { + "epoch": 1.97, + "learning_rate": 4.370163356719182e-06, + "loss": 0.019, + "step": 305360 + }, + { + "epoch": 1.97, + "learning_rate": 4.36048200236225e-06, + "loss": 0.0223, + "step": 305370 + }, + { + "epoch": 1.97, + "learning_rate": 4.350800648005318e-06, + "loss": 0.0217, + "step": 305380 + }, + { + "epoch": 1.97, + "learning_rate": 4.341119293648386e-06, + "loss": 0.0244, + "step": 305390 + }, + { + "epoch": 1.97, + "learning_rate": 4.331437939291454e-06, + "loss": 0.0212, + "step": 305400 + }, + { + "epoch": 1.97, + "learning_rate": 4.321756584934521e-06, + "loss": 0.0231, + "step": 305410 + }, + { + "epoch": 1.97, + "learning_rate": 4.312075230577589e-06, + "loss": 0.0204, + "step": 305420 + }, + { + "epoch": 1.97, + "learning_rate": 4.302393876220657e-06, + "loss": 0.0221, + "step": 305430 + }, + { + "epoch": 1.97, + "learning_rate": 4.292712521863725e-06, + "loss": 0.0214, + "step": 305440 + }, + { + "epoch": 1.97, + "learning_rate": 4.283031167506793e-06, + "loss": 0.0174, + "step": 305450 + }, + { + "epoch": 1.97, + "learning_rate": 4.273349813149861e-06, + "loss": 0.0223, + "step": 305460 + }, + { + "epoch": 1.97, + "learning_rate": 4.263668458792929e-06, + "loss": 0.0198, + "step": 305470 + }, + { + "epoch": 1.97, + "learning_rate": 4.253987104435996e-06, + "loss": 0.0189, + "step": 305480 + }, + { + "epoch": 1.97, + "learning_rate": 4.244305750079064e-06, + "loss": 0.0188, + "step": 305490 + }, + { + "epoch": 1.97, + "learning_rate": 4.234624395722132e-06, + "loss": 0.0225, + "step": 305500 + }, + { + "epoch": 1.97, + "learning_rate": 4.2249430413652e-06, + "loss": 0.0249, + "step": 305510 + }, + { + "epoch": 1.97, + "learning_rate": 4.215261687008268e-06, + "loss": 0.024, + "step": 305520 + }, + { + "epoch": 1.97, + "learning_rate": 4.2055803326513355e-06, + "loss": 0.0232, + "step": 305530 + }, + { + "epoch": 1.97, + "learning_rate": 4.195898978294403e-06, + "loss": 0.021, + "step": 305540 + }, + { + "epoch": 1.97, + "learning_rate": 4.1862176239374706e-06, + "loss": 0.0287, + "step": 305550 + }, + { + "epoch": 1.97, + "learning_rate": 4.1765362695805385e-06, + "loss": 0.0214, + "step": 305560 + }, + { + "epoch": 1.97, + "learning_rate": 4.1668549152236064e-06, + "loss": 0.0226, + "step": 305570 + }, + { + "epoch": 1.97, + "learning_rate": 4.157173560866674e-06, + "loss": 0.0225, + "step": 305580 + }, + { + "epoch": 1.97, + "learning_rate": 4.147492206509742e-06, + "loss": 0.0216, + "step": 305590 + }, + { + "epoch": 1.97, + "learning_rate": 4.13781085215281e-06, + "loss": 0.0194, + "step": 305600 + }, + { + "epoch": 1.97, + "learning_rate": 4.128129497795878e-06, + "loss": 0.0238, + "step": 305610 + }, + { + "epoch": 1.97, + "learning_rate": 4.118448143438945e-06, + "loss": 0.0225, + "step": 305620 + }, + { + "epoch": 1.97, + "learning_rate": 4.108766789082013e-06, + "loss": 0.0186, + "step": 305630 + }, + { + "epoch": 1.97, + "learning_rate": 4.099085434725081e-06, + "loss": 0.0222, + "step": 305640 + }, + { + "epoch": 1.97, + "learning_rate": 4.089404080368149e-06, + "loss": 0.0197, + "step": 305650 + }, + { + "epoch": 1.97, + "learning_rate": 4.079722726011217e-06, + "loss": 0.033, + "step": 305660 + }, + { + "epoch": 1.97, + "learning_rate": 4.070041371654285e-06, + "loss": 0.0229, + "step": 305670 + }, + { + "epoch": 1.97, + "learning_rate": 4.060360017297353e-06, + "loss": 0.0186, + "step": 305680 + }, + { + "epoch": 1.97, + "learning_rate": 4.050678662940421e-06, + "loss": 0.0266, + "step": 305690 + }, + { + "epoch": 1.97, + "learning_rate": 4.040997308583489e-06, + "loss": 0.0243, + "step": 305700 + }, + { + "epoch": 1.97, + "learning_rate": 4.031315954226557e-06, + "loss": 0.0238, + "step": 305710 + }, + { + "epoch": 1.97, + "learning_rate": 4.021634599869625e-06, + "loss": 0.0239, + "step": 305720 + }, + { + "epoch": 1.97, + "learning_rate": 4.0119532455126925e-06, + "loss": 0.0202, + "step": 305730 + }, + { + "epoch": 1.97, + "learning_rate": 4.00227189115576e-06, + "loss": 0.0238, + "step": 305740 + }, + { + "epoch": 1.97, + "learning_rate": 3.9925905367988275e-06, + "loss": 0.0162, + "step": 305750 + }, + { + "epoch": 1.97, + "learning_rate": 3.9829091824418955e-06, + "loss": 0.0218, + "step": 305760 + }, + { + "epoch": 1.97, + "learning_rate": 3.973227828084963e-06, + "loss": 0.0195, + "step": 305770 + }, + { + "epoch": 1.97, + "learning_rate": 3.963546473728031e-06, + "loss": 0.0203, + "step": 305780 + }, + { + "epoch": 1.97, + "learning_rate": 3.953865119371099e-06, + "loss": 0.0214, + "step": 305790 + }, + { + "epoch": 1.97, + "learning_rate": 3.944183765014166e-06, + "loss": 0.021, + "step": 305800 + }, + { + "epoch": 1.97, + "learning_rate": 3.934502410657234e-06, + "loss": 0.0216, + "step": 305810 + }, + { + "epoch": 1.97, + "learning_rate": 3.924821056300302e-06, + "loss": 0.0274, + "step": 305820 + }, + { + "epoch": 1.97, + "learning_rate": 3.91513970194337e-06, + "loss": 0.0205, + "step": 305830 + }, + { + "epoch": 1.97, + "learning_rate": 3.905458347586438e-06, + "loss": 0.0159, + "step": 305840 + }, + { + "epoch": 1.97, + "learning_rate": 3.895776993229506e-06, + "loss": 0.0267, + "step": 305850 + }, + { + "epoch": 1.97, + "learning_rate": 3.886095638872573e-06, + "loss": 0.0217, + "step": 305860 + }, + { + "epoch": 1.97, + "learning_rate": 3.876414284515641e-06, + "loss": 0.0197, + "step": 305870 + }, + { + "epoch": 1.97, + "learning_rate": 3.866732930158709e-06, + "loss": 0.0238, + "step": 305880 + }, + { + "epoch": 1.97, + "learning_rate": 3.857051575801777e-06, + "loss": 0.0221, + "step": 305890 + }, + { + "epoch": 1.97, + "learning_rate": 3.847370221444845e-06, + "loss": 0.0273, + "step": 305900 + }, + { + "epoch": 1.97, + "learning_rate": 3.837688867087913e-06, + "loss": 0.0239, + "step": 305910 + }, + { + "epoch": 1.97, + "learning_rate": 3.828007512730981e-06, + "loss": 0.0252, + "step": 305920 + }, + { + "epoch": 1.97, + "learning_rate": 3.818326158374049e-06, + "loss": 0.0186, + "step": 305930 + }, + { + "epoch": 1.97, + "learning_rate": 3.808644804017116e-06, + "loss": 0.0226, + "step": 305940 + }, + { + "epoch": 1.97, + "learning_rate": 3.798963449660184e-06, + "loss": 0.0198, + "step": 305950 + }, + { + "epoch": 1.97, + "learning_rate": 3.789282095303252e-06, + "loss": 0.0268, + "step": 305960 + }, + { + "epoch": 1.97, + "learning_rate": 3.77960074094632e-06, + "loss": 0.025, + "step": 305970 + }, + { + "epoch": 1.97, + "learning_rate": 3.769919386589388e-06, + "loss": 0.0217, + "step": 305980 + }, + { + "epoch": 1.97, + "learning_rate": 3.7602380322324554e-06, + "loss": 0.0207, + "step": 305990 + }, + { + "epoch": 1.97, + "learning_rate": 3.7505566778755233e-06, + "loss": 0.0211, + "step": 306000 + }, + { + "epoch": 1.97, + "eval_cer": 0.919808383233533, + "eval_loss": 0.01641755923628807, + "eval_runtime": 120.3007, + "eval_samples_per_second": 16.625, + "eval_steps_per_second": 4.156, + "step": 306000 + }, + { + "epoch": 1.98, + "learning_rate": 3.740875323518591e-06, + "loss": 0.0277, + "step": 306010 + }, + { + "epoch": 1.98, + "learning_rate": 3.7311939691616588e-06, + "loss": 0.0268, + "step": 306020 + }, + { + "epoch": 1.98, + "learning_rate": 3.7215126148047267e-06, + "loss": 0.023, + "step": 306030 + }, + { + "epoch": 1.98, + "learning_rate": 3.7118312604477946e-06, + "loss": 0.0248, + "step": 306040 + }, + { + "epoch": 1.98, + "learning_rate": 3.7021499060908626e-06, + "loss": 0.0182, + "step": 306050 + }, + { + "epoch": 1.98, + "learning_rate": 3.69246855173393e-06, + "loss": 0.0163, + "step": 306060 + }, + { + "epoch": 1.98, + "learning_rate": 3.682787197376998e-06, + "loss": 0.021, + "step": 306070 + }, + { + "epoch": 1.98, + "learning_rate": 3.673105843020066e-06, + "loss": 0.023, + "step": 306080 + }, + { + "epoch": 1.98, + "learning_rate": 3.663424488663134e-06, + "loss": 0.0205, + "step": 306090 + }, + { + "epoch": 1.98, + "learning_rate": 3.653743134306202e-06, + "loss": 0.0184, + "step": 306100 + }, + { + "epoch": 1.98, + "learning_rate": 3.6440617799492697e-06, + "loss": 0.0239, + "step": 306110 + }, + { + "epoch": 1.98, + "learning_rate": 3.634380425592337e-06, + "loss": 0.0217, + "step": 306120 + }, + { + "epoch": 1.98, + "learning_rate": 3.6246990712354048e-06, + "loss": 0.0224, + "step": 306130 + }, + { + "epoch": 1.98, + "learning_rate": 3.6150177168784727e-06, + "loss": 0.0256, + "step": 306140 + }, + { + "epoch": 1.98, + "learning_rate": 3.6053363625215406e-06, + "loss": 0.0191, + "step": 306150 + }, + { + "epoch": 1.98, + "learning_rate": 3.5956550081646086e-06, + "loss": 0.0208, + "step": 306160 + }, + { + "epoch": 1.98, + "learning_rate": 3.5859736538076765e-06, + "loss": 0.0193, + "step": 306170 + }, + { + "epoch": 1.98, + "learning_rate": 3.576292299450744e-06, + "loss": 0.0213, + "step": 306180 + }, + { + "epoch": 1.98, + "learning_rate": 3.566610945093812e-06, + "loss": 0.0213, + "step": 306190 + }, + { + "epoch": 1.98, + "learning_rate": 3.55692959073688e-06, + "loss": 0.0223, + "step": 306200 + }, + { + "epoch": 1.98, + "learning_rate": 3.547248236379948e-06, + "loss": 0.0171, + "step": 306210 + }, + { + "epoch": 1.98, + "learning_rate": 3.5375668820230157e-06, + "loss": 0.0223, + "step": 306220 + }, + { + "epoch": 1.98, + "learning_rate": 3.5278855276660837e-06, + "loss": 0.0204, + "step": 306230 + }, + { + "epoch": 1.98, + "learning_rate": 3.518204173309151e-06, + "loss": 0.0236, + "step": 306240 + }, + { + "epoch": 1.98, + "learning_rate": 3.5085228189522187e-06, + "loss": 0.0223, + "step": 306250 + }, + { + "epoch": 1.98, + "learning_rate": 3.4988414645952866e-06, + "loss": 0.0224, + "step": 306260 + }, + { + "epoch": 1.98, + "learning_rate": 3.4891601102383546e-06, + "loss": 0.024, + "step": 306270 + }, + { + "epoch": 1.98, + "learning_rate": 3.4794787558814225e-06, + "loss": 0.0245, + "step": 306280 + }, + { + "epoch": 1.98, + "learning_rate": 3.4697974015244904e-06, + "loss": 0.0195, + "step": 306290 + }, + { + "epoch": 1.98, + "learning_rate": 3.4601160471675584e-06, + "loss": 0.0284, + "step": 306300 + }, + { + "epoch": 1.98, + "learning_rate": 3.450434692810626e-06, + "loss": 0.0191, + "step": 306310 + }, + { + "epoch": 1.98, + "learning_rate": 3.440753338453694e-06, + "loss": 0.0194, + "step": 306320 + }, + { + "epoch": 1.98, + "learning_rate": 3.4310719840967617e-06, + "loss": 0.0212, + "step": 306330 + }, + { + "epoch": 1.98, + "learning_rate": 3.4213906297398292e-06, + "loss": 0.02, + "step": 306340 + }, + { + "epoch": 1.98, + "learning_rate": 3.411709275382897e-06, + "loss": 0.0256, + "step": 306350 + }, + { + "epoch": 1.98, + "learning_rate": 3.402027921025965e-06, + "loss": 0.0208, + "step": 306360 + }, + { + "epoch": 1.98, + "learning_rate": 3.392346566669033e-06, + "loss": 0.0183, + "step": 306370 + }, + { + "epoch": 1.98, + "learning_rate": 3.3826652123121006e-06, + "loss": 0.025, + "step": 306380 + }, + { + "epoch": 1.98, + "learning_rate": 3.3729838579551685e-06, + "loss": 0.0246, + "step": 306390 + }, + { + "epoch": 1.98, + "learning_rate": 3.3633025035982364e-06, + "loss": 0.0194, + "step": 306400 + }, + { + "epoch": 1.98, + "learning_rate": 3.3536211492413044e-06, + "loss": 0.0214, + "step": 306410 + }, + { + "epoch": 1.98, + "learning_rate": 3.3439397948843723e-06, + "loss": 0.0199, + "step": 306420 + }, + { + "epoch": 1.98, + "learning_rate": 3.3342584405274402e-06, + "loss": 0.0201, + "step": 306430 + }, + { + "epoch": 1.98, + "learning_rate": 3.3245770861705073e-06, + "loss": 0.0208, + "step": 306440 + }, + { + "epoch": 1.98, + "learning_rate": 3.3148957318135752e-06, + "loss": 0.0197, + "step": 306450 + }, + { + "epoch": 1.98, + "learning_rate": 3.305214377456643e-06, + "loss": 0.0263, + "step": 306460 + }, + { + "epoch": 1.98, + "learning_rate": 3.295533023099711e-06, + "loss": 0.029, + "step": 306470 + }, + { + "epoch": 1.98, + "learning_rate": 3.285851668742779e-06, + "loss": 0.0262, + "step": 306480 + }, + { + "epoch": 1.98, + "learning_rate": 3.276170314385847e-06, + "loss": 0.0186, + "step": 306490 + }, + { + "epoch": 1.98, + "learning_rate": 3.2664889600289145e-06, + "loss": 0.0271, + "step": 306500 + }, + { + "epoch": 1.98, + "learning_rate": 3.2568076056719824e-06, + "loss": 0.0225, + "step": 306510 + }, + { + "epoch": 1.98, + "learning_rate": 3.2471262513150504e-06, + "loss": 0.0255, + "step": 306520 + }, + { + "epoch": 1.98, + "learning_rate": 3.2374448969581183e-06, + "loss": 0.0212, + "step": 306530 + }, + { + "epoch": 1.98, + "learning_rate": 3.2277635426011862e-06, + "loss": 0.0204, + "step": 306540 + }, + { + "epoch": 1.98, + "learning_rate": 3.218082188244254e-06, + "loss": 0.0208, + "step": 306550 + }, + { + "epoch": 1.98, + "learning_rate": 3.208400833887322e-06, + "loss": 0.0259, + "step": 306560 + }, + { + "epoch": 1.98, + "learning_rate": 3.198719479530389e-06, + "loss": 0.023, + "step": 306570 + }, + { + "epoch": 1.98, + "learning_rate": 3.189038125173457e-06, + "loss": 0.0219, + "step": 306580 + }, + { + "epoch": 1.98, + "learning_rate": 3.179356770816525e-06, + "loss": 0.0238, + "step": 306590 + }, + { + "epoch": 1.98, + "learning_rate": 3.169675416459593e-06, + "loss": 0.021, + "step": 306600 + }, + { + "epoch": 1.98, + "learning_rate": 3.159994062102661e-06, + "loss": 0.024, + "step": 306610 + }, + { + "epoch": 1.98, + "learning_rate": 3.150312707745729e-06, + "loss": 0.02, + "step": 306620 + }, + { + "epoch": 1.98, + "learning_rate": 3.1406313533887963e-06, + "loss": 0.0239, + "step": 306630 + }, + { + "epoch": 1.98, + "learning_rate": 3.1309499990318643e-06, + "loss": 0.0211, + "step": 306640 + }, + { + "epoch": 1.98, + "learning_rate": 3.1212686446749322e-06, + "loss": 0.0256, + "step": 306650 + }, + { + "epoch": 1.98, + "learning_rate": 3.111587290318e-06, + "loss": 0.0259, + "step": 306660 + }, + { + "epoch": 1.98, + "learning_rate": 3.1019059359610677e-06, + "loss": 0.0184, + "step": 306670 + }, + { + "epoch": 1.98, + "learning_rate": 3.0922245816041356e-06, + "loss": 0.0199, + "step": 306680 + }, + { + "epoch": 1.98, + "learning_rate": 3.0825432272472035e-06, + "loss": 0.0294, + "step": 306690 + }, + { + "epoch": 1.98, + "learning_rate": 3.072861872890271e-06, + "loss": 0.0211, + "step": 306700 + }, + { + "epoch": 1.98, + "learning_rate": 3.063180518533339e-06, + "loss": 0.0236, + "step": 306710 + }, + { + "epoch": 1.98, + "learning_rate": 3.053499164176407e-06, + "loss": 0.0247, + "step": 306720 + }, + { + "epoch": 1.98, + "learning_rate": 3.043817809819475e-06, + "loss": 0.029, + "step": 306730 + }, + { + "epoch": 1.98, + "learning_rate": 3.0341364554625428e-06, + "loss": 0.0216, + "step": 306740 + }, + { + "epoch": 1.98, + "learning_rate": 3.0244551011056107e-06, + "loss": 0.0204, + "step": 306750 + }, + { + "epoch": 1.98, + "learning_rate": 3.014773746748678e-06, + "loss": 0.0322, + "step": 306760 + }, + { + "epoch": 1.98, + "learning_rate": 3.0050923923917457e-06, + "loss": 0.0234, + "step": 306770 + }, + { + "epoch": 1.98, + "learning_rate": 2.9954110380348136e-06, + "loss": 0.0216, + "step": 306780 + }, + { + "epoch": 1.98, + "learning_rate": 2.9857296836778816e-06, + "loss": 0.0215, + "step": 306790 + }, + { + "epoch": 1.98, + "learning_rate": 2.9760483293209495e-06, + "loss": 0.0241, + "step": 306800 + }, + { + "epoch": 1.98, + "learning_rate": 2.9663669749640174e-06, + "loss": 0.0231, + "step": 306810 + }, + { + "epoch": 1.98, + "learning_rate": 2.956685620607085e-06, + "loss": 0.0328, + "step": 306820 + }, + { + "epoch": 1.98, + "learning_rate": 2.947004266250153e-06, + "loss": 0.024, + "step": 306830 + }, + { + "epoch": 1.98, + "learning_rate": 2.937322911893221e-06, + "loss": 0.0216, + "step": 306840 + }, + { + "epoch": 1.98, + "learning_rate": 2.9276415575362888e-06, + "loss": 0.0194, + "step": 306850 + }, + { + "epoch": 1.98, + "learning_rate": 2.9179602031793567e-06, + "loss": 0.0242, + "step": 306860 + }, + { + "epoch": 1.98, + "learning_rate": 2.9082788488224246e-06, + "loss": 0.0194, + "step": 306870 + }, + { + "epoch": 1.98, + "learning_rate": 2.8985974944654926e-06, + "loss": 0.0215, + "step": 306880 + }, + { + "epoch": 1.98, + "learning_rate": 2.8889161401085596e-06, + "loss": 0.027, + "step": 306890 + }, + { + "epoch": 1.98, + "learning_rate": 2.8792347857516276e-06, + "loss": 0.0241, + "step": 306900 + }, + { + "epoch": 1.98, + "learning_rate": 2.8695534313946955e-06, + "loss": 0.0198, + "step": 306910 + }, + { + "epoch": 1.98, + "learning_rate": 2.8598720770377634e-06, + "loss": 0.018, + "step": 306920 + }, + { + "epoch": 1.98, + "learning_rate": 2.8501907226808314e-06, + "loss": 0.0218, + "step": 306930 + }, + { + "epoch": 1.98, + "learning_rate": 2.8405093683238993e-06, + "loss": 0.0239, + "step": 306940 + }, + { + "epoch": 1.98, + "learning_rate": 2.830828013966967e-06, + "loss": 0.0226, + "step": 306950 + }, + { + "epoch": 1.98, + "learning_rate": 2.8211466596100348e-06, + "loss": 0.0225, + "step": 306960 + }, + { + "epoch": 1.98, + "learning_rate": 2.8114653052531027e-06, + "loss": 0.0217, + "step": 306970 + }, + { + "epoch": 1.98, + "learning_rate": 2.8017839508961706e-06, + "loss": 0.0192, + "step": 306980 + }, + { + "epoch": 1.98, + "learning_rate": 2.7921025965392386e-06, + "loss": 0.0219, + "step": 306990 + }, + { + "epoch": 1.98, + "learning_rate": 2.7824212421823065e-06, + "loss": 0.02, + "step": 307000 + }, + { + "epoch": 1.98, + "eval_cer": 0.9198192294655971, + "eval_loss": 0.016391895711421967, + "eval_runtime": 120.1873, + "eval_samples_per_second": 16.641, + "eval_steps_per_second": 4.16, + "step": 307000 + }, + { + "epoch": 1.98, + "learning_rate": 2.772739887825374e-06, + "loss": 0.0237, + "step": 307010 + }, + { + "epoch": 1.98, + "learning_rate": 2.7630585334684415e-06, + "loss": 0.0232, + "step": 307020 + }, + { + "epoch": 1.98, + "learning_rate": 2.7533771791115094e-06, + "loss": 0.0225, + "step": 307030 + }, + { + "epoch": 1.98, + "learning_rate": 2.7436958247545774e-06, + "loss": 0.0165, + "step": 307040 + }, + { + "epoch": 1.98, + "learning_rate": 2.7340144703976453e-06, + "loss": 0.0203, + "step": 307050 + }, + { + "epoch": 1.98, + "learning_rate": 2.7243331160407132e-06, + "loss": 0.0196, + "step": 307060 + }, + { + "epoch": 1.98, + "learning_rate": 2.714651761683781e-06, + "loss": 0.022, + "step": 307070 + }, + { + "epoch": 1.98, + "learning_rate": 2.7049704073268487e-06, + "loss": 0.0179, + "step": 307080 + }, + { + "epoch": 1.98, + "learning_rate": 2.6952890529699166e-06, + "loss": 0.0221, + "step": 307090 + }, + { + "epoch": 1.98, + "learning_rate": 2.6856076986129845e-06, + "loss": 0.022, + "step": 307100 + }, + { + "epoch": 1.98, + "learning_rate": 2.675926344256052e-06, + "loss": 0.0234, + "step": 307110 + }, + { + "epoch": 1.98, + "learning_rate": 2.66624498989912e-06, + "loss": 0.0239, + "step": 307120 + }, + { + "epoch": 1.98, + "learning_rate": 2.656563635542188e-06, + "loss": 0.0224, + "step": 307130 + }, + { + "epoch": 1.98, + "learning_rate": 2.6468822811852554e-06, + "loss": 0.0225, + "step": 307140 + }, + { + "epoch": 1.98, + "learning_rate": 2.6372009268283234e-06, + "loss": 0.0196, + "step": 307150 + }, + { + "epoch": 1.98, + "learning_rate": 2.6275195724713913e-06, + "loss": 0.0194, + "step": 307160 + }, + { + "epoch": 1.98, + "learning_rate": 2.6178382181144592e-06, + "loss": 0.0168, + "step": 307170 + }, + { + "epoch": 1.98, + "learning_rate": 2.608156863757527e-06, + "loss": 0.0236, + "step": 307180 + }, + { + "epoch": 1.98, + "learning_rate": 2.598475509400595e-06, + "loss": 0.0165, + "step": 307190 + }, + { + "epoch": 1.98, + "learning_rate": 2.588794155043663e-06, + "loss": 0.0216, + "step": 307200 + }, + { + "epoch": 1.98, + "learning_rate": 2.57911280068673e-06, + "loss": 0.0235, + "step": 307210 + }, + { + "epoch": 1.98, + "learning_rate": 2.569431446329798e-06, + "loss": 0.0205, + "step": 307220 + }, + { + "epoch": 1.98, + "learning_rate": 2.559750091972866e-06, + "loss": 0.0214, + "step": 307230 + }, + { + "epoch": 1.98, + "learning_rate": 2.550068737615934e-06, + "loss": 0.0201, + "step": 307240 + }, + { + "epoch": 1.98, + "learning_rate": 2.540387383259002e-06, + "loss": 0.022, + "step": 307250 + }, + { + "epoch": 1.98, + "learning_rate": 2.5307060289020698e-06, + "loss": 0.0254, + "step": 307260 + }, + { + "epoch": 1.98, + "learning_rate": 2.5210246745451373e-06, + "loss": 0.0237, + "step": 307270 + }, + { + "epoch": 1.98, + "learning_rate": 2.5113433201882052e-06, + "loss": 0.0289, + "step": 307280 + }, + { + "epoch": 1.98, + "learning_rate": 2.501661965831273e-06, + "loss": 0.0205, + "step": 307290 + }, + { + "epoch": 1.98, + "learning_rate": 2.491980611474341e-06, + "loss": 0.0266, + "step": 307300 + }, + { + "epoch": 1.98, + "learning_rate": 2.482299257117409e-06, + "loss": 0.022, + "step": 307310 + }, + { + "epoch": 1.98, + "learning_rate": 2.472617902760477e-06, + "loss": 0.031, + "step": 307320 + }, + { + "epoch": 1.98, + "learning_rate": 2.462936548403545e-06, + "loss": 0.0198, + "step": 307330 + }, + { + "epoch": 1.98, + "learning_rate": 2.453255194046612e-06, + "loss": 0.0244, + "step": 307340 + }, + { + "epoch": 1.98, + "learning_rate": 2.44357383968968e-06, + "loss": 0.0232, + "step": 307350 + }, + { + "epoch": 1.98, + "learning_rate": 2.433892485332748e-06, + "loss": 0.0248, + "step": 307360 + }, + { + "epoch": 1.98, + "learning_rate": 2.4242111309758158e-06, + "loss": 0.0275, + "step": 307370 + }, + { + "epoch": 1.98, + "learning_rate": 2.4145297766188837e-06, + "loss": 0.0207, + "step": 307380 + }, + { + "epoch": 1.98, + "learning_rate": 2.4048484222619516e-06, + "loss": 0.0201, + "step": 307390 + }, + { + "epoch": 1.98, + "learning_rate": 2.395167067905019e-06, + "loss": 0.0244, + "step": 307400 + }, + { + "epoch": 1.98, + "learning_rate": 2.385485713548087e-06, + "loss": 0.0229, + "step": 307410 + }, + { + "epoch": 1.98, + "learning_rate": 2.375804359191155e-06, + "loss": 0.0194, + "step": 307420 + }, + { + "epoch": 1.98, + "learning_rate": 2.366123004834223e-06, + "loss": 0.0232, + "step": 307430 + }, + { + "epoch": 1.98, + "learning_rate": 2.3564416504772905e-06, + "loss": 0.019, + "step": 307440 + }, + { + "epoch": 1.98, + "learning_rate": 2.3467602961203584e-06, + "loss": 0.0234, + "step": 307450 + }, + { + "epoch": 1.98, + "learning_rate": 2.3370789417634263e-06, + "loss": 0.0244, + "step": 307460 + }, + { + "epoch": 1.98, + "learning_rate": 2.3273975874064943e-06, + "loss": 0.0217, + "step": 307470 + }, + { + "epoch": 1.98, + "learning_rate": 2.3177162330495618e-06, + "loss": 0.0207, + "step": 307480 + }, + { + "epoch": 1.98, + "learning_rate": 2.3080348786926297e-06, + "loss": 0.0169, + "step": 307490 + }, + { + "epoch": 1.98, + "learning_rate": 2.2983535243356976e-06, + "loss": 0.0218, + "step": 307500 + }, + { + "epoch": 1.98, + "learning_rate": 2.288672169978765e-06, + "loss": 0.0197, + "step": 307510 + }, + { + "epoch": 1.98, + "learning_rate": 2.278990815621833e-06, + "loss": 0.0186, + "step": 307520 + }, + { + "epoch": 1.98, + "learning_rate": 2.269309461264901e-06, + "loss": 0.0226, + "step": 307530 + }, + { + "epoch": 1.98, + "learning_rate": 2.2596281069079685e-06, + "loss": 0.027, + "step": 307540 + }, + { + "epoch": 1.98, + "learning_rate": 2.2499467525510365e-06, + "loss": 0.0291, + "step": 307550 + }, + { + "epoch": 1.99, + "learning_rate": 2.2402653981941044e-06, + "loss": 0.0182, + "step": 307560 + }, + { + "epoch": 1.99, + "learning_rate": 2.2305840438371723e-06, + "loss": 0.0224, + "step": 307570 + }, + { + "epoch": 1.99, + "learning_rate": 2.2209026894802403e-06, + "loss": 0.0224, + "step": 307580 + }, + { + "epoch": 1.99, + "learning_rate": 2.211221335123308e-06, + "loss": 0.02, + "step": 307590 + }, + { + "epoch": 1.99, + "learning_rate": 2.201539980766376e-06, + "loss": 0.0218, + "step": 307600 + }, + { + "epoch": 1.99, + "learning_rate": 2.1918586264094436e-06, + "loss": 0.022, + "step": 307610 + }, + { + "epoch": 1.99, + "learning_rate": 2.1821772720525116e-06, + "loss": 0.0229, + "step": 307620 + }, + { + "epoch": 1.99, + "learning_rate": 2.1724959176955795e-06, + "loss": 0.03, + "step": 307630 + }, + { + "epoch": 1.99, + "learning_rate": 2.162814563338647e-06, + "loss": 0.0274, + "step": 307640 + }, + { + "epoch": 1.99, + "learning_rate": 2.153133208981715e-06, + "loss": 0.0185, + "step": 307650 + }, + { + "epoch": 1.99, + "learning_rate": 2.143451854624783e-06, + "loss": 0.0198, + "step": 307660 + }, + { + "epoch": 1.99, + "learning_rate": 2.1337705002678504e-06, + "loss": 0.0229, + "step": 307670 + }, + { + "epoch": 1.99, + "learning_rate": 2.1240891459109183e-06, + "loss": 0.0179, + "step": 307680 + }, + { + "epoch": 1.99, + "learning_rate": 2.1144077915539863e-06, + "loss": 0.0231, + "step": 307690 + }, + { + "epoch": 1.99, + "learning_rate": 2.1047264371970538e-06, + "loss": 0.0207, + "step": 307700 + }, + { + "epoch": 1.99, + "learning_rate": 2.0950450828401217e-06, + "loss": 0.0213, + "step": 307710 + }, + { + "epoch": 1.99, + "learning_rate": 2.0853637284831896e-06, + "loss": 0.022, + "step": 307720 + }, + { + "epoch": 1.99, + "learning_rate": 2.0756823741262576e-06, + "loss": 0.0191, + "step": 307730 + }, + { + "epoch": 1.99, + "learning_rate": 2.0660010197693255e-06, + "loss": 0.0195, + "step": 307740 + }, + { + "epoch": 1.99, + "learning_rate": 2.0563196654123934e-06, + "loss": 0.0229, + "step": 307750 + }, + { + "epoch": 1.99, + "learning_rate": 2.0466383110554614e-06, + "loss": 0.0205, + "step": 307760 + }, + { + "epoch": 1.99, + "learning_rate": 2.036956956698529e-06, + "loss": 0.0214, + "step": 307770 + }, + { + "epoch": 1.99, + "learning_rate": 2.027275602341597e-06, + "loss": 0.0193, + "step": 307780 + }, + { + "epoch": 1.99, + "learning_rate": 2.0175942479846647e-06, + "loss": 0.0196, + "step": 307790 + }, + { + "epoch": 1.99, + "learning_rate": 2.0079128936277322e-06, + "loss": 0.0221, + "step": 307800 + }, + { + "epoch": 1.99, + "learning_rate": 1.9982315392708e-06, + "loss": 0.0232, + "step": 307810 + }, + { + "epoch": 1.99, + "learning_rate": 1.988550184913868e-06, + "loss": 0.0241, + "step": 307820 + }, + { + "epoch": 1.99, + "learning_rate": 1.9788688305569356e-06, + "loss": 0.0244, + "step": 307830 + }, + { + "epoch": 1.99, + "learning_rate": 1.9691874762000036e-06, + "loss": 0.0232, + "step": 307840 + }, + { + "epoch": 1.99, + "learning_rate": 1.9595061218430715e-06, + "loss": 0.0206, + "step": 307850 + }, + { + "epoch": 1.99, + "learning_rate": 1.9498247674861394e-06, + "loss": 0.0219, + "step": 307860 + }, + { + "epoch": 1.99, + "learning_rate": 1.940143413129207e-06, + "loss": 0.0202, + "step": 307870 + }, + { + "epoch": 1.99, + "learning_rate": 1.930462058772275e-06, + "loss": 0.0223, + "step": 307880 + }, + { + "epoch": 1.99, + "learning_rate": 1.920780704415343e-06, + "loss": 0.0241, + "step": 307890 + }, + { + "epoch": 1.99, + "learning_rate": 1.9110993500584107e-06, + "loss": 0.0186, + "step": 307900 + }, + { + "epoch": 1.99, + "learning_rate": 1.9014179957014785e-06, + "loss": 0.0193, + "step": 307910 + }, + { + "epoch": 1.99, + "learning_rate": 1.8917366413445464e-06, + "loss": 0.0212, + "step": 307920 + }, + { + "epoch": 1.99, + "learning_rate": 1.8820552869876141e-06, + "loss": 0.0203, + "step": 307930 + }, + { + "epoch": 1.99, + "learning_rate": 1.872373932630682e-06, + "loss": 0.0236, + "step": 307940 + }, + { + "epoch": 1.99, + "learning_rate": 1.86269257827375e-06, + "loss": 0.0195, + "step": 307950 + }, + { + "epoch": 1.99, + "learning_rate": 1.8530112239168175e-06, + "loss": 0.0214, + "step": 307960 + }, + { + "epoch": 1.99, + "learning_rate": 1.8433298695598854e-06, + "loss": 0.0229, + "step": 307970 + }, + { + "epoch": 1.99, + "learning_rate": 1.8336485152029534e-06, + "loss": 0.0215, + "step": 307980 + }, + { + "epoch": 1.99, + "learning_rate": 1.823967160846021e-06, + "loss": 0.023, + "step": 307990 + }, + { + "epoch": 1.99, + "learning_rate": 1.814285806489089e-06, + "loss": 0.0191, + "step": 308000 + }, + { + "epoch": 1.99, + "eval_cer": 0.9198192294655971, + "eval_loss": 0.01642085798084736, + "eval_runtime": 120.209, + "eval_samples_per_second": 16.638, + "eval_steps_per_second": 4.159, + "step": 308000 + }, + { + "epoch": 1.99, + "learning_rate": 1.8046044521321567e-06, + "loss": 0.018, + "step": 308010 + }, + { + "epoch": 1.99, + "learning_rate": 1.7949230977752245e-06, + "loss": 0.0222, + "step": 308020 + }, + { + "epoch": 1.99, + "learning_rate": 1.7852417434182924e-06, + "loss": 0.0233, + "step": 308030 + }, + { + "epoch": 1.99, + "learning_rate": 1.7755603890613603e-06, + "loss": 0.0199, + "step": 308040 + }, + { + "epoch": 1.99, + "learning_rate": 1.7658790347044283e-06, + "loss": 0.0227, + "step": 308050 + }, + { + "epoch": 1.99, + "learning_rate": 1.7561976803474958e-06, + "loss": 0.0196, + "step": 308060 + }, + { + "epoch": 1.99, + "learning_rate": 1.7465163259905637e-06, + "loss": 0.0246, + "step": 308070 + }, + { + "epoch": 1.99, + "learning_rate": 1.7368349716336316e-06, + "loss": 0.0237, + "step": 308080 + }, + { + "epoch": 1.99, + "learning_rate": 1.7271536172766993e-06, + "loss": 0.0187, + "step": 308090 + }, + { + "epoch": 1.99, + "learning_rate": 1.7174722629197673e-06, + "loss": 0.0234, + "step": 308100 + }, + { + "epoch": 1.99, + "learning_rate": 1.7077909085628352e-06, + "loss": 0.0291, + "step": 308110 + }, + { + "epoch": 1.99, + "learning_rate": 1.6981095542059027e-06, + "loss": 0.0203, + "step": 308120 + }, + { + "epoch": 1.99, + "learning_rate": 1.6884281998489707e-06, + "loss": 0.0216, + "step": 308130 + }, + { + "epoch": 1.99, + "learning_rate": 1.6787468454920386e-06, + "loss": 0.0252, + "step": 308140 + }, + { + "epoch": 1.99, + "learning_rate": 1.6690654911351063e-06, + "loss": 0.0244, + "step": 308150 + }, + { + "epoch": 1.99, + "learning_rate": 1.6593841367781742e-06, + "loss": 0.0222, + "step": 308160 + }, + { + "epoch": 1.99, + "learning_rate": 1.6497027824212422e-06, + "loss": 0.0238, + "step": 308170 + }, + { + "epoch": 1.99, + "learning_rate": 1.6400214280643097e-06, + "loss": 0.0221, + "step": 308180 + }, + { + "epoch": 1.99, + "learning_rate": 1.6303400737073776e-06, + "loss": 0.0215, + "step": 308190 + }, + { + "epoch": 1.99, + "learning_rate": 1.6206587193504456e-06, + "loss": 0.0267, + "step": 308200 + }, + { + "epoch": 1.99, + "learning_rate": 1.6109773649935135e-06, + "loss": 0.023, + "step": 308210 + }, + { + "epoch": 1.99, + "learning_rate": 1.6012960106365812e-06, + "loss": 0.0217, + "step": 308220 + }, + { + "epoch": 1.99, + "learning_rate": 1.591614656279649e-06, + "loss": 0.0244, + "step": 308230 + }, { "epoch": 1.99, - "learning_rate": 2.235706405347524e-06, - "loss": 0.0229, - "step": 183530 + "learning_rate": 1.5819333019227169e-06, + "loss": 0.0263, + "step": 308240 }, { "epoch": 1.99, - "learning_rate": 2.2194821208384707e-06, - "loss": 0.0241, - "step": 183540 + "learning_rate": 1.5722519475657846e-06, + "loss": 0.0201, + "step": 308250 }, { "epoch": 1.99, - "learning_rate": 2.2032578363294176e-06, - "loss": 0.0213, - "step": 183550 + "learning_rate": 1.5625705932088525e-06, + "loss": 0.0188, + "step": 308260 }, { "epoch": 1.99, - "learning_rate": 2.1870335518203644e-06, - "loss": 0.0228, - "step": 183560 + "learning_rate": 1.5528892388519205e-06, + "loss": 0.0218, + "step": 308270 }, { "epoch": 1.99, - "learning_rate": 2.1708092673113116e-06, - "loss": 0.0202, - "step": 183570 + "learning_rate": 1.543207884494988e-06, + "loss": 0.0226, + "step": 308280 }, { "epoch": 1.99, - "learning_rate": 2.1545849828022584e-06, - "loss": 0.0267, - "step": 183580 + "learning_rate": 1.533526530138056e-06, + "loss": 0.0189, + "step": 308290 }, { "epoch": 1.99, - "learning_rate": 2.138360698293205e-06, - "loss": 0.0221, - "step": 183590 + "learning_rate": 1.5238451757811238e-06, + "loss": 0.0217, + "step": 308300 }, { "epoch": 1.99, - "learning_rate": 2.122136413784152e-06, - "loss": 0.0292, - "step": 183600 + "learning_rate": 1.5141638214241916e-06, + "loss": 0.0302, + "step": 308310 }, { "epoch": 1.99, - "learning_rate": 2.105912129275099e-06, - "loss": 0.0213, - "step": 183610 + "learning_rate": 1.5044824670672595e-06, + "loss": 0.0224, + "step": 308320 }, { "epoch": 1.99, - "learning_rate": 2.0896878447660456e-06, - "loss": 0.0238, - "step": 183620 + "learning_rate": 1.4948011127103274e-06, + "loss": 0.0195, + "step": 308330 }, { "epoch": 1.99, - "learning_rate": 2.0734635602569924e-06, - "loss": 0.0197, - "step": 183630 + "learning_rate": 1.4851197583533953e-06, + "loss": 0.0195, + "step": 308340 }, { "epoch": 1.99, - "learning_rate": 2.0572392757479392e-06, - "loss": 0.023, - "step": 183640 + "learning_rate": 1.4754384039964629e-06, + "loss": 0.0183, + "step": 308350 }, { "epoch": 1.99, - "learning_rate": 2.041014991238886e-06, - "loss": 0.0229, - "step": 183650 + "learning_rate": 1.4657570496395308e-06, + "loss": 0.0216, + "step": 308360 }, { "epoch": 1.99, - "learning_rate": 2.024790706729833e-06, - "loss": 0.023, - "step": 183660 + "learning_rate": 1.4560756952825987e-06, + "loss": 0.0282, + "step": 308370 }, { "epoch": 1.99, - "learning_rate": 2.0085664222207797e-06, - "loss": 0.0252, - "step": 183670 + "learning_rate": 1.4463943409256664e-06, + "loss": 0.0182, + "step": 308380 }, { "epoch": 1.99, - "learning_rate": 1.992342137711727e-06, - "loss": 0.0216, - "step": 183680 + "learning_rate": 1.4367129865687344e-06, + "loss": 0.0198, + "step": 308390 }, { "epoch": 1.99, - "learning_rate": 1.9761178532026737e-06, - "loss": 0.0236, - "step": 183690 + "learning_rate": 1.427031632211802e-06, + "loss": 0.0212, + "step": 308400 }, { "epoch": 1.99, - "learning_rate": 1.9598935686936205e-06, - "loss": 0.0211, - "step": 183700 + "learning_rate": 1.4173502778548698e-06, + "loss": 0.0228, + "step": 308410 }, { "epoch": 1.99, - "learning_rate": 1.9436692841845673e-06, - "loss": 0.0219, - "step": 183710 + "learning_rate": 1.4076689234979378e-06, + "loss": 0.0213, + "step": 308420 }, { "epoch": 1.99, - "learning_rate": 1.927444999675514e-06, - "loss": 0.0224, - "step": 183720 + "learning_rate": 1.3979875691410057e-06, + "loss": 0.0239, + "step": 308430 }, { "epoch": 1.99, - "learning_rate": 1.911220715166461e-06, - "loss": 0.0316, - "step": 183730 + "learning_rate": 1.3883062147840734e-06, + "loss": 0.0251, + "step": 308440 }, { "epoch": 1.99, - "learning_rate": 1.8949964306574077e-06, - "loss": 0.0201, - "step": 183740 + "learning_rate": 1.3786248604271411e-06, + "loss": 0.0245, + "step": 308450 }, { "epoch": 1.99, - "learning_rate": 1.8787721461483547e-06, - "loss": 0.0253, - "step": 183750 + "learning_rate": 1.368943506070209e-06, + "loss": 0.024, + "step": 308460 }, { "epoch": 1.99, - "learning_rate": 1.8625478616393015e-06, - "loss": 0.0211, - "step": 183760 + "learning_rate": 1.3592621517132768e-06, + "loss": 0.0225, + "step": 308470 }, { "epoch": 1.99, - "learning_rate": 1.8463235771302483e-06, - "loss": 0.0226, - "step": 183770 + "learning_rate": 1.3495807973563447e-06, + "loss": 0.0216, + "step": 308480 }, { "epoch": 1.99, - "learning_rate": 1.8300992926211952e-06, - "loss": 0.0242, - "step": 183780 + "learning_rate": 1.3398994429994127e-06, + "loss": 0.0208, + "step": 308490 }, { "epoch": 1.99, - "learning_rate": 1.8138750081121422e-06, - "loss": 0.0219, - "step": 183790 + "learning_rate": 1.3302180886424806e-06, + "loss": 0.0197, + "step": 308500 }, { "epoch": 1.99, - "learning_rate": 1.797650723603089e-06, - "loss": 0.022, - "step": 183800 + "learning_rate": 1.320536734285548e-06, + "loss": 0.0211, + "step": 308510 }, { "epoch": 1.99, - "learning_rate": 1.7814264390940358e-06, - "loss": 0.0223, - "step": 183810 + "learning_rate": 1.310855379928616e-06, + "loss": 0.0237, + "step": 308520 }, { "epoch": 1.99, - "learning_rate": 1.7652021545849828e-06, - "loss": 0.0208, - "step": 183820 + "learning_rate": 1.301174025571684e-06, + "loss": 0.0256, + "step": 308530 }, { "epoch": 1.99, - "learning_rate": 1.7489778700759296e-06, - "loss": 0.028, - "step": 183830 + "learning_rate": 1.2914926712147517e-06, + "loss": 0.0215, + "step": 308540 }, { "epoch": 1.99, - "learning_rate": 1.7327535855668764e-06, - "loss": 0.0231, - "step": 183840 + "learning_rate": 1.2818113168578196e-06, + "loss": 0.0227, + "step": 308550 }, { "epoch": 1.99, - "learning_rate": 1.716529301057823e-06, - "loss": 0.0252, - "step": 183850 + "learning_rate": 1.2721299625008873e-06, + "loss": 0.0238, + "step": 308560 }, { "epoch": 1.99, - "learning_rate": 1.7003050165487702e-06, - "loss": 0.0249, - "step": 183860 + "learning_rate": 1.262448608143955e-06, + "loss": 0.0237, + "step": 308570 }, { "epoch": 1.99, - "learning_rate": 1.6840807320397168e-06, - "loss": 0.0268, - "step": 183870 + "learning_rate": 1.252767253787023e-06, + "loss": 0.024, + "step": 308580 }, { "epoch": 1.99, - "learning_rate": 1.6678564475306636e-06, - "loss": 0.0215, - "step": 183880 + "learning_rate": 1.243085899430091e-06, + "loss": 0.0259, + "step": 308590 }, { "epoch": 1.99, - "learning_rate": 1.6516321630216104e-06, - "loss": 0.0198, - "step": 183890 + "learning_rate": 1.2334045450731586e-06, + "loss": 0.0283, + "step": 308600 }, { "epoch": 1.99, - "learning_rate": 1.6354078785125575e-06, - "loss": 0.0223, - "step": 183900 + "learning_rate": 1.2237231907162264e-06, + "loss": 0.0272, + "step": 308610 }, { "epoch": 1.99, - "learning_rate": 1.6191835940035043e-06, - "loss": 0.0239, - "step": 183910 + "learning_rate": 1.2140418363592943e-06, + "loss": 0.0203, + "step": 308620 }, { "epoch": 1.99, - "learning_rate": 1.602959309494451e-06, - "loss": 0.0285, - "step": 183920 + "learning_rate": 1.204360482002362e-06, + "loss": 0.0279, + "step": 308630 }, { "epoch": 1.99, - "learning_rate": 1.586735024985398e-06, - "loss": 0.0269, - "step": 183930 + "learning_rate": 1.19467912764543e-06, + "loss": 0.0195, + "step": 308640 }, { "epoch": 1.99, - "learning_rate": 1.570510740476345e-06, - "loss": 0.0271, - "step": 183940 + "learning_rate": 1.1849977732884979e-06, + "loss": 0.0172, + "step": 308650 }, { "epoch": 1.99, - "learning_rate": 1.5542864559672917e-06, - "loss": 0.0246, - "step": 183950 + "learning_rate": 1.1753164189315658e-06, + "loss": 0.0217, + "step": 308660 }, { "epoch": 1.99, - "learning_rate": 1.5380621714582385e-06, - "loss": 0.0199, - "step": 183960 + "learning_rate": 1.1656350645746333e-06, + "loss": 0.021, + "step": 308670 }, { "epoch": 1.99, - "learning_rate": 1.5218378869491855e-06, - "loss": 0.027, - "step": 183970 + "learning_rate": 1.1559537102177013e-06, + "loss": 0.0214, + "step": 308680 }, { "epoch": 1.99, - "learning_rate": 1.5056136024401323e-06, - "loss": 0.0219, - "step": 183980 + "learning_rate": 1.1462723558607692e-06, + "loss": 0.0228, + "step": 308690 }, { "epoch": 1.99, - "learning_rate": 1.4893893179310791e-06, - "loss": 0.0288, - "step": 183990 + "learning_rate": 1.136591001503837e-06, + "loss": 0.0208, + "step": 308700 }, { "epoch": 1.99, - "learning_rate": 1.473165033422026e-06, - "loss": 0.0259, - "step": 184000 + "learning_rate": 1.1269096471469049e-06, + "loss": 0.0196, + "step": 308710 }, { "epoch": 1.99, - "eval_cer": 0.9210889474344499, - "eval_loss": 0.020046746358275414, - "eval_runtime": 118.9151, - "eval_samples_per_second": 16.819, - "eval_steps_per_second": 4.205, - "step": 184000 + "learning_rate": 1.1172282927899726e-06, + "loss": 0.0195, + "step": 308720 }, { "epoch": 1.99, - "learning_rate": 1.456940748912973e-06, - "loss": 0.0244, - "step": 184010 + "learning_rate": 1.1075469384330405e-06, + "loss": 0.0187, + "step": 308730 }, { "epoch": 1.99, - "learning_rate": 1.4407164644039198e-06, - "loss": 0.0287, - "step": 184020 + "learning_rate": 1.0978655840761082e-06, + "loss": 0.0224, + "step": 308740 }, { "epoch": 1.99, - "learning_rate": 1.4244921798948664e-06, - "loss": 0.026, - "step": 184030 + "learning_rate": 1.088184229719176e-06, + "loss": 0.0282, + "step": 308750 }, { "epoch": 1.99, - "learning_rate": 1.4082678953858134e-06, - "loss": 0.0211, - "step": 184040 + "learning_rate": 1.0785028753622439e-06, + "loss": 0.0201, + "step": 308760 }, { "epoch": 1.99, - "learning_rate": 1.3920436108767602e-06, - "loss": 0.0267, - "step": 184050 + "learning_rate": 1.0688215210053118e-06, + "loss": 0.0205, + "step": 308770 }, { "epoch": 1.99, - "learning_rate": 1.375819326367707e-06, - "loss": 0.0271, - "step": 184060 + "learning_rate": 1.0591401666483795e-06, + "loss": 0.023, + "step": 308780 }, { "epoch": 1.99, - "learning_rate": 1.3595950418586538e-06, - "loss": 0.019, - "step": 184070 + "learning_rate": 1.0494588122914475e-06, + "loss": 0.0209, + "step": 308790 }, { "epoch": 1.99, - "learning_rate": 1.3433707573496008e-06, - "loss": 0.0218, - "step": 184080 + "learning_rate": 1.0397774579345152e-06, + "loss": 0.0205, + "step": 308800 }, { "epoch": 1.99, - "learning_rate": 1.3271464728405476e-06, - "loss": 0.0213, - "step": 184090 + "learning_rate": 1.0300961035775831e-06, + "loss": 0.0243, + "step": 308810 }, { "epoch": 1.99, - "learning_rate": 1.3109221883314944e-06, - "loss": 0.024, - "step": 184100 + "learning_rate": 1.0204147492206509e-06, + "loss": 0.017, + "step": 308820 }, { "epoch": 1.99, - "learning_rate": 1.2946979038224412e-06, - "loss": 0.0192, - "step": 184110 + "learning_rate": 1.0107333948637186e-06, + "loss": 0.0207, + "step": 308830 }, { "epoch": 1.99, - "learning_rate": 1.2784736193133883e-06, - "loss": 0.0257, - "step": 184120 + "learning_rate": 1.0010520405067865e-06, + "loss": 0.0254, + "step": 308840 }, { "epoch": 1.99, - "learning_rate": 1.262249334804335e-06, - "loss": 0.0191, - "step": 184130 + "learning_rate": 9.913706861498544e-07, + "loss": 0.0208, + "step": 308850 }, { "epoch": 1.99, - "learning_rate": 1.2460250502952819e-06, - "loss": 0.0237, - "step": 184140 + "learning_rate": 9.816893317929222e-07, + "loss": 0.0217, + "step": 308860 }, { "epoch": 1.99, - "learning_rate": 1.2298007657862289e-06, - "loss": 0.0244, - "step": 184150 + "learning_rate": 9.7200797743599e-07, + "loss": 0.0231, + "step": 308870 }, { "epoch": 1.99, - "learning_rate": 1.2135764812771757e-06, - "loss": 0.0249, - "step": 184160 + "learning_rate": 9.623266230790578e-07, + "loss": 0.0256, + "step": 308880 }, { "epoch": 1.99, - "learning_rate": 1.1973521967681225e-06, - "loss": 0.0262, - "step": 184170 + "learning_rate": 9.526452687221257e-07, + "loss": 0.0196, + "step": 308890 }, { "epoch": 1.99, - "learning_rate": 1.181127912259069e-06, - "loss": 0.0283, - "step": 184180 + "learning_rate": 9.429639143651935e-07, + "loss": 0.022, + "step": 308900 }, { "epoch": 1.99, - "learning_rate": 1.1649036277500161e-06, - "loss": 0.0216, - "step": 184190 + "learning_rate": 9.332825600082613e-07, + "loss": 0.0212, + "step": 308910 }, { "epoch": 1.99, - "learning_rate": 1.148679343240963e-06, - "loss": 0.0253, - "step": 184200 + "learning_rate": 9.236012056513292e-07, + "loss": 0.0233, + "step": 308920 }, { "epoch": 1.99, - "learning_rate": 1.1324550587319097e-06, - "loss": 0.0213, - "step": 184210 + "learning_rate": 9.13919851294397e-07, + "loss": 0.0182, + "step": 308930 }, { "epoch": 1.99, - "learning_rate": 1.1162307742228567e-06, - "loss": 0.0313, - "step": 184220 + "learning_rate": 9.042384969374649e-07, + "loss": 0.0243, + "step": 308940 }, { "epoch": 1.99, - "learning_rate": 1.1000064897138035e-06, - "loss": 0.0257, - "step": 184230 + "learning_rate": 8.945571425805327e-07, + "loss": 0.0216, + "step": 308950 }, { "epoch": 1.99, - "learning_rate": 1.0837822052047503e-06, - "loss": 0.0264, - "step": 184240 + "learning_rate": 8.848757882236004e-07, + "loss": 0.0222, + "step": 308960 }, { "epoch": 1.99, - "learning_rate": 1.0675579206956974e-06, - "loss": 0.0231, - "step": 184250 + "learning_rate": 8.751944338666684e-07, + "loss": 0.0233, + "step": 308970 }, { "epoch": 1.99, - "learning_rate": 1.0513336361866442e-06, - "loss": 0.0237, - "step": 184260 + "learning_rate": 8.655130795097361e-07, + "loss": 0.0198, + "step": 308980 }, { "epoch": 1.99, - "learning_rate": 1.035109351677591e-06, - "loss": 0.0252, - "step": 184270 + "learning_rate": 8.558317251528039e-07, + "loss": 0.0205, + "step": 308990 }, { "epoch": 1.99, - "learning_rate": 1.0188850671685378e-06, - "loss": 0.0206, - "step": 184280 + "learning_rate": 8.461503707958718e-07, + "loss": 0.0214, + "step": 309000 }, { "epoch": 1.99, - "learning_rate": 1.0026607826594846e-06, - "loss": 0.0237, - "step": 184290 + "eval_cer": 0.919811094791549, + "eval_loss": 0.016410965472459793, + "eval_runtime": 120.1413, + "eval_samples_per_second": 16.647, + "eval_steps_per_second": 4.162, + "step": 309000 }, { "epoch": 1.99, - "learning_rate": 9.864364981504314e-07, - "loss": 0.0218, - "step": 184300 + "learning_rate": 8.364690164389396e-07, + "loss": 0.022, + "step": 309010 }, { "epoch": 1.99, - "learning_rate": 9.702122136413784e-07, - "loss": 0.0228, - "step": 184310 + "learning_rate": 8.267876620820075e-07, + "loss": 0.0201, + "step": 309020 }, { "epoch": 1.99, - "learning_rate": 9.539879291323252e-07, - "loss": 0.0222, - "step": 184320 + "learning_rate": 8.171063077250753e-07, + "loss": 0.0271, + "step": 309030 }, { "epoch": 1.99, - "learning_rate": 9.37763644623272e-07, - "loss": 0.0193, - "step": 184330 + "learning_rate": 8.07424953368143e-07, + "loss": 0.0189, + "step": 309040 }, { "epoch": 1.99, - "learning_rate": 9.215393601142188e-07, - "loss": 0.0225, - "step": 184340 + "learning_rate": 7.97743599011211e-07, + "loss": 0.0204, + "step": 309050 }, { "epoch": 1.99, - "learning_rate": 9.053150756051657e-07, - "loss": 0.0223, - "step": 184350 + "learning_rate": 7.880622446542788e-07, + "loss": 0.0211, + "step": 309060 }, { "epoch": 1.99, - "learning_rate": 8.890907910961127e-07, - "loss": 0.0241, - "step": 184360 + "learning_rate": 7.783808902973465e-07, + "loss": 0.0202, + "step": 309070 }, { "epoch": 1.99, - "learning_rate": 8.728665065870595e-07, - "loss": 0.0236, - "step": 184370 + "learning_rate": 7.686995359404145e-07, + "loss": 0.0188, + "step": 309080 }, { "epoch": 1.99, - "learning_rate": 8.566422220780064e-07, - "loss": 0.024, - "step": 184380 + "learning_rate": 7.590181815834822e-07, + "loss": 0.0189, + "step": 309090 }, { "epoch": 1.99, - "learning_rate": 8.404179375689531e-07, - "loss": 0.0259, - "step": 184390 + "learning_rate": 7.493368272265501e-07, + "loss": 0.0161, + "step": 309100 }, { - "epoch": 1.99, - "learning_rate": 8.241936530599e-07, - "loss": 0.025, - "step": 184400 + "epoch": 2.0, + "learning_rate": 7.39655472869618e-07, + "loss": 0.0226, + "step": 309110 }, { - "epoch": 1.99, - "learning_rate": 8.079693685508468e-07, - "loss": 0.0217, - "step": 184410 + "epoch": 2.0, + "learning_rate": 7.299741185126857e-07, + "loss": 0.0187, + "step": 309120 }, { - "epoch": 1.99, - "learning_rate": 7.917450840417937e-07, - "loss": 0.0254, - "step": 184420 + "epoch": 2.0, + "learning_rate": 7.202927641557536e-07, + "loss": 0.02, + "step": 309130 }, { - "epoch": 1.99, - "learning_rate": 7.755207995327405e-07, - "loss": 0.0196, - "step": 184430 + "epoch": 2.0, + "learning_rate": 7.106114097988214e-07, + "loss": 0.0207, + "step": 309140 }, { - "epoch": 1.99, - "learning_rate": 7.592965150236874e-07, - "loss": 0.0251, - "step": 184440 + "epoch": 2.0, + "learning_rate": 7.009300554418892e-07, + "loss": 0.0258, + "step": 309150 }, { "epoch": 2.0, - "learning_rate": 7.430722305146342e-07, - "loss": 0.0254, - "step": 184450 + "learning_rate": 6.912487010849571e-07, + "loss": 0.0249, + "step": 309160 }, { "epoch": 2.0, - "learning_rate": 7.268479460055811e-07, - "loss": 0.0256, - "step": 184460 + "learning_rate": 6.815673467280248e-07, + "loss": 0.0228, + "step": 309170 }, { "epoch": 2.0, - "learning_rate": 7.10623661496528e-07, - "loss": 0.0252, - "step": 184470 + "learning_rate": 6.718859923710927e-07, + "loss": 0.0217, + "step": 309180 }, { "epoch": 2.0, - "learning_rate": 6.943993769874748e-07, - "loss": 0.0242, - "step": 184480 + "learning_rate": 6.622046380141606e-07, + "loss": 0.0216, + "step": 309190 }, { "epoch": 2.0, - "learning_rate": 6.781750924784217e-07, + "learning_rate": 6.525232836572283e-07, "loss": 0.0192, - "step": 184490 + "step": 309200 }, { "epoch": 2.0, - "learning_rate": 6.619508079693685e-07, + "learning_rate": 6.428419293002962e-07, "loss": 0.0241, - "step": 184500 + "step": 309210 }, { "epoch": 2.0, - "learning_rate": 6.457265234603154e-07, - "loss": 0.0209, - "step": 184510 + "learning_rate": 6.33160574943364e-07, + "loss": 0.0195, + "step": 309220 }, { "epoch": 2.0, - "learning_rate": 6.295022389512622e-07, - "loss": 0.0279, - "step": 184520 + "learning_rate": 6.234792205864318e-07, + "loss": 0.0193, + "step": 309230 }, { "epoch": 2.0, - "learning_rate": 6.132779544422091e-07, - "loss": 0.0233, - "step": 184530 + "learning_rate": 6.137978662294997e-07, + "loss": 0.021, + "step": 309240 }, { "epoch": 2.0, - "learning_rate": 5.970536699331558e-07, - "loss": 0.022, - "step": 184540 + "learning_rate": 6.041165118725675e-07, + "loss": 0.0211, + "step": 309250 }, { "epoch": 2.0, - "learning_rate": 5.808293854241027e-07, - "loss": 0.024, - "step": 184550 + "learning_rate": 5.944351575156354e-07, + "loss": 0.0178, + "step": 309260 + }, + { + "epoch": 2.0, + "learning_rate": 5.847538031587032e-07, + "loss": 0.0253, + "step": 309270 + }, + { + "epoch": 2.0, + "learning_rate": 5.75072448801771e-07, + "loss": 0.0181, + "step": 309280 + }, + { + "epoch": 2.0, + "learning_rate": 5.653910944448388e-07, + "loss": 0.0175, + "step": 309290 + }, + { + "epoch": 2.0, + "learning_rate": 5.557097400879067e-07, + "loss": 0.0185, + "step": 309300 }, { "epoch": 2.0, - "learning_rate": 5.646051009150496e-07, + "learning_rate": 5.460283857309745e-07, "loss": 0.0199, - "step": 184560 + "step": 309310 }, { "epoch": 2.0, - "learning_rate": 5.483808164059964e-07, - "loss": 0.0233, - "step": 184570 + "learning_rate": 5.363470313740423e-07, + "loss": 0.02, + "step": 309320 }, { "epoch": 2.0, - "learning_rate": 5.321565318969433e-07, - "loss": 0.0201, - "step": 184580 + "learning_rate": 5.266656770171102e-07, + "loss": 0.0195, + "step": 309330 }, { "epoch": 2.0, - "learning_rate": 5.159322473878901e-07, - "loss": 0.0202, - "step": 184590 + "learning_rate": 5.16984322660178e-07, + "loss": 0.0241, + "step": 309340 }, { "epoch": 2.0, - "learning_rate": 4.99707962878837e-07, - "loss": 0.0256, - "step": 184600 + "learning_rate": 5.073029683032458e-07, + "loss": 0.0263, + "step": 309350 }, { "epoch": 2.0, - "learning_rate": 4.834836783697839e-07, - "loss": 0.0262, - "step": 184610 + "learning_rate": 4.976216139463136e-07, + "loss": 0.0194, + "step": 309360 }, { "epoch": 2.0, - "learning_rate": 4.6725939386073067e-07, - "loss": 0.03, - "step": 184620 + "learning_rate": 4.879402595893815e-07, + "loss": 0.018, + "step": 309370 }, { "epoch": 2.0, - "learning_rate": 4.5103510935167753e-07, + "learning_rate": 4.782589052324493e-07, "loss": 0.0213, - "step": 184630 + "step": 309380 + }, + { + "epoch": 2.0, + "learning_rate": 4.685775508755171e-07, + "loss": 0.0267, + "step": 309390 + }, + { + "epoch": 2.0, + "learning_rate": 4.5889619651858494e-07, + "loss": 0.0219, + "step": 309400 + }, + { + "epoch": 2.0, + "learning_rate": 4.492148421616527e-07, + "loss": 0.0181, + "step": 309410 + }, + { + "epoch": 2.0, + "learning_rate": 4.395334878047206e-07, + "loss": 0.0169, + "step": 309420 + }, + { + "epoch": 2.0, + "learning_rate": 4.298521334477884e-07, + "loss": 0.02, + "step": 309430 }, { "epoch": 2.0, - "learning_rate": 4.3481082484262444e-07, + "learning_rate": 4.2017077909085625e-07, + "loss": 0.0221, + "step": 309440 + }, + { + "epoch": 2.0, + "learning_rate": 4.10489424733924e-07, "loss": 0.0243, - "step": 184640 + "step": 309450 }, { "epoch": 2.0, - "learning_rate": 4.1858654033357125e-07, - "loss": 0.0296, - "step": 184650 + "learning_rate": 4.008080703769919e-07, + "loss": 0.0244, + "step": 309460 }, { "epoch": 2.0, - "learning_rate": 4.023622558245181e-07, - "loss": 0.0216, - "step": 184660 + "learning_rate": 3.9112671602005973e-07, + "loss": 0.0197, + "step": 309470 }, { "epoch": 2.0, - "learning_rate": 3.8613797131546497e-07, - "loss": 0.0265, - "step": 184670 + "learning_rate": 3.8144536166312756e-07, + "loss": 0.0207, + "step": 309480 }, { "epoch": 2.0, - "learning_rate": 3.6991368680641183e-07, - "loss": 0.0223, - "step": 184680 + "learning_rate": 3.717640073061954e-07, + "loss": 0.0229, + "step": 309490 }, { "epoch": 2.0, - "learning_rate": 3.5368940229735863e-07, - "loss": 0.0259, - "step": 184690 + "learning_rate": 3.620826529492632e-07, + "loss": 0.0178, + "step": 309500 }, { "epoch": 2.0, - "learning_rate": 3.374651177883055e-07, - "loss": 0.0216, - "step": 184700 + "learning_rate": 3.5240129859233104e-07, + "loss": 0.0212, + "step": 309510 }, { "epoch": 2.0, - "learning_rate": 3.2124083327925235e-07, - "loss": 0.0217, - "step": 184710 + "learning_rate": 3.427199442353989e-07, + "loss": 0.026, + "step": 309520 }, { "epoch": 2.0, - "learning_rate": 3.050165487701992e-07, - "loss": 0.0262, - "step": 184720 + "learning_rate": 3.330385898784667e-07, + "loss": 0.0204, + "step": 309530 }, { "epoch": 2.0, - "learning_rate": 2.8879226426114607e-07, - "loss": 0.0255, - "step": 184730 + "learning_rate": 3.233572355215345e-07, + "loss": 0.0204, + "step": 309540 }, { "epoch": 2.0, - "learning_rate": 2.7256797975209293e-07, - "loss": 0.0293, - "step": 184740 + "learning_rate": 3.1367588116460235e-07, + "loss": 0.024, + "step": 309550 }, { "epoch": 2.0, - "learning_rate": 2.5634369524303973e-07, - "loss": 0.0232, - "step": 184750 + "learning_rate": 3.0399452680767023e-07, + "loss": 0.0198, + "step": 309560 }, { "epoch": 2.0, - "learning_rate": 2.401194107339866e-07, - "loss": 0.0318, - "step": 184760 + "learning_rate": 2.94313172450738e-07, + "loss": 0.0202, + "step": 309570 }, { "epoch": 2.0, - "learning_rate": 2.2389512622493345e-07, - "loss": 0.0237, - "step": 184770 + "learning_rate": 2.8463181809380583e-07, + "loss": 0.023, + "step": 309580 }, { "epoch": 2.0, - "learning_rate": 2.076708417158803e-07, - "loss": 0.0247, - "step": 184780 + "learning_rate": 2.7495046373687366e-07, + "loss": 0.0253, + "step": 309590 }, { "epoch": 2.0, - "learning_rate": 1.9144655720682717e-07, - "loss": 0.0197, - "step": 184790 + "learning_rate": 2.652691093799415e-07, + "loss": 0.0201, + "step": 309600 }, { "epoch": 2.0, - "learning_rate": 1.75222272697774e-07, - "loss": 0.0238, - "step": 184800 + "learning_rate": 2.555877550230093e-07, + "loss": 0.0198, + "step": 309610 }, { "epoch": 2.0, - "learning_rate": 1.5899798818872086e-07, - "loss": 0.0224, - "step": 184810 + "learning_rate": 2.4590640066607714e-07, + "loss": 0.0246, + "step": 309620 }, { "epoch": 2.0, - "learning_rate": 1.4277370367966772e-07, - "loss": 0.0304, - "step": 184820 + "learning_rate": 2.36225046309145e-07, + "loss": 0.021, + "step": 309630 }, { "epoch": 2.0, - "learning_rate": 1.2654941917061455e-07, - "loss": 0.026, - "step": 184830 + "learning_rate": 2.265436919522128e-07, + "loss": 0.0251, + "step": 309640 }, { "epoch": 2.0, - "learning_rate": 1.1032513466156142e-07, - "loss": 0.0277, - "step": 184840 + "learning_rate": 2.1686233759528065e-07, + "loss": 0.0274, + "step": 309650 }, { "epoch": 2.0, - "learning_rate": 9.410085015250827e-08, - "loss": 0.0268, - "step": 184850 + "learning_rate": 2.0718098323834845e-07, + "loss": 0.0197, + "step": 309660 + }, + { + "epoch": 2.0, + "learning_rate": 1.974996288814163e-07, + "loss": 0.0201, + "step": 309670 }, { "epoch": 2.0, - "learning_rate": 7.787656564345512e-08, + "learning_rate": 1.878182745244841e-07, + "loss": 0.0232, + "step": 309680 + }, + { + "epoch": 2.0, + "learning_rate": 1.7813692016755196e-07, "loss": 0.0234, - "step": 184860 + "step": 309690 }, { "epoch": 2.0, - "learning_rate": 6.165228113440196e-08, - "loss": 0.0261, - "step": 184870 + "learning_rate": 1.684555658106198e-07, + "loss": 0.0169, + "step": 309700 }, { "epoch": 2.0, - "learning_rate": 4.542799662534882e-08, - "loss": 0.0211, - "step": 184880 + "learning_rate": 1.5877421145368762e-07, + "loss": 0.024, + "step": 309710 }, { "epoch": 2.0, - "learning_rate": 2.9203712116295667e-08, - "loss": 0.0258, - "step": 184890 + "learning_rate": 1.4909285709675544e-07, + "loss": 0.02, + "step": 309720 }, { "epoch": 2.0, - "learning_rate": 1.297942760724252e-08, - "loss": 0.0224, - "step": 184900 + "learning_rate": 1.3941150273982327e-07, + "loss": 0.0213, + "step": 309730 + }, + { + "epoch": 2.0, + "learning_rate": 1.297301483828911e-07, + "loss": 0.0179, + "step": 309740 + }, + { + "epoch": 2.0, + "learning_rate": 1.2004879402595893e-07, + "loss": 0.0265, + "step": 309750 + }, + { + "epoch": 2.0, + "learning_rate": 1.1036743966902677e-07, + "loss": 0.0202, + "step": 309760 + }, + { + "epoch": 2.0, + "learning_rate": 1.0068608531209459e-07, + "loss": 0.0183, + "step": 309770 + }, + { + "epoch": 2.0, + "learning_rate": 9.100473095516242e-08, + "loss": 0.0225, + "step": 309780 + }, + { + "epoch": 2.0, + "learning_rate": 8.132337659823025e-08, + "loss": 0.0196, + "step": 309790 + }, + { + "epoch": 2.0, + "learning_rate": 7.164202224129808e-08, + "loss": 0.0184, + "step": 309800 + }, + { + "epoch": 2.0, + "learning_rate": 6.19606678843659e-08, + "loss": 0.0256, + "step": 309810 + }, + { + "epoch": 2.0, + "learning_rate": 5.227931352743372e-08, + "loss": 0.0201, + "step": 309820 + }, + { + "epoch": 2.0, + "learning_rate": 4.259795917050155e-08, + "loss": 0.0249, + "step": 309830 + }, + { + "epoch": 2.0, + "learning_rate": 3.2916604813569384e-08, + "loss": 0.0227, + "step": 309840 + }, + { + "epoch": 2.0, + "learning_rate": 2.3235250456637212e-08, + "loss": 0.0218, + "step": 309850 + }, + { + "epoch": 2.0, + "learning_rate": 1.355389609970504e-08, + "loss": 0.0212, + "step": 309860 + }, + { + "epoch": 2.0, + "learning_rate": 3.872541742772869e-09, + "loss": 0.0204, + "step": 309870 }, { "epoch": 2.0, - "step": 184908, - "total_flos": 9.984146296023245e+17, - "train_loss": 0.05150384478483596, - "train_runtime": 204639.736, - "train_samples_per_second": 28.915, - "train_steps_per_second": 0.904 + "step": 309874, + "total_flos": 1.6340823463826534e+18, + "train_loss": 0.047053869794253175, + "train_runtime": 343177.6492, + "train_samples_per_second": 28.895, + "train_steps_per_second": 0.903 } ], - "max_steps": 184908, + "max_steps": 309874, "num_train_epochs": 2, - "total_flos": 9.984146296023245e+17, + "total_flos": 1.6340823463826534e+18, "trial_name": null, "trial_params": null } diff --git a/training_args.bin b/training_args.bin index c43af0d9d130b03471d90f4b15dadb727b241fca..5acaa885d201afedac42166e2c44637fc99f3831 100644 --- a/training_args.bin +++ b/training_args.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:dcaa8fb3e6403c3f1d958c15d97817380cca47833d439484dd2f38a0a53f4340 +oid sha256:c1aad804f228e120d28bf4be176a8fd53fb1a8d0a742145b5d195d7bdff2768b size 3707