diff --git "a/trainer_state.json" "b/trainer_state.json" new file mode 100644--- /dev/null +++ "b/trainer_state.json" @@ -0,0 +1,49216 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.999968595825129, + "global_step": 79606, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 0.002999623143984122, + "loss": 3.9921, + "step": 10 + }, + { + "epoch": 0.0, + "learning_rate": 0.0029992462879682436, + "loss": 1.5317, + "step": 20 + }, + { + "epoch": 0.0, + "learning_rate": 0.0029988694319523653, + "loss": 1.2121, + "step": 30 + }, + { + "epoch": 0.0, + "learning_rate": 0.0029984925759364875, + "loss": 1.0693, + "step": 40 + }, + { + "epoch": 0.0, + "learning_rate": 0.0029981157199206092, + "loss": 0.9832, + "step": 50 + }, + { + "epoch": 0.0, + "learning_rate": 0.0029977388639047305, + "loss": 0.925, + "step": 60 + }, + { + "epoch": 0.0, + "learning_rate": 0.0029973620078888527, + "loss": 0.8599, + "step": 70 + }, + { + "epoch": 0.0, + "learning_rate": 0.0029969851518729745, + "loss": 0.8426, + "step": 80 + }, + { + "epoch": 0.0, + "learning_rate": 0.002996608295857096, + "loss": 0.8016, + "step": 90 + }, + { + "epoch": 0.0, + "learning_rate": 0.002996231439841218, + "loss": 0.7594, + "step": 100 + }, + { + "epoch": 0.0, + "learning_rate": 0.0029958545838253397, + "loss": 0.7358, + "step": 110 + }, + { + "epoch": 0.0, + "learning_rate": 0.002995477727809462, + "loss": 0.7094, + "step": 120 + }, + { + "epoch": 0.0, + "learning_rate": 0.0029951008717935836, + "loss": 0.7043, + "step": 130 + }, + { + "epoch": 0.0, + "learning_rate": 0.0029947240157777054, + "loss": 0.6813, + "step": 140 + }, + { + "epoch": 0.0, + "learning_rate": 0.002994347159761827, + "loss": 0.671, + "step": 150 + }, + { + "epoch": 0.0, + "learning_rate": 0.002993970303745949, + "loss": 0.6486, + "step": 160 + }, + { + "epoch": 0.0, + "learning_rate": 0.002993593447730071, + "loss": 0.6395, + "step": 170 + }, + { + "epoch": 0.0, + "learning_rate": 0.0029932165917141923, + "loss": 0.6361, + "step": 180 + }, + { + "epoch": 0.0, + "learning_rate": 0.002992839735698314, + "loss": 0.6132, + "step": 190 + }, + { + "epoch": 0.01, + "learning_rate": 0.0029924628796824363, + "loss": 0.6038, + "step": 200 + }, + { + "epoch": 0.01, + "learning_rate": 0.002992086023666558, + "loss": 0.5928, + "step": 210 + }, + { + "epoch": 0.01, + "learning_rate": 0.0029917091676506797, + "loss": 0.5775, + "step": 220 + }, + { + "epoch": 0.01, + "learning_rate": 0.0029913323116348015, + "loss": 0.5844, + "step": 230 + }, + { + "epoch": 0.01, + "learning_rate": 0.0029909554556189232, + "loss": 0.561, + "step": 240 + }, + { + "epoch": 0.01, + "learning_rate": 0.002990578599603045, + "loss": 0.5629, + "step": 250 + }, + { + "epoch": 0.01, + "learning_rate": 0.0029902017435871667, + "loss": 0.5413, + "step": 260 + }, + { + "epoch": 0.01, + "learning_rate": 0.0029898248875712885, + "loss": 0.5516, + "step": 270 + }, + { + "epoch": 0.01, + "learning_rate": 0.0029894480315554106, + "loss": 0.5345, + "step": 280 + }, + { + "epoch": 0.01, + "learning_rate": 0.002989071175539532, + "loss": 0.5332, + "step": 290 + }, + { + "epoch": 0.01, + "learning_rate": 0.002988694319523654, + "loss": 0.5317, + "step": 300 + }, + { + "epoch": 0.01, + "learning_rate": 0.002988317463507776, + "loss": 0.521, + "step": 310 + }, + { + "epoch": 0.01, + "learning_rate": 0.0029879406074918976, + "loss": 0.5091, + "step": 320 + }, + { + "epoch": 0.01, + "learning_rate": 0.0029875637514760194, + "loss": 0.5108, + "step": 330 + }, + { + "epoch": 0.01, + "learning_rate": 0.002987186895460141, + "loss": 0.4999, + "step": 340 + }, + { + "epoch": 0.01, + "learning_rate": 0.0029868100394442633, + "loss": 0.5046, + "step": 350 + }, + { + "epoch": 0.01, + "learning_rate": 0.002986433183428385, + "loss": 0.4958, + "step": 360 + }, + { + "epoch": 0.01, + "learning_rate": 0.0029860563274125063, + "loss": 0.4948, + "step": 370 + }, + { + "epoch": 0.01, + "learning_rate": 0.0029856794713966285, + "loss": 0.4778, + "step": 380 + }, + { + "epoch": 0.01, + "learning_rate": 0.0029853026153807503, + "loss": 0.4669, + "step": 390 + }, + { + "epoch": 0.01, + "learning_rate": 0.002984925759364872, + "loss": 0.4694, + "step": 400 + }, + { + "epoch": 0.01, + "learning_rate": 0.0029845489033489938, + "loss": 0.4669, + "step": 410 + }, + { + "epoch": 0.01, + "learning_rate": 0.0029841720473331155, + "loss": 0.4618, + "step": 420 + }, + { + "epoch": 0.01, + "learning_rate": 0.0029837951913172377, + "loss": 0.4561, + "step": 430 + }, + { + "epoch": 0.01, + "learning_rate": 0.0029834183353013594, + "loss": 0.4558, + "step": 440 + }, + { + "epoch": 0.01, + "learning_rate": 0.002983041479285481, + "loss": 0.4625, + "step": 450 + }, + { + "epoch": 0.01, + "learning_rate": 0.002982664623269603, + "loss": 0.4507, + "step": 460 + }, + { + "epoch": 0.01, + "learning_rate": 0.0029822877672537247, + "loss": 0.4496, + "step": 470 + }, + { + "epoch": 0.01, + "learning_rate": 0.0029819109112378464, + "loss": 0.4435, + "step": 480 + }, + { + "epoch": 0.01, + "learning_rate": 0.002981534055221968, + "loss": 0.4396, + "step": 490 + }, + { + "epoch": 0.01, + "learning_rate": 0.00298115719920609, + "loss": 0.444, + "step": 500 + }, + { + "epoch": 0.01, + "eval_cer": 0.6732715529832191, + "eval_loss": 0.33886468410491943, + "eval_runtime": 90.4817, + "eval_samples_per_second": 110.508, + "eval_steps_per_second": 6.907, + "step": 500 + }, + { + "epoch": 0.01, + "learning_rate": 0.002980780343190212, + "loss": 0.4308, + "step": 510 + }, + { + "epoch": 0.01, + "learning_rate": 0.0029804034871743334, + "loss": 0.4287, + "step": 520 + }, + { + "epoch": 0.01, + "learning_rate": 0.0029800266311584556, + "loss": 0.4156, + "step": 530 + }, + { + "epoch": 0.01, + "learning_rate": 0.0029796497751425773, + "loss": 0.4347, + "step": 540 + }, + { + "epoch": 0.01, + "learning_rate": 0.002979272919126699, + "loss": 0.4347, + "step": 550 + }, + { + "epoch": 0.01, + "learning_rate": 0.002978896063110821, + "loss": 0.4227, + "step": 560 + }, + { + "epoch": 0.01, + "learning_rate": 0.0029785192070949425, + "loss": 0.4235, + "step": 570 + }, + { + "epoch": 0.01, + "learning_rate": 0.0029781423510790647, + "loss": 0.4185, + "step": 580 + }, + { + "epoch": 0.01, + "learning_rate": 0.0029777654950631865, + "loss": 0.419, + "step": 590 + }, + { + "epoch": 0.02, + "learning_rate": 0.0029773886390473078, + "loss": 0.4138, + "step": 600 + }, + { + "epoch": 0.02, + "learning_rate": 0.00297701178303143, + "loss": 0.4028, + "step": 610 + }, + { + "epoch": 0.02, + "learning_rate": 0.0029766349270155517, + "loss": 0.4085, + "step": 620 + }, + { + "epoch": 0.02, + "learning_rate": 0.0029762580709996734, + "loss": 0.4033, + "step": 630 + }, + { + "epoch": 0.02, + "learning_rate": 0.002975881214983795, + "loss": 0.3989, + "step": 640 + }, + { + "epoch": 0.02, + "learning_rate": 0.002975504358967917, + "loss": 0.3959, + "step": 650 + }, + { + "epoch": 0.02, + "learning_rate": 0.002975127502952039, + "loss": 0.3925, + "step": 660 + }, + { + "epoch": 0.02, + "learning_rate": 0.0029747506469361604, + "loss": 0.395, + "step": 670 + }, + { + "epoch": 0.02, + "learning_rate": 0.002974373790920282, + "loss": 0.3885, + "step": 680 + }, + { + "epoch": 0.02, + "learning_rate": 0.0029739969349044043, + "loss": 0.3886, + "step": 690 + }, + { + "epoch": 0.02, + "learning_rate": 0.002973620078888526, + "loss": 0.3905, + "step": 700 + }, + { + "epoch": 0.02, + "learning_rate": 0.002973243222872648, + "loss": 0.3884, + "step": 710 + }, + { + "epoch": 0.02, + "learning_rate": 0.0029728663668567696, + "loss": 0.3947, + "step": 720 + }, + { + "epoch": 0.02, + "learning_rate": 0.0029724895108408913, + "loss": 0.3868, + "step": 730 + }, + { + "epoch": 0.02, + "learning_rate": 0.0029721126548250135, + "loss": 0.3832, + "step": 740 + }, + { + "epoch": 0.02, + "learning_rate": 0.002971735798809135, + "loss": 0.3848, + "step": 750 + }, + { + "epoch": 0.02, + "learning_rate": 0.002971358942793257, + "loss": 0.3766, + "step": 760 + }, + { + "epoch": 0.02, + "learning_rate": 0.0029709820867773787, + "loss": 0.3797, + "step": 770 + }, + { + "epoch": 0.02, + "learning_rate": 0.0029706052307615005, + "loss": 0.3786, + "step": 780 + }, + { + "epoch": 0.02, + "learning_rate": 0.0029702283747456222, + "loss": 0.3694, + "step": 790 + }, + { + "epoch": 0.02, + "learning_rate": 0.002969851518729744, + "loss": 0.373, + "step": 800 + }, + { + "epoch": 0.02, + "learning_rate": 0.0029694746627138657, + "loss": 0.371, + "step": 810 + }, + { + "epoch": 0.02, + "learning_rate": 0.002969097806697988, + "loss": 0.3584, + "step": 820 + }, + { + "epoch": 0.02, + "learning_rate": 0.002968720950682109, + "loss": 0.3691, + "step": 830 + }, + { + "epoch": 0.02, + "learning_rate": 0.0029683440946662314, + "loss": 0.3656, + "step": 840 + }, + { + "epoch": 0.02, + "learning_rate": 0.002967967238650353, + "loss": 0.3662, + "step": 850 + }, + { + "epoch": 0.02, + "learning_rate": 0.002967590382634475, + "loss": 0.3619, + "step": 860 + }, + { + "epoch": 0.02, + "learning_rate": 0.0029672135266185966, + "loss": 0.3613, + "step": 870 + }, + { + "epoch": 0.02, + "learning_rate": 0.0029668366706027184, + "loss": 0.3551, + "step": 880 + }, + { + "epoch": 0.02, + "learning_rate": 0.0029664598145868405, + "loss": 0.371, + "step": 890 + }, + { + "epoch": 0.02, + "learning_rate": 0.002966082958570962, + "loss": 0.35, + "step": 900 + }, + { + "epoch": 0.02, + "learning_rate": 0.0029657061025550836, + "loss": 0.3464, + "step": 910 + }, + { + "epoch": 0.02, + "learning_rate": 0.0029653292465392058, + "loss": 0.3441, + "step": 920 + }, + { + "epoch": 0.02, + "learning_rate": 0.0029649523905233275, + "loss": 0.3513, + "step": 930 + }, + { + "epoch": 0.02, + "learning_rate": 0.0029645755345074493, + "loss": 0.3452, + "step": 940 + }, + { + "epoch": 0.02, + "learning_rate": 0.002964198678491571, + "loss": 0.3483, + "step": 950 + }, + { + "epoch": 0.02, + "learning_rate": 0.0029638218224756928, + "loss": 0.3463, + "step": 960 + }, + { + "epoch": 0.02, + "learning_rate": 0.002963444966459815, + "loss": 0.3423, + "step": 970 + }, + { + "epoch": 0.02, + "learning_rate": 0.0029630681104439362, + "loss": 0.3441, + "step": 980 + }, + { + "epoch": 0.02, + "learning_rate": 0.0029626912544280584, + "loss": 0.3489, + "step": 990 + }, + { + "epoch": 0.03, + "learning_rate": 0.00296231439841218, + "loss": 0.3429, + "step": 1000 + }, + { + "epoch": 0.03, + "eval_cer": 0.6705959123333078, + "eval_loss": 0.26553666591644287, + "eval_runtime": 90.2108, + "eval_samples_per_second": 110.84, + "eval_steps_per_second": 6.928, + "step": 1000 + }, + { + "epoch": 0.03, + "learning_rate": 0.002961937542396302, + "loss": 0.3388, + "step": 1010 + }, + { + "epoch": 0.03, + "learning_rate": 0.0029615606863804237, + "loss": 0.3408, + "step": 1020 + }, + { + "epoch": 0.03, + "learning_rate": 0.0029611838303645454, + "loss": 0.3431, + "step": 1030 + }, + { + "epoch": 0.03, + "learning_rate": 0.002960806974348667, + "loss": 0.3392, + "step": 1040 + }, + { + "epoch": 0.03, + "learning_rate": 0.0029604301183327893, + "loss": 0.3382, + "step": 1050 + }, + { + "epoch": 0.03, + "learning_rate": 0.0029600532623169106, + "loss": 0.3425, + "step": 1060 + }, + { + "epoch": 0.03, + "learning_rate": 0.002959676406301033, + "loss": 0.3345, + "step": 1070 + }, + { + "epoch": 0.03, + "learning_rate": 0.0029592995502851546, + "loss": 0.3368, + "step": 1080 + }, + { + "epoch": 0.03, + "learning_rate": 0.0029589226942692763, + "loss": 0.3377, + "step": 1090 + }, + { + "epoch": 0.03, + "learning_rate": 0.002958545838253398, + "loss": 0.3267, + "step": 1100 + }, + { + "epoch": 0.03, + "learning_rate": 0.00295816898223752, + "loss": 0.332, + "step": 1110 + }, + { + "epoch": 0.03, + "learning_rate": 0.0029577921262216415, + "loss": 0.3262, + "step": 1120 + }, + { + "epoch": 0.03, + "learning_rate": 0.0029574152702057633, + "loss": 0.3305, + "step": 1130 + }, + { + "epoch": 0.03, + "learning_rate": 0.002957038414189885, + "loss": 0.3259, + "step": 1140 + }, + { + "epoch": 0.03, + "learning_rate": 0.002956661558174007, + "loss": 0.3221, + "step": 1150 + }, + { + "epoch": 0.03, + "learning_rate": 0.002956284702158129, + "loss": 0.3286, + "step": 1160 + }, + { + "epoch": 0.03, + "learning_rate": 0.0029559078461422507, + "loss": 0.3246, + "step": 1170 + }, + { + "epoch": 0.03, + "learning_rate": 0.0029555309901263724, + "loss": 0.3159, + "step": 1180 + }, + { + "epoch": 0.03, + "learning_rate": 0.002955154134110494, + "loss": 0.3159, + "step": 1190 + }, + { + "epoch": 0.03, + "learning_rate": 0.0029547772780946164, + "loss": 0.3244, + "step": 1200 + }, + { + "epoch": 0.03, + "learning_rate": 0.0029544004220787377, + "loss": 0.3265, + "step": 1210 + }, + { + "epoch": 0.03, + "learning_rate": 0.0029540235660628594, + "loss": 0.317, + "step": 1220 + }, + { + "epoch": 0.03, + "learning_rate": 0.0029536467100469816, + "loss": 0.3051, + "step": 1230 + }, + { + "epoch": 0.03, + "learning_rate": 0.0029532698540311033, + "loss": 0.3192, + "step": 1240 + }, + { + "epoch": 0.03, + "learning_rate": 0.002952892998015225, + "loss": 0.3194, + "step": 1250 + }, + { + "epoch": 0.03, + "learning_rate": 0.002952516141999347, + "loss": 0.3129, + "step": 1260 + }, + { + "epoch": 0.03, + "learning_rate": 0.0029521392859834686, + "loss": 0.3141, + "step": 1270 + }, + { + "epoch": 0.03, + "learning_rate": 0.0029517624299675907, + "loss": 0.3176, + "step": 1280 + }, + { + "epoch": 0.03, + "learning_rate": 0.002951385573951712, + "loss": 0.3152, + "step": 1290 + }, + { + "epoch": 0.03, + "learning_rate": 0.0029510087179358342, + "loss": 0.311, + "step": 1300 + }, + { + "epoch": 0.03, + "learning_rate": 0.002950631861919956, + "loss": 0.3164, + "step": 1310 + }, + { + "epoch": 0.03, + "learning_rate": 0.0029502550059040777, + "loss": 0.3056, + "step": 1320 + }, + { + "epoch": 0.03, + "learning_rate": 0.0029498781498881995, + "loss": 0.3124, + "step": 1330 + }, + { + "epoch": 0.03, + "learning_rate": 0.002949501293872321, + "loss": 0.3016, + "step": 1340 + }, + { + "epoch": 0.03, + "learning_rate": 0.002949124437856443, + "loss": 0.2999, + "step": 1350 + }, + { + "epoch": 0.03, + "learning_rate": 0.0029487475818405647, + "loss": 0.3043, + "step": 1360 + }, + { + "epoch": 0.03, + "learning_rate": 0.0029483707258246864, + "loss": 0.3036, + "step": 1370 + }, + { + "epoch": 0.03, + "learning_rate": 0.0029479938698088086, + "loss": 0.305, + "step": 1380 + }, + { + "epoch": 0.03, + "learning_rate": 0.0029476170137929304, + "loss": 0.3019, + "step": 1390 + }, + { + "epoch": 0.04, + "learning_rate": 0.002947240157777052, + "loss": 0.3098, + "step": 1400 + }, + { + "epoch": 0.04, + "learning_rate": 0.002946863301761174, + "loss": 0.2971, + "step": 1410 + }, + { + "epoch": 0.04, + "learning_rate": 0.0029464864457452956, + "loss": 0.3018, + "step": 1420 + }, + { + "epoch": 0.04, + "learning_rate": 0.0029461095897294174, + "loss": 0.3037, + "step": 1430 + }, + { + "epoch": 0.04, + "learning_rate": 0.002945732733713539, + "loss": 0.3026, + "step": 1440 + }, + { + "epoch": 0.04, + "learning_rate": 0.002945355877697661, + "loss": 0.2994, + "step": 1450 + }, + { + "epoch": 0.04, + "learning_rate": 0.002944979021681783, + "loss": 0.3042, + "step": 1460 + }, + { + "epoch": 0.04, + "learning_rate": 0.0029446021656659048, + "loss": 0.3, + "step": 1470 + }, + { + "epoch": 0.04, + "learning_rate": 0.0029442253096500265, + "loss": 0.2954, + "step": 1480 + }, + { + "epoch": 0.04, + "learning_rate": 0.0029438484536341483, + "loss": 0.2995, + "step": 1490 + }, + { + "epoch": 0.04, + "learning_rate": 0.00294347159761827, + "loss": 0.2914, + "step": 1500 + }, + { + "epoch": 0.04, + "eval_cer": 0.6704616490704796, + "eval_loss": 0.22774317860603333, + "eval_runtime": 90.4054, + "eval_samples_per_second": 110.602, + "eval_steps_per_second": 6.913, + "step": 1500 + }, + { + "epoch": 0.04, + "learning_rate": 0.002943094741602392, + "loss": 0.2932, + "step": 1510 + }, + { + "epoch": 0.04, + "learning_rate": 0.0029427178855865135, + "loss": 0.2942, + "step": 1520 + }, + { + "epoch": 0.04, + "learning_rate": 0.0029423410295706352, + "loss": 0.2952, + "step": 1530 + }, + { + "epoch": 0.04, + "learning_rate": 0.0029419641735547574, + "loss": 0.2902, + "step": 1540 + }, + { + "epoch": 0.04, + "learning_rate": 0.002941587317538879, + "loss": 0.2969, + "step": 1550 + }, + { + "epoch": 0.04, + "learning_rate": 0.002941210461523001, + "loss": 0.2905, + "step": 1560 + }, + { + "epoch": 0.04, + "learning_rate": 0.0029408336055071226, + "loss": 0.2959, + "step": 1570 + }, + { + "epoch": 0.04, + "learning_rate": 0.0029404567494912444, + "loss": 0.2942, + "step": 1580 + }, + { + "epoch": 0.04, + "learning_rate": 0.002940079893475366, + "loss": 0.2969, + "step": 1590 + }, + { + "epoch": 0.04, + "learning_rate": 0.002939703037459488, + "loss": 0.2973, + "step": 1600 + }, + { + "epoch": 0.04, + "learning_rate": 0.00293932618144361, + "loss": 0.2976, + "step": 1610 + }, + { + "epoch": 0.04, + "learning_rate": 0.002938949325427732, + "loss": 0.2824, + "step": 1620 + }, + { + "epoch": 0.04, + "learning_rate": 0.002938572469411853, + "loss": 0.2918, + "step": 1630 + }, + { + "epoch": 0.04, + "learning_rate": 0.0029381956133959753, + "loss": 0.2897, + "step": 1640 + }, + { + "epoch": 0.04, + "learning_rate": 0.002937818757380097, + "loss": 0.2859, + "step": 1650 + }, + { + "epoch": 0.04, + "learning_rate": 0.0029374419013642188, + "loss": 0.279, + "step": 1660 + }, + { + "epoch": 0.04, + "learning_rate": 0.0029370650453483405, + "loss": 0.2871, + "step": 1670 + }, + { + "epoch": 0.04, + "learning_rate": 0.0029366881893324623, + "loss": 0.2826, + "step": 1680 + }, + { + "epoch": 0.04, + "learning_rate": 0.0029363113333165844, + "loss": 0.2859, + "step": 1690 + }, + { + "epoch": 0.04, + "learning_rate": 0.002935934477300706, + "loss": 0.2864, + "step": 1700 + }, + { + "epoch": 0.04, + "learning_rate": 0.002935557621284828, + "loss": 0.2808, + "step": 1710 + }, + { + "epoch": 0.04, + "learning_rate": 0.0029351807652689497, + "loss": 0.2775, + "step": 1720 + }, + { + "epoch": 0.04, + "learning_rate": 0.0029348039092530714, + "loss": 0.2812, + "step": 1730 + }, + { + "epoch": 0.04, + "learning_rate": 0.0029344270532371936, + "loss": 0.2762, + "step": 1740 + }, + { + "epoch": 0.04, + "learning_rate": 0.002934050197221315, + "loss": 0.281, + "step": 1750 + }, + { + "epoch": 0.04, + "learning_rate": 0.0029336733412054367, + "loss": 0.2811, + "step": 1760 + }, + { + "epoch": 0.04, + "learning_rate": 0.002933296485189559, + "loss": 0.2765, + "step": 1770 + }, + { + "epoch": 0.04, + "learning_rate": 0.00293291962917368, + "loss": 0.2847, + "step": 1780 + }, + { + "epoch": 0.04, + "learning_rate": 0.0029325427731578023, + "loss": 0.2843, + "step": 1790 + }, + { + "epoch": 0.05, + "learning_rate": 0.002932165917141924, + "loss": 0.2789, + "step": 1800 + }, + { + "epoch": 0.05, + "learning_rate": 0.002931789061126046, + "loss": 0.2844, + "step": 1810 + }, + { + "epoch": 0.05, + "learning_rate": 0.0029314122051101676, + "loss": 0.2748, + "step": 1820 + }, + { + "epoch": 0.05, + "learning_rate": 0.0029310353490942893, + "loss": 0.2743, + "step": 1830 + }, + { + "epoch": 0.05, + "learning_rate": 0.002930658493078411, + "loss": 0.2745, + "step": 1840 + }, + { + "epoch": 0.05, + "learning_rate": 0.0029302816370625332, + "loss": 0.2697, + "step": 1850 + }, + { + "epoch": 0.05, + "learning_rate": 0.0029299047810466545, + "loss": 0.273, + "step": 1860 + }, + { + "epoch": 0.05, + "learning_rate": 0.0029295279250307767, + "loss": 0.2713, + "step": 1870 + }, + { + "epoch": 0.05, + "learning_rate": 0.0029291510690148985, + "loss": 0.2791, + "step": 1880 + }, + { + "epoch": 0.05, + "learning_rate": 0.00292877421299902, + "loss": 0.2731, + "step": 1890 + }, + { + "epoch": 0.05, + "learning_rate": 0.002928397356983142, + "loss": 0.2713, + "step": 1900 + }, + { + "epoch": 0.05, + "learning_rate": 0.0029280205009672637, + "loss": 0.2793, + "step": 1910 + }, + { + "epoch": 0.05, + "learning_rate": 0.002927643644951386, + "loss": 0.2729, + "step": 1920 + }, + { + "epoch": 0.05, + "learning_rate": 0.0029272667889355076, + "loss": 0.2725, + "step": 1930 + }, + { + "epoch": 0.05, + "learning_rate": 0.002926889932919629, + "loss": 0.2697, + "step": 1940 + }, + { + "epoch": 0.05, + "learning_rate": 0.002926513076903751, + "loss": 0.2684, + "step": 1950 + }, + { + "epoch": 0.05, + "learning_rate": 0.002926136220887873, + "loss": 0.276, + "step": 1960 + }, + { + "epoch": 0.05, + "learning_rate": 0.0029257593648719946, + "loss": 0.2778, + "step": 1970 + }, + { + "epoch": 0.05, + "learning_rate": 0.0029253825088561163, + "loss": 0.2716, + "step": 1980 + }, + { + "epoch": 0.05, + "learning_rate": 0.002925005652840238, + "loss": 0.2677, + "step": 1990 + }, + { + "epoch": 0.05, + "learning_rate": 0.0029246287968243603, + "loss": 0.264, + "step": 2000 + }, + { + "epoch": 0.05, + "eval_cer": 0.6698235376492957, + "eval_loss": 0.20776917040348053, + "eval_runtime": 90.9557, + "eval_samples_per_second": 109.933, + "eval_steps_per_second": 6.871, + "step": 2000 + }, + { + "epoch": 0.05, + "learning_rate": 0.0029242519408084816, + "loss": 0.2685, + "step": 2010 + }, + { + "epoch": 0.05, + "learning_rate": 0.0029238750847926038, + "loss": 0.2688, + "step": 2020 + }, + { + "epoch": 0.05, + "learning_rate": 0.0029234982287767255, + "loss": 0.2665, + "step": 2030 + }, + { + "epoch": 0.05, + "learning_rate": 0.0029231213727608472, + "loss": 0.2673, + "step": 2040 + }, + { + "epoch": 0.05, + "learning_rate": 0.002922744516744969, + "loss": 0.2602, + "step": 2050 + }, + { + "epoch": 0.05, + "learning_rate": 0.0029223676607290907, + "loss": 0.2632, + "step": 2060 + }, + { + "epoch": 0.05, + "learning_rate": 0.0029219908047132125, + "loss": 0.2626, + "step": 2070 + }, + { + "epoch": 0.05, + "learning_rate": 0.0029216139486973347, + "loss": 0.2667, + "step": 2080 + }, + { + "epoch": 0.05, + "learning_rate": 0.002921237092681456, + "loss": 0.2591, + "step": 2090 + }, + { + "epoch": 0.05, + "learning_rate": 0.002920860236665578, + "loss": 0.2577, + "step": 2100 + }, + { + "epoch": 0.05, + "learning_rate": 0.0029204833806497, + "loss": 0.2624, + "step": 2110 + }, + { + "epoch": 0.05, + "learning_rate": 0.0029201065246338216, + "loss": 0.257, + "step": 2120 + }, + { + "epoch": 0.05, + "learning_rate": 0.0029197296686179434, + "loss": 0.2583, + "step": 2130 + }, + { + "epoch": 0.05, + "learning_rate": 0.002919352812602065, + "loss": 0.2672, + "step": 2140 + }, + { + "epoch": 0.05, + "learning_rate": 0.0029189759565861873, + "loss": 0.2578, + "step": 2150 + }, + { + "epoch": 0.05, + "learning_rate": 0.002918599100570309, + "loss": 0.2549, + "step": 2160 + }, + { + "epoch": 0.05, + "learning_rate": 0.0029182222445544304, + "loss": 0.2643, + "step": 2170 + }, + { + "epoch": 0.05, + "learning_rate": 0.0029178453885385525, + "loss": 0.2617, + "step": 2180 + }, + { + "epoch": 0.06, + "learning_rate": 0.0029174685325226743, + "loss": 0.2536, + "step": 2190 + }, + { + "epoch": 0.06, + "learning_rate": 0.002917091676506796, + "loss": 0.2598, + "step": 2200 + }, + { + "epoch": 0.06, + "learning_rate": 0.0029167148204909178, + "loss": 0.2618, + "step": 2210 + }, + { + "epoch": 0.06, + "learning_rate": 0.0029163379644750395, + "loss": 0.2543, + "step": 2220 + }, + { + "epoch": 0.06, + "learning_rate": 0.0029159611084591617, + "loss": 0.2563, + "step": 2230 + }, + { + "epoch": 0.06, + "learning_rate": 0.002915584252443283, + "loss": 0.2618, + "step": 2240 + }, + { + "epoch": 0.06, + "learning_rate": 0.0029152073964274047, + "loss": 0.256, + "step": 2250 + }, + { + "epoch": 0.06, + "learning_rate": 0.002914830540411527, + "loss": 0.2554, + "step": 2260 + }, + { + "epoch": 0.06, + "learning_rate": 0.0029144536843956487, + "loss": 0.2555, + "step": 2270 + }, + { + "epoch": 0.06, + "learning_rate": 0.0029140768283797704, + "loss": 0.2533, + "step": 2280 + }, + { + "epoch": 0.06, + "learning_rate": 0.002913699972363892, + "loss": 0.2577, + "step": 2290 + }, + { + "epoch": 0.06, + "learning_rate": 0.002913323116348014, + "loss": 0.2526, + "step": 2300 + }, + { + "epoch": 0.06, + "learning_rate": 0.002912946260332136, + "loss": 0.2536, + "step": 2310 + }, + { + "epoch": 0.06, + "learning_rate": 0.0029125694043162574, + "loss": 0.2562, + "step": 2320 + }, + { + "epoch": 0.06, + "learning_rate": 0.0029121925483003796, + "loss": 0.2537, + "step": 2330 + }, + { + "epoch": 0.06, + "learning_rate": 0.0029118156922845013, + "loss": 0.2543, + "step": 2340 + }, + { + "epoch": 0.06, + "learning_rate": 0.002911438836268623, + "loss": 0.2562, + "step": 2350 + }, + { + "epoch": 0.06, + "learning_rate": 0.002911061980252745, + "loss": 0.2556, + "step": 2360 + }, + { + "epoch": 0.06, + "learning_rate": 0.0029106851242368665, + "loss": 0.2523, + "step": 2370 + }, + { + "epoch": 0.06, + "learning_rate": 0.0029103082682209883, + "loss": 0.253, + "step": 2380 + }, + { + "epoch": 0.06, + "learning_rate": 0.0029099314122051105, + "loss": 0.2479, + "step": 2390 + }, + { + "epoch": 0.06, + "learning_rate": 0.002909554556189232, + "loss": 0.2521, + "step": 2400 + }, + { + "epoch": 0.06, + "learning_rate": 0.002909177700173354, + "loss": 0.2561, + "step": 2410 + }, + { + "epoch": 0.06, + "learning_rate": 0.0029088008441574757, + "loss": 0.2518, + "step": 2420 + }, + { + "epoch": 0.06, + "learning_rate": 0.0029084239881415975, + "loss": 0.2552, + "step": 2430 + }, + { + "epoch": 0.06, + "learning_rate": 0.002908047132125719, + "loss": 0.2483, + "step": 2440 + }, + { + "epoch": 0.06, + "learning_rate": 0.002907670276109841, + "loss": 0.2593, + "step": 2450 + }, + { + "epoch": 0.06, + "learning_rate": 0.002907293420093963, + "loss": 0.2491, + "step": 2460 + }, + { + "epoch": 0.06, + "learning_rate": 0.0029069165640780844, + "loss": 0.2454, + "step": 2470 + }, + { + "epoch": 0.06, + "learning_rate": 0.002906539708062206, + "loss": 0.2516, + "step": 2480 + }, + { + "epoch": 0.06, + "learning_rate": 0.0029061628520463284, + "loss": 0.2493, + "step": 2490 + }, + { + "epoch": 0.06, + "learning_rate": 0.00290578599603045, + "loss": 0.2506, + "step": 2500 + }, + { + "epoch": 0.06, + "eval_cer": 0.6693986112655058, + "eval_loss": 0.18936096131801605, + "eval_runtime": 90.6775, + "eval_samples_per_second": 110.27, + "eval_steps_per_second": 6.893, + "step": 2500 + }, + { + "epoch": 0.06, + "learning_rate": 0.002905409140014572, + "loss": 0.2495, + "step": 2510 + }, + { + "epoch": 0.06, + "learning_rate": 0.0029050322839986936, + "loss": 0.2504, + "step": 2520 + }, + { + "epoch": 0.06, + "learning_rate": 0.0029046554279828153, + "loss": 0.2385, + "step": 2530 + }, + { + "epoch": 0.06, + "learning_rate": 0.0029042785719669375, + "loss": 0.2492, + "step": 2540 + }, + { + "epoch": 0.06, + "learning_rate": 0.002903901715951059, + "loss": 0.2449, + "step": 2550 + }, + { + "epoch": 0.06, + "learning_rate": 0.002903524859935181, + "loss": 0.2387, + "step": 2560 + }, + { + "epoch": 0.06, + "learning_rate": 0.0029031480039193027, + "loss": 0.2418, + "step": 2570 + }, + { + "epoch": 0.06, + "learning_rate": 0.0029027711479034245, + "loss": 0.2452, + "step": 2580 + }, + { + "epoch": 0.07, + "learning_rate": 0.0029023942918875462, + "loss": 0.2497, + "step": 2590 + }, + { + "epoch": 0.07, + "learning_rate": 0.002902017435871668, + "loss": 0.2436, + "step": 2600 + }, + { + "epoch": 0.07, + "learning_rate": 0.0029016405798557897, + "loss": 0.2504, + "step": 2610 + }, + { + "epoch": 0.07, + "learning_rate": 0.002901263723839912, + "loss": 0.2471, + "step": 2620 + }, + { + "epoch": 0.07, + "learning_rate": 0.002900886867824033, + "loss": 0.2429, + "step": 2630 + }, + { + "epoch": 0.07, + "learning_rate": 0.0029005100118081554, + "loss": 0.2513, + "step": 2640 + }, + { + "epoch": 0.07, + "learning_rate": 0.002900133155792277, + "loss": 0.2373, + "step": 2650 + }, + { + "epoch": 0.07, + "learning_rate": 0.002899756299776399, + "loss": 0.2415, + "step": 2660 + }, + { + "epoch": 0.07, + "learning_rate": 0.0028993794437605206, + "loss": 0.2429, + "step": 2670 + }, + { + "epoch": 0.07, + "learning_rate": 0.0028990025877446424, + "loss": 0.2436, + "step": 2680 + }, + { + "epoch": 0.07, + "learning_rate": 0.002898625731728764, + "loss": 0.2379, + "step": 2690 + }, + { + "epoch": 0.07, + "learning_rate": 0.002898248875712886, + "loss": 0.2465, + "step": 2700 + }, + { + "epoch": 0.07, + "learning_rate": 0.0028978720196970076, + "loss": 0.2431, + "step": 2710 + }, + { + "epoch": 0.07, + "learning_rate": 0.0028974951636811298, + "loss": 0.24, + "step": 2720 + }, + { + "epoch": 0.07, + "learning_rate": 0.0028971183076652515, + "loss": 0.2464, + "step": 2730 + }, + { + "epoch": 0.07, + "learning_rate": 0.0028967414516493733, + "loss": 0.2404, + "step": 2740 + }, + { + "epoch": 0.07, + "learning_rate": 0.002896364595633495, + "loss": 0.2333, + "step": 2750 + }, + { + "epoch": 0.07, + "learning_rate": 0.0028959877396176168, + "loss": 0.2332, + "step": 2760 + }, + { + "epoch": 0.07, + "learning_rate": 0.002895610883601739, + "loss": 0.2387, + "step": 2770 + }, + { + "epoch": 0.07, + "learning_rate": 0.0028952340275858602, + "loss": 0.2393, + "step": 2780 + }, + { + "epoch": 0.07, + "learning_rate": 0.002894857171569982, + "loss": 0.2314, + "step": 2790 + }, + { + "epoch": 0.07, + "learning_rate": 0.002894480315554104, + "loss": 0.2372, + "step": 2800 + }, + { + "epoch": 0.07, + "learning_rate": 0.002894103459538226, + "loss": 0.2377, + "step": 2810 + }, + { + "epoch": 0.07, + "learning_rate": 0.0028937266035223477, + "loss": 0.2341, + "step": 2820 + }, + { + "epoch": 0.07, + "learning_rate": 0.0028933497475064694, + "loss": 0.2339, + "step": 2830 + }, + { + "epoch": 0.07, + "learning_rate": 0.002892972891490591, + "loss": 0.2373, + "step": 2840 + }, + { + "epoch": 0.07, + "learning_rate": 0.0028925960354747133, + "loss": 0.2328, + "step": 2850 + }, + { + "epoch": 0.07, + "learning_rate": 0.0028922191794588346, + "loss": 0.2343, + "step": 2860 + }, + { + "epoch": 0.07, + "learning_rate": 0.002891842323442957, + "loss": 0.2344, + "step": 2870 + }, + { + "epoch": 0.07, + "learning_rate": 0.0028914654674270786, + "loss": 0.2309, + "step": 2880 + }, + { + "epoch": 0.07, + "learning_rate": 0.0028910886114112003, + "loss": 0.234, + "step": 2890 + }, + { + "epoch": 0.07, + "learning_rate": 0.002890711755395322, + "loss": 0.2315, + "step": 2900 + }, + { + "epoch": 0.07, + "learning_rate": 0.002890334899379444, + "loss": 0.2377, + "step": 2910 + }, + { + "epoch": 0.07, + "learning_rate": 0.0028899580433635655, + "loss": 0.24, + "step": 2920 + }, + { + "epoch": 0.07, + "learning_rate": 0.0028895811873476873, + "loss": 0.2387, + "step": 2930 + }, + { + "epoch": 0.07, + "learning_rate": 0.002889204331331809, + "loss": 0.2373, + "step": 2940 + }, + { + "epoch": 0.07, + "learning_rate": 0.002888827475315931, + "loss": 0.2401, + "step": 2950 + }, + { + "epoch": 0.07, + "learning_rate": 0.002888450619300053, + "loss": 0.2361, + "step": 2960 + }, + { + "epoch": 0.07, + "learning_rate": 0.0028880737632841747, + "loss": 0.233, + "step": 2970 + }, + { + "epoch": 0.07, + "learning_rate": 0.0028876969072682964, + "loss": 0.2341, + "step": 2980 + }, + { + "epoch": 0.08, + "learning_rate": 0.002887320051252418, + "loss": 0.229, + "step": 2990 + }, + { + "epoch": 0.08, + "learning_rate": 0.00288694319523654, + "loss": 0.2305, + "step": 3000 + }, + { + "epoch": 0.08, + "eval_cer": 0.6684963043916599, + "eval_loss": 0.17874853312969208, + "eval_runtime": 90.9659, + "eval_samples_per_second": 109.92, + "eval_steps_per_second": 6.871, + "step": 3000 + }, + { + "epoch": 0.08, + "learning_rate": 0.0028865663392206617, + "loss": 0.2329, + "step": 3010 + }, + { + "epoch": 0.08, + "learning_rate": 0.0028861894832047834, + "loss": 0.2329, + "step": 3020 + }, + { + "epoch": 0.08, + "learning_rate": 0.0028858126271889056, + "loss": 0.2329, + "step": 3030 + }, + { + "epoch": 0.08, + "learning_rate": 0.0028854357711730273, + "loss": 0.2301, + "step": 3040 + }, + { + "epoch": 0.08, + "learning_rate": 0.002885058915157149, + "loss": 0.2323, + "step": 3050 + }, + { + "epoch": 0.08, + "learning_rate": 0.002884682059141271, + "loss": 0.2234, + "step": 3060 + }, + { + "epoch": 0.08, + "learning_rate": 0.0028843052031253926, + "loss": 0.2317, + "step": 3070 + }, + { + "epoch": 0.08, + "learning_rate": 0.0028839283471095148, + "loss": 0.2335, + "step": 3080 + }, + { + "epoch": 0.08, + "learning_rate": 0.002883551491093636, + "loss": 0.2269, + "step": 3090 + }, + { + "epoch": 0.08, + "learning_rate": 0.002883174635077758, + "loss": 0.2328, + "step": 3100 + }, + { + "epoch": 0.08, + "learning_rate": 0.00288279777906188, + "loss": 0.2229, + "step": 3110 + }, + { + "epoch": 0.08, + "learning_rate": 0.0028824209230460013, + "loss": 0.227, + "step": 3120 + }, + { + "epoch": 0.08, + "learning_rate": 0.0028820440670301235, + "loss": 0.2255, + "step": 3130 + }, + { + "epoch": 0.08, + "learning_rate": 0.0028816672110142452, + "loss": 0.2209, + "step": 3140 + }, + { + "epoch": 0.08, + "learning_rate": 0.002881290354998367, + "loss": 0.2268, + "step": 3150 + }, + { + "epoch": 0.08, + "learning_rate": 0.0028809134989824887, + "loss": 0.2293, + "step": 3160 + }, + { + "epoch": 0.08, + "learning_rate": 0.0028805366429666105, + "loss": 0.2217, + "step": 3170 + }, + { + "epoch": 0.08, + "learning_rate": 0.0028801597869507326, + "loss": 0.2275, + "step": 3180 + }, + { + "epoch": 0.08, + "learning_rate": 0.0028797829309348544, + "loss": 0.2229, + "step": 3190 + }, + { + "epoch": 0.08, + "learning_rate": 0.0028794060749189757, + "loss": 0.2225, + "step": 3200 + }, + { + "epoch": 0.08, + "learning_rate": 0.002879029218903098, + "loss": 0.226, + "step": 3210 + }, + { + "epoch": 0.08, + "learning_rate": 0.0028786523628872196, + "loss": 0.226, + "step": 3220 + }, + { + "epoch": 0.08, + "learning_rate": 0.0028782755068713414, + "loss": 0.2239, + "step": 3230 + }, + { + "epoch": 0.08, + "learning_rate": 0.002877898650855463, + "loss": 0.2209, + "step": 3240 + }, + { + "epoch": 0.08, + "learning_rate": 0.002877521794839585, + "loss": 0.2225, + "step": 3250 + }, + { + "epoch": 0.08, + "learning_rate": 0.002877144938823707, + "loss": 0.2221, + "step": 3260 + }, + { + "epoch": 0.08, + "learning_rate": 0.0028767680828078288, + "loss": 0.2255, + "step": 3270 + }, + { + "epoch": 0.08, + "learning_rate": 0.0028763912267919505, + "loss": 0.2274, + "step": 3280 + }, + { + "epoch": 0.08, + "learning_rate": 0.0028760143707760723, + "loss": 0.2235, + "step": 3290 + }, + { + "epoch": 0.08, + "learning_rate": 0.002875637514760194, + "loss": 0.2264, + "step": 3300 + }, + { + "epoch": 0.08, + "learning_rate": 0.002875260658744316, + "loss": 0.2243, + "step": 3310 + }, + { + "epoch": 0.08, + "learning_rate": 0.0028748838027284375, + "loss": 0.2303, + "step": 3320 + }, + { + "epoch": 0.08, + "learning_rate": 0.0028745069467125592, + "loss": 0.2169, + "step": 3330 + }, + { + "epoch": 0.08, + "learning_rate": 0.0028741300906966814, + "loss": 0.2245, + "step": 3340 + }, + { + "epoch": 0.08, + "learning_rate": 0.0028737532346808027, + "loss": 0.219, + "step": 3350 + }, + { + "epoch": 0.08, + "learning_rate": 0.002873376378664925, + "loss": 0.2223, + "step": 3360 + }, + { + "epoch": 0.08, + "learning_rate": 0.0028729995226490466, + "loss": 0.2171, + "step": 3370 + }, + { + "epoch": 0.08, + "learning_rate": 0.0028726226666331684, + "loss": 0.2232, + "step": 3380 + }, + { + "epoch": 0.09, + "learning_rate": 0.00287224581061729, + "loss": 0.2228, + "step": 3390 + }, + { + "epoch": 0.09, + "learning_rate": 0.002871868954601412, + "loss": 0.2229, + "step": 3400 + }, + { + "epoch": 0.09, + "learning_rate": 0.0028714920985855336, + "loss": 0.2141, + "step": 3410 + }, + { + "epoch": 0.09, + "learning_rate": 0.002871115242569656, + "loss": 0.2212, + "step": 3420 + }, + { + "epoch": 0.09, + "learning_rate": 0.002870738386553777, + "loss": 0.2329, + "step": 3430 + }, + { + "epoch": 0.09, + "learning_rate": 0.0028703615305378993, + "loss": 0.2172, + "step": 3440 + }, + { + "epoch": 0.09, + "learning_rate": 0.002869984674522021, + "loss": 0.2235, + "step": 3450 + }, + { + "epoch": 0.09, + "learning_rate": 0.002869607818506143, + "loss": 0.2143, + "step": 3460 + }, + { + "epoch": 0.09, + "learning_rate": 0.0028692309624902645, + "loss": 0.2202, + "step": 3470 + }, + { + "epoch": 0.09, + "learning_rate": 0.0028688541064743863, + "loss": 0.2187, + "step": 3480 + }, + { + "epoch": 0.09, + "learning_rate": 0.0028684772504585085, + "loss": 0.2181, + "step": 3490 + }, + { + "epoch": 0.09, + "learning_rate": 0.00286810039444263, + "loss": 0.2206, + "step": 3500 + }, + { + "epoch": 0.09, + "eval_cer": 0.668782636439627, + "eval_loss": 0.1685170978307724, + "eval_runtime": 90.6789, + "eval_samples_per_second": 110.268, + "eval_steps_per_second": 6.892, + "step": 3500 + }, + { + "epoch": 0.09, + "learning_rate": 0.0028677235384267515, + "loss": 0.2217, + "step": 3510 + }, + { + "epoch": 0.09, + "learning_rate": 0.0028673466824108737, + "loss": 0.2118, + "step": 3520 + }, + { + "epoch": 0.09, + "learning_rate": 0.0028669698263949954, + "loss": 0.2129, + "step": 3530 + }, + { + "epoch": 0.09, + "learning_rate": 0.002866592970379117, + "loss": 0.2189, + "step": 3540 + }, + { + "epoch": 0.09, + "learning_rate": 0.002866216114363239, + "loss": 0.2166, + "step": 3550 + }, + { + "epoch": 0.09, + "learning_rate": 0.0028658392583473607, + "loss": 0.2116, + "step": 3560 + }, + { + "epoch": 0.09, + "learning_rate": 0.002865462402331483, + "loss": 0.216, + "step": 3570 + }, + { + "epoch": 0.09, + "learning_rate": 0.002865085546315604, + "loss": 0.2173, + "step": 3580 + }, + { + "epoch": 0.09, + "learning_rate": 0.0028647086902997263, + "loss": 0.2213, + "step": 3590 + }, + { + "epoch": 0.09, + "learning_rate": 0.002864331834283848, + "loss": 0.213, + "step": 3600 + }, + { + "epoch": 0.09, + "learning_rate": 0.00286395497826797, + "loss": 0.2191, + "step": 3610 + }, + { + "epoch": 0.09, + "learning_rate": 0.0028635781222520916, + "loss": 0.2171, + "step": 3620 + }, + { + "epoch": 0.09, + "learning_rate": 0.0028632012662362133, + "loss": 0.2139, + "step": 3630 + }, + { + "epoch": 0.09, + "learning_rate": 0.002862824410220335, + "loss": 0.2152, + "step": 3640 + }, + { + "epoch": 0.09, + "learning_rate": 0.0028624475542044572, + "loss": 0.211, + "step": 3650 + }, + { + "epoch": 0.09, + "learning_rate": 0.0028620706981885785, + "loss": 0.2191, + "step": 3660 + }, + { + "epoch": 0.09, + "learning_rate": 0.0028616938421727007, + "loss": 0.2133, + "step": 3670 + }, + { + "epoch": 0.09, + "learning_rate": 0.0028613169861568225, + "loss": 0.2183, + "step": 3680 + }, + { + "epoch": 0.09, + "learning_rate": 0.002860940130140944, + "loss": 0.2118, + "step": 3690 + }, + { + "epoch": 0.09, + "learning_rate": 0.002860563274125066, + "loss": 0.2134, + "step": 3700 + }, + { + "epoch": 0.09, + "learning_rate": 0.0028601864181091877, + "loss": 0.2145, + "step": 3710 + }, + { + "epoch": 0.09, + "learning_rate": 0.00285980956209331, + "loss": 0.212, + "step": 3720 + }, + { + "epoch": 0.09, + "learning_rate": 0.0028594327060774316, + "loss": 0.2155, + "step": 3730 + }, + { + "epoch": 0.09, + "learning_rate": 0.002859055850061553, + "loss": 0.2131, + "step": 3740 + }, + { + "epoch": 0.09, + "learning_rate": 0.002858678994045675, + "loss": 0.2177, + "step": 3750 + }, + { + "epoch": 0.09, + "learning_rate": 0.002858302138029797, + "loss": 0.2219, + "step": 3760 + }, + { + "epoch": 0.09, + "learning_rate": 0.0028579252820139186, + "loss": 0.2193, + "step": 3770 + }, + { + "epoch": 0.09, + "learning_rate": 0.0028575484259980403, + "loss": 0.2107, + "step": 3780 + }, + { + "epoch": 0.1, + "learning_rate": 0.002857171569982162, + "loss": 0.2127, + "step": 3790 + }, + { + "epoch": 0.1, + "learning_rate": 0.0028567947139662843, + "loss": 0.2178, + "step": 3800 + }, + { + "epoch": 0.1, + "learning_rate": 0.0028564178579504056, + "loss": 0.2128, + "step": 3810 + }, + { + "epoch": 0.1, + "learning_rate": 0.0028560410019345273, + "loss": 0.2121, + "step": 3820 + }, + { + "epoch": 0.1, + "learning_rate": 0.0028556641459186495, + "loss": 0.2094, + "step": 3830 + }, + { + "epoch": 0.1, + "learning_rate": 0.0028552872899027712, + "loss": 0.2158, + "step": 3840 + }, + { + "epoch": 0.1, + "learning_rate": 0.002854910433886893, + "loss": 0.2161, + "step": 3850 + }, + { + "epoch": 0.1, + "learning_rate": 0.0028545335778710147, + "loss": 0.2145, + "step": 3860 + }, + { + "epoch": 0.1, + "learning_rate": 0.0028541567218551365, + "loss": 0.2089, + "step": 3870 + }, + { + "epoch": 0.1, + "learning_rate": 0.0028537798658392587, + "loss": 0.2088, + "step": 3880 + }, + { + "epoch": 0.1, + "learning_rate": 0.00285340300982338, + "loss": 0.2081, + "step": 3890 + }, + { + "epoch": 0.1, + "learning_rate": 0.002853026153807502, + "loss": 0.2111, + "step": 3900 + }, + { + "epoch": 0.1, + "learning_rate": 0.002852649297791624, + "loss": 0.2113, + "step": 3910 + }, + { + "epoch": 0.1, + "learning_rate": 0.0028522724417757456, + "loss": 0.2072, + "step": 3920 + }, + { + "epoch": 0.1, + "learning_rate": 0.0028518955857598674, + "loss": 0.2127, + "step": 3930 + }, + { + "epoch": 0.1, + "learning_rate": 0.002851518729743989, + "loss": 0.207, + "step": 3940 + }, + { + "epoch": 0.1, + "learning_rate": 0.002851141873728111, + "loss": 0.2079, + "step": 3950 + }, + { + "epoch": 0.1, + "learning_rate": 0.002850765017712233, + "loss": 0.2096, + "step": 3960 + }, + { + "epoch": 0.1, + "learning_rate": 0.0028503881616963544, + "loss": 0.2078, + "step": 3970 + }, + { + "epoch": 0.1, + "learning_rate": 0.0028500113056804765, + "loss": 0.2067, + "step": 3980 + }, + { + "epoch": 0.1, + "learning_rate": 0.0028496344496645983, + "loss": 0.2043, + "step": 3990 + }, + { + "epoch": 0.1, + "learning_rate": 0.00284925759364872, + "loss": 0.2086, + "step": 4000 + }, + { + "epoch": 0.1, + "eval_cer": 0.6684727241053567, + "eval_loss": 0.16068455576896667, + "eval_runtime": 90.6058, + "eval_samples_per_second": 110.357, + "eval_steps_per_second": 6.898, + "step": 4000 + }, + { + "epoch": 0.1, + "learning_rate": 0.0028488807376328418, + "loss": 0.2033, + "step": 4010 + }, + { + "epoch": 0.1, + "learning_rate": 0.0028485038816169635, + "loss": 0.2086, + "step": 4020 + }, + { + "epoch": 0.1, + "learning_rate": 0.0028481270256010857, + "loss": 0.2048, + "step": 4030 + }, + { + "epoch": 0.1, + "learning_rate": 0.002847750169585207, + "loss": 0.2071, + "step": 4040 + }, + { + "epoch": 0.1, + "learning_rate": 0.0028473733135693288, + "loss": 0.2062, + "step": 4050 + }, + { + "epoch": 0.1, + "learning_rate": 0.002846996457553451, + "loss": 0.2096, + "step": 4060 + }, + { + "epoch": 0.1, + "learning_rate": 0.0028466196015375727, + "loss": 0.2108, + "step": 4070 + }, + { + "epoch": 0.1, + "learning_rate": 0.0028462427455216944, + "loss": 0.2058, + "step": 4080 + }, + { + "epoch": 0.1, + "learning_rate": 0.002845865889505816, + "loss": 0.2098, + "step": 4090 + }, + { + "epoch": 0.1, + "learning_rate": 0.002845489033489938, + "loss": 0.2044, + "step": 4100 + }, + { + "epoch": 0.1, + "learning_rate": 0.00284511217747406, + "loss": 0.2129, + "step": 4110 + }, + { + "epoch": 0.1, + "learning_rate": 0.0028447353214581814, + "loss": 0.2055, + "step": 4120 + }, + { + "epoch": 0.1, + "learning_rate": 0.0028443584654423036, + "loss": 0.2078, + "step": 4130 + }, + { + "epoch": 0.1, + "learning_rate": 0.0028439816094264253, + "loss": 0.2015, + "step": 4140 + }, + { + "epoch": 0.1, + "learning_rate": 0.002843604753410547, + "loss": 0.2001, + "step": 4150 + }, + { + "epoch": 0.1, + "learning_rate": 0.002843227897394669, + "loss": 0.2105, + "step": 4160 + }, + { + "epoch": 0.1, + "learning_rate": 0.0028428510413787906, + "loss": 0.2061, + "step": 4170 + }, + { + "epoch": 0.11, + "learning_rate": 0.0028424741853629123, + "loss": 0.2102, + "step": 4180 + }, + { + "epoch": 0.11, + "learning_rate": 0.0028420973293470345, + "loss": 0.2072, + "step": 4190 + }, + { + "epoch": 0.11, + "learning_rate": 0.002841720473331156, + "loss": 0.2004, + "step": 4200 + }, + { + "epoch": 0.11, + "learning_rate": 0.002841343617315278, + "loss": 0.2048, + "step": 4210 + }, + { + "epoch": 0.11, + "learning_rate": 0.0028409667612993997, + "loss": 0.2045, + "step": 4220 + }, + { + "epoch": 0.11, + "learning_rate": 0.002840589905283521, + "loss": 0.212, + "step": 4230 + }, + { + "epoch": 0.11, + "learning_rate": 0.002840213049267643, + "loss": 0.2036, + "step": 4240 + }, + { + "epoch": 0.11, + "learning_rate": 0.002839836193251765, + "loss": 0.2055, + "step": 4250 + }, + { + "epoch": 0.11, + "learning_rate": 0.0028394593372358867, + "loss": 0.2057, + "step": 4260 + }, + { + "epoch": 0.11, + "learning_rate": 0.0028390824812200084, + "loss": 0.202, + "step": 4270 + }, + { + "epoch": 0.11, + "learning_rate": 0.00283870562520413, + "loss": 0.2116, + "step": 4280 + }, + { + "epoch": 0.11, + "learning_rate": 0.0028383287691882524, + "loss": 0.2004, + "step": 4290 + }, + { + "epoch": 0.11, + "learning_rate": 0.002837951913172374, + "loss": 0.201, + "step": 4300 + }, + { + "epoch": 0.11, + "learning_rate": 0.002837575057156496, + "loss": 0.2058, + "step": 4310 + }, + { + "epoch": 0.11, + "learning_rate": 0.0028371982011406176, + "loss": 0.2019, + "step": 4320 + }, + { + "epoch": 0.11, + "learning_rate": 0.0028368213451247393, + "loss": 0.2054, + "step": 4330 + }, + { + "epoch": 0.11, + "learning_rate": 0.0028364444891088615, + "loss": 0.2049, + "step": 4340 + }, + { + "epoch": 0.11, + "learning_rate": 0.002836067633092983, + "loss": 0.2036, + "step": 4350 + }, + { + "epoch": 0.11, + "learning_rate": 0.0028356907770771046, + "loss": 0.1996, + "step": 4360 + }, + { + "epoch": 0.11, + "learning_rate": 0.0028353139210612268, + "loss": 0.2033, + "step": 4370 + }, + { + "epoch": 0.11, + "learning_rate": 0.0028349370650453485, + "loss": 0.2015, + "step": 4380 + }, + { + "epoch": 0.11, + "learning_rate": 0.0028345602090294702, + "loss": 0.1991, + "step": 4390 + }, + { + "epoch": 0.11, + "learning_rate": 0.002834183353013592, + "loss": 0.206, + "step": 4400 + }, + { + "epoch": 0.11, + "learning_rate": 0.0028338064969977137, + "loss": 0.2049, + "step": 4410 + }, + { + "epoch": 0.11, + "learning_rate": 0.002833429640981836, + "loss": 0.195, + "step": 4420 + }, + { + "epoch": 0.11, + "learning_rate": 0.0028330527849659572, + "loss": 0.1996, + "step": 4430 + }, + { + "epoch": 0.11, + "learning_rate": 0.0028326759289500794, + "loss": 0.1986, + "step": 4440 + }, + { + "epoch": 0.11, + "learning_rate": 0.002832299072934201, + "loss": 0.2058, + "step": 4450 + }, + { + "epoch": 0.11, + "learning_rate": 0.0028319222169183225, + "loss": 0.1988, + "step": 4460 + }, + { + "epoch": 0.11, + "learning_rate": 0.0028315453609024446, + "loss": 0.1954, + "step": 4470 + }, + { + "epoch": 0.11, + "learning_rate": 0.0028311685048865664, + "loss": 0.2005, + "step": 4480 + }, + { + "epoch": 0.11, + "learning_rate": 0.002830791648870688, + "loss": 0.1986, + "step": 4490 + }, + { + "epoch": 0.11, + "learning_rate": 0.00283041479285481, + "loss": 0.1955, + "step": 4500 + }, + { + "epoch": 0.11, + "eval_cer": 0.6682609827589608, + "eval_loss": 0.15178607404232025, + "eval_runtime": 90.6612, + "eval_samples_per_second": 110.29, + "eval_steps_per_second": 6.894, + "step": 4500 + }, + { + "epoch": 0.11, + "learning_rate": 0.0028300379368389316, + "loss": 0.1974, + "step": 4510 + }, + { + "epoch": 0.11, + "learning_rate": 0.002829661080823054, + "loss": 0.1988, + "step": 4520 + }, + { + "epoch": 0.11, + "learning_rate": 0.0028292842248071755, + "loss": 0.2004, + "step": 4530 + }, + { + "epoch": 0.11, + "learning_rate": 0.0028289073687912973, + "loss": 0.1999, + "step": 4540 + }, + { + "epoch": 0.11, + "learning_rate": 0.002828530512775419, + "loss": 0.1944, + "step": 4550 + }, + { + "epoch": 0.11, + "learning_rate": 0.0028281536567595408, + "loss": 0.1953, + "step": 4560 + }, + { + "epoch": 0.11, + "learning_rate": 0.0028277768007436625, + "loss": 0.2002, + "step": 4570 + }, + { + "epoch": 0.12, + "learning_rate": 0.0028273999447277843, + "loss": 0.1997, + "step": 4580 + }, + { + "epoch": 0.12, + "learning_rate": 0.002827023088711906, + "loss": 0.201, + "step": 4590 + }, + { + "epoch": 0.12, + "learning_rate": 0.002826646232696028, + "loss": 0.2003, + "step": 4600 + }, + { + "epoch": 0.12, + "learning_rate": 0.00282626937668015, + "loss": 0.2066, + "step": 4610 + }, + { + "epoch": 0.12, + "learning_rate": 0.0028258925206642717, + "loss": 0.1923, + "step": 4620 + }, + { + "epoch": 0.12, + "learning_rate": 0.0028255156646483934, + "loss": 0.199, + "step": 4630 + }, + { + "epoch": 0.12, + "learning_rate": 0.002825138808632515, + "loss": 0.1977, + "step": 4640 + }, + { + "epoch": 0.12, + "learning_rate": 0.0028247619526166373, + "loss": 0.1968, + "step": 4650 + }, + { + "epoch": 0.12, + "learning_rate": 0.0028243850966007586, + "loss": 0.1967, + "step": 4660 + }, + { + "epoch": 0.12, + "learning_rate": 0.0028240082405848804, + "loss": 0.2042, + "step": 4670 + }, + { + "epoch": 0.12, + "learning_rate": 0.0028236313845690026, + "loss": 0.2012, + "step": 4680 + }, + { + "epoch": 0.12, + "learning_rate": 0.002823254528553124, + "loss": 0.1981, + "step": 4690 + }, + { + "epoch": 0.12, + "learning_rate": 0.002822877672537246, + "loss": 0.1926, + "step": 4700 + }, + { + "epoch": 0.12, + "learning_rate": 0.002822500816521368, + "loss": 0.1958, + "step": 4710 + }, + { + "epoch": 0.12, + "learning_rate": 0.0028221239605054895, + "loss": 0.1916, + "step": 4720 + }, + { + "epoch": 0.12, + "learning_rate": 0.0028217471044896113, + "loss": 0.2, + "step": 4730 + }, + { + "epoch": 0.12, + "learning_rate": 0.002821370248473733, + "loss": 0.1958, + "step": 4740 + }, + { + "epoch": 0.12, + "learning_rate": 0.002820993392457855, + "loss": 0.1976, + "step": 4750 + }, + { + "epoch": 0.12, + "learning_rate": 0.002820616536441977, + "loss": 0.1966, + "step": 4760 + }, + { + "epoch": 0.12, + "learning_rate": 0.0028202396804260983, + "loss": 0.1917, + "step": 4770 + }, + { + "epoch": 0.12, + "learning_rate": 0.0028198628244102204, + "loss": 0.2017, + "step": 4780 + }, + { + "epoch": 0.12, + "learning_rate": 0.002819485968394342, + "loss": 0.1975, + "step": 4790 + }, + { + "epoch": 0.12, + "learning_rate": 0.002819109112378464, + "loss": 0.1965, + "step": 4800 + }, + { + "epoch": 0.12, + "learning_rate": 0.0028187322563625857, + "loss": 0.1967, + "step": 4810 + }, + { + "epoch": 0.12, + "learning_rate": 0.0028183554003467074, + "loss": 0.2022, + "step": 4820 + }, + { + "epoch": 0.12, + "learning_rate": 0.0028179785443308296, + "loss": 0.1958, + "step": 4830 + }, + { + "epoch": 0.12, + "learning_rate": 0.0028176016883149513, + "loss": 0.1923, + "step": 4840 + }, + { + "epoch": 0.12, + "learning_rate": 0.002817224832299073, + "loss": 0.2005, + "step": 4850 + }, + { + "epoch": 0.12, + "learning_rate": 0.002816847976283195, + "loss": 0.1913, + "step": 4860 + }, + { + "epoch": 0.12, + "learning_rate": 0.0028164711202673166, + "loss": 0.1938, + "step": 4870 + }, + { + "epoch": 0.12, + "learning_rate": 0.0028160942642514388, + "loss": 0.1997, + "step": 4880 + }, + { + "epoch": 0.12, + "learning_rate": 0.00281571740823556, + "loss": 0.1955, + "step": 4890 + }, + { + "epoch": 0.12, + "learning_rate": 0.002815340552219682, + "loss": 0.1907, + "step": 4900 + }, + { + "epoch": 0.12, + "learning_rate": 0.002814963696203804, + "loss": 0.1961, + "step": 4910 + }, + { + "epoch": 0.12, + "learning_rate": 0.0028145868401879253, + "loss": 0.1959, + "step": 4920 + }, + { + "epoch": 0.12, + "learning_rate": 0.0028142099841720475, + "loss": 0.1943, + "step": 4930 + }, + { + "epoch": 0.12, + "learning_rate": 0.0028138331281561692, + "loss": 0.1934, + "step": 4940 + }, + { + "epoch": 0.12, + "learning_rate": 0.002813456272140291, + "loss": 0.2008, + "step": 4950 + }, + { + "epoch": 0.12, + "learning_rate": 0.0028130794161244127, + "loss": 0.1866, + "step": 4960 + }, + { + "epoch": 0.12, + "learning_rate": 0.0028127025601085345, + "loss": 0.197, + "step": 4970 + }, + { + "epoch": 0.13, + "learning_rate": 0.002812325704092656, + "loss": 0.1916, + "step": 4980 + }, + { + "epoch": 0.13, + "learning_rate": 0.0028119488480767784, + "loss": 0.1928, + "step": 4990 + }, + { + "epoch": 0.13, + "learning_rate": 0.0028115719920608997, + "loss": 0.1903, + "step": 5000 + }, + { + "epoch": 0.13, + "eval_cer": 0.6685646390989058, + "eval_loss": 0.14745888113975525, + "eval_runtime": 90.6922, + "eval_samples_per_second": 110.252, + "eval_steps_per_second": 6.891, + "step": 5000 + }, + { + "epoch": 0.13, + "learning_rate": 0.002811195136045022, + "loss": 0.1923, + "step": 5010 + }, + { + "epoch": 0.13, + "learning_rate": 0.0028108182800291436, + "loss": 0.1937, + "step": 5020 + }, + { + "epoch": 0.13, + "learning_rate": 0.0028104414240132654, + "loss": 0.1935, + "step": 5030 + }, + { + "epoch": 0.13, + "learning_rate": 0.002810064567997387, + "loss": 0.1921, + "step": 5040 + }, + { + "epoch": 0.13, + "learning_rate": 0.002809687711981509, + "loss": 0.1966, + "step": 5050 + }, + { + "epoch": 0.13, + "learning_rate": 0.002809310855965631, + "loss": 0.1934, + "step": 5060 + }, + { + "epoch": 0.13, + "learning_rate": 0.0028089339999497528, + "loss": 0.1895, + "step": 5070 + }, + { + "epoch": 0.13, + "learning_rate": 0.002808557143933874, + "loss": 0.194, + "step": 5080 + }, + { + "epoch": 0.13, + "learning_rate": 0.0028081802879179963, + "loss": 0.1948, + "step": 5090 + }, + { + "epoch": 0.13, + "learning_rate": 0.002807803431902118, + "loss": 0.1917, + "step": 5100 + }, + { + "epoch": 0.13, + "learning_rate": 0.0028074265758862398, + "loss": 0.1955, + "step": 5110 + }, + { + "epoch": 0.13, + "learning_rate": 0.0028070497198703615, + "loss": 0.189, + "step": 5120 + }, + { + "epoch": 0.13, + "learning_rate": 0.0028066728638544832, + "loss": 0.1943, + "step": 5130 + }, + { + "epoch": 0.13, + "learning_rate": 0.0028062960078386054, + "loss": 0.1898, + "step": 5140 + }, + { + "epoch": 0.13, + "learning_rate": 0.0028059191518227267, + "loss": 0.1896, + "step": 5150 + }, + { + "epoch": 0.13, + "learning_rate": 0.002805542295806849, + "loss": 0.1919, + "step": 5160 + }, + { + "epoch": 0.13, + "learning_rate": 0.0028051654397909707, + "loss": 0.1935, + "step": 5170 + }, + { + "epoch": 0.13, + "learning_rate": 0.0028047885837750924, + "loss": 0.1876, + "step": 5180 + }, + { + "epoch": 0.13, + "learning_rate": 0.002804411727759214, + "loss": 0.1914, + "step": 5190 + }, + { + "epoch": 0.13, + "learning_rate": 0.002804034871743336, + "loss": 0.1891, + "step": 5200 + }, + { + "epoch": 0.13, + "learning_rate": 0.0028036580157274576, + "loss": 0.1908, + "step": 5210 + }, + { + "epoch": 0.13, + "learning_rate": 0.00280328115971158, + "loss": 0.1893, + "step": 5220 + }, + { + "epoch": 0.13, + "learning_rate": 0.002802904303695701, + "loss": 0.1848, + "step": 5230 + }, + { + "epoch": 0.13, + "learning_rate": 0.0028025274476798233, + "loss": 0.1922, + "step": 5240 + }, + { + "epoch": 0.13, + "learning_rate": 0.002802150591663945, + "loss": 0.1921, + "step": 5250 + }, + { + "epoch": 0.13, + "learning_rate": 0.002801773735648067, + "loss": 0.1927, + "step": 5260 + }, + { + "epoch": 0.13, + "learning_rate": 0.0028013968796321885, + "loss": 0.191, + "step": 5270 + }, + { + "epoch": 0.13, + "learning_rate": 0.0028010200236163103, + "loss": 0.1963, + "step": 5280 + }, + { + "epoch": 0.13, + "learning_rate": 0.0028006431676004325, + "loss": 0.1873, + "step": 5290 + }, + { + "epoch": 0.13, + "learning_rate": 0.002800266311584554, + "loss": 0.1908, + "step": 5300 + }, + { + "epoch": 0.13, + "learning_rate": 0.0027998894555686755, + "loss": 0.1866, + "step": 5310 + }, + { + "epoch": 0.13, + "learning_rate": 0.0027995125995527977, + "loss": 0.1935, + "step": 5320 + }, + { + "epoch": 0.13, + "learning_rate": 0.0027991357435369194, + "loss": 0.1892, + "step": 5330 + }, + { + "epoch": 0.13, + "learning_rate": 0.002798758887521041, + "loss": 0.1894, + "step": 5340 + }, + { + "epoch": 0.13, + "learning_rate": 0.002798382031505163, + "loss": 0.1812, + "step": 5350 + }, + { + "epoch": 0.13, + "learning_rate": 0.0027980051754892847, + "loss": 0.1868, + "step": 5360 + }, + { + "epoch": 0.13, + "learning_rate": 0.002797628319473407, + "loss": 0.1905, + "step": 5370 + }, + { + "epoch": 0.14, + "learning_rate": 0.002797251463457528, + "loss": 0.191, + "step": 5380 + }, + { + "epoch": 0.14, + "learning_rate": 0.00279687460744165, + "loss": 0.192, + "step": 5390 + }, + { + "epoch": 0.14, + "learning_rate": 0.002796497751425772, + "loss": 0.1865, + "step": 5400 + }, + { + "epoch": 0.14, + "learning_rate": 0.002796120895409894, + "loss": 0.1868, + "step": 5410 + }, + { + "epoch": 0.14, + "learning_rate": 0.0027957440393940156, + "loss": 0.184, + "step": 5420 + }, + { + "epoch": 0.14, + "learning_rate": 0.0027953671833781373, + "loss": 0.1909, + "step": 5430 + }, + { + "epoch": 0.14, + "learning_rate": 0.002794990327362259, + "loss": 0.1797, + "step": 5440 + }, + { + "epoch": 0.14, + "learning_rate": 0.0027946134713463812, + "loss": 0.1846, + "step": 5450 + }, + { + "epoch": 0.14, + "learning_rate": 0.0027942366153305026, + "loss": 0.1869, + "step": 5460 + }, + { + "epoch": 0.14, + "learning_rate": 0.0027938597593146247, + "loss": 0.1831, + "step": 5470 + }, + { + "epoch": 0.14, + "learning_rate": 0.0027934829032987465, + "loss": 0.1836, + "step": 5480 + }, + { + "epoch": 0.14, + "learning_rate": 0.0027931060472828682, + "loss": 0.1878, + "step": 5490 + }, + { + "epoch": 0.14, + "learning_rate": 0.00279272919126699, + "loss": 0.1827, + "step": 5500 + }, + { + "epoch": 0.14, + "eval_cer": 0.6683553039041735, + "eval_loss": 0.14301101863384247, + "eval_runtime": 90.7398, + "eval_samples_per_second": 110.194, + "eval_steps_per_second": 6.888, + "step": 5500 + }, + { + "epoch": 0.14, + "learning_rate": 0.0027923523352511117, + "loss": 0.1803, + "step": 5510 + }, + { + "epoch": 0.14, + "learning_rate": 0.0027919754792352335, + "loss": 0.1819, + "step": 5520 + }, + { + "epoch": 0.14, + "learning_rate": 0.0027915986232193556, + "loss": 0.1879, + "step": 5530 + }, + { + "epoch": 0.14, + "learning_rate": 0.002791221767203477, + "loss": 0.1881, + "step": 5540 + }, + { + "epoch": 0.14, + "learning_rate": 0.002790844911187599, + "loss": 0.1878, + "step": 5550 + }, + { + "epoch": 0.14, + "learning_rate": 0.002790468055171721, + "loss": 0.1852, + "step": 5560 + }, + { + "epoch": 0.14, + "learning_rate": 0.0027900911991558426, + "loss": 0.1871, + "step": 5570 + }, + { + "epoch": 0.14, + "learning_rate": 0.0027897143431399644, + "loss": 0.184, + "step": 5580 + }, + { + "epoch": 0.14, + "learning_rate": 0.002789337487124086, + "loss": 0.1865, + "step": 5590 + }, + { + "epoch": 0.14, + "learning_rate": 0.0027889606311082083, + "loss": 0.1845, + "step": 5600 + }, + { + "epoch": 0.14, + "learning_rate": 0.0027885837750923296, + "loss": 0.1866, + "step": 5610 + }, + { + "epoch": 0.14, + "learning_rate": 0.0027882069190764513, + "loss": 0.185, + "step": 5620 + }, + { + "epoch": 0.14, + "learning_rate": 0.0027878300630605735, + "loss": 0.1838, + "step": 5630 + }, + { + "epoch": 0.14, + "learning_rate": 0.0027874532070446953, + "loss": 0.1822, + "step": 5640 + }, + { + "epoch": 0.14, + "learning_rate": 0.002787076351028817, + "loss": 0.1854, + "step": 5650 + }, + { + "epoch": 0.14, + "learning_rate": 0.0027866994950129387, + "loss": 0.1828, + "step": 5660 + }, + { + "epoch": 0.14, + "learning_rate": 0.0027863226389970605, + "loss": 0.1816, + "step": 5670 + }, + { + "epoch": 0.14, + "learning_rate": 0.0027859457829811827, + "loss": 0.1771, + "step": 5680 + }, + { + "epoch": 0.14, + "learning_rate": 0.002785568926965304, + "loss": 0.1881, + "step": 5690 + }, + { + "epoch": 0.14, + "learning_rate": 0.002785192070949426, + "loss": 0.1787, + "step": 5700 + }, + { + "epoch": 0.14, + "learning_rate": 0.002784815214933548, + "loss": 0.1839, + "step": 5710 + }, + { + "epoch": 0.14, + "learning_rate": 0.0027844383589176696, + "loss": 0.1817, + "step": 5720 + }, + { + "epoch": 0.14, + "learning_rate": 0.0027840615029017914, + "loss": 0.1831, + "step": 5730 + }, + { + "epoch": 0.14, + "learning_rate": 0.002783684646885913, + "loss": 0.1844, + "step": 5740 + }, + { + "epoch": 0.14, + "learning_rate": 0.002783307790870035, + "loss": 0.1846, + "step": 5750 + }, + { + "epoch": 0.14, + "learning_rate": 0.002782930934854157, + "loss": 0.1784, + "step": 5760 + }, + { + "epoch": 0.14, + "learning_rate": 0.0027825540788382784, + "loss": 0.1817, + "step": 5770 + }, + { + "epoch": 0.15, + "learning_rate": 0.0027821772228224005, + "loss": 0.1807, + "step": 5780 + }, + { + "epoch": 0.15, + "learning_rate": 0.0027818003668065223, + "loss": 0.1805, + "step": 5790 + }, + { + "epoch": 0.15, + "learning_rate": 0.0027814235107906436, + "loss": 0.1813, + "step": 5800 + }, + { + "epoch": 0.15, + "learning_rate": 0.0027810466547747658, + "loss": 0.1821, + "step": 5810 + }, + { + "epoch": 0.15, + "learning_rate": 0.0027806697987588875, + "loss": 0.1809, + "step": 5820 + }, + { + "epoch": 0.15, + "learning_rate": 0.0027802929427430093, + "loss": 0.1834, + "step": 5830 + }, + { + "epoch": 0.15, + "learning_rate": 0.002779916086727131, + "loss": 0.1811, + "step": 5840 + }, + { + "epoch": 0.15, + "learning_rate": 0.0027795392307112528, + "loss": 0.1823, + "step": 5850 + }, + { + "epoch": 0.15, + "learning_rate": 0.002779162374695375, + "loss": 0.1896, + "step": 5860 + }, + { + "epoch": 0.15, + "learning_rate": 0.0027787855186794967, + "loss": 0.1767, + "step": 5870 + }, + { + "epoch": 0.15, + "learning_rate": 0.0027784086626636184, + "loss": 0.1821, + "step": 5880 + }, + { + "epoch": 0.15, + "learning_rate": 0.00277803180664774, + "loss": 0.1769, + "step": 5890 + }, + { + "epoch": 0.15, + "learning_rate": 0.002777654950631862, + "loss": 0.185, + "step": 5900 + }, + { + "epoch": 0.15, + "learning_rate": 0.002777278094615984, + "loss": 0.1842, + "step": 5910 + }, + { + "epoch": 0.15, + "learning_rate": 0.0027769012386001054, + "loss": 0.1786, + "step": 5920 + }, + { + "epoch": 0.15, + "learning_rate": 0.002776524382584227, + "loss": 0.1771, + "step": 5930 + }, + { + "epoch": 0.15, + "learning_rate": 0.0027761475265683493, + "loss": 0.1717, + "step": 5940 + }, + { + "epoch": 0.15, + "learning_rate": 0.002775770670552471, + "loss": 0.1858, + "step": 5950 + }, + { + "epoch": 0.15, + "learning_rate": 0.002775393814536593, + "loss": 0.1809, + "step": 5960 + }, + { + "epoch": 0.15, + "learning_rate": 0.0027750169585207146, + "loss": 0.1767, + "step": 5970 + }, + { + "epoch": 0.15, + "learning_rate": 0.0027746401025048363, + "loss": 0.179, + "step": 5980 + }, + { + "epoch": 0.15, + "learning_rate": 0.0027742632464889585, + "loss": 0.1799, + "step": 5990 + }, + { + "epoch": 0.15, + "learning_rate": 0.00277388639047308, + "loss": 0.1775, + "step": 6000 + }, + { + "epoch": 0.15, + "eval_cer": 0.6680800401538589, + "eval_loss": 0.13693051040172577, + "eval_runtime": 90.8542, + "eval_samples_per_second": 110.055, + "eval_steps_per_second": 6.879, + "step": 6000 + }, + { + "epoch": 0.15, + "learning_rate": 0.002773509534457202, + "loss": 0.1767, + "step": 6010 + }, + { + "epoch": 0.15, + "learning_rate": 0.0027731326784413237, + "loss": 0.1782, + "step": 6020 + }, + { + "epoch": 0.15, + "learning_rate": 0.002772755822425445, + "loss": 0.1818, + "step": 6030 + }, + { + "epoch": 0.15, + "learning_rate": 0.002772378966409567, + "loss": 0.1827, + "step": 6040 + }, + { + "epoch": 0.15, + "learning_rate": 0.002772002110393689, + "loss": 0.1795, + "step": 6050 + }, + { + "epoch": 0.15, + "learning_rate": 0.0027716252543778107, + "loss": 0.1785, + "step": 6060 + }, + { + "epoch": 0.15, + "learning_rate": 0.0027712483983619324, + "loss": 0.1761, + "step": 6070 + }, + { + "epoch": 0.15, + "learning_rate": 0.002770871542346054, + "loss": 0.1768, + "step": 6080 + }, + { + "epoch": 0.15, + "learning_rate": 0.0027704946863301764, + "loss": 0.1788, + "step": 6090 + }, + { + "epoch": 0.15, + "learning_rate": 0.002770117830314298, + "loss": 0.18, + "step": 6100 + }, + { + "epoch": 0.15, + "learning_rate": 0.00276974097429842, + "loss": 0.1763, + "step": 6110 + }, + { + "epoch": 0.15, + "learning_rate": 0.0027693641182825416, + "loss": 0.1843, + "step": 6120 + }, + { + "epoch": 0.15, + "learning_rate": 0.0027689872622666633, + "loss": 0.1754, + "step": 6130 + }, + { + "epoch": 0.15, + "learning_rate": 0.0027686104062507855, + "loss": 0.1811, + "step": 6140 + }, + { + "epoch": 0.15, + "learning_rate": 0.002768233550234907, + "loss": 0.181, + "step": 6150 + }, + { + "epoch": 0.15, + "learning_rate": 0.0027678566942190286, + "loss": 0.1804, + "step": 6160 + }, + { + "epoch": 0.16, + "learning_rate": 0.0027674798382031508, + "loss": 0.1789, + "step": 6170 + }, + { + "epoch": 0.16, + "learning_rate": 0.0027671029821872725, + "loss": 0.181, + "step": 6180 + }, + { + "epoch": 0.16, + "learning_rate": 0.0027667261261713942, + "loss": 0.1832, + "step": 6190 + }, + { + "epoch": 0.16, + "learning_rate": 0.002766349270155516, + "loss": 0.1808, + "step": 6200 + }, + { + "epoch": 0.16, + "learning_rate": 0.0027659724141396377, + "loss": 0.1828, + "step": 6210 + }, + { + "epoch": 0.16, + "learning_rate": 0.00276559555812376, + "loss": 0.1813, + "step": 6220 + }, + { + "epoch": 0.16, + "learning_rate": 0.0027652187021078812, + "loss": 0.1782, + "step": 6230 + }, + { + "epoch": 0.16, + "learning_rate": 0.002764841846092003, + "loss": 0.1724, + "step": 6240 + }, + { + "epoch": 0.16, + "learning_rate": 0.002764464990076125, + "loss": 0.1748, + "step": 6250 + }, + { + "epoch": 0.16, + "learning_rate": 0.0027640881340602465, + "loss": 0.1731, + "step": 6260 + }, + { + "epoch": 0.16, + "learning_rate": 0.0027637112780443686, + "loss": 0.177, + "step": 6270 + }, + { + "epoch": 0.16, + "learning_rate": 0.0027633344220284904, + "loss": 0.175, + "step": 6280 + }, + { + "epoch": 0.16, + "learning_rate": 0.002762957566012612, + "loss": 0.1784, + "step": 6290 + }, + { + "epoch": 0.16, + "learning_rate": 0.002762580709996734, + "loss": 0.1754, + "step": 6300 + }, + { + "epoch": 0.16, + "learning_rate": 0.0027622038539808556, + "loss": 0.1801, + "step": 6310 + }, + { + "epoch": 0.16, + "learning_rate": 0.002761826997964978, + "loss": 0.175, + "step": 6320 + }, + { + "epoch": 0.16, + "learning_rate": 0.0027614501419490995, + "loss": 0.1724, + "step": 6330 + }, + { + "epoch": 0.16, + "learning_rate": 0.002761073285933221, + "loss": 0.1784, + "step": 6340 + }, + { + "epoch": 0.16, + "learning_rate": 0.002760696429917343, + "loss": 0.1811, + "step": 6350 + }, + { + "epoch": 0.16, + "learning_rate": 0.0027603195739014648, + "loss": 0.1784, + "step": 6360 + }, + { + "epoch": 0.16, + "learning_rate": 0.0027599427178855865, + "loss": 0.1747, + "step": 6370 + }, + { + "epoch": 0.16, + "learning_rate": 0.0027595658618697083, + "loss": 0.1711, + "step": 6380 + }, + { + "epoch": 0.16, + "learning_rate": 0.00275918900585383, + "loss": 0.1755, + "step": 6390 + }, + { + "epoch": 0.16, + "learning_rate": 0.002758812149837952, + "loss": 0.175, + "step": 6400 + }, + { + "epoch": 0.16, + "learning_rate": 0.002758435293822074, + "loss": 0.1723, + "step": 6410 + }, + { + "epoch": 0.16, + "learning_rate": 0.0027580584378061957, + "loss": 0.1707, + "step": 6420 + }, + { + "epoch": 0.16, + "learning_rate": 0.0027576815817903174, + "loss": 0.1744, + "step": 6430 + }, + { + "epoch": 0.16, + "learning_rate": 0.002757304725774439, + "loss": 0.1719, + "step": 6440 + }, + { + "epoch": 0.16, + "learning_rate": 0.0027569278697585613, + "loss": 0.1782, + "step": 6450 + }, + { + "epoch": 0.16, + "learning_rate": 0.0027565510137426827, + "loss": 0.1684, + "step": 6460 + }, + { + "epoch": 0.16, + "learning_rate": 0.0027561741577268044, + "loss": 0.171, + "step": 6470 + }, + { + "epoch": 0.16, + "learning_rate": 0.0027557973017109266, + "loss": 0.1759, + "step": 6480 + }, + { + "epoch": 0.16, + "learning_rate": 0.002755420445695048, + "loss": 0.1723, + "step": 6490 + }, + { + "epoch": 0.16, + "learning_rate": 0.00275504358967917, + "loss": 0.1748, + "step": 6500 + }, + { + "epoch": 0.16, + "eval_cer": 0.6680973644458368, + "eval_loss": 0.13586829602718353, + "eval_runtime": 90.7366, + "eval_samples_per_second": 110.198, + "eval_steps_per_second": 6.888, + "step": 6500 + }, + { + "epoch": 0.16, + "learning_rate": 0.002754666733663292, + "loss": 0.1766, + "step": 6510 + }, + { + "epoch": 0.16, + "learning_rate": 0.0027542898776474136, + "loss": 0.1798, + "step": 6520 + }, + { + "epoch": 0.16, + "learning_rate": 0.0027539130216315353, + "loss": 0.1747, + "step": 6530 + }, + { + "epoch": 0.16, + "learning_rate": 0.002753536165615657, + "loss": 0.1724, + "step": 6540 + }, + { + "epoch": 0.16, + "learning_rate": 0.0027531593095997792, + "loss": 0.1781, + "step": 6550 + }, + { + "epoch": 0.16, + "learning_rate": 0.002752782453583901, + "loss": 0.1793, + "step": 6560 + }, + { + "epoch": 0.17, + "learning_rate": 0.0027524055975680223, + "loss": 0.1741, + "step": 6570 + }, + { + "epoch": 0.17, + "learning_rate": 0.0027520287415521445, + "loss": 0.1745, + "step": 6580 + }, + { + "epoch": 0.17, + "learning_rate": 0.002751651885536266, + "loss": 0.1749, + "step": 6590 + }, + { + "epoch": 0.17, + "learning_rate": 0.002751275029520388, + "loss": 0.1789, + "step": 6600 + }, + { + "epoch": 0.17, + "learning_rate": 0.0027508981735045097, + "loss": 0.1792, + "step": 6610 + }, + { + "epoch": 0.17, + "learning_rate": 0.0027505213174886314, + "loss": 0.1773, + "step": 6620 + }, + { + "epoch": 0.17, + "learning_rate": 0.0027501444614727536, + "loss": 0.1733, + "step": 6630 + }, + { + "epoch": 0.17, + "learning_rate": 0.0027497676054568754, + "loss": 0.1701, + "step": 6640 + }, + { + "epoch": 0.17, + "learning_rate": 0.0027493907494409967, + "loss": 0.1755, + "step": 6650 + }, + { + "epoch": 0.17, + "learning_rate": 0.002749013893425119, + "loss": 0.1711, + "step": 6660 + }, + { + "epoch": 0.17, + "learning_rate": 0.0027486370374092406, + "loss": 0.1697, + "step": 6670 + }, + { + "epoch": 0.17, + "learning_rate": 0.0027482601813933623, + "loss": 0.1697, + "step": 6680 + }, + { + "epoch": 0.17, + "learning_rate": 0.002747883325377484, + "loss": 0.1699, + "step": 6690 + }, + { + "epoch": 0.17, + "learning_rate": 0.002747506469361606, + "loss": 0.1709, + "step": 6700 + }, + { + "epoch": 0.17, + "learning_rate": 0.002747129613345728, + "loss": 0.1693, + "step": 6710 + }, + { + "epoch": 0.17, + "learning_rate": 0.0027467527573298493, + "loss": 0.1742, + "step": 6720 + }, + { + "epoch": 0.17, + "learning_rate": 0.0027463759013139715, + "loss": 0.1763, + "step": 6730 + }, + { + "epoch": 0.17, + "learning_rate": 0.0027459990452980932, + "loss": 0.1661, + "step": 6740 + }, + { + "epoch": 0.17, + "learning_rate": 0.002745622189282215, + "loss": 0.167, + "step": 6750 + }, + { + "epoch": 0.17, + "learning_rate": 0.0027452453332663367, + "loss": 0.1745, + "step": 6760 + }, + { + "epoch": 0.17, + "learning_rate": 0.0027448684772504585, + "loss": 0.1694, + "step": 6770 + }, + { + "epoch": 0.17, + "learning_rate": 0.00274449162123458, + "loss": 0.1685, + "step": 6780 + }, + { + "epoch": 0.17, + "learning_rate": 0.0027441147652187024, + "loss": 0.1706, + "step": 6790 + }, + { + "epoch": 0.17, + "learning_rate": 0.0027437379092028237, + "loss": 0.1723, + "step": 6800 + }, + { + "epoch": 0.17, + "learning_rate": 0.002743361053186946, + "loss": 0.1669, + "step": 6810 + }, + { + "epoch": 0.17, + "learning_rate": 0.0027429841971710676, + "loss": 0.1722, + "step": 6820 + }, + { + "epoch": 0.17, + "learning_rate": 0.0027426073411551894, + "loss": 0.1665, + "step": 6830 + }, + { + "epoch": 0.17, + "learning_rate": 0.002742230485139311, + "loss": 0.1748, + "step": 6840 + }, + { + "epoch": 0.17, + "learning_rate": 0.002741853629123433, + "loss": 0.1727, + "step": 6850 + }, + { + "epoch": 0.17, + "learning_rate": 0.002741476773107555, + "loss": 0.1731, + "step": 6860 + }, + { + "epoch": 0.17, + "learning_rate": 0.002741099917091677, + "loss": 0.1707, + "step": 6870 + }, + { + "epoch": 0.17, + "learning_rate": 0.002740723061075798, + "loss": 0.1672, + "step": 6880 + }, + { + "epoch": 0.17, + "learning_rate": 0.0027403462050599203, + "loss": 0.1678, + "step": 6890 + }, + { + "epoch": 0.17, + "learning_rate": 0.002739969349044042, + "loss": 0.1673, + "step": 6900 + }, + { + "epoch": 0.17, + "learning_rate": 0.0027395924930281638, + "loss": 0.181, + "step": 6910 + }, + { + "epoch": 0.17, + "learning_rate": 0.0027392156370122855, + "loss": 0.1734, + "step": 6920 + }, + { + "epoch": 0.17, + "learning_rate": 0.0027388387809964073, + "loss": 0.1664, + "step": 6930 + }, + { + "epoch": 0.17, + "learning_rate": 0.0027384619249805294, + "loss": 0.1695, + "step": 6940 + }, + { + "epoch": 0.17, + "learning_rate": 0.0027380850689646507, + "loss": 0.1669, + "step": 6950 + }, + { + "epoch": 0.17, + "learning_rate": 0.0027377082129487725, + "loss": 0.168, + "step": 6960 + }, + { + "epoch": 0.18, + "learning_rate": 0.0027373313569328947, + "loss": 0.1689, + "step": 6970 + }, + { + "epoch": 0.18, + "learning_rate": 0.0027369545009170164, + "loss": 0.1741, + "step": 6980 + }, + { + "epoch": 0.18, + "learning_rate": 0.002736577644901138, + "loss": 0.169, + "step": 6990 + }, + { + "epoch": 0.18, + "learning_rate": 0.00273620078888526, + "loss": 0.1725, + "step": 7000 + }, + { + "epoch": 0.18, + "eval_cer": 0.6677037180336736, + "eval_loss": 0.1311553418636322, + "eval_runtime": 90.7293, + "eval_samples_per_second": 110.207, + "eval_steps_per_second": 6.889, + "step": 7000 + }, + { + "epoch": 0.18, + "learning_rate": 0.0027358239328693816, + "loss": 0.165, + "step": 7010 + }, + { + "epoch": 0.18, + "learning_rate": 0.002735447076853504, + "loss": 0.1721, + "step": 7020 + }, + { + "epoch": 0.18, + "learning_rate": 0.002735070220837625, + "loss": 0.1703, + "step": 7030 + }, + { + "epoch": 0.18, + "learning_rate": 0.0027346933648217473, + "loss": 0.1648, + "step": 7040 + }, + { + "epoch": 0.18, + "learning_rate": 0.002734316508805869, + "loss": 0.1708, + "step": 7050 + }, + { + "epoch": 0.18, + "learning_rate": 0.002733939652789991, + "loss": 0.1714, + "step": 7060 + }, + { + "epoch": 0.18, + "learning_rate": 0.0027335627967741125, + "loss": 0.1664, + "step": 7070 + }, + { + "epoch": 0.18, + "learning_rate": 0.0027331859407582343, + "loss": 0.1664, + "step": 7080 + }, + { + "epoch": 0.18, + "learning_rate": 0.002732809084742356, + "loss": 0.1704, + "step": 7090 + }, + { + "epoch": 0.18, + "learning_rate": 0.002732432228726478, + "loss": 0.1641, + "step": 7100 + }, + { + "epoch": 0.18, + "learning_rate": 0.0027320553727105995, + "loss": 0.1701, + "step": 7110 + }, + { + "epoch": 0.18, + "learning_rate": 0.0027316785166947217, + "loss": 0.1656, + "step": 7120 + }, + { + "epoch": 0.18, + "learning_rate": 0.0027313016606788434, + "loss": 0.1751, + "step": 7130 + }, + { + "epoch": 0.18, + "learning_rate": 0.002730924804662965, + "loss": 0.1656, + "step": 7140 + }, + { + "epoch": 0.18, + "learning_rate": 0.002730547948647087, + "loss": 0.1692, + "step": 7150 + }, + { + "epoch": 0.18, + "learning_rate": 0.0027301710926312087, + "loss": 0.1725, + "step": 7160 + }, + { + "epoch": 0.18, + "learning_rate": 0.002729794236615331, + "loss": 0.174, + "step": 7170 + }, + { + "epoch": 0.18, + "learning_rate": 0.002729417380599452, + "loss": 0.1702, + "step": 7180 + }, + { + "epoch": 0.18, + "learning_rate": 0.002729040524583574, + "loss": 0.1714, + "step": 7190 + }, + { + "epoch": 0.18, + "learning_rate": 0.002728663668567696, + "loss": 0.1688, + "step": 7200 + }, + { + "epoch": 0.18, + "learning_rate": 0.002728286812551818, + "loss": 0.1692, + "step": 7210 + }, + { + "epoch": 0.18, + "learning_rate": 0.0027279099565359396, + "loss": 0.1651, + "step": 7220 + }, + { + "epoch": 0.18, + "learning_rate": 0.0027275331005200613, + "loss": 0.1707, + "step": 7230 + }, + { + "epoch": 0.18, + "learning_rate": 0.002727156244504183, + "loss": 0.1701, + "step": 7240 + }, + { + "epoch": 0.18, + "learning_rate": 0.0027267793884883052, + "loss": 0.1677, + "step": 7250 + }, + { + "epoch": 0.18, + "learning_rate": 0.0027264025324724266, + "loss": 0.1681, + "step": 7260 + }, + { + "epoch": 0.18, + "learning_rate": 0.0027260256764565487, + "loss": 0.1704, + "step": 7270 + }, + { + "epoch": 0.18, + "learning_rate": 0.0027256488204406705, + "loss": 0.1638, + "step": 7280 + }, + { + "epoch": 0.18, + "learning_rate": 0.0027252719644247922, + "loss": 0.1685, + "step": 7290 + }, + { + "epoch": 0.18, + "learning_rate": 0.002724895108408914, + "loss": 0.1696, + "step": 7300 + }, + { + "epoch": 0.18, + "learning_rate": 0.0027245182523930357, + "loss": 0.1719, + "step": 7310 + }, + { + "epoch": 0.18, + "learning_rate": 0.0027241413963771575, + "loss": 0.1699, + "step": 7320 + }, + { + "epoch": 0.18, + "learning_rate": 0.0027237645403612796, + "loss": 0.1745, + "step": 7330 + }, + { + "epoch": 0.18, + "learning_rate": 0.002723387684345401, + "loss": 0.1663, + "step": 7340 + }, + { + "epoch": 0.18, + "learning_rate": 0.002723010828329523, + "loss": 0.1715, + "step": 7350 + }, + { + "epoch": 0.18, + "learning_rate": 0.002722633972313645, + "loss": 0.1624, + "step": 7360 + }, + { + "epoch": 0.19, + "learning_rate": 0.002722257116297766, + "loss": 0.1615, + "step": 7370 + }, + { + "epoch": 0.19, + "learning_rate": 0.0027218802602818884, + "loss": 0.1689, + "step": 7380 + }, + { + "epoch": 0.19, + "learning_rate": 0.00272150340426601, + "loss": 0.1653, + "step": 7390 + }, + { + "epoch": 0.19, + "learning_rate": 0.002721126548250132, + "loss": 0.1636, + "step": 7400 + }, + { + "epoch": 0.19, + "learning_rate": 0.0027207496922342536, + "loss": 0.1663, + "step": 7410 + }, + { + "epoch": 0.19, + "learning_rate": 0.0027203728362183753, + "loss": 0.1667, + "step": 7420 + }, + { + "epoch": 0.19, + "learning_rate": 0.0027199959802024975, + "loss": 0.1652, + "step": 7430 + }, + { + "epoch": 0.19, + "learning_rate": 0.0027196191241866193, + "loss": 0.1632, + "step": 7440 + }, + { + "epoch": 0.19, + "learning_rate": 0.002719242268170741, + "loss": 0.1662, + "step": 7450 + }, + { + "epoch": 0.19, + "learning_rate": 0.0027188654121548628, + "loss": 0.1704, + "step": 7460 + }, + { + "epoch": 0.19, + "learning_rate": 0.0027184885561389845, + "loss": 0.1654, + "step": 7470 + }, + { + "epoch": 0.19, + "learning_rate": 0.0027181117001231067, + "loss": 0.1664, + "step": 7480 + }, + { + "epoch": 0.19, + "learning_rate": 0.002717734844107228, + "loss": 0.1684, + "step": 7490 + }, + { + "epoch": 0.19, + "learning_rate": 0.0027173579880913497, + "loss": 0.1638, + "step": 7500 + }, + { + "epoch": 0.19, + "eval_cer": 0.6673577134244495, + "eval_loss": 0.12540632486343384, + "eval_runtime": 90.7183, + "eval_samples_per_second": 110.22, + "eval_steps_per_second": 6.889, + "step": 7500 + }, + { + "epoch": 0.19, + "learning_rate": 0.002716981132075472, + "loss": 0.1615, + "step": 7510 + }, + { + "epoch": 0.19, + "learning_rate": 0.0027166042760595937, + "loss": 0.1672, + "step": 7520 + }, + { + "epoch": 0.19, + "learning_rate": 0.0027162274200437154, + "loss": 0.1614, + "step": 7530 + }, + { + "epoch": 0.19, + "learning_rate": 0.002715850564027837, + "loss": 0.1683, + "step": 7540 + }, + { + "epoch": 0.19, + "learning_rate": 0.002715473708011959, + "loss": 0.1678, + "step": 7550 + }, + { + "epoch": 0.19, + "learning_rate": 0.002715096851996081, + "loss": 0.1719, + "step": 7560 + }, + { + "epoch": 0.19, + "learning_rate": 0.0027147199959802024, + "loss": 0.1639, + "step": 7570 + }, + { + "epoch": 0.19, + "learning_rate": 0.0027143431399643246, + "loss": 0.1657, + "step": 7580 + }, + { + "epoch": 0.19, + "learning_rate": 0.0027139662839484463, + "loss": 0.1622, + "step": 7590 + }, + { + "epoch": 0.19, + "learning_rate": 0.0027135894279325676, + "loss": 0.1608, + "step": 7600 + }, + { + "epoch": 0.19, + "learning_rate": 0.00271321257191669, + "loss": 0.1639, + "step": 7610 + }, + { + "epoch": 0.19, + "learning_rate": 0.0027128357159008115, + "loss": 0.1637, + "step": 7620 + }, + { + "epoch": 0.19, + "learning_rate": 0.0027124588598849333, + "loss": 0.1616, + "step": 7630 + }, + { + "epoch": 0.19, + "learning_rate": 0.002712082003869055, + "loss": 0.1625, + "step": 7640 + }, + { + "epoch": 0.19, + "learning_rate": 0.0027117051478531768, + "loss": 0.1658, + "step": 7650 + }, + { + "epoch": 0.19, + "learning_rate": 0.002711328291837299, + "loss": 0.1619, + "step": 7660 + }, + { + "epoch": 0.19, + "learning_rate": 0.0027109514358214207, + "loss": 0.1601, + "step": 7670 + }, + { + "epoch": 0.19, + "learning_rate": 0.0027105745798055424, + "loss": 0.1628, + "step": 7680 + }, + { + "epoch": 0.19, + "learning_rate": 0.002710197723789664, + "loss": 0.1701, + "step": 7690 + }, + { + "epoch": 0.19, + "learning_rate": 0.002709820867773786, + "loss": 0.1665, + "step": 7700 + }, + { + "epoch": 0.19, + "learning_rate": 0.002709444011757908, + "loss": 0.1698, + "step": 7710 + }, + { + "epoch": 0.19, + "learning_rate": 0.0027090671557420294, + "loss": 0.1634, + "step": 7720 + }, + { + "epoch": 0.19, + "learning_rate": 0.002708690299726151, + "loss": 0.1635, + "step": 7730 + }, + { + "epoch": 0.19, + "learning_rate": 0.0027083134437102733, + "loss": 0.1643, + "step": 7740 + }, + { + "epoch": 0.19, + "learning_rate": 0.002707936587694395, + "loss": 0.165, + "step": 7750 + }, + { + "epoch": 0.19, + "learning_rate": 0.002707559731678517, + "loss": 0.1601, + "step": 7760 + }, + { + "epoch": 0.2, + "learning_rate": 0.0027071828756626386, + "loss": 0.1633, + "step": 7770 + }, + { + "epoch": 0.2, + "learning_rate": 0.0027068060196467603, + "loss": 0.1602, + "step": 7780 + }, + { + "epoch": 0.2, + "learning_rate": 0.002706429163630882, + "loss": 0.1597, + "step": 7790 + }, + { + "epoch": 0.2, + "learning_rate": 0.002706052307615004, + "loss": 0.16, + "step": 7800 + }, + { + "epoch": 0.2, + "learning_rate": 0.0027056754515991255, + "loss": 0.1593, + "step": 7810 + }, + { + "epoch": 0.2, + "learning_rate": 0.0027052985955832477, + "loss": 0.1646, + "step": 7820 + }, + { + "epoch": 0.2, + "learning_rate": 0.002704921739567369, + "loss": 0.1648, + "step": 7830 + }, + { + "epoch": 0.2, + "learning_rate": 0.0027045448835514912, + "loss": 0.1686, + "step": 7840 + }, + { + "epoch": 0.2, + "learning_rate": 0.002704168027535613, + "loss": 0.1635, + "step": 7850 + }, + { + "epoch": 0.2, + "learning_rate": 0.0027037911715197347, + "loss": 0.1628, + "step": 7860 + }, + { + "epoch": 0.2, + "learning_rate": 0.0027034143155038565, + "loss": 0.1598, + "step": 7870 + }, + { + "epoch": 0.2, + "learning_rate": 0.002703037459487978, + "loss": 0.1633, + "step": 7880 + }, + { + "epoch": 0.2, + "learning_rate": 0.0027026606034721004, + "loss": 0.1604, + "step": 7890 + }, + { + "epoch": 0.2, + "learning_rate": 0.002702283747456222, + "loss": 0.1615, + "step": 7900 + }, + { + "epoch": 0.2, + "learning_rate": 0.0027019068914403434, + "loss": 0.1638, + "step": 7910 + }, + { + "epoch": 0.2, + "learning_rate": 0.0027015300354244656, + "loss": 0.1612, + "step": 7920 + }, + { + "epoch": 0.2, + "learning_rate": 0.0027011531794085874, + "loss": 0.1611, + "step": 7930 + }, + { + "epoch": 0.2, + "learning_rate": 0.002700776323392709, + "loss": 0.1629, + "step": 7940 + }, + { + "epoch": 0.2, + "learning_rate": 0.002700399467376831, + "loss": 0.1689, + "step": 7950 + }, + { + "epoch": 0.2, + "learning_rate": 0.0027000226113609526, + "loss": 0.1613, + "step": 7960 + }, + { + "epoch": 0.2, + "learning_rate": 0.0026996457553450748, + "loss": 0.166, + "step": 7970 + }, + { + "epoch": 0.2, + "learning_rate": 0.0026992688993291965, + "loss": 0.165, + "step": 7980 + }, + { + "epoch": 0.2, + "learning_rate": 0.0026988920433133183, + "loss": 0.1707, + "step": 7990 + }, + { + "epoch": 0.2, + "learning_rate": 0.00269851518729744, + "loss": 0.1575, + "step": 8000 + }, + { + "epoch": 0.2, + "eval_cer": 0.6680179614409384, + "eval_loss": 0.12548059225082397, + "eval_runtime": 90.4279, + "eval_samples_per_second": 110.574, + "eval_steps_per_second": 6.912, + "step": 8000 + }, + { + "epoch": 0.2, + "learning_rate": 0.0026981383312815617, + "loss": 0.1597, + "step": 8010 + }, + { + "epoch": 0.2, + "learning_rate": 0.0026977614752656835, + "loss": 0.1661, + "step": 8020 + }, + { + "epoch": 0.2, + "learning_rate": 0.0026973846192498052, + "loss": 0.1591, + "step": 8030 + }, + { + "epoch": 0.2, + "learning_rate": 0.002697007763233927, + "loss": 0.1668, + "step": 8040 + }, + { + "epoch": 0.2, + "learning_rate": 0.002696630907218049, + "loss": 0.1674, + "step": 8050 + }, + { + "epoch": 0.2, + "learning_rate": 0.0026962540512021705, + "loss": 0.1625, + "step": 8060 + }, + { + "epoch": 0.2, + "learning_rate": 0.0026958771951862926, + "loss": 0.1587, + "step": 8070 + }, + { + "epoch": 0.2, + "learning_rate": 0.0026955003391704144, + "loss": 0.1635, + "step": 8080 + }, + { + "epoch": 0.2, + "learning_rate": 0.002695123483154536, + "loss": 0.1636, + "step": 8090 + }, + { + "epoch": 0.2, + "learning_rate": 0.002694746627138658, + "loss": 0.1598, + "step": 8100 + }, + { + "epoch": 0.2, + "learning_rate": 0.0026943697711227796, + "loss": 0.1644, + "step": 8110 + }, + { + "epoch": 0.2, + "learning_rate": 0.002693992915106902, + "loss": 0.1574, + "step": 8120 + }, + { + "epoch": 0.2, + "learning_rate": 0.0026936160590910235, + "loss": 0.1608, + "step": 8130 + }, + { + "epoch": 0.2, + "learning_rate": 0.002693239203075145, + "loss": 0.1604, + "step": 8140 + }, + { + "epoch": 0.2, + "learning_rate": 0.002692862347059267, + "loss": 0.1629, + "step": 8150 + }, + { + "epoch": 0.21, + "learning_rate": 0.0026924854910433888, + "loss": 0.1596, + "step": 8160 + }, + { + "epoch": 0.21, + "learning_rate": 0.0026921086350275105, + "loss": 0.1584, + "step": 8170 + }, + { + "epoch": 0.21, + "learning_rate": 0.0026917317790116323, + "loss": 0.1615, + "step": 8180 + }, + { + "epoch": 0.21, + "learning_rate": 0.002691354922995754, + "loss": 0.164, + "step": 8190 + }, + { + "epoch": 0.21, + "learning_rate": 0.002690978066979876, + "loss": 0.1634, + "step": 8200 + }, + { + "epoch": 0.21, + "learning_rate": 0.002690601210963998, + "loss": 0.156, + "step": 8210 + }, + { + "epoch": 0.21, + "learning_rate": 0.0026902243549481192, + "loss": 0.1569, + "step": 8220 + }, + { + "epoch": 0.21, + "learning_rate": 0.0026898474989322414, + "loss": 0.1591, + "step": 8230 + }, + { + "epoch": 0.21, + "learning_rate": 0.002689470642916363, + "loss": 0.1608, + "step": 8240 + }, + { + "epoch": 0.21, + "learning_rate": 0.002689093786900485, + "loss": 0.1595, + "step": 8250 + }, + { + "epoch": 0.21, + "learning_rate": 0.0026887169308846067, + "loss": 0.1562, + "step": 8260 + }, + { + "epoch": 0.21, + "learning_rate": 0.0026883400748687284, + "loss": 0.1594, + "step": 8270 + }, + { + "epoch": 0.21, + "learning_rate": 0.0026879632188528506, + "loss": 0.1568, + "step": 8280 + }, + { + "epoch": 0.21, + "learning_rate": 0.002687586362836972, + "loss": 0.1591, + "step": 8290 + }, + { + "epoch": 0.21, + "learning_rate": 0.002687209506821094, + "loss": 0.1639, + "step": 8300 + }, + { + "epoch": 0.21, + "learning_rate": 0.002686832650805216, + "loss": 0.1567, + "step": 8310 + }, + { + "epoch": 0.21, + "learning_rate": 0.0026864557947893376, + "loss": 0.1523, + "step": 8320 + }, + { + "epoch": 0.21, + "learning_rate": 0.0026860789387734593, + "loss": 0.1588, + "step": 8330 + }, + { + "epoch": 0.21, + "learning_rate": 0.002685702082757581, + "loss": 0.1595, + "step": 8340 + }, + { + "epoch": 0.21, + "learning_rate": 0.002685325226741703, + "loss": 0.1538, + "step": 8350 + }, + { + "epoch": 0.21, + "learning_rate": 0.002684948370725825, + "loss": 0.1553, + "step": 8360 + }, + { + "epoch": 0.21, + "learning_rate": 0.0026845715147099463, + "loss": 0.1606, + "step": 8370 + }, + { + "epoch": 0.21, + "learning_rate": 0.0026841946586940685, + "loss": 0.1583, + "step": 8380 + }, + { + "epoch": 0.21, + "learning_rate": 0.00268381780267819, + "loss": 0.1617, + "step": 8390 + }, + { + "epoch": 0.21, + "learning_rate": 0.002683440946662312, + "loss": 0.1617, + "step": 8400 + }, + { + "epoch": 0.21, + "learning_rate": 0.0026830640906464337, + "loss": 0.1655, + "step": 8410 + }, + { + "epoch": 0.21, + "learning_rate": 0.0026826872346305554, + "loss": 0.1588, + "step": 8420 + }, + { + "epoch": 0.21, + "learning_rate": 0.0026823103786146776, + "loss": 0.159, + "step": 8430 + }, + { + "epoch": 0.21, + "learning_rate": 0.0026819335225987994, + "loss": 0.1575, + "step": 8440 + }, + { + "epoch": 0.21, + "learning_rate": 0.0026815566665829207, + "loss": 0.1613, + "step": 8450 + }, + { + "epoch": 0.21, + "learning_rate": 0.002681179810567043, + "loss": 0.1639, + "step": 8460 + }, + { + "epoch": 0.21, + "learning_rate": 0.0026808029545511646, + "loss": 0.1566, + "step": 8470 + }, + { + "epoch": 0.21, + "learning_rate": 0.0026804260985352863, + "loss": 0.1544, + "step": 8480 + }, + { + "epoch": 0.21, + "learning_rate": 0.002680049242519408, + "loss": 0.1562, + "step": 8490 + }, + { + "epoch": 0.21, + "learning_rate": 0.00267967238650353, + "loss": 0.1537, + "step": 8500 + }, + { + "epoch": 0.21, + "eval_cer": 0.667791783184561, + "eval_loss": 0.12038606405258179, + "eval_runtime": 90.1852, + "eval_samples_per_second": 110.872, + "eval_steps_per_second": 6.93, + "step": 8500 + }, + { + "epoch": 0.21, + "learning_rate": 0.002679295530487652, + "loss": 0.157, + "step": 8510 + }, + { + "epoch": 0.21, + "learning_rate": 0.0026789186744717733, + "loss": 0.1542, + "step": 8520 + }, + { + "epoch": 0.21, + "learning_rate": 0.0026785418184558955, + "loss": 0.1577, + "step": 8530 + }, + { + "epoch": 0.21, + "learning_rate": 0.0026781649624400172, + "loss": 0.1522, + "step": 8540 + }, + { + "epoch": 0.21, + "learning_rate": 0.002677788106424139, + "loss": 0.1552, + "step": 8550 + }, + { + "epoch": 0.22, + "learning_rate": 0.0026774112504082607, + "loss": 0.1594, + "step": 8560 + }, + { + "epoch": 0.22, + "learning_rate": 0.0026770343943923825, + "loss": 0.1573, + "step": 8570 + }, + { + "epoch": 0.22, + "learning_rate": 0.0026766575383765042, + "loss": 0.1579, + "step": 8580 + }, + { + "epoch": 0.22, + "learning_rate": 0.0026762806823606264, + "loss": 0.1571, + "step": 8590 + }, + { + "epoch": 0.22, + "learning_rate": 0.0026759038263447477, + "loss": 0.1538, + "step": 8600 + }, + { + "epoch": 0.22, + "learning_rate": 0.00267552697032887, + "loss": 0.1554, + "step": 8610 + }, + { + "epoch": 0.22, + "learning_rate": 0.0026751501143129916, + "loss": 0.1599, + "step": 8620 + }, + { + "epoch": 0.22, + "learning_rate": 0.0026747732582971134, + "loss": 0.1531, + "step": 8630 + }, + { + "epoch": 0.22, + "learning_rate": 0.002674396402281235, + "loss": 0.1559, + "step": 8640 + }, + { + "epoch": 0.22, + "learning_rate": 0.002674019546265357, + "loss": 0.1578, + "step": 8650 + }, + { + "epoch": 0.22, + "learning_rate": 0.0026736426902494786, + "loss": 0.1547, + "step": 8660 + }, + { + "epoch": 0.22, + "learning_rate": 0.002673265834233601, + "loss": 0.1564, + "step": 8670 + }, + { + "epoch": 0.22, + "learning_rate": 0.002672888978217722, + "loss": 0.1585, + "step": 8680 + }, + { + "epoch": 0.22, + "learning_rate": 0.0026725121222018443, + "loss": 0.1596, + "step": 8690 + }, + { + "epoch": 0.22, + "learning_rate": 0.002672135266185966, + "loss": 0.1595, + "step": 8700 + }, + { + "epoch": 0.22, + "learning_rate": 0.0026717584101700878, + "loss": 0.1609, + "step": 8710 + }, + { + "epoch": 0.22, + "learning_rate": 0.0026713815541542095, + "loss": 0.1543, + "step": 8720 + }, + { + "epoch": 0.22, + "learning_rate": 0.0026710046981383313, + "loss": 0.1536, + "step": 8730 + }, + { + "epoch": 0.22, + "learning_rate": 0.0026706278421224534, + "loss": 0.1575, + "step": 8740 + }, + { + "epoch": 0.22, + "learning_rate": 0.0026702509861065747, + "loss": 0.1567, + "step": 8750 + }, + { + "epoch": 0.22, + "learning_rate": 0.0026698741300906965, + "loss": 0.1524, + "step": 8760 + }, + { + "epoch": 0.22, + "learning_rate": 0.0026694972740748187, + "loss": 0.1548, + "step": 8770 + }, + { + "epoch": 0.22, + "learning_rate": 0.0026691204180589404, + "loss": 0.163, + "step": 8780 + }, + { + "epoch": 0.22, + "learning_rate": 0.002668743562043062, + "loss": 0.1542, + "step": 8790 + }, + { + "epoch": 0.22, + "learning_rate": 0.002668366706027184, + "loss": 0.1597, + "step": 8800 + }, + { + "epoch": 0.22, + "learning_rate": 0.0026679898500113057, + "loss": 0.1549, + "step": 8810 + }, + { + "epoch": 0.22, + "learning_rate": 0.002667612993995428, + "loss": 0.1563, + "step": 8820 + }, + { + "epoch": 0.22, + "learning_rate": 0.002667236137979549, + "loss": 0.1545, + "step": 8830 + }, + { + "epoch": 0.22, + "learning_rate": 0.0026668592819636713, + "loss": 0.1552, + "step": 8840 + }, + { + "epoch": 0.22, + "learning_rate": 0.002666482425947793, + "loss": 0.1593, + "step": 8850 + }, + { + "epoch": 0.22, + "learning_rate": 0.002666105569931915, + "loss": 0.157, + "step": 8860 + }, + { + "epoch": 0.22, + "learning_rate": 0.0026657287139160366, + "loss": 0.1524, + "step": 8870 + }, + { + "epoch": 0.22, + "learning_rate": 0.0026653518579001583, + "loss": 0.1548, + "step": 8880 + }, + { + "epoch": 0.22, + "learning_rate": 0.00266497500188428, + "loss": 0.1554, + "step": 8890 + }, + { + "epoch": 0.22, + "learning_rate": 0.002664598145868402, + "loss": 0.1548, + "step": 8900 + }, + { + "epoch": 0.22, + "learning_rate": 0.0026642212898525235, + "loss": 0.1591, + "step": 8910 + }, + { + "epoch": 0.22, + "learning_rate": 0.0026638444338366457, + "loss": 0.1623, + "step": 8920 + }, + { + "epoch": 0.22, + "learning_rate": 0.0026634675778207675, + "loss": 0.1566, + "step": 8930 + }, + { + "epoch": 0.22, + "learning_rate": 0.002663090721804889, + "loss": 0.1569, + "step": 8940 + }, + { + "epoch": 0.22, + "learning_rate": 0.002662713865789011, + "loss": 0.1552, + "step": 8950 + }, + { + "epoch": 0.23, + "learning_rate": 0.0026623370097731327, + "loss": 0.1543, + "step": 8960 + }, + { + "epoch": 0.23, + "learning_rate": 0.0026619601537572544, + "loss": 0.1516, + "step": 8970 + }, + { + "epoch": 0.23, + "learning_rate": 0.002661583297741376, + "loss": 0.1585, + "step": 8980 + }, + { + "epoch": 0.23, + "learning_rate": 0.002661206441725498, + "loss": 0.1547, + "step": 8990 + }, + { + "epoch": 0.23, + "learning_rate": 0.00266082958570962, + "loss": 0.1516, + "step": 9000 + }, + { + "epoch": 0.23, + "eval_cer": 0.6670555007755027, + "eval_loss": 0.1187540739774704, + "eval_runtime": 90.5351, + "eval_samples_per_second": 110.443, + "eval_steps_per_second": 6.903, + "step": 9000 + }, + { + "epoch": 0.23, + "learning_rate": 0.002660452729693742, + "loss": 0.1551, + "step": 9010 + }, + { + "epoch": 0.23, + "learning_rate": 0.0026600758736778636, + "loss": 0.155, + "step": 9020 + }, + { + "epoch": 0.23, + "learning_rate": 0.0026596990176619853, + "loss": 0.1571, + "step": 9030 + }, + { + "epoch": 0.23, + "learning_rate": 0.002659322161646107, + "loss": 0.1491, + "step": 9040 + }, + { + "epoch": 0.23, + "learning_rate": 0.0026589453056302293, + "loss": 0.1536, + "step": 9050 + }, + { + "epoch": 0.23, + "learning_rate": 0.0026585684496143506, + "loss": 0.1514, + "step": 9060 + }, + { + "epoch": 0.23, + "learning_rate": 0.0026581915935984723, + "loss": 0.1523, + "step": 9070 + }, + { + "epoch": 0.23, + "learning_rate": 0.0026578147375825945, + "loss": 0.1593, + "step": 9080 + }, + { + "epoch": 0.23, + "learning_rate": 0.0026574378815667162, + "loss": 0.1543, + "step": 9090 + }, + { + "epoch": 0.23, + "learning_rate": 0.002657061025550838, + "loss": 0.159, + "step": 9100 + }, + { + "epoch": 0.23, + "learning_rate": 0.0026566841695349597, + "loss": 0.1543, + "step": 9110 + }, + { + "epoch": 0.23, + "learning_rate": 0.0026563073135190815, + "loss": 0.1497, + "step": 9120 + }, + { + "epoch": 0.23, + "learning_rate": 0.002655930457503203, + "loss": 0.1571, + "step": 9130 + }, + { + "epoch": 0.23, + "learning_rate": 0.002655553601487325, + "loss": 0.147, + "step": 9140 + }, + { + "epoch": 0.23, + "learning_rate": 0.002655176745471447, + "loss": 0.1499, + "step": 9150 + }, + { + "epoch": 0.23, + "learning_rate": 0.002654799889455569, + "loss": 0.1535, + "step": 9160 + }, + { + "epoch": 0.23, + "learning_rate": 0.00265442303343969, + "loss": 0.1488, + "step": 9170 + }, + { + "epoch": 0.23, + "learning_rate": 0.0026540461774238124, + "loss": 0.1491, + "step": 9180 + }, + { + "epoch": 0.23, + "learning_rate": 0.002653669321407934, + "loss": 0.1522, + "step": 9190 + }, + { + "epoch": 0.23, + "learning_rate": 0.002653292465392056, + "loss": 0.1526, + "step": 9200 + }, + { + "epoch": 0.23, + "learning_rate": 0.0026529156093761776, + "loss": 0.1534, + "step": 9210 + }, + { + "epoch": 0.23, + "learning_rate": 0.0026525387533602993, + "loss": 0.1514, + "step": 9220 + }, + { + "epoch": 0.23, + "learning_rate": 0.0026521618973444215, + "loss": 0.1523, + "step": 9230 + }, + { + "epoch": 0.23, + "learning_rate": 0.0026517850413285433, + "loss": 0.1571, + "step": 9240 + }, + { + "epoch": 0.23, + "learning_rate": 0.002651408185312665, + "loss": 0.1532, + "step": 9250 + }, + { + "epoch": 0.23, + "learning_rate": 0.0026510313292967868, + "loss": 0.1553, + "step": 9260 + }, + { + "epoch": 0.23, + "learning_rate": 0.0026506544732809085, + "loss": 0.1542, + "step": 9270 + }, + { + "epoch": 0.23, + "learning_rate": 0.0026502776172650307, + "loss": 0.1551, + "step": 9280 + }, + { + "epoch": 0.23, + "learning_rate": 0.002649900761249152, + "loss": 0.1512, + "step": 9290 + }, + { + "epoch": 0.23, + "learning_rate": 0.0026495239052332737, + "loss": 0.1526, + "step": 9300 + }, + { + "epoch": 0.23, + "learning_rate": 0.002649147049217396, + "loss": 0.1514, + "step": 9310 + }, + { + "epoch": 0.23, + "learning_rate": 0.0026487701932015177, + "loss": 0.1491, + "step": 9320 + }, + { + "epoch": 0.23, + "learning_rate": 0.0026483933371856394, + "loss": 0.1533, + "step": 9330 + }, + { + "epoch": 0.23, + "learning_rate": 0.002648016481169761, + "loss": 0.1565, + "step": 9340 + }, + { + "epoch": 0.23, + "learning_rate": 0.002647639625153883, + "loss": 0.1524, + "step": 9350 + }, + { + "epoch": 0.24, + "learning_rate": 0.0026472627691380046, + "loss": 0.1549, + "step": 9360 + }, + { + "epoch": 0.24, + "learning_rate": 0.0026468859131221264, + "loss": 0.1529, + "step": 9370 + }, + { + "epoch": 0.24, + "learning_rate": 0.002646509057106248, + "loss": 0.1491, + "step": 9380 + }, + { + "epoch": 0.24, + "learning_rate": 0.0026461322010903703, + "loss": 0.1525, + "step": 9390 + }, + { + "epoch": 0.24, + "learning_rate": 0.0026457553450744916, + "loss": 0.1459, + "step": 9400 + }, + { + "epoch": 0.24, + "learning_rate": 0.002645378489058614, + "loss": 0.1476, + "step": 9410 + }, + { + "epoch": 0.24, + "learning_rate": 0.0026450016330427355, + "loss": 0.1494, + "step": 9420 + }, + { + "epoch": 0.24, + "learning_rate": 0.0026446247770268573, + "loss": 0.1497, + "step": 9430 + }, + { + "epoch": 0.24, + "learning_rate": 0.002644247921010979, + "loss": 0.1502, + "step": 9440 + }, + { + "epoch": 0.24, + "learning_rate": 0.0026438710649951008, + "loss": 0.15, + "step": 9450 + }, + { + "epoch": 0.24, + "learning_rate": 0.002643494208979223, + "loss": 0.1536, + "step": 9460 + }, + { + "epoch": 0.24, + "learning_rate": 0.0026431173529633447, + "loss": 0.151, + "step": 9470 + }, + { + "epoch": 0.24, + "learning_rate": 0.002642740496947466, + "loss": 0.1478, + "step": 9480 + }, + { + "epoch": 0.24, + "learning_rate": 0.002642363640931588, + "loss": 0.1505, + "step": 9490 + }, + { + "epoch": 0.24, + "learning_rate": 0.00264198678491571, + "loss": 0.1526, + "step": 9500 + }, + { + "epoch": 0.24, + "eval_cer": 0.667285047644209, + "eval_loss": 0.11501982808113098, + "eval_runtime": 89.9198, + "eval_samples_per_second": 111.199, + "eval_steps_per_second": 6.951, + "step": 9500 + }, + { + "epoch": 0.24, + "learning_rate": 0.0026416099288998317, + "loss": 0.1529, + "step": 9510 + }, + { + "epoch": 0.24, + "learning_rate": 0.0026412330728839534, + "loss": 0.1544, + "step": 9520 + }, + { + "epoch": 0.24, + "learning_rate": 0.002640856216868075, + "loss": 0.1497, + "step": 9530 + }, + { + "epoch": 0.24, + "learning_rate": 0.0026404793608521973, + "loss": 0.1521, + "step": 9540 + }, + { + "epoch": 0.24, + "learning_rate": 0.002640102504836319, + "loss": 0.1553, + "step": 9550 + }, + { + "epoch": 0.24, + "learning_rate": 0.002639725648820441, + "loss": 0.149, + "step": 9560 + }, + { + "epoch": 0.24, + "learning_rate": 0.0026393487928045626, + "loss": 0.1555, + "step": 9570 + }, + { + "epoch": 0.24, + "learning_rate": 0.0026389719367886843, + "loss": 0.1505, + "step": 9580 + }, + { + "epoch": 0.24, + "learning_rate": 0.002638595080772806, + "loss": 0.1515, + "step": 9590 + }, + { + "epoch": 0.24, + "learning_rate": 0.002638218224756928, + "loss": 0.1544, + "step": 9600 + }, + { + "epoch": 0.24, + "learning_rate": 0.0026378413687410496, + "loss": 0.1442, + "step": 9610 + }, + { + "epoch": 0.24, + "learning_rate": 0.0026374645127251717, + "loss": 0.1497, + "step": 9620 + }, + { + "epoch": 0.24, + "learning_rate": 0.002637087656709293, + "loss": 0.1522, + "step": 9630 + }, + { + "epoch": 0.24, + "learning_rate": 0.0026367108006934152, + "loss": 0.1506, + "step": 9640 + }, + { + "epoch": 0.24, + "learning_rate": 0.002636333944677537, + "loss": 0.1538, + "step": 9650 + }, + { + "epoch": 0.24, + "learning_rate": 0.0026359570886616587, + "loss": 0.1514, + "step": 9660 + }, + { + "epoch": 0.24, + "learning_rate": 0.0026355802326457805, + "loss": 0.1471, + "step": 9670 + }, + { + "epoch": 0.24, + "learning_rate": 0.002635203376629902, + "loss": 0.1514, + "step": 9680 + }, + { + "epoch": 0.24, + "learning_rate": 0.0026348265206140244, + "loss": 0.148, + "step": 9690 + }, + { + "epoch": 0.24, + "learning_rate": 0.002634449664598146, + "loss": 0.1483, + "step": 9700 + }, + { + "epoch": 0.24, + "learning_rate": 0.0026340728085822674, + "loss": 0.1489, + "step": 9710 + }, + { + "epoch": 0.24, + "learning_rate": 0.0026336959525663896, + "loss": 0.153, + "step": 9720 + }, + { + "epoch": 0.24, + "learning_rate": 0.0026333190965505114, + "loss": 0.1479, + "step": 9730 + }, + { + "epoch": 0.24, + "learning_rate": 0.002632942240534633, + "loss": 0.1529, + "step": 9740 + }, + { + "epoch": 0.24, + "learning_rate": 0.002632565384518755, + "loss": 0.152, + "step": 9750 + }, + { + "epoch": 0.25, + "learning_rate": 0.0026321885285028766, + "loss": 0.147, + "step": 9760 + }, + { + "epoch": 0.25, + "learning_rate": 0.0026318116724869988, + "loss": 0.1452, + "step": 9770 + }, + { + "epoch": 0.25, + "learning_rate": 0.0026314348164711205, + "loss": 0.1497, + "step": 9780 + }, + { + "epoch": 0.25, + "learning_rate": 0.002631057960455242, + "loss": 0.1526, + "step": 9790 + }, + { + "epoch": 0.25, + "learning_rate": 0.002630681104439364, + "loss": 0.148, + "step": 9800 + }, + { + "epoch": 0.25, + "learning_rate": 0.0026303042484234858, + "loss": 0.1471, + "step": 9810 + }, + { + "epoch": 0.25, + "learning_rate": 0.0026299273924076075, + "loss": 0.1492, + "step": 9820 + }, + { + "epoch": 0.25, + "learning_rate": 0.0026295505363917292, + "loss": 0.1562, + "step": 9830 + }, + { + "epoch": 0.25, + "learning_rate": 0.002629173680375851, + "loss": 0.1489, + "step": 9840 + }, + { + "epoch": 0.25, + "learning_rate": 0.002628796824359973, + "loss": 0.1514, + "step": 9850 + }, + { + "epoch": 0.25, + "learning_rate": 0.0026284199683440945, + "loss": 0.1559, + "step": 9860 + }, + { + "epoch": 0.25, + "learning_rate": 0.0026280431123282167, + "loss": 0.1519, + "step": 9870 + }, + { + "epoch": 0.25, + "learning_rate": 0.0026276662563123384, + "loss": 0.1481, + "step": 9880 + }, + { + "epoch": 0.25, + "learning_rate": 0.00262728940029646, + "loss": 0.1425, + "step": 9890 + }, + { + "epoch": 0.25, + "learning_rate": 0.002626912544280582, + "loss": 0.1518, + "step": 9900 + }, + { + "epoch": 0.25, + "learning_rate": 0.0026265356882647036, + "loss": 0.1476, + "step": 9910 + }, + { + "epoch": 0.25, + "learning_rate": 0.0026261588322488254, + "loss": 0.1456, + "step": 9920 + }, + { + "epoch": 0.25, + "learning_rate": 0.0026257819762329476, + "loss": 0.1481, + "step": 9930 + }, + { + "epoch": 0.25, + "learning_rate": 0.002625405120217069, + "loss": 0.146, + "step": 9940 + }, + { + "epoch": 0.25, + "learning_rate": 0.002625028264201191, + "loss": 0.155, + "step": 9950 + }, + { + "epoch": 0.25, + "learning_rate": 0.002624651408185313, + "loss": 0.1448, + "step": 9960 + }, + { + "epoch": 0.25, + "learning_rate": 0.0026242745521694345, + "loss": 0.1575, + "step": 9970 + }, + { + "epoch": 0.25, + "learning_rate": 0.0026238976961535563, + "loss": 0.1424, + "step": 9980 + }, + { + "epoch": 0.25, + "learning_rate": 0.002623520840137678, + "loss": 0.1496, + "step": 9990 + }, + { + "epoch": 0.25, + "learning_rate": 0.0026231439841218, + "loss": 0.148, + "step": 10000 + }, + { + "epoch": 0.25, + "eval_cer": 0.6675872602931558, + "eval_loss": 0.11312033236026764, + "eval_runtime": 90.4563, + "eval_samples_per_second": 110.54, + "eval_steps_per_second": 6.909, + "step": 10000 + }, + { + "epoch": 0.25, + "learning_rate": 0.002622767128105922, + "loss": 0.1537, + "step": 10010 + }, + { + "epoch": 0.25, + "learning_rate": 0.0026223902720900433, + "loss": 0.1447, + "step": 10020 + }, + { + "epoch": 0.25, + "learning_rate": 0.0026220134160741654, + "loss": 0.1481, + "step": 10030 + }, + { + "epoch": 0.25, + "learning_rate": 0.002621636560058287, + "loss": 0.1485, + "step": 10040 + }, + { + "epoch": 0.25, + "learning_rate": 0.002621259704042409, + "loss": 0.1495, + "step": 10050 + }, + { + "epoch": 0.25, + "learning_rate": 0.0026208828480265307, + "loss": 0.1483, + "step": 10060 + }, + { + "epoch": 0.25, + "learning_rate": 0.0026205059920106524, + "loss": 0.1487, + "step": 10070 + }, + { + "epoch": 0.25, + "learning_rate": 0.0026201291359947746, + "loss": 0.1462, + "step": 10080 + }, + { + "epoch": 0.25, + "learning_rate": 0.002619752279978896, + "loss": 0.1475, + "step": 10090 + }, + { + "epoch": 0.25, + "learning_rate": 0.002619375423963018, + "loss": 0.1431, + "step": 10100 + }, + { + "epoch": 0.25, + "learning_rate": 0.00261899856794714, + "loss": 0.1455, + "step": 10110 + }, + { + "epoch": 0.25, + "learning_rate": 0.0026186217119312616, + "loss": 0.1504, + "step": 10120 + }, + { + "epoch": 0.25, + "learning_rate": 0.0026182448559153833, + "loss": 0.1509, + "step": 10130 + }, + { + "epoch": 0.25, + "learning_rate": 0.002617867999899505, + "loss": 0.1464, + "step": 10140 + }, + { + "epoch": 0.26, + "learning_rate": 0.002617491143883627, + "loss": 0.1461, + "step": 10150 + }, + { + "epoch": 0.26, + "learning_rate": 0.002617114287867749, + "loss": 0.1512, + "step": 10160 + }, + { + "epoch": 0.26, + "learning_rate": 0.0026167374318518703, + "loss": 0.1487, + "step": 10170 + }, + { + "epoch": 0.26, + "learning_rate": 0.0026163605758359925, + "loss": 0.1443, + "step": 10180 + }, + { + "epoch": 0.26, + "learning_rate": 0.002615983719820114, + "loss": 0.1492, + "step": 10190 + }, + { + "epoch": 0.26, + "learning_rate": 0.002615606863804236, + "loss": 0.1496, + "step": 10200 + }, + { + "epoch": 0.26, + "learning_rate": 0.0026152300077883577, + "loss": 0.1457, + "step": 10210 + }, + { + "epoch": 0.26, + "learning_rate": 0.0026148531517724794, + "loss": 0.1477, + "step": 10220 + }, + { + "epoch": 0.26, + "learning_rate": 0.002614476295756601, + "loss": 0.144, + "step": 10230 + }, + { + "epoch": 0.26, + "learning_rate": 0.002614099439740723, + "loss": 0.1474, + "step": 10240 + }, + { + "epoch": 0.26, + "learning_rate": 0.0026137225837248447, + "loss": 0.1468, + "step": 10250 + }, + { + "epoch": 0.26, + "learning_rate": 0.002613345727708967, + "loss": 0.1448, + "step": 10260 + }, + { + "epoch": 0.26, + "learning_rate": 0.0026129688716930886, + "loss": 0.1464, + "step": 10270 + }, + { + "epoch": 0.26, + "learning_rate": 0.0026125920156772104, + "loss": 0.143, + "step": 10280 + }, + { + "epoch": 0.26, + "learning_rate": 0.002612215159661332, + "loss": 0.1482, + "step": 10290 + }, + { + "epoch": 0.26, + "learning_rate": 0.002611838303645454, + "loss": 0.1453, + "step": 10300 + }, + { + "epoch": 0.26, + "learning_rate": 0.002611461447629576, + "loss": 0.1499, + "step": 10310 + }, + { + "epoch": 0.26, + "learning_rate": 0.0026110845916136973, + "loss": 0.1463, + "step": 10320 + }, + { + "epoch": 0.26, + "learning_rate": 0.002610707735597819, + "loss": 0.1485, + "step": 10330 + }, + { + "epoch": 0.26, + "learning_rate": 0.0026103308795819413, + "loss": 0.1493, + "step": 10340 + }, + { + "epoch": 0.26, + "learning_rate": 0.002609954023566063, + "loss": 0.1432, + "step": 10350 + }, + { + "epoch": 0.26, + "learning_rate": 0.0026095771675501847, + "loss": 0.1503, + "step": 10360 + }, + { + "epoch": 0.26, + "learning_rate": 0.0026092003115343065, + "loss": 0.1481, + "step": 10370 + }, + { + "epoch": 0.26, + "learning_rate": 0.0026088234555184282, + "loss": 0.1472, + "step": 10380 + }, + { + "epoch": 0.26, + "learning_rate": 0.0026084465995025504, + "loss": 0.1439, + "step": 10390 + }, + { + "epoch": 0.26, + "learning_rate": 0.0026080697434866717, + "loss": 0.1449, + "step": 10400 + }, + { + "epoch": 0.26, + "learning_rate": 0.002607692887470794, + "loss": 0.1412, + "step": 10410 + }, + { + "epoch": 0.26, + "learning_rate": 0.0026073160314549156, + "loss": 0.1421, + "step": 10420 + }, + { + "epoch": 0.26, + "learning_rate": 0.0026069391754390374, + "loss": 0.1427, + "step": 10430 + }, + { + "epoch": 0.26, + "learning_rate": 0.002606562319423159, + "loss": 0.1467, + "step": 10440 + }, + { + "epoch": 0.26, + "learning_rate": 0.002606185463407281, + "loss": 0.1415, + "step": 10450 + }, + { + "epoch": 0.26, + "learning_rate": 0.0026058086073914026, + "loss": 0.1461, + "step": 10460 + }, + { + "epoch": 0.26, + "learning_rate": 0.0026054317513755244, + "loss": 0.1455, + "step": 10470 + }, + { + "epoch": 0.26, + "learning_rate": 0.002605054895359646, + "loss": 0.1416, + "step": 10480 + }, + { + "epoch": 0.26, + "learning_rate": 0.0026046780393437683, + "loss": 0.1482, + "step": 10490 + }, + { + "epoch": 0.26, + "learning_rate": 0.00260430118332789, + "loss": 0.1445, + "step": 10500 + }, + { + "epoch": 0.26, + "eval_cer": 0.667484758232287, + "eval_loss": 0.11072567105293274, + "eval_runtime": 90.1742, + "eval_samples_per_second": 110.885, + "eval_steps_per_second": 6.931, + "step": 10500 + }, + { + "epoch": 0.26, + "learning_rate": 0.0026039243273120118, + "loss": 0.1448, + "step": 10510 + }, + { + "epoch": 0.26, + "learning_rate": 0.0026035474712961335, + "loss": 0.1456, + "step": 10520 + }, + { + "epoch": 0.26, + "learning_rate": 0.0026031706152802553, + "loss": 0.1453, + "step": 10530 + }, + { + "epoch": 0.26, + "learning_rate": 0.002602793759264377, + "loss": 0.147, + "step": 10540 + }, + { + "epoch": 0.27, + "learning_rate": 0.0026024169032484988, + "loss": 0.1432, + "step": 10550 + }, + { + "epoch": 0.27, + "learning_rate": 0.0026020400472326205, + "loss": 0.1412, + "step": 10560 + }, + { + "epoch": 0.27, + "learning_rate": 0.0026016631912167427, + "loss": 0.143, + "step": 10570 + }, + { + "epoch": 0.27, + "learning_rate": 0.0026012863352008644, + "loss": 0.1455, + "step": 10580 + }, + { + "epoch": 0.27, + "learning_rate": 0.002600909479184986, + "loss": 0.1461, + "step": 10590 + }, + { + "epoch": 0.27, + "learning_rate": 0.002600532623169108, + "loss": 0.1469, + "step": 10600 + }, + { + "epoch": 0.27, + "learning_rate": 0.0026001557671532297, + "loss": 0.1434, + "step": 10610 + }, + { + "epoch": 0.27, + "learning_rate": 0.002599778911137352, + "loss": 0.1427, + "step": 10620 + }, + { + "epoch": 0.27, + "learning_rate": 0.002599402055121473, + "loss": 0.1433, + "step": 10630 + }, + { + "epoch": 0.27, + "learning_rate": 0.002599025199105595, + "loss": 0.1423, + "step": 10640 + }, + { + "epoch": 0.27, + "learning_rate": 0.002598648343089717, + "loss": 0.1437, + "step": 10650 + }, + { + "epoch": 0.27, + "learning_rate": 0.002598271487073839, + "loss": 0.1428, + "step": 10660 + }, + { + "epoch": 0.27, + "learning_rate": 0.0025978946310579606, + "loss": 0.1399, + "step": 10670 + }, + { + "epoch": 0.27, + "learning_rate": 0.0025975177750420823, + "loss": 0.1451, + "step": 10680 + }, + { + "epoch": 0.27, + "learning_rate": 0.002597140919026204, + "loss": 0.1415, + "step": 10690 + }, + { + "epoch": 0.27, + "learning_rate": 0.002596764063010326, + "loss": 0.1459, + "step": 10700 + }, + { + "epoch": 0.27, + "learning_rate": 0.0025963872069944475, + "loss": 0.1434, + "step": 10710 + }, + { + "epoch": 0.27, + "learning_rate": 0.0025960103509785697, + "loss": 0.1413, + "step": 10720 + }, + { + "epoch": 0.27, + "learning_rate": 0.0025956334949626915, + "loss": 0.1446, + "step": 10730 + }, + { + "epoch": 0.27, + "learning_rate": 0.0025952566389468128, + "loss": 0.1448, + "step": 10740 + }, + { + "epoch": 0.27, + "learning_rate": 0.002594879782930935, + "loss": 0.1407, + "step": 10750 + }, + { + "epoch": 0.27, + "learning_rate": 0.0025945029269150567, + "loss": 0.1408, + "step": 10760 + }, + { + "epoch": 0.27, + "learning_rate": 0.0025941260708991784, + "loss": 0.1419, + "step": 10770 + }, + { + "epoch": 0.27, + "learning_rate": 0.0025937492148833, + "loss": 0.1484, + "step": 10780 + }, + { + "epoch": 0.27, + "learning_rate": 0.002593372358867422, + "loss": 0.143, + "step": 10790 + }, + { + "epoch": 0.27, + "learning_rate": 0.002592995502851544, + "loss": 0.1421, + "step": 10800 + }, + { + "epoch": 0.27, + "learning_rate": 0.002592618646835666, + "loss": 0.1387, + "step": 10810 + }, + { + "epoch": 0.27, + "learning_rate": 0.0025922417908197876, + "loss": 0.1425, + "step": 10820 + }, + { + "epoch": 0.27, + "learning_rate": 0.0025918649348039093, + "loss": 0.1439, + "step": 10830 + }, + { + "epoch": 0.27, + "learning_rate": 0.002591488078788031, + "loss": 0.141, + "step": 10840 + }, + { + "epoch": 0.27, + "learning_rate": 0.0025911112227721533, + "loss": 0.1422, + "step": 10850 + }, + { + "epoch": 0.27, + "learning_rate": 0.0025907343667562746, + "loss": 0.1427, + "step": 10860 + }, + { + "epoch": 0.27, + "learning_rate": 0.0025903575107403963, + "loss": 0.1419, + "step": 10870 + }, + { + "epoch": 0.27, + "learning_rate": 0.0025899806547245185, + "loss": 0.1379, + "step": 10880 + }, + { + "epoch": 0.27, + "learning_rate": 0.0025896037987086402, + "loss": 0.1473, + "step": 10890 + }, + { + "epoch": 0.27, + "learning_rate": 0.002589226942692762, + "loss": 0.1432, + "step": 10900 + }, + { + "epoch": 0.27, + "learning_rate": 0.0025888500866768837, + "loss": 0.1424, + "step": 10910 + }, + { + "epoch": 0.27, + "learning_rate": 0.0025884732306610055, + "loss": 0.1451, + "step": 10920 + }, + { + "epoch": 0.27, + "learning_rate": 0.0025880963746451272, + "loss": 0.1381, + "step": 10930 + }, + { + "epoch": 0.27, + "learning_rate": 0.002587719518629249, + "loss": 0.1393, + "step": 10940 + }, + { + "epoch": 0.28, + "learning_rate": 0.0025873426626133707, + "loss": 0.141, + "step": 10950 + }, + { + "epoch": 0.28, + "learning_rate": 0.002586965806597493, + "loss": 0.1405, + "step": 10960 + }, + { + "epoch": 0.28, + "learning_rate": 0.002586588950581614, + "loss": 0.1392, + "step": 10970 + }, + { + "epoch": 0.28, + "learning_rate": 0.0025862120945657364, + "loss": 0.1428, + "step": 10980 + }, + { + "epoch": 0.28, + "learning_rate": 0.002585835238549858, + "loss": 0.1447, + "step": 10990 + }, + { + "epoch": 0.28, + "learning_rate": 0.00258545838253398, + "loss": 0.1378, + "step": 11000 + }, + { + "epoch": 0.28, + "eval_cer": 0.6664130582813244, + "eval_loss": 0.111346036195755, + "eval_runtime": 90.4938, + "eval_samples_per_second": 110.494, + "eval_steps_per_second": 6.907, + "step": 11000 + }, + { + "epoch": 0.28, + "learning_rate": 0.0025850815265181016, + "loss": 0.1417, + "step": 11010 + }, + { + "epoch": 0.28, + "learning_rate": 0.0025847046705022234, + "loss": 0.1412, + "step": 11020 + }, + { + "epoch": 0.28, + "learning_rate": 0.0025843278144863455, + "loss": 0.1388, + "step": 11030 + }, + { + "epoch": 0.28, + "learning_rate": 0.0025839509584704673, + "loss": 0.1448, + "step": 11040 + }, + { + "epoch": 0.28, + "learning_rate": 0.0025835741024545886, + "loss": 0.1433, + "step": 11050 + }, + { + "epoch": 0.28, + "learning_rate": 0.0025831972464387108, + "loss": 0.1429, + "step": 11060 + }, + { + "epoch": 0.28, + "learning_rate": 0.0025828203904228325, + "loss": 0.1434, + "step": 11070 + }, + { + "epoch": 0.28, + "learning_rate": 0.0025824435344069543, + "loss": 0.1394, + "step": 11080 + }, + { + "epoch": 0.28, + "learning_rate": 0.002582066678391076, + "loss": 0.1412, + "step": 11090 + }, + { + "epoch": 0.28, + "learning_rate": 0.0025816898223751977, + "loss": 0.1464, + "step": 11100 + }, + { + "epoch": 0.28, + "learning_rate": 0.00258131296635932, + "loss": 0.1395, + "step": 11110 + }, + { + "epoch": 0.28, + "learning_rate": 0.0025809361103434417, + "loss": 0.1418, + "step": 11120 + }, + { + "epoch": 0.28, + "learning_rate": 0.0025805592543275634, + "loss": 0.1392, + "step": 11130 + }, + { + "epoch": 0.28, + "learning_rate": 0.002580182398311685, + "loss": 0.1393, + "step": 11140 + }, + { + "epoch": 0.28, + "learning_rate": 0.002579805542295807, + "loss": 0.1404, + "step": 11150 + }, + { + "epoch": 0.28, + "learning_rate": 0.0025794286862799286, + "loss": 5.9387, + "step": 11160 + }, + { + "epoch": 0.28, + "learning_rate": 0.0025790518302640504, + "loss": 7.2621, + "step": 11170 + }, + { + "epoch": 0.28, + "learning_rate": 0.002578674974248172, + "loss": 6.7929, + "step": 11180 + }, + { + "epoch": 0.28, + "learning_rate": 0.0025782981182322943, + "loss": 7.9889, + "step": 11190 + }, + { + "epoch": 0.28, + "learning_rate": 0.0025779212622164156, + "loss": 7.8188, + "step": 11200 + }, + { + "epoch": 0.28, + "learning_rate": 0.002577544406200538, + "loss": 7.1258, + "step": 11210 + }, + { + "epoch": 0.28, + "learning_rate": 0.0025771675501846595, + "loss": 6.8801, + "step": 11220 + }, + { + "epoch": 0.28, + "learning_rate": 0.0025767906941687813, + "loss": 6.7671, + "step": 11230 + }, + { + "epoch": 0.28, + "learning_rate": 0.002576413838152903, + "loss": 6.5726, + "step": 11240 + }, + { + "epoch": 0.28, + "learning_rate": 0.002576036982137025, + "loss": 6.2308, + "step": 11250 + }, + { + "epoch": 0.28, + "learning_rate": 0.002575660126121147, + "loss": 6.2539, + "step": 11260 + }, + { + "epoch": 0.28, + "learning_rate": 0.0025752832701052687, + "loss": 7.1063, + "step": 11270 + }, + { + "epoch": 0.28, + "learning_rate": 0.00257490641408939, + "loss": 6.5323, + "step": 11280 + }, + { + "epoch": 0.28, + "learning_rate": 0.002574529558073512, + "loss": 6.2713, + "step": 11290 + }, + { + "epoch": 0.28, + "learning_rate": 0.002574152702057634, + "loss": 6.0892, + "step": 11300 + }, + { + "epoch": 0.28, + "learning_rate": 0.0025737758460417557, + "loss": 6.2819, + "step": 11310 + }, + { + "epoch": 0.28, + "learning_rate": 0.0025733989900258774, + "loss": 6.2821, + "step": 11320 + }, + { + "epoch": 0.28, + "learning_rate": 0.002573022134009999, + "loss": 6.1237, + "step": 11330 + }, + { + "epoch": 0.28, + "learning_rate": 0.0025726452779941214, + "loss": 6.0933, + "step": 11340 + }, + { + "epoch": 0.29, + "learning_rate": 0.0025722684219782427, + "loss": 6.2318, + "step": 11350 + }, + { + "epoch": 0.29, + "learning_rate": 0.0025718915659623644, + "loss": 6.0266, + "step": 11360 + }, + { + "epoch": 0.29, + "learning_rate": 0.0025715147099464866, + "loss": 5.8218, + "step": 11370 + }, + { + "epoch": 0.29, + "learning_rate": 0.0025711378539306083, + "loss": 5.8923, + "step": 11380 + }, + { + "epoch": 0.29, + "learning_rate": 0.00257076099791473, + "loss": 5.8399, + "step": 11390 + }, + { + "epoch": 0.29, + "learning_rate": 0.002570384141898852, + "loss": 5.9417, + "step": 11400 + }, + { + "epoch": 0.29, + "learning_rate": 0.0025700072858829736, + "loss": 5.9609, + "step": 11410 + }, + { + "epoch": 0.29, + "learning_rate": 0.0025696304298670957, + "loss": 6.7493, + "step": 11420 + }, + { + "epoch": 0.29, + "learning_rate": 0.002569253573851217, + "loss": 6.8029, + "step": 11430 + }, + { + "epoch": 0.29, + "learning_rate": 0.0025688767178353392, + "loss": 6.3757, + "step": 11440 + }, + { + "epoch": 0.29, + "learning_rate": 0.002568499861819461, + "loss": 6.2486, + "step": 11450 + }, + { + "epoch": 0.29, + "learning_rate": 0.0025681230058035827, + "loss": 6.15, + "step": 11460 + }, + { + "epoch": 0.29, + "learning_rate": 0.0025677461497877045, + "loss": 6.1534, + "step": 11470 + }, + { + "epoch": 0.29, + "learning_rate": 0.002567369293771826, + "loss": 6.0945, + "step": 11480 + }, + { + "epoch": 0.29, + "learning_rate": 0.002566992437755948, + "loss": 6.1041, + "step": 11490 + }, + { + "epoch": 0.29, + "learning_rate": 0.00256661558174007, + "loss": 6.1099, + "step": 11500 + }, + { + "epoch": 0.29, + "eval_cer": 0.8805047336221677, + "eval_loss": 6.048417091369629, + "eval_runtime": 90.456, + "eval_samples_per_second": 110.54, + "eval_steps_per_second": 6.909, + "step": 11500 + }, + { + "epoch": 0.29, + "learning_rate": 0.0025662387257241914, + "loss": 6.1748, + "step": 11510 + }, + { + "epoch": 0.29, + "learning_rate": 0.0025658618697083136, + "loss": 6.2297, + "step": 11520 + }, + { + "epoch": 0.29, + "learning_rate": 0.0025654850136924354, + "loss": 6.2931, + "step": 11530 + }, + { + "epoch": 0.29, + "learning_rate": 0.002565108157676557, + "loss": 6.3084, + "step": 11540 + }, + { + "epoch": 0.29, + "learning_rate": 0.002564731301660679, + "loss": 6.2893, + "step": 11550 + }, + { + "epoch": 0.29, + "learning_rate": 0.0025643544456448006, + "loss": 6.273, + "step": 11560 + }, + { + "epoch": 0.29, + "learning_rate": 0.0025639775896289228, + "loss": 6.2783, + "step": 11570 + }, + { + "epoch": 0.29, + "learning_rate": 0.002563600733613044, + "loss": 6.2444, + "step": 11580 + }, + { + "epoch": 0.29, + "learning_rate": 0.002563223877597166, + "loss": 6.2464, + "step": 11590 + }, + { + "epoch": 0.29, + "learning_rate": 0.002562847021581288, + "loss": 6.3133, + "step": 11600 + }, + { + "epoch": 0.29, + "learning_rate": 0.0025624701655654098, + "loss": 6.1791, + "step": 11610 + }, + { + "epoch": 0.29, + "learning_rate": 0.0025620933095495315, + "loss": 6.0017, + "step": 11620 + }, + { + "epoch": 0.29, + "learning_rate": 0.0025617164535336532, + "loss": 5.9354, + "step": 11630 + }, + { + "epoch": 0.29, + "learning_rate": 0.002561339597517775, + "loss": 5.9088, + "step": 11640 + }, + { + "epoch": 0.29, + "learning_rate": 0.002560962741501897, + "loss": 5.8717, + "step": 11650 + }, + { + "epoch": 0.29, + "learning_rate": 0.0025605858854860185, + "loss": 5.8255, + "step": 11660 + }, + { + "epoch": 0.29, + "learning_rate": 0.0025602090294701407, + "loss": 5.7379, + "step": 11670 + }, + { + "epoch": 0.29, + "learning_rate": 0.0025598321734542624, + "loss": 5.7158, + "step": 11680 + }, + { + "epoch": 0.29, + "learning_rate": 0.002559455317438384, + "loss": 5.667, + "step": 11690 + }, + { + "epoch": 0.29, + "learning_rate": 0.002559078461422506, + "loss": 5.62, + "step": 11700 + }, + { + "epoch": 0.29, + "learning_rate": 0.0025587016054066276, + "loss": 5.5561, + "step": 11710 + }, + { + "epoch": 0.29, + "learning_rate": 0.0025583247493907494, + "loss": 5.5272, + "step": 11720 + }, + { + "epoch": 0.29, + "learning_rate": 0.0025579478933748716, + "loss": 5.4919, + "step": 11730 + }, + { + "epoch": 0.29, + "learning_rate": 0.002557571037358993, + "loss": 5.4039, + "step": 11740 + }, + { + "epoch": 0.3, + "learning_rate": 0.002557194181343115, + "loss": 5.323, + "step": 11750 + }, + { + "epoch": 0.3, + "learning_rate": 0.002556817325327237, + "loss": 5.2373, + "step": 11760 + }, + { + "epoch": 0.3, + "learning_rate": 0.0025564404693113585, + "loss": 5.1487, + "step": 11770 + }, + { + "epoch": 0.3, + "learning_rate": 0.0025560636132954803, + "loss": 5.1224, + "step": 11780 + }, + { + "epoch": 0.3, + "learning_rate": 0.002555686757279602, + "loss": 5.408, + "step": 11790 + }, + { + "epoch": 0.3, + "learning_rate": 0.0025553099012637238, + "loss": 6.0158, + "step": 11800 + }, + { + "epoch": 0.3, + "learning_rate": 0.0025549330452478455, + "loss": 6.0681, + "step": 11810 + }, + { + "epoch": 0.3, + "learning_rate": 0.0025545561892319673, + "loss": 5.6654, + "step": 11820 + }, + { + "epoch": 0.3, + "learning_rate": 0.0025541793332160894, + "loss": 5.3601, + "step": 11830 + }, + { + "epoch": 0.3, + "learning_rate": 0.002553802477200211, + "loss": 5.2609, + "step": 11840 + }, + { + "epoch": 0.3, + "learning_rate": 0.002553425621184333, + "loss": 5.2451, + "step": 11850 + }, + { + "epoch": 0.3, + "learning_rate": 0.0025530487651684547, + "loss": 5.208, + "step": 11860 + }, + { + "epoch": 0.3, + "learning_rate": 0.0025526719091525764, + "loss": 5.1566, + "step": 11870 + }, + { + "epoch": 0.3, + "learning_rate": 0.0025522950531366986, + "loss": 5.8534, + "step": 11880 + }, + { + "epoch": 0.3, + "learning_rate": 0.00255191819712082, + "loss": 6.3235, + "step": 11890 + }, + { + "epoch": 0.3, + "learning_rate": 0.0025515413411049417, + "loss": 6.0392, + "step": 11900 + }, + { + "epoch": 0.3, + "learning_rate": 0.002551164485089064, + "loss": 5.5035, + "step": 11910 + }, + { + "epoch": 0.3, + "learning_rate": 0.0025507876290731856, + "loss": 5.1853, + "step": 11920 + }, + { + "epoch": 0.3, + "learning_rate": 0.0025504107730573073, + "loss": 5.0908, + "step": 11930 + }, + { + "epoch": 0.3, + "learning_rate": 0.002550033917041429, + "loss": 5.0612, + "step": 11940 + }, + { + "epoch": 0.3, + "learning_rate": 0.002549657061025551, + "loss": 5.1003, + "step": 11950 + }, + { + "epoch": 0.3, + "learning_rate": 0.002549280205009673, + "loss": 5.0377, + "step": 11960 + }, + { + "epoch": 0.3, + "learning_rate": 0.0025489033489937943, + "loss": 4.9801, + "step": 11970 + }, + { + "epoch": 0.3, + "learning_rate": 0.0025485264929779165, + "loss": 4.9317, + "step": 11980 + }, + { + "epoch": 0.3, + "learning_rate": 0.0025481496369620382, + "loss": 4.9793, + "step": 11990 + }, + { + "epoch": 0.3, + "learning_rate": 0.00254777278094616, + "loss": 4.9528, + "step": 12000 + }, + { + "epoch": 0.3, + "eval_cer": 0.811528065112389, + "eval_loss": 4.661426067352295, + "eval_runtime": 90.744, + "eval_samples_per_second": 110.189, + "eval_steps_per_second": 6.888, + "step": 12000 + }, + { + "epoch": 0.3, + "learning_rate": 0.0025473959249302817, + "loss": 4.9223, + "step": 12010 + }, + { + "epoch": 0.3, + "learning_rate": 0.0025470190689144035, + "loss": 4.8947, + "step": 12020 + }, + { + "epoch": 0.3, + "learning_rate": 0.002546642212898525, + "loss": 4.8087, + "step": 12030 + }, + { + "epoch": 0.3, + "learning_rate": 0.002546265356882647, + "loss": 4.786, + "step": 12040 + }, + { + "epoch": 0.3, + "learning_rate": 0.0025458885008667687, + "loss": 4.7338, + "step": 12050 + }, + { + "epoch": 0.3, + "learning_rate": 0.002545511644850891, + "loss": 4.7176, + "step": 12060 + }, + { + "epoch": 0.3, + "learning_rate": 0.0025451347888350126, + "loss": 4.7573, + "step": 12070 + }, + { + "epoch": 0.3, + "learning_rate": 0.0025447579328191344, + "loss": 4.7873, + "step": 12080 + }, + { + "epoch": 0.3, + "learning_rate": 0.002544381076803256, + "loss": 4.7283, + "step": 12090 + }, + { + "epoch": 0.3, + "learning_rate": 0.002544004220787378, + "loss": 4.674, + "step": 12100 + }, + { + "epoch": 0.3, + "learning_rate": 0.0025436273647714996, + "loss": 4.7024, + "step": 12110 + }, + { + "epoch": 0.3, + "learning_rate": 0.0025432505087556213, + "loss": 4.7434, + "step": 12120 + }, + { + "epoch": 0.3, + "learning_rate": 0.002542873652739743, + "loss": 4.6647, + "step": 12130 + }, + { + "epoch": 0.3, + "learning_rate": 0.0025424967967238653, + "loss": 4.6216, + "step": 12140 + }, + { + "epoch": 0.31, + "learning_rate": 0.002542119940707987, + "loss": 4.636, + "step": 12150 + }, + { + "epoch": 0.31, + "learning_rate": 0.0025417430846921087, + "loss": 4.6511, + "step": 12160 + }, + { + "epoch": 0.31, + "learning_rate": 0.0025413662286762305, + "loss": 4.5795, + "step": 12170 + }, + { + "epoch": 0.31, + "learning_rate": 0.0025409893726603522, + "loss": 4.4972, + "step": 12180 + }, + { + "epoch": 0.31, + "learning_rate": 0.0025406125166444744, + "loss": 4.435, + "step": 12190 + }, + { + "epoch": 0.31, + "learning_rate": 0.0025402356606285957, + "loss": 4.379, + "step": 12200 + }, + { + "epoch": 0.31, + "learning_rate": 0.0025398588046127175, + "loss": 4.3485, + "step": 12210 + }, + { + "epoch": 0.31, + "learning_rate": 0.0025394819485968396, + "loss": 4.2845, + "step": 12220 + }, + { + "epoch": 0.31, + "learning_rate": 0.0025391050925809614, + "loss": 4.1975, + "step": 12230 + }, + { + "epoch": 0.31, + "learning_rate": 0.002538728236565083, + "loss": 3.0927, + "step": 12240 + }, + { + "epoch": 0.31, + "learning_rate": 0.002538351380549205, + "loss": 1.1231, + "step": 12250 + }, + { + "epoch": 0.31, + "learning_rate": 0.0025379745245333266, + "loss": 0.566, + "step": 12260 + }, + { + "epoch": 0.31, + "learning_rate": 0.0025375976685174484, + "loss": 0.4869, + "step": 12270 + }, + { + "epoch": 0.31, + "learning_rate": 0.00253722081250157, + "loss": 0.4279, + "step": 12280 + }, + { + "epoch": 0.31, + "learning_rate": 0.0025368439564856923, + "loss": 0.4044, + "step": 12290 + }, + { + "epoch": 0.31, + "learning_rate": 0.002536467100469814, + "loss": 0.3643, + "step": 12300 + }, + { + "epoch": 0.31, + "learning_rate": 0.0025360902444539354, + "loss": 0.4048, + "step": 12310 + }, + { + "epoch": 0.31, + "learning_rate": 0.0025357133884380575, + "loss": 0.3471, + "step": 12320 + }, + { + "epoch": 0.31, + "learning_rate": 0.0025353365324221793, + "loss": 0.3162, + "step": 12330 + }, + { + "epoch": 0.31, + "learning_rate": 0.002534959676406301, + "loss": 0.2862, + "step": 12340 + }, + { + "epoch": 0.31, + "learning_rate": 0.0025345828203904228, + "loss": 0.2789, + "step": 12350 + }, + { + "epoch": 0.31, + "learning_rate": 0.0025342059643745445, + "loss": 0.2707, + "step": 12360 + }, + { + "epoch": 0.31, + "learning_rate": 0.0025338291083586667, + "loss": 0.255, + "step": 12370 + }, + { + "epoch": 0.31, + "learning_rate": 0.0025334522523427884, + "loss": 0.2596, + "step": 12380 + }, + { + "epoch": 0.31, + "learning_rate": 0.00253307539632691, + "loss": 0.2378, + "step": 12390 + }, + { + "epoch": 0.31, + "learning_rate": 0.002532698540311032, + "loss": 0.2396, + "step": 12400 + }, + { + "epoch": 0.31, + "learning_rate": 0.0025323216842951537, + "loss": 0.2339, + "step": 12410 + }, + { + "epoch": 0.31, + "learning_rate": 0.002531944828279276, + "loss": 0.2316, + "step": 12420 + }, + { + "epoch": 0.31, + "learning_rate": 0.002531567972263397, + "loss": 0.2366, + "step": 12430 + }, + { + "epoch": 0.31, + "learning_rate": 0.002531191116247519, + "loss": 0.2309, + "step": 12440 + }, + { + "epoch": 0.31, + "learning_rate": 0.002530814260231641, + "loss": 0.2239, + "step": 12450 + }, + { + "epoch": 0.31, + "learning_rate": 0.0025304374042157624, + "loss": 0.2195, + "step": 12460 + }, + { + "epoch": 0.31, + "learning_rate": 0.0025300605481998846, + "loss": 0.2191, + "step": 12470 + }, + { + "epoch": 0.31, + "learning_rate": 0.0025296836921840063, + "loss": 0.2128, + "step": 12480 + }, + { + "epoch": 0.31, + "learning_rate": 0.002529306836168128, + "loss": 0.209, + "step": 12490 + }, + { + "epoch": 0.31, + "learning_rate": 0.00252892998015225, + "loss": 0.2066, + "step": 12500 + }, + { + "epoch": 0.31, + "eval_cer": 0.6679375959753745, + "eval_loss": 0.14948998391628265, + "eval_runtime": 90.7588, + "eval_samples_per_second": 110.171, + "eval_steps_per_second": 6.886, + "step": 12500 + }, + { + "epoch": 0.31, + "learning_rate": 0.0025285531241363715, + "loss": 0.2081, + "step": 12510 + }, + { + "epoch": 0.31, + "learning_rate": 0.0025281762681204933, + "loss": 0.2056, + "step": 12520 + }, + { + "epoch": 0.31, + "learning_rate": 0.0025277994121046155, + "loss": 0.2009, + "step": 12530 + }, + { + "epoch": 0.32, + "learning_rate": 0.0025274225560887368, + "loss": 0.1993, + "step": 12540 + }, + { + "epoch": 0.32, + "learning_rate": 0.002527045700072859, + "loss": 0.1974, + "step": 12550 + }, + { + "epoch": 0.32, + "learning_rate": 0.0025266688440569807, + "loss": 0.1969, + "step": 12560 + }, + { + "epoch": 0.32, + "learning_rate": 0.0025262919880411024, + "loss": 0.1976, + "step": 12570 + }, + { + "epoch": 0.32, + "learning_rate": 0.002525915132025224, + "loss": 0.1909, + "step": 12580 + }, + { + "epoch": 0.32, + "learning_rate": 0.002525538276009346, + "loss": 0.1953, + "step": 12590 + }, + { + "epoch": 0.32, + "learning_rate": 0.002525161419993468, + "loss": 0.1904, + "step": 12600 + }, + { + "epoch": 0.32, + "learning_rate": 0.00252478456397759, + "loss": 0.1923, + "step": 12610 + }, + { + "epoch": 0.32, + "learning_rate": 0.002524407707961711, + "loss": 0.1899, + "step": 12620 + }, + { + "epoch": 0.32, + "learning_rate": 0.0025240308519458333, + "loss": 0.1873, + "step": 12630 + }, + { + "epoch": 0.32, + "learning_rate": 0.002523653995929955, + "loss": 0.1892, + "step": 12640 + }, + { + "epoch": 0.32, + "learning_rate": 0.002523277139914077, + "loss": 0.1862, + "step": 12650 + }, + { + "epoch": 0.32, + "learning_rate": 0.0025229002838981986, + "loss": 0.186, + "step": 12660 + }, + { + "epoch": 0.32, + "learning_rate": 0.0025225234278823203, + "loss": 0.182, + "step": 12670 + }, + { + "epoch": 0.32, + "learning_rate": 0.0025221465718664425, + "loss": 0.1819, + "step": 12680 + }, + { + "epoch": 0.32, + "learning_rate": 0.002521769715850564, + "loss": 0.1777, + "step": 12690 + }, + { + "epoch": 0.32, + "learning_rate": 0.002521392859834686, + "loss": 0.1781, + "step": 12700 + }, + { + "epoch": 0.32, + "learning_rate": 0.0025210160038188077, + "loss": 0.1827, + "step": 12710 + }, + { + "epoch": 0.32, + "learning_rate": 0.0025206391478029295, + "loss": 0.1773, + "step": 12720 + }, + { + "epoch": 0.32, + "learning_rate": 0.0025202622917870512, + "loss": 0.1813, + "step": 12730 + }, + { + "epoch": 0.32, + "learning_rate": 0.002519885435771173, + "loss": 0.1815, + "step": 12740 + }, + { + "epoch": 0.32, + "learning_rate": 0.0025195085797552947, + "loss": 0.1758, + "step": 12750 + }, + { + "epoch": 0.32, + "learning_rate": 0.002519131723739417, + "loss": 0.1794, + "step": 12760 + }, + { + "epoch": 0.32, + "learning_rate": 0.002518754867723538, + "loss": 0.1755, + "step": 12770 + }, + { + "epoch": 0.32, + "learning_rate": 0.0025183780117076604, + "loss": 0.1786, + "step": 12780 + }, + { + "epoch": 0.32, + "learning_rate": 0.002518001155691782, + "loss": 0.1749, + "step": 12790 + }, + { + "epoch": 0.32, + "learning_rate": 0.002517624299675904, + "loss": 0.174, + "step": 12800 + }, + { + "epoch": 0.32, + "learning_rate": 0.0025172474436600256, + "loss": 0.1782, + "step": 12810 + }, + { + "epoch": 0.32, + "learning_rate": 0.0025168705876441474, + "loss": 0.1763, + "step": 12820 + }, + { + "epoch": 0.32, + "learning_rate": 0.0025164937316282695, + "loss": 0.1749, + "step": 12830 + }, + { + "epoch": 0.32, + "learning_rate": 0.0025161168756123913, + "loss": 0.1728, + "step": 12840 + }, + { + "epoch": 0.32, + "learning_rate": 0.0025157400195965126, + "loss": 0.17, + "step": 12850 + }, + { + "epoch": 0.32, + "learning_rate": 0.0025153631635806348, + "loss": 0.1732, + "step": 12860 + }, + { + "epoch": 0.32, + "learning_rate": 0.0025149863075647565, + "loss": 0.1685, + "step": 12870 + }, + { + "epoch": 0.32, + "learning_rate": 0.0025146094515488783, + "loss": 0.1734, + "step": 12880 + }, + { + "epoch": 0.32, + "learning_rate": 0.002514232595533, + "loss": 0.1757, + "step": 12890 + }, + { + "epoch": 0.32, + "learning_rate": 0.0025138557395171218, + "loss": 0.1672, + "step": 12900 + }, + { + "epoch": 0.32, + "learning_rate": 0.002513478883501244, + "loss": 0.1718, + "step": 12910 + }, + { + "epoch": 0.32, + "learning_rate": 0.0025131020274853652, + "loss": 0.1732, + "step": 12920 + }, + { + "epoch": 0.32, + "learning_rate": 0.002512725171469487, + "loss": 0.1701, + "step": 12930 + }, + { + "epoch": 0.33, + "learning_rate": 0.002512348315453609, + "loss": 0.1653, + "step": 12940 + }, + { + "epoch": 0.33, + "learning_rate": 0.002511971459437731, + "loss": 0.1674, + "step": 12950 + }, + { + "epoch": 0.33, + "learning_rate": 0.0025115946034218527, + "loss": 0.1712, + "step": 12960 + }, + { + "epoch": 0.33, + "learning_rate": 0.0025112177474059744, + "loss": 0.1643, + "step": 12970 + }, + { + "epoch": 0.33, + "learning_rate": 0.002510840891390096, + "loss": 0.1636, + "step": 12980 + }, + { + "epoch": 0.33, + "learning_rate": 0.0025104640353742183, + "loss": 0.1633, + "step": 12990 + }, + { + "epoch": 0.33, + "learning_rate": 0.0025100871793583396, + "loss": 0.1654, + "step": 13000 + }, + { + "epoch": 0.33, + "eval_cer": 0.6678427935998291, + "eval_loss": 0.12283774465322495, + "eval_runtime": 90.4365, + "eval_samples_per_second": 110.564, + "eval_steps_per_second": 6.911, + "step": 13000 + }, + { + "epoch": 0.33, + "learning_rate": 0.002509710323342462, + "loss": 0.169, + "step": 13010 + }, + { + "epoch": 0.33, + "learning_rate": 0.0025093334673265836, + "loss": 0.1637, + "step": 13020 + }, + { + "epoch": 0.33, + "learning_rate": 0.0025089566113107053, + "loss": 0.1614, + "step": 13030 + }, + { + "epoch": 0.33, + "learning_rate": 0.002508579755294827, + "loss": 0.1662, + "step": 13040 + }, + { + "epoch": 0.33, + "learning_rate": 0.002508202899278949, + "loss": 0.165, + "step": 13050 + }, + { + "epoch": 0.33, + "learning_rate": 0.0025078260432630705, + "loss": 0.1591, + "step": 13060 + }, + { + "epoch": 0.33, + "learning_rate": 0.0025074491872471927, + "loss": 0.1631, + "step": 13070 + }, + { + "epoch": 0.33, + "learning_rate": 0.002507072331231314, + "loss": 0.1596, + "step": 13080 + }, + { + "epoch": 0.33, + "learning_rate": 0.002506695475215436, + "loss": 0.1599, + "step": 13090 + }, + { + "epoch": 0.33, + "learning_rate": 0.002506318619199558, + "loss": 0.158, + "step": 13100 + }, + { + "epoch": 0.33, + "learning_rate": 0.0025059417631836797, + "loss": 0.1625, + "step": 13110 + }, + { + "epoch": 0.33, + "learning_rate": 0.0025055649071678014, + "loss": 0.1618, + "step": 13120 + }, + { + "epoch": 0.33, + "learning_rate": 0.002505188051151923, + "loss": 0.1655, + "step": 13130 + }, + { + "epoch": 0.33, + "learning_rate": 0.0025048111951360454, + "loss": 0.1585, + "step": 13140 + }, + { + "epoch": 0.33, + "learning_rate": 0.0025044343391201667, + "loss": 0.1597, + "step": 13150 + }, + { + "epoch": 0.33, + "learning_rate": 0.0025040574831042884, + "loss": 0.1604, + "step": 13160 + }, + { + "epoch": 0.33, + "learning_rate": 0.0025036806270884106, + "loss": 0.1563, + "step": 13170 + }, + { + "epoch": 0.33, + "learning_rate": 0.0025033037710725323, + "loss": 0.1571, + "step": 13180 + }, + { + "epoch": 0.33, + "learning_rate": 0.002502926915056654, + "loss": 0.1604, + "step": 13190 + }, + { + "epoch": 0.33, + "learning_rate": 0.002502550059040776, + "loss": 0.1669, + "step": 13200 + }, + { + "epoch": 0.33, + "learning_rate": 0.0025021732030248976, + "loss": 0.1606, + "step": 13210 + }, + { + "epoch": 0.33, + "learning_rate": 0.0025017963470090198, + "loss": 0.149, + "step": 13220 + }, + { + "epoch": 0.33, + "learning_rate": 0.002501419490993141, + "loss": 0.1592, + "step": 13230 + }, + { + "epoch": 0.33, + "learning_rate": 0.0025010426349772632, + "loss": 0.158, + "step": 13240 + }, + { + "epoch": 0.33, + "learning_rate": 0.002500665778961385, + "loss": 0.1601, + "step": 13250 + }, + { + "epoch": 0.33, + "learning_rate": 0.0025002889229455067, + "loss": 0.1525, + "step": 13260 + }, + { + "epoch": 0.33, + "learning_rate": 0.0024999120669296285, + "loss": 0.1606, + "step": 13270 + }, + { + "epoch": 0.33, + "learning_rate": 0.0024995352109137502, + "loss": 0.158, + "step": 13280 + }, + { + "epoch": 0.33, + "learning_rate": 0.002499158354897872, + "loss": 0.1574, + "step": 13290 + }, + { + "epoch": 0.33, + "learning_rate": 0.002498781498881994, + "loss": 0.1546, + "step": 13300 + }, + { + "epoch": 0.33, + "learning_rate": 0.0024984046428661155, + "loss": 0.1562, + "step": 13310 + }, + { + "epoch": 0.33, + "learning_rate": 0.0024980277868502376, + "loss": 0.1603, + "step": 13320 + }, + { + "epoch": 0.33, + "learning_rate": 0.0024976509308343594, + "loss": 0.1553, + "step": 13330 + }, + { + "epoch": 0.34, + "learning_rate": 0.002497274074818481, + "loss": 0.1568, + "step": 13340 + }, + { + "epoch": 0.34, + "learning_rate": 0.002496897218802603, + "loss": 0.1523, + "step": 13350 + }, + { + "epoch": 0.34, + "learning_rate": 0.0024965203627867246, + "loss": 0.1544, + "step": 13360 + }, + { + "epoch": 0.34, + "learning_rate": 0.0024961435067708464, + "loss": 0.1539, + "step": 13370 + }, + { + "epoch": 0.34, + "learning_rate": 0.002495766650754968, + "loss": 0.1557, + "step": 13380 + }, + { + "epoch": 0.34, + "learning_rate": 0.00249538979473909, + "loss": 0.1526, + "step": 13390 + }, + { + "epoch": 0.34, + "learning_rate": 0.002495012938723212, + "loss": 0.1537, + "step": 13400 + }, + { + "epoch": 0.34, + "learning_rate": 0.0024946360827073338, + "loss": 0.1574, + "step": 13410 + }, + { + "epoch": 0.34, + "learning_rate": 0.0024942592266914555, + "loss": 0.1555, + "step": 13420 + }, + { + "epoch": 0.34, + "learning_rate": 0.0024938823706755773, + "loss": 0.1528, + "step": 13430 + }, + { + "epoch": 0.34, + "learning_rate": 0.002493505514659699, + "loss": 0.1517, + "step": 13440 + }, + { + "epoch": 0.34, + "learning_rate": 0.002493128658643821, + "loss": 0.1604, + "step": 13450 + }, + { + "epoch": 0.34, + "learning_rate": 0.0024927518026279425, + "loss": 0.1541, + "step": 13460 + }, + { + "epoch": 0.34, + "learning_rate": 0.0024923749466120642, + "loss": 0.1515, + "step": 13470 + }, + { + "epoch": 0.34, + "learning_rate": 0.0024919980905961864, + "loss": 0.1506, + "step": 13480 + }, + { + "epoch": 0.34, + "learning_rate": 0.002491621234580308, + "loss": 0.1542, + "step": 13490 + }, + { + "epoch": 0.34, + "learning_rate": 0.00249124437856443, + "loss": 0.1552, + "step": 13500 + }, + { + "epoch": 0.34, + "eval_cer": 0.667002084208571, + "eval_loss": 0.11529998481273651, + "eval_runtime": 90.608, + "eval_samples_per_second": 110.355, + "eval_steps_per_second": 6.898, + "step": 13500 + }, + { + "epoch": 0.34, + "learning_rate": 0.0024908675225485516, + "loss": 0.1555, + "step": 13510 + }, + { + "epoch": 0.34, + "learning_rate": 0.0024904906665326734, + "loss": 0.1503, + "step": 13520 + }, + { + "epoch": 0.34, + "learning_rate": 0.0024901138105167956, + "loss": 0.15, + "step": 13530 + }, + { + "epoch": 0.34, + "learning_rate": 0.002489736954500917, + "loss": 0.1545, + "step": 13540 + }, + { + "epoch": 0.34, + "learning_rate": 0.002489360098485039, + "loss": 0.1517, + "step": 13550 + }, + { + "epoch": 0.34, + "learning_rate": 0.002488983242469161, + "loss": 0.148, + "step": 13560 + }, + { + "epoch": 0.34, + "learning_rate": 0.0024886063864532825, + "loss": 0.1488, + "step": 13570 + }, + { + "epoch": 0.34, + "learning_rate": 0.0024882295304374043, + "loss": 0.1557, + "step": 13580 + }, + { + "epoch": 0.34, + "learning_rate": 0.002487852674421526, + "loss": 0.1546, + "step": 13590 + }, + { + "epoch": 0.34, + "learning_rate": 0.0024874758184056478, + "loss": 0.1531, + "step": 13600 + }, + { + "epoch": 0.34, + "learning_rate": 0.0024870989623897695, + "loss": 0.1531, + "step": 13610 + }, + { + "epoch": 0.34, + "learning_rate": 0.0024867221063738913, + "loss": 0.1513, + "step": 13620 + }, + { + "epoch": 0.34, + "learning_rate": 0.0024863452503580134, + "loss": 0.1519, + "step": 13630 + }, + { + "epoch": 0.34, + "learning_rate": 0.002485968394342135, + "loss": 0.1476, + "step": 13640 + }, + { + "epoch": 0.34, + "learning_rate": 0.002485591538326257, + "loss": 0.1527, + "step": 13650 + }, + { + "epoch": 0.34, + "learning_rate": 0.0024852146823103787, + "loss": 0.1544, + "step": 13660 + }, + { + "epoch": 0.34, + "learning_rate": 0.0024848378262945004, + "loss": 0.1496, + "step": 13670 + }, + { + "epoch": 0.34, + "learning_rate": 0.0024844609702786226, + "loss": 0.1513, + "step": 13680 + }, + { + "epoch": 0.34, + "learning_rate": 0.002484084114262744, + "loss": 0.1478, + "step": 13690 + }, + { + "epoch": 0.34, + "learning_rate": 0.0024837072582468657, + "loss": 0.1447, + "step": 13700 + }, + { + "epoch": 0.34, + "learning_rate": 0.002483330402230988, + "loss": 0.1524, + "step": 13710 + }, + { + "epoch": 0.34, + "learning_rate": 0.0024829535462151096, + "loss": 0.1535, + "step": 13720 + }, + { + "epoch": 0.34, + "learning_rate": 0.0024825766901992313, + "loss": 0.1486, + "step": 13730 + }, + { + "epoch": 0.35, + "learning_rate": 0.002482199834183353, + "loss": 0.1468, + "step": 13740 + }, + { + "epoch": 0.35, + "learning_rate": 0.002481822978167475, + "loss": 0.1505, + "step": 13750 + }, + { + "epoch": 0.35, + "learning_rate": 0.002481446122151597, + "loss": 0.1439, + "step": 13760 + }, + { + "epoch": 0.35, + "learning_rate": 0.0024810692661357183, + "loss": 0.1498, + "step": 13770 + }, + { + "epoch": 0.35, + "learning_rate": 0.00248069241011984, + "loss": 0.1507, + "step": 13780 + }, + { + "epoch": 0.35, + "learning_rate": 0.0024803155541039622, + "loss": 0.1455, + "step": 13790 + }, + { + "epoch": 0.35, + "learning_rate": 0.0024799386980880835, + "loss": 0.1438, + "step": 13800 + }, + { + "epoch": 0.35, + "learning_rate": 0.0024795618420722057, + "loss": 0.1513, + "step": 13810 + }, + { + "epoch": 0.35, + "learning_rate": 0.0024791849860563275, + "loss": 0.1477, + "step": 13820 + }, + { + "epoch": 0.35, + "learning_rate": 0.002478808130040449, + "loss": 0.1495, + "step": 13830 + }, + { + "epoch": 0.35, + "learning_rate": 0.002478431274024571, + "loss": 0.1464, + "step": 13840 + }, + { + "epoch": 0.35, + "learning_rate": 0.0024780544180086927, + "loss": 0.1432, + "step": 13850 + }, + { + "epoch": 0.35, + "learning_rate": 0.002477677561992815, + "loss": 0.1406, + "step": 13860 + }, + { + "epoch": 0.35, + "learning_rate": 0.0024773007059769366, + "loss": 0.1507, + "step": 13870 + }, + { + "epoch": 0.35, + "learning_rate": 0.002476923849961058, + "loss": 0.1433, + "step": 13880 + }, + { + "epoch": 0.35, + "learning_rate": 0.00247654699394518, + "loss": 0.1418, + "step": 13890 + }, + { + "epoch": 0.35, + "learning_rate": 0.002476170137929302, + "loss": 0.1437, + "step": 13900 + }, + { + "epoch": 0.35, + "learning_rate": 0.0024757932819134236, + "loss": 0.1461, + "step": 13910 + }, + { + "epoch": 0.35, + "learning_rate": 0.0024754164258975453, + "loss": 0.1473, + "step": 13920 + }, + { + "epoch": 0.35, + "learning_rate": 0.002475039569881667, + "loss": 0.1397, + "step": 13930 + }, + { + "epoch": 0.35, + "learning_rate": 0.0024746627138657893, + "loss": 0.1499, + "step": 13940 + }, + { + "epoch": 0.35, + "learning_rate": 0.002474285857849911, + "loss": 0.1454, + "step": 13950 + }, + { + "epoch": 0.35, + "learning_rate": 0.0024739090018340328, + "loss": 0.1452, + "step": 13960 + }, + { + "epoch": 0.35, + "learning_rate": 0.0024735321458181545, + "loss": 0.142, + "step": 13970 + }, + { + "epoch": 0.35, + "learning_rate": 0.0024731552898022762, + "loss": 0.1377, + "step": 13980 + }, + { + "epoch": 0.35, + "learning_rate": 0.0024727784337863984, + "loss": 0.1454, + "step": 13990 + }, + { + "epoch": 0.35, + "learning_rate": 0.0024724015777705197, + "loss": 0.1443, + "step": 14000 + }, + { + "epoch": 0.35, + "eval_cer": 0.6669525174843011, + "eval_loss": 0.11095242947340012, + "eval_runtime": 90.4686, + "eval_samples_per_second": 110.525, + "eval_steps_per_second": 6.908, + "step": 14000 + }, + { + "epoch": 0.35, + "learning_rate": 0.0024720247217546415, + "loss": 0.1419, + "step": 14010 + }, + { + "epoch": 0.35, + "learning_rate": 0.0024716478657387637, + "loss": 0.1433, + "step": 14020 + }, + { + "epoch": 0.35, + "learning_rate": 0.002471271009722885, + "loss": 0.1403, + "step": 14030 + }, + { + "epoch": 0.35, + "learning_rate": 0.002470894153707007, + "loss": 0.1411, + "step": 14040 + }, + { + "epoch": 0.35, + "learning_rate": 0.002470517297691129, + "loss": 0.1438, + "step": 14050 + }, + { + "epoch": 0.35, + "learning_rate": 0.0024701404416752506, + "loss": 0.1491, + "step": 14060 + }, + { + "epoch": 0.35, + "learning_rate": 0.0024697635856593724, + "loss": 0.144, + "step": 14070 + }, + { + "epoch": 0.35, + "learning_rate": 0.002469386729643494, + "loss": 0.1426, + "step": 14080 + }, + { + "epoch": 0.35, + "learning_rate": 0.0024690098736276163, + "loss": 0.1418, + "step": 14090 + }, + { + "epoch": 0.35, + "learning_rate": 0.002468633017611738, + "loss": 0.1408, + "step": 14100 + }, + { + "epoch": 0.35, + "learning_rate": 0.0024682561615958594, + "loss": 0.146, + "step": 14110 + }, + { + "epoch": 0.35, + "learning_rate": 0.0024678793055799815, + "loss": 0.1426, + "step": 14120 + }, + { + "epoch": 0.35, + "learning_rate": 0.0024675024495641033, + "loss": 0.145, + "step": 14130 + }, + { + "epoch": 0.36, + "learning_rate": 0.002467125593548225, + "loss": 0.139, + "step": 14140 + }, + { + "epoch": 0.36, + "learning_rate": 0.0024667487375323468, + "loss": 0.1381, + "step": 14150 + }, + { + "epoch": 0.36, + "learning_rate": 0.0024663718815164685, + "loss": 0.1424, + "step": 14160 + }, + { + "epoch": 0.36, + "learning_rate": 0.0024659950255005907, + "loss": 0.1467, + "step": 14170 + }, + { + "epoch": 0.36, + "learning_rate": 0.0024656181694847124, + "loss": 0.1428, + "step": 14180 + }, + { + "epoch": 0.36, + "learning_rate": 0.0024652413134688337, + "loss": 0.1394, + "step": 14190 + }, + { + "epoch": 0.36, + "learning_rate": 0.002464864457452956, + "loss": 0.1443, + "step": 14200 + }, + { + "epoch": 0.36, + "learning_rate": 0.0024644876014370777, + "loss": 0.1398, + "step": 14210 + }, + { + "epoch": 0.36, + "learning_rate": 0.0024641107454211994, + "loss": 0.1463, + "step": 14220 + }, + { + "epoch": 0.36, + "learning_rate": 0.002463733889405321, + "loss": 0.1442, + "step": 14230 + }, + { + "epoch": 0.36, + "learning_rate": 0.002463357033389443, + "loss": 0.1421, + "step": 14240 + }, + { + "epoch": 0.36, + "learning_rate": 0.002462980177373565, + "loss": 0.1414, + "step": 14250 + }, + { + "epoch": 0.36, + "learning_rate": 0.0024626033213576864, + "loss": 0.1437, + "step": 14260 + }, + { + "epoch": 0.36, + "learning_rate": 0.0024622264653418086, + "loss": 0.1367, + "step": 14270 + }, + { + "epoch": 0.36, + "learning_rate": 0.0024618496093259303, + "loss": 0.1422, + "step": 14280 + }, + { + "epoch": 0.36, + "learning_rate": 0.002461472753310052, + "loss": 0.1452, + "step": 14290 + }, + { + "epoch": 0.36, + "learning_rate": 0.002461095897294174, + "loss": 0.1448, + "step": 14300 + }, + { + "epoch": 0.36, + "learning_rate": 0.0024607190412782956, + "loss": 0.1426, + "step": 14310 + }, + { + "epoch": 0.36, + "learning_rate": 0.0024603421852624173, + "loss": 0.138, + "step": 14320 + }, + { + "epoch": 0.36, + "learning_rate": 0.0024599653292465395, + "loss": 0.1415, + "step": 14330 + }, + { + "epoch": 0.36, + "learning_rate": 0.002459588473230661, + "loss": 0.1401, + "step": 14340 + }, + { + "epoch": 0.36, + "learning_rate": 0.002459211617214783, + "loss": 0.1424, + "step": 14350 + }, + { + "epoch": 0.36, + "learning_rate": 0.0024588347611989047, + "loss": 0.1391, + "step": 14360 + }, + { + "epoch": 0.36, + "learning_rate": 0.0024584579051830265, + "loss": 0.1413, + "step": 14370 + }, + { + "epoch": 0.36, + "learning_rate": 0.002458081049167148, + "loss": 0.139, + "step": 14380 + }, + { + "epoch": 0.36, + "learning_rate": 0.00245770419315127, + "loss": 0.1355, + "step": 14390 + }, + { + "epoch": 0.36, + "learning_rate": 0.002457327337135392, + "loss": 0.1426, + "step": 14400 + }, + { + "epoch": 0.36, + "learning_rate": 0.002456950481119514, + "loss": 0.1404, + "step": 14410 + }, + { + "epoch": 0.36, + "learning_rate": 0.002456573625103635, + "loss": 0.1383, + "step": 14420 + }, + { + "epoch": 0.36, + "learning_rate": 0.0024561967690877574, + "loss": 0.1378, + "step": 14430 + }, + { + "epoch": 0.36, + "learning_rate": 0.002455819913071879, + "loss": 0.1444, + "step": 14440 + }, + { + "epoch": 0.36, + "learning_rate": 0.002455443057056001, + "loss": 0.1368, + "step": 14450 + }, + { + "epoch": 0.36, + "learning_rate": 0.0024550662010401226, + "loss": 0.1395, + "step": 14460 + }, + { + "epoch": 0.36, + "learning_rate": 0.0024546893450242443, + "loss": 0.1366, + "step": 14470 + }, + { + "epoch": 0.36, + "learning_rate": 0.0024543124890083665, + "loss": 0.141, + "step": 14480 + }, + { + "epoch": 0.36, + "learning_rate": 0.002453935632992488, + "loss": 0.1415, + "step": 14490 + }, + { + "epoch": 0.36, + "learning_rate": 0.00245355877697661, + "loss": 0.1397, + "step": 14500 + }, + { + "epoch": 0.36, + "eval_cer": 0.6669780226919351, + "eval_loss": 0.10726305842399597, + "eval_runtime": 90.529, + "eval_samples_per_second": 110.451, + "eval_steps_per_second": 6.904, + "step": 14500 + }, + { + "epoch": 0.36, + "learning_rate": 0.0024531819209607317, + "loss": 0.1349, + "step": 14510 + }, + { + "epoch": 0.36, + "learning_rate": 0.0024528050649448535, + "loss": 0.1399, + "step": 14520 + }, + { + "epoch": 0.37, + "learning_rate": 0.0024524282089289752, + "loss": 0.1368, + "step": 14530 + }, + { + "epoch": 0.37, + "learning_rate": 0.002452051352913097, + "loss": 0.1397, + "step": 14540 + }, + { + "epoch": 0.37, + "learning_rate": 0.0024516744968972187, + "loss": 0.1375, + "step": 14550 + }, + { + "epoch": 0.37, + "learning_rate": 0.002451297640881341, + "loss": 0.1395, + "step": 14560 + }, + { + "epoch": 0.37, + "learning_rate": 0.002450920784865462, + "loss": 0.1377, + "step": 14570 + }, + { + "epoch": 0.37, + "learning_rate": 0.0024505439288495844, + "loss": 0.1421, + "step": 14580 + }, + { + "epoch": 0.37, + "learning_rate": 0.002450167072833706, + "loss": 0.1413, + "step": 14590 + }, + { + "epoch": 0.37, + "learning_rate": 0.002449790216817828, + "loss": 0.1373, + "step": 14600 + }, + { + "epoch": 0.37, + "learning_rate": 0.0024494133608019496, + "loss": 0.137, + "step": 14610 + }, + { + "epoch": 0.37, + "learning_rate": 0.0024490365047860714, + "loss": 0.1361, + "step": 14620 + }, + { + "epoch": 0.37, + "learning_rate": 0.002448659648770193, + "loss": 0.1446, + "step": 14630 + }, + { + "epoch": 0.37, + "learning_rate": 0.0024482827927543153, + "loss": 0.1364, + "step": 14640 + }, + { + "epoch": 0.37, + "learning_rate": 0.0024479059367384366, + "loss": 0.141, + "step": 14650 + }, + { + "epoch": 0.37, + "learning_rate": 0.0024475290807225588, + "loss": 0.1425, + "step": 14660 + }, + { + "epoch": 0.37, + "learning_rate": 0.0024471522247066805, + "loss": 0.1365, + "step": 14670 + }, + { + "epoch": 0.37, + "learning_rate": 0.0024467753686908023, + "loss": 0.1399, + "step": 14680 + }, + { + "epoch": 0.37, + "learning_rate": 0.002446398512674924, + "loss": 0.1381, + "step": 14690 + }, + { + "epoch": 0.37, + "learning_rate": 0.0024460216566590458, + "loss": 0.1452, + "step": 14700 + }, + { + "epoch": 0.37, + "learning_rate": 0.002445644800643168, + "loss": 0.1399, + "step": 14710 + }, + { + "epoch": 0.37, + "learning_rate": 0.0024452679446272893, + "loss": 0.1397, + "step": 14720 + }, + { + "epoch": 0.37, + "learning_rate": 0.002444891088611411, + "loss": 0.1376, + "step": 14730 + }, + { + "epoch": 0.37, + "learning_rate": 0.002444514232595533, + "loss": 0.1356, + "step": 14740 + }, + { + "epoch": 0.37, + "learning_rate": 0.002444137376579655, + "loss": 0.1392, + "step": 14750 + }, + { + "epoch": 0.37, + "learning_rate": 0.0024437605205637767, + "loss": 0.1397, + "step": 14760 + }, + { + "epoch": 0.37, + "learning_rate": 0.0024433836645478984, + "loss": 0.1373, + "step": 14770 + }, + { + "epoch": 0.37, + "learning_rate": 0.00244300680853202, + "loss": 0.1353, + "step": 14780 + }, + { + "epoch": 0.37, + "learning_rate": 0.0024426299525161423, + "loss": 0.1384, + "step": 14790 + }, + { + "epoch": 0.37, + "learning_rate": 0.0024422530965002636, + "loss": 0.1426, + "step": 14800 + }, + { + "epoch": 0.37, + "learning_rate": 0.002441876240484386, + "loss": 0.1405, + "step": 14810 + }, + { + "epoch": 0.37, + "learning_rate": 0.0024414993844685076, + "loss": 0.1379, + "step": 14820 + }, + { + "epoch": 0.37, + "learning_rate": 0.0024411225284526293, + "loss": 0.1372, + "step": 14830 + }, + { + "epoch": 0.37, + "learning_rate": 0.002440745672436751, + "loss": 0.1399, + "step": 14840 + }, + { + "epoch": 0.37, + "learning_rate": 0.002440368816420873, + "loss": 0.1396, + "step": 14850 + }, + { + "epoch": 0.37, + "learning_rate": 0.0024399919604049945, + "loss": 0.1362, + "step": 14860 + }, + { + "epoch": 0.37, + "learning_rate": 0.0024396151043891167, + "loss": 0.1322, + "step": 14870 + }, + { + "epoch": 0.37, + "learning_rate": 0.002439238248373238, + "loss": 0.1324, + "step": 14880 + }, + { + "epoch": 0.37, + "learning_rate": 0.00243886139235736, + "loss": 0.1387, + "step": 14890 + }, + { + "epoch": 0.37, + "learning_rate": 0.002438484536341482, + "loss": 0.1387, + "step": 14900 + }, + { + "epoch": 0.37, + "learning_rate": 0.0024381076803256037, + "loss": 0.1393, + "step": 14910 + }, + { + "epoch": 0.37, + "learning_rate": 0.0024377308243097254, + "loss": 0.1387, + "step": 14920 + }, + { + "epoch": 0.38, + "learning_rate": 0.002437353968293847, + "loss": 0.1368, + "step": 14930 + }, + { + "epoch": 0.38, + "learning_rate": 0.002436977112277969, + "loss": 0.135, + "step": 14940 + }, + { + "epoch": 0.38, + "learning_rate": 0.0024366002562620907, + "loss": 0.1357, + "step": 14950 + }, + { + "epoch": 0.38, + "learning_rate": 0.0024362234002462124, + "loss": 0.1374, + "step": 14960 + }, + { + "epoch": 0.38, + "learning_rate": 0.0024358465442303346, + "loss": 0.1352, + "step": 14970 + }, + { + "epoch": 0.38, + "learning_rate": 0.0024354696882144563, + "loss": 0.1323, + "step": 14980 + }, + { + "epoch": 0.38, + "learning_rate": 0.002435092832198578, + "loss": 0.135, + "step": 14990 + }, + { + "epoch": 0.38, + "learning_rate": 0.0024347159761827, + "loss": 0.1366, + "step": 15000 + }, + { + "epoch": 0.38, + "eval_cer": 0.666434232415964, + "eval_loss": 0.10666073858737946, + "eval_runtime": 90.0505, + "eval_samples_per_second": 111.038, + "eval_steps_per_second": 6.941, + "step": 15000 + }, + { + "epoch": 0.38, + "learning_rate": 0.0024343391201668216, + "loss": 0.1368, + "step": 15010 + }, + { + "epoch": 0.38, + "learning_rate": 0.0024339622641509438, + "loss": 0.1402, + "step": 15020 + }, + { + "epoch": 0.38, + "learning_rate": 0.002433585408135065, + "loss": 0.1406, + "step": 15030 + }, + { + "epoch": 0.38, + "learning_rate": 0.002433208552119187, + "loss": 0.1365, + "step": 15040 + }, + { + "epoch": 0.38, + "learning_rate": 0.002432831696103309, + "loss": 0.1391, + "step": 15050 + }, + { + "epoch": 0.38, + "learning_rate": 0.0024324548400874307, + "loss": 0.1397, + "step": 15060 + }, + { + "epoch": 0.38, + "learning_rate": 0.0024320779840715525, + "loss": 0.1336, + "step": 15070 + }, + { + "epoch": 0.38, + "learning_rate": 0.0024317011280556742, + "loss": 0.1392, + "step": 15080 + }, + { + "epoch": 0.38, + "learning_rate": 0.002431324272039796, + "loss": 0.1363, + "step": 15090 + }, + { + "epoch": 0.38, + "learning_rate": 0.002430947416023918, + "loss": 0.1367, + "step": 15100 + }, + { + "epoch": 0.38, + "learning_rate": 0.0024305705600080395, + "loss": 0.1324, + "step": 15110 + }, + { + "epoch": 0.38, + "learning_rate": 0.0024301937039921616, + "loss": 0.1361, + "step": 15120 + }, + { + "epoch": 0.38, + "learning_rate": 0.0024298168479762834, + "loss": 0.1381, + "step": 15130 + }, + { + "epoch": 0.38, + "learning_rate": 0.0024294399919604047, + "loss": 0.1354, + "step": 15140 + }, + { + "epoch": 0.38, + "learning_rate": 0.002429063135944527, + "loss": 0.1386, + "step": 15150 + }, + { + "epoch": 0.38, + "learning_rate": 0.0024286862799286486, + "loss": 0.132, + "step": 15160 + }, + { + "epoch": 0.38, + "learning_rate": 0.0024283094239127704, + "loss": 0.136, + "step": 15170 + }, + { + "epoch": 0.38, + "learning_rate": 0.002427932567896892, + "loss": 0.1359, + "step": 15180 + }, + { + "epoch": 0.38, + "learning_rate": 0.002427555711881014, + "loss": 0.1348, + "step": 15190 + }, + { + "epoch": 0.38, + "learning_rate": 0.002427178855865136, + "loss": 0.1383, + "step": 15200 + }, + { + "epoch": 0.38, + "learning_rate": 0.0024268019998492578, + "loss": 0.1339, + "step": 15210 + }, + { + "epoch": 0.38, + "learning_rate": 0.0024264251438333795, + "loss": 0.1309, + "step": 15220 + }, + { + "epoch": 0.38, + "learning_rate": 0.0024260482878175013, + "loss": 0.1417, + "step": 15230 + }, + { + "epoch": 0.38, + "learning_rate": 0.002425671431801623, + "loss": 0.138, + "step": 15240 + }, + { + "epoch": 0.38, + "learning_rate": 0.002425294575785745, + "loss": 0.1366, + "step": 15250 + }, + { + "epoch": 0.38, + "learning_rate": 0.0024249177197698665, + "loss": 0.1383, + "step": 15260 + }, + { + "epoch": 0.38, + "learning_rate": 0.0024245408637539882, + "loss": 0.1379, + "step": 15270 + }, + { + "epoch": 0.38, + "learning_rate": 0.0024241640077381104, + "loss": 0.1375, + "step": 15280 + }, + { + "epoch": 0.38, + "learning_rate": 0.002423787151722232, + "loss": 0.1372, + "step": 15290 + }, + { + "epoch": 0.38, + "learning_rate": 0.002423410295706354, + "loss": 0.1375, + "step": 15300 + }, + { + "epoch": 0.38, + "learning_rate": 0.0024230334396904757, + "loss": 0.1364, + "step": 15310 + }, + { + "epoch": 0.38, + "learning_rate": 0.0024226565836745974, + "loss": 0.1394, + "step": 15320 + }, + { + "epoch": 0.39, + "learning_rate": 0.0024222797276587196, + "loss": 0.137, + "step": 15330 + }, + { + "epoch": 0.39, + "learning_rate": 0.002421902871642841, + "loss": 0.1363, + "step": 15340 + }, + { + "epoch": 0.39, + "learning_rate": 0.0024215260156269626, + "loss": 0.1372, + "step": 15350 + }, + { + "epoch": 0.39, + "learning_rate": 0.002421149159611085, + "loss": 0.138, + "step": 15360 + }, + { + "epoch": 0.39, + "learning_rate": 0.002420772303595206, + "loss": 0.1351, + "step": 15370 + }, + { + "epoch": 0.39, + "learning_rate": 0.0024203954475793283, + "loss": 0.1379, + "step": 15380 + }, + { + "epoch": 0.39, + "learning_rate": 0.00242001859156345, + "loss": 0.1336, + "step": 15390 + }, + { + "epoch": 0.39, + "learning_rate": 0.002419641735547572, + "loss": 0.1313, + "step": 15400 + }, + { + "epoch": 0.39, + "learning_rate": 0.0024192648795316935, + "loss": 0.1377, + "step": 15410 + }, + { + "epoch": 0.39, + "learning_rate": 0.0024188880235158153, + "loss": 0.1355, + "step": 15420 + }, + { + "epoch": 0.39, + "learning_rate": 0.0024185111674999375, + "loss": 0.1379, + "step": 15430 + }, + { + "epoch": 0.39, + "learning_rate": 0.002418134311484059, + "loss": 0.1331, + "step": 15440 + }, + { + "epoch": 0.39, + "learning_rate": 0.0024177574554681805, + "loss": 0.1373, + "step": 15450 + }, + { + "epoch": 0.39, + "learning_rate": 0.0024173805994523027, + "loss": 0.1377, + "step": 15460 + }, + { + "epoch": 0.39, + "learning_rate": 0.0024170037434364244, + "loss": 0.1359, + "step": 15470 + }, + { + "epoch": 0.39, + "learning_rate": 0.002416626887420546, + "loss": 0.1315, + "step": 15480 + }, + { + "epoch": 0.39, + "learning_rate": 0.002416250031404668, + "loss": 0.1301, + "step": 15490 + }, + { + "epoch": 0.39, + "learning_rate": 0.0024158731753887897, + "loss": 0.1362, + "step": 15500 + }, + { + "epoch": 0.39, + "eval_cer": 0.6669188313610108, + "eval_loss": 0.10428140312433243, + "eval_runtime": 90.5923, + "eval_samples_per_second": 110.374, + "eval_steps_per_second": 6.899, + "step": 15500 + }, + { + "epoch": 0.39, + "learning_rate": 0.002415496319372912, + "loss": 0.1352, + "step": 15510 + }, + { + "epoch": 0.39, + "learning_rate": 0.0024151194633570336, + "loss": 0.1348, + "step": 15520 + }, + { + "epoch": 0.39, + "learning_rate": 0.0024147426073411553, + "loss": 0.1319, + "step": 15530 + }, + { + "epoch": 0.39, + "learning_rate": 0.002414365751325277, + "loss": 0.1349, + "step": 15540 + }, + { + "epoch": 0.39, + "learning_rate": 0.002413988895309399, + "loss": 0.1315, + "step": 15550 + }, + { + "epoch": 0.39, + "learning_rate": 0.002413612039293521, + "loss": 0.1331, + "step": 15560 + }, + { + "epoch": 0.39, + "learning_rate": 0.0024132351832776423, + "loss": 0.1334, + "step": 15570 + }, + { + "epoch": 0.39, + "learning_rate": 0.002412858327261764, + "loss": 0.1362, + "step": 15580 + }, + { + "epoch": 0.39, + "learning_rate": 0.0024124814712458862, + "loss": 0.1359, + "step": 15590 + }, + { + "epoch": 0.39, + "learning_rate": 0.0024121046152300075, + "loss": 0.1322, + "step": 15600 + }, + { + "epoch": 0.39, + "learning_rate": 0.0024117277592141297, + "loss": 0.1318, + "step": 15610 + }, + { + "epoch": 0.39, + "learning_rate": 0.0024113509031982515, + "loss": 0.1382, + "step": 15620 + }, + { + "epoch": 0.39, + "learning_rate": 0.002410974047182373, + "loss": 0.1368, + "step": 15630 + }, + { + "epoch": 0.39, + "learning_rate": 0.002410597191166495, + "loss": 0.1303, + "step": 15640 + }, + { + "epoch": 0.39, + "learning_rate": 0.0024102203351506167, + "loss": 0.1356, + "step": 15650 + }, + { + "epoch": 0.39, + "learning_rate": 0.002409843479134739, + "loss": 0.1349, + "step": 15660 + }, + { + "epoch": 0.39, + "learning_rate": 0.0024094666231188606, + "loss": 0.1313, + "step": 15670 + }, + { + "epoch": 0.39, + "learning_rate": 0.002409089767102982, + "loss": 0.13, + "step": 15680 + }, + { + "epoch": 0.39, + "learning_rate": 0.002408712911087104, + "loss": 0.1347, + "step": 15690 + }, + { + "epoch": 0.39, + "learning_rate": 0.002408336055071226, + "loss": 0.1337, + "step": 15700 + }, + { + "epoch": 0.39, + "learning_rate": 0.0024079591990553476, + "loss": 0.1349, + "step": 15710 + }, + { + "epoch": 0.39, + "learning_rate": 0.0024075823430394694, + "loss": 0.132, + "step": 15720 + }, + { + "epoch": 0.4, + "learning_rate": 0.002407205487023591, + "loss": 0.1344, + "step": 15730 + }, + { + "epoch": 0.4, + "learning_rate": 0.0024068286310077133, + "loss": 0.1321, + "step": 15740 + }, + { + "epoch": 0.4, + "learning_rate": 0.002406451774991835, + "loss": 0.1306, + "step": 15750 + }, + { + "epoch": 0.4, + "learning_rate": 0.0024060749189759563, + "loss": 0.1325, + "step": 15760 + }, + { + "epoch": 0.4, + "learning_rate": 0.0024056980629600785, + "loss": 0.1307, + "step": 15770 + }, + { + "epoch": 0.4, + "learning_rate": 0.0024053212069442003, + "loss": 0.1312, + "step": 15780 + }, + { + "epoch": 0.4, + "learning_rate": 0.002404944350928322, + "loss": 0.133, + "step": 15790 + }, + { + "epoch": 0.4, + "learning_rate": 0.0024045674949124437, + "loss": 0.1328, + "step": 15800 + }, + { + "epoch": 0.4, + "learning_rate": 0.0024041906388965655, + "loss": 0.1337, + "step": 15810 + }, + { + "epoch": 0.4, + "learning_rate": 0.0024038137828806877, + "loss": 0.1288, + "step": 15820 + }, + { + "epoch": 0.4, + "learning_rate": 0.002403436926864809, + "loss": 0.1336, + "step": 15830 + }, + { + "epoch": 0.4, + "learning_rate": 0.002403060070848931, + "loss": 0.1361, + "step": 15840 + }, + { + "epoch": 0.4, + "learning_rate": 0.002402683214833053, + "loss": 0.1311, + "step": 15850 + }, + { + "epoch": 0.4, + "learning_rate": 0.0024023063588171746, + "loss": 0.1308, + "step": 15860 + }, + { + "epoch": 0.4, + "learning_rate": 0.0024019295028012964, + "loss": 0.1331, + "step": 15870 + }, + { + "epoch": 0.4, + "learning_rate": 0.002401552646785418, + "loss": 0.1337, + "step": 15880 + }, + { + "epoch": 0.4, + "learning_rate": 0.00240117579076954, + "loss": 0.1339, + "step": 15890 + }, + { + "epoch": 0.4, + "learning_rate": 0.002400798934753662, + "loss": 0.1303, + "step": 15900 + }, + { + "epoch": 0.4, + "learning_rate": 0.0024004220787377834, + "loss": 0.1286, + "step": 15910 + }, + { + "epoch": 0.4, + "learning_rate": 0.0024000452227219055, + "loss": 0.1352, + "step": 15920 + }, + { + "epoch": 0.4, + "learning_rate": 0.0023996683667060273, + "loss": 0.1322, + "step": 15930 + }, + { + "epoch": 0.4, + "learning_rate": 0.002399291510690149, + "loss": 0.1314, + "step": 15940 + }, + { + "epoch": 0.4, + "learning_rate": 0.0023989146546742708, + "loss": 0.1326, + "step": 15950 + }, + { + "epoch": 0.4, + "learning_rate": 0.0023985377986583925, + "loss": 0.1248, + "step": 15960 + }, + { + "epoch": 0.4, + "learning_rate": 0.0023981609426425147, + "loss": 0.1372, + "step": 15970 + }, + { + "epoch": 0.4, + "learning_rate": 0.0023977840866266364, + "loss": 0.1297, + "step": 15980 + }, + { + "epoch": 0.4, + "learning_rate": 0.0023974072306107578, + "loss": 0.1284, + "step": 15990 + }, + { + "epoch": 0.4, + "learning_rate": 0.00239703037459488, + "loss": 0.1375, + "step": 16000 + }, + { + "epoch": 0.4, + "eval_cer": 0.6667884179408443, + "eval_loss": 0.10115189850330353, + "eval_runtime": 90.5383, + "eval_samples_per_second": 110.439, + "eval_steps_per_second": 6.903, + "step": 16000 + }, + { + "epoch": 0.4, + "learning_rate": 0.0023966535185790017, + "loss": 0.1304, + "step": 16010 + }, + { + "epoch": 0.4, + "learning_rate": 0.0023962766625631234, + "loss": 0.1332, + "step": 16020 + }, + { + "epoch": 0.4, + "learning_rate": 0.002395899806547245, + "loss": 0.1248, + "step": 16030 + }, + { + "epoch": 0.4, + "learning_rate": 0.002395522950531367, + "loss": 0.1352, + "step": 16040 + }, + { + "epoch": 0.4, + "learning_rate": 0.002395146094515489, + "loss": 0.1351, + "step": 16050 + }, + { + "epoch": 0.4, + "learning_rate": 0.0023947692384996104, + "loss": 0.1287, + "step": 16060 + }, + { + "epoch": 0.4, + "learning_rate": 0.0023943923824837326, + "loss": 0.1347, + "step": 16070 + }, + { + "epoch": 0.4, + "learning_rate": 0.0023940155264678543, + "loss": 0.129, + "step": 16080 + }, + { + "epoch": 0.4, + "learning_rate": 0.002393638670451976, + "loss": 0.1308, + "step": 16090 + }, + { + "epoch": 0.4, + "learning_rate": 0.002393261814436098, + "loss": 0.1314, + "step": 16100 + }, + { + "epoch": 0.4, + "learning_rate": 0.0023928849584202196, + "loss": 0.1307, + "step": 16110 + }, + { + "epoch": 0.4, + "learning_rate": 0.0023925081024043413, + "loss": 0.1281, + "step": 16120 + }, + { + "epoch": 0.41, + "learning_rate": 0.0023921312463884635, + "loss": 0.1255, + "step": 16130 + }, + { + "epoch": 0.41, + "learning_rate": 0.002391754390372585, + "loss": 0.1315, + "step": 16140 + }, + { + "epoch": 0.41, + "learning_rate": 0.002391377534356707, + "loss": 0.1308, + "step": 16150 + }, + { + "epoch": 0.41, + "learning_rate": 0.0023910006783408287, + "loss": 0.1296, + "step": 16160 + }, + { + "epoch": 0.41, + "learning_rate": 0.0023906238223249505, + "loss": 0.1326, + "step": 16170 + }, + { + "epoch": 0.41, + "learning_rate": 0.002390246966309072, + "loss": 0.1309, + "step": 16180 + }, + { + "epoch": 0.41, + "learning_rate": 0.002389870110293194, + "loss": 0.1344, + "step": 16190 + }, + { + "epoch": 0.41, + "learning_rate": 0.0023894932542773157, + "loss": 0.131, + "step": 16200 + }, + { + "epoch": 0.41, + "learning_rate": 0.002389116398261438, + "loss": 0.1335, + "step": 16210 + }, + { + "epoch": 0.41, + "learning_rate": 0.002388739542245559, + "loss": 0.1325, + "step": 16220 + }, + { + "epoch": 0.41, + "learning_rate": 0.0023883626862296814, + "loss": 0.131, + "step": 16230 + }, + { + "epoch": 0.41, + "learning_rate": 0.002387985830213803, + "loss": 0.132, + "step": 16240 + }, + { + "epoch": 0.41, + "learning_rate": 0.002387608974197925, + "loss": 0.1291, + "step": 16250 + }, + { + "epoch": 0.41, + "learning_rate": 0.0023872321181820466, + "loss": 0.1333, + "step": 16260 + }, + { + "epoch": 0.41, + "learning_rate": 0.0023868552621661683, + "loss": 0.1288, + "step": 16270 + }, + { + "epoch": 0.41, + "learning_rate": 0.0023864784061502905, + "loss": 0.135, + "step": 16280 + }, + { + "epoch": 0.41, + "learning_rate": 0.002386101550134412, + "loss": 0.1296, + "step": 16290 + }, + { + "epoch": 0.41, + "learning_rate": 0.0023857246941185336, + "loss": 0.1361, + "step": 16300 + }, + { + "epoch": 0.41, + "learning_rate": 0.0023853478381026558, + "loss": 0.1353, + "step": 16310 + }, + { + "epoch": 0.41, + "learning_rate": 0.0023849709820867775, + "loss": 0.1296, + "step": 16320 + }, + { + "epoch": 0.41, + "learning_rate": 0.0023845941260708992, + "loss": 0.131, + "step": 16330 + }, + { + "epoch": 0.41, + "learning_rate": 0.002384217270055021, + "loss": 0.126, + "step": 16340 + }, + { + "epoch": 0.41, + "learning_rate": 0.0023838404140391427, + "loss": 0.1299, + "step": 16350 + }, + { + "epoch": 0.41, + "learning_rate": 0.002383463558023265, + "loss": 0.1355, + "step": 16360 + }, + { + "epoch": 0.41, + "learning_rate": 0.0023830867020073862, + "loss": 0.1266, + "step": 16370 + }, + { + "epoch": 0.41, + "learning_rate": 0.0023827098459915084, + "loss": 0.129, + "step": 16380 + }, + { + "epoch": 0.41, + "learning_rate": 0.00238233298997563, + "loss": 0.1271, + "step": 16390 + }, + { + "epoch": 0.41, + "learning_rate": 0.002381956133959752, + "loss": 0.1268, + "step": 16400 + }, + { + "epoch": 0.41, + "learning_rate": 0.0023815792779438736, + "loss": 0.1308, + "step": 16410 + }, + { + "epoch": 0.41, + "learning_rate": 0.0023812024219279954, + "loss": 0.1335, + "step": 16420 + }, + { + "epoch": 0.41, + "learning_rate": 0.002380825565912117, + "loss": 0.13, + "step": 16430 + }, + { + "epoch": 0.41, + "learning_rate": 0.0023804487098962393, + "loss": 0.1295, + "step": 16440 + }, + { + "epoch": 0.41, + "learning_rate": 0.0023800718538803606, + "loss": 0.1331, + "step": 16450 + }, + { + "epoch": 0.41, + "learning_rate": 0.002379694997864483, + "loss": 0.1305, + "step": 16460 + }, + { + "epoch": 0.41, + "learning_rate": 0.0023793181418486045, + "loss": 0.127, + "step": 16470 + }, + { + "epoch": 0.41, + "learning_rate": 0.0023789412858327263, + "loss": 0.1286, + "step": 16480 + }, + { + "epoch": 0.41, + "learning_rate": 0.002378564429816848, + "loss": 0.1325, + "step": 16490 + }, + { + "epoch": 0.41, + "learning_rate": 0.0023781875738009698, + "loss": 0.1325, + "step": 16500 + }, + { + "epoch": 0.41, + "eval_cer": 0.6672475116782571, + "eval_loss": 0.09959594905376434, + "eval_runtime": 90.384, + "eval_samples_per_second": 110.628, + "eval_steps_per_second": 6.915, + "step": 16500 + }, + { + "epoch": 0.41, + "learning_rate": 0.0023778107177850915, + "loss": 0.1236, + "step": 16510 + }, + { + "epoch": 0.42, + "learning_rate": 0.0023774338617692133, + "loss": 0.1281, + "step": 16520 + }, + { + "epoch": 0.42, + "learning_rate": 0.002377057005753335, + "loss": 0.1294, + "step": 16530 + }, + { + "epoch": 0.42, + "learning_rate": 0.002376680149737457, + "loss": 0.129, + "step": 16540 + }, + { + "epoch": 0.42, + "learning_rate": 0.002376303293721579, + "loss": 0.1296, + "step": 16550 + }, + { + "epoch": 0.42, + "learning_rate": 0.0023759264377057007, + "loss": 0.1235, + "step": 16560 + }, + { + "epoch": 0.42, + "learning_rate": 0.0023755495816898224, + "loss": 0.132, + "step": 16570 + }, + { + "epoch": 0.42, + "learning_rate": 0.002375172725673944, + "loss": 0.1317, + "step": 16580 + }, + { + "epoch": 0.42, + "learning_rate": 0.0023747958696580663, + "loss": 0.1299, + "step": 16590 + }, + { + "epoch": 0.42, + "learning_rate": 0.0023744190136421876, + "loss": 0.1312, + "step": 16600 + }, + { + "epoch": 0.42, + "learning_rate": 0.0023740421576263094, + "loss": 0.1296, + "step": 16610 + }, + { + "epoch": 0.42, + "learning_rate": 0.0023736653016104316, + "loss": 0.1294, + "step": 16620 + }, + { + "epoch": 0.42, + "learning_rate": 0.0023732884455945533, + "loss": 0.1285, + "step": 16630 + }, + { + "epoch": 0.42, + "learning_rate": 0.002372911589578675, + "loss": 0.1263, + "step": 16640 + }, + { + "epoch": 0.42, + "learning_rate": 0.002372534733562797, + "loss": 0.126, + "step": 16650 + }, + { + "epoch": 0.42, + "learning_rate": 0.0023721578775469186, + "loss": 0.132, + "step": 16660 + }, + { + "epoch": 0.42, + "learning_rate": 0.0023717810215310407, + "loss": 0.1263, + "step": 16670 + }, + { + "epoch": 0.42, + "learning_rate": 0.002371404165515162, + "loss": 0.1259, + "step": 16680 + }, + { + "epoch": 0.42, + "learning_rate": 0.0023710273094992842, + "loss": 0.1279, + "step": 16690 + }, + { + "epoch": 0.42, + "learning_rate": 0.002370650453483406, + "loss": 0.1294, + "step": 16700 + }, + { + "epoch": 0.42, + "learning_rate": 0.0023702735974675273, + "loss": 0.1265, + "step": 16710 + }, + { + "epoch": 0.42, + "learning_rate": 0.0023698967414516495, + "loss": 0.1238, + "step": 16720 + }, + { + "epoch": 0.42, + "learning_rate": 0.002369519885435771, + "loss": 0.1275, + "step": 16730 + }, + { + "epoch": 0.42, + "learning_rate": 0.002369143029419893, + "loss": 0.1314, + "step": 16740 + }, + { + "epoch": 0.42, + "learning_rate": 0.0023687661734040147, + "loss": 0.1291, + "step": 16750 + }, + { + "epoch": 0.42, + "learning_rate": 0.0023683893173881364, + "loss": 0.1285, + "step": 16760 + }, + { + "epoch": 0.42, + "learning_rate": 0.0023680124613722586, + "loss": 0.1266, + "step": 16770 + }, + { + "epoch": 0.42, + "learning_rate": 0.0023676356053563804, + "loss": 0.1264, + "step": 16780 + }, + { + "epoch": 0.42, + "learning_rate": 0.002367258749340502, + "loss": 0.1287, + "step": 16790 + }, + { + "epoch": 0.42, + "learning_rate": 0.002366881893324624, + "loss": 0.1263, + "step": 16800 + }, + { + "epoch": 0.42, + "learning_rate": 0.0023665050373087456, + "loss": 0.1273, + "step": 16810 + }, + { + "epoch": 0.42, + "learning_rate": 0.0023661281812928678, + "loss": 0.1295, + "step": 16820 + }, + { + "epoch": 0.42, + "learning_rate": 0.002365751325276989, + "loss": 0.1266, + "step": 16830 + }, + { + "epoch": 0.42, + "learning_rate": 0.002365374469261111, + "loss": 0.1238, + "step": 16840 + }, + { + "epoch": 0.42, + "learning_rate": 0.002364997613245233, + "loss": 0.1303, + "step": 16850 + }, + { + "epoch": 0.42, + "learning_rate": 0.0023646207572293547, + "loss": 0.1264, + "step": 16860 + }, + { + "epoch": 0.42, + "learning_rate": 0.0023642439012134765, + "loss": 0.1264, + "step": 16870 + }, + { + "epoch": 0.42, + "learning_rate": 0.0023638670451975982, + "loss": 0.1284, + "step": 16880 + }, + { + "epoch": 0.42, + "learning_rate": 0.00236349018918172, + "loss": 0.1287, + "step": 16890 + }, + { + "epoch": 0.42, + "learning_rate": 0.002363113333165842, + "loss": 0.1283, + "step": 16900 + }, + { + "epoch": 0.42, + "learning_rate": 0.0023627364771499635, + "loss": 0.1314, + "step": 16910 + }, + { + "epoch": 0.43, + "learning_rate": 0.002362359621134085, + "loss": 0.1295, + "step": 16920 + }, + { + "epoch": 0.43, + "learning_rate": 0.0023619827651182074, + "loss": 0.1247, + "step": 16930 + }, + { + "epoch": 0.43, + "learning_rate": 0.0023616059091023287, + "loss": 0.1302, + "step": 16940 + }, + { + "epoch": 0.43, + "learning_rate": 0.002361229053086451, + "loss": 0.1249, + "step": 16950 + }, + { + "epoch": 0.43, + "learning_rate": 0.0023608521970705726, + "loss": 0.1342, + "step": 16960 + }, + { + "epoch": 0.43, + "learning_rate": 0.0023604753410546944, + "loss": 0.1287, + "step": 16970 + }, + { + "epoch": 0.43, + "learning_rate": 0.002360098485038816, + "loss": 0.1265, + "step": 16980 + }, + { + "epoch": 0.43, + "learning_rate": 0.002359721629022938, + "loss": 0.1266, + "step": 16990 + }, + { + "epoch": 0.43, + "learning_rate": 0.00235934477300706, + "loss": 0.1277, + "step": 17000 + }, + { + "epoch": 0.43, + "eval_cer": 0.6664294201126367, + "eval_loss": 0.0992693156003952, + "eval_runtime": 89.9278, + "eval_samples_per_second": 111.189, + "eval_steps_per_second": 6.95, + "step": 17000 + }, + { + "epoch": 0.43, + "learning_rate": 0.0023589679169911818, + "loss": 0.1268, + "step": 17010 + }, + { + "epoch": 0.43, + "learning_rate": 0.002358591060975303, + "loss": 0.1255, + "step": 17020 + }, + { + "epoch": 0.43, + "learning_rate": 0.0023582142049594253, + "loss": 0.1296, + "step": 17030 + }, + { + "epoch": 0.43, + "learning_rate": 0.002357837348943547, + "loss": 0.1273, + "step": 17040 + }, + { + "epoch": 0.43, + "learning_rate": 0.0023574604929276688, + "loss": 0.1304, + "step": 17050 + }, + { + "epoch": 0.43, + "learning_rate": 0.0023570836369117905, + "loss": 0.1262, + "step": 17060 + }, + { + "epoch": 0.43, + "learning_rate": 0.0023567067808959122, + "loss": 0.1257, + "step": 17070 + }, + { + "epoch": 0.43, + "learning_rate": 0.0023563299248800344, + "loss": 0.1275, + "step": 17080 + }, + { + "epoch": 0.43, + "learning_rate": 0.002355953068864156, + "loss": 0.1241, + "step": 17090 + }, + { + "epoch": 0.43, + "learning_rate": 0.002355576212848278, + "loss": 0.126, + "step": 17100 + }, + { + "epoch": 0.43, + "learning_rate": 0.0023551993568323997, + "loss": 0.1239, + "step": 17110 + }, + { + "epoch": 0.43, + "learning_rate": 0.0023548225008165214, + "loss": 0.1276, + "step": 17120 + }, + { + "epoch": 0.43, + "learning_rate": 0.0023544456448006436, + "loss": 0.127, + "step": 17130 + }, + { + "epoch": 0.43, + "learning_rate": 0.002354068788784765, + "loss": 0.1229, + "step": 17140 + }, + { + "epoch": 0.43, + "learning_rate": 0.0023536919327688866, + "loss": 0.1245, + "step": 17150 + }, + { + "epoch": 0.43, + "learning_rate": 0.002353315076753009, + "loss": 0.1276, + "step": 17160 + }, + { + "epoch": 0.43, + "learning_rate": 0.00235293822073713, + "loss": 0.1289, + "step": 17170 + }, + { + "epoch": 0.43, + "learning_rate": 0.0023525613647212523, + "loss": 0.1231, + "step": 17180 + }, + { + "epoch": 0.43, + "learning_rate": 0.002352184508705374, + "loss": 0.1289, + "step": 17190 + }, + { + "epoch": 0.43, + "learning_rate": 0.002351807652689496, + "loss": 0.1239, + "step": 17200 + }, + { + "epoch": 0.43, + "learning_rate": 0.0023514307966736175, + "loss": 0.1276, + "step": 17210 + }, + { + "epoch": 0.43, + "learning_rate": 0.0023510539406577393, + "loss": 0.1261, + "step": 17220 + }, + { + "epoch": 0.43, + "learning_rate": 0.0023506770846418615, + "loss": 0.13, + "step": 17230 + }, + { + "epoch": 0.43, + "learning_rate": 0.002350300228625983, + "loss": 0.1246, + "step": 17240 + }, + { + "epoch": 0.43, + "learning_rate": 0.0023499233726101045, + "loss": 0.1247, + "step": 17250 + }, + { + "epoch": 0.43, + "learning_rate": 0.0023495465165942267, + "loss": 0.1258, + "step": 17260 + }, + { + "epoch": 0.43, + "learning_rate": 0.0023491696605783484, + "loss": 0.1278, + "step": 17270 + }, + { + "epoch": 0.43, + "learning_rate": 0.00234879280456247, + "loss": 0.1273, + "step": 17280 + }, + { + "epoch": 0.43, + "learning_rate": 0.002348415948546592, + "loss": 0.1286, + "step": 17290 + }, + { + "epoch": 0.43, + "learning_rate": 0.0023480390925307137, + "loss": 0.1257, + "step": 17300 + }, + { + "epoch": 0.43, + "learning_rate": 0.002347662236514836, + "loss": 0.1244, + "step": 17310 + }, + { + "epoch": 0.44, + "learning_rate": 0.0023472853804989576, + "loss": 0.1232, + "step": 17320 + }, + { + "epoch": 0.44, + "learning_rate": 0.002346908524483079, + "loss": 0.1284, + "step": 17330 + }, + { + "epoch": 0.44, + "learning_rate": 0.002346531668467201, + "loss": 0.1194, + "step": 17340 + }, + { + "epoch": 0.44, + "learning_rate": 0.002346154812451323, + "loss": 0.13, + "step": 17350 + }, + { + "epoch": 0.44, + "learning_rate": 0.0023457779564354446, + "loss": 0.1288, + "step": 17360 + }, + { + "epoch": 0.44, + "learning_rate": 0.0023454011004195663, + "loss": 0.1264, + "step": 17370 + }, + { + "epoch": 0.44, + "learning_rate": 0.002345024244403688, + "loss": 0.1265, + "step": 17380 + }, + { + "epoch": 0.44, + "learning_rate": 0.0023446473883878102, + "loss": 0.1252, + "step": 17390 + }, + { + "epoch": 0.44, + "learning_rate": 0.0023442705323719316, + "loss": 0.1218, + "step": 17400 + }, + { + "epoch": 0.44, + "learning_rate": 0.0023438936763560537, + "loss": 0.1263, + "step": 17410 + }, + { + "epoch": 0.44, + "learning_rate": 0.0023435168203401755, + "loss": 0.1277, + "step": 17420 + }, + { + "epoch": 0.44, + "learning_rate": 0.0023431399643242972, + "loss": 0.1216, + "step": 17430 + }, + { + "epoch": 0.44, + "learning_rate": 0.002342763108308419, + "loss": 0.1234, + "step": 17440 + }, + { + "epoch": 0.44, + "learning_rate": 0.0023423862522925407, + "loss": 0.1257, + "step": 17450 + }, + { + "epoch": 0.44, + "learning_rate": 0.0023420093962766625, + "loss": 0.128, + "step": 17460 + }, + { + "epoch": 0.44, + "learning_rate": 0.0023416325402607846, + "loss": 0.123, + "step": 17470 + }, + { + "epoch": 0.44, + "learning_rate": 0.002341255684244906, + "loss": 0.1204, + "step": 17480 + }, + { + "epoch": 0.44, + "learning_rate": 0.002340878828229028, + "loss": 0.1233, + "step": 17490 + }, + { + "epoch": 0.44, + "learning_rate": 0.00234050197221315, + "loss": 0.1261, + "step": 17500 + }, + { + "epoch": 0.44, + "eval_cer": 0.6667470321322305, + "eval_loss": 0.09771975874900818, + "eval_runtime": 90.5027, + "eval_samples_per_second": 110.483, + "eval_steps_per_second": 6.906, + "step": 17500 + }, + { + "epoch": 0.44, + "learning_rate": 0.0023401251161972716, + "loss": 0.1238, + "step": 17510 + }, + { + "epoch": 0.44, + "learning_rate": 0.0023397482601813934, + "loss": 0.1288, + "step": 17520 + }, + { + "epoch": 0.44, + "learning_rate": 0.002339371404165515, + "loss": 0.1262, + "step": 17530 + }, + { + "epoch": 0.44, + "learning_rate": 0.0023389945481496373, + "loss": 0.1228, + "step": 17540 + }, + { + "epoch": 0.44, + "learning_rate": 0.002338617692133759, + "loss": 0.1256, + "step": 17550 + }, + { + "epoch": 0.44, + "learning_rate": 0.0023382408361178803, + "loss": 0.1243, + "step": 17560 + }, + { + "epoch": 0.44, + "learning_rate": 0.0023378639801020025, + "loss": 0.1237, + "step": 17570 + }, + { + "epoch": 0.44, + "learning_rate": 0.0023374871240861243, + "loss": 0.1283, + "step": 17580 + }, + { + "epoch": 0.44, + "learning_rate": 0.002337110268070246, + "loss": 0.1226, + "step": 17590 + }, + { + "epoch": 0.44, + "learning_rate": 0.0023367334120543677, + "loss": 0.1264, + "step": 17600 + }, + { + "epoch": 0.44, + "learning_rate": 0.0023363565560384895, + "loss": 0.1233, + "step": 17610 + }, + { + "epoch": 0.44, + "learning_rate": 0.0023359797000226117, + "loss": 0.128, + "step": 17620 + }, + { + "epoch": 0.44, + "learning_rate": 0.002335602844006733, + "loss": 0.1229, + "step": 17630 + }, + { + "epoch": 0.44, + "learning_rate": 0.002335225987990855, + "loss": 0.122, + "step": 17640 + }, + { + "epoch": 0.44, + "learning_rate": 0.002334849131974977, + "loss": 0.1308, + "step": 17650 + }, + { + "epoch": 0.44, + "learning_rate": 0.0023344722759590987, + "loss": 0.1234, + "step": 17660 + }, + { + "epoch": 0.44, + "learning_rate": 0.0023340954199432204, + "loss": 0.1256, + "step": 17670 + }, + { + "epoch": 0.44, + "learning_rate": 0.002333718563927342, + "loss": 0.1232, + "step": 17680 + }, + { + "epoch": 0.44, + "learning_rate": 0.002333341707911464, + "loss": 0.1286, + "step": 17690 + }, + { + "epoch": 0.44, + "learning_rate": 0.002332964851895586, + "loss": 0.1266, + "step": 17700 + }, + { + "epoch": 0.44, + "learning_rate": 0.0023325879958797074, + "loss": 0.1291, + "step": 17710 + }, + { + "epoch": 0.45, + "learning_rate": 0.0023322111398638296, + "loss": 0.1222, + "step": 17720 + }, + { + "epoch": 0.45, + "learning_rate": 0.0023318342838479513, + "loss": 0.1305, + "step": 17730 + }, + { + "epoch": 0.45, + "learning_rate": 0.002331457427832073, + "loss": 0.1229, + "step": 17740 + }, + { + "epoch": 0.45, + "learning_rate": 0.002331080571816195, + "loss": 0.1247, + "step": 17750 + }, + { + "epoch": 0.45, + "learning_rate": 0.0023307037158003165, + "loss": 0.1236, + "step": 17760 + }, + { + "epoch": 0.45, + "learning_rate": 0.0023303268597844383, + "loss": 0.1223, + "step": 17770 + }, + { + "epoch": 0.45, + "learning_rate": 0.0023299500037685605, + "loss": 0.1233, + "step": 17780 + }, + { + "epoch": 0.45, + "learning_rate": 0.0023295731477526818, + "loss": 0.1242, + "step": 17790 + }, + { + "epoch": 0.45, + "learning_rate": 0.002329196291736804, + "loss": 0.1234, + "step": 17800 + }, + { + "epoch": 0.45, + "learning_rate": 0.0023288194357209257, + "loss": 0.125, + "step": 17810 + }, + { + "epoch": 0.45, + "learning_rate": 0.0023284425797050474, + "loss": 0.1259, + "step": 17820 + }, + { + "epoch": 0.45, + "learning_rate": 0.002328065723689169, + "loss": 0.1273, + "step": 17830 + }, + { + "epoch": 0.45, + "learning_rate": 0.002327688867673291, + "loss": 0.1222, + "step": 17840 + }, + { + "epoch": 0.45, + "learning_rate": 0.002327312011657413, + "loss": 0.1231, + "step": 17850 + }, + { + "epoch": 0.45, + "learning_rate": 0.0023269351556415344, + "loss": 0.127, + "step": 17860 + }, + { + "epoch": 0.45, + "learning_rate": 0.002326558299625656, + "loss": 0.1236, + "step": 17870 + }, + { + "epoch": 0.45, + "learning_rate": 0.0023261814436097783, + "loss": 0.121, + "step": 17880 + }, + { + "epoch": 0.45, + "learning_rate": 0.0023258045875939, + "loss": 0.1251, + "step": 17890 + }, + { + "epoch": 0.45, + "learning_rate": 0.002325427731578022, + "loss": 0.1245, + "step": 17900 + }, + { + "epoch": 0.45, + "learning_rate": 0.0023250508755621436, + "loss": 0.123, + "step": 17910 + }, + { + "epoch": 0.45, + "learning_rate": 0.0023246740195462653, + "loss": 0.1223, + "step": 17920 + }, + { + "epoch": 0.45, + "learning_rate": 0.0023242971635303875, + "loss": 0.1253, + "step": 17930 + }, + { + "epoch": 0.45, + "learning_rate": 0.002323920307514509, + "loss": 0.1272, + "step": 17940 + }, + { + "epoch": 0.45, + "learning_rate": 0.002323543451498631, + "loss": 0.1252, + "step": 17950 + }, + { + "epoch": 0.45, + "learning_rate": 0.0023231665954827527, + "loss": 0.1234, + "step": 17960 + }, + { + "epoch": 0.45, + "learning_rate": 0.0023227897394668745, + "loss": 0.1189, + "step": 17970 + }, + { + "epoch": 0.45, + "learning_rate": 0.002322412883450996, + "loss": 0.1245, + "step": 17980 + }, + { + "epoch": 0.45, + "learning_rate": 0.002322036027435118, + "loss": 0.126, + "step": 17990 + }, + { + "epoch": 0.45, + "learning_rate": 0.0023216591714192397, + "loss": 0.1274, + "step": 18000 + }, + { + "epoch": 0.45, + "eval_cer": 0.6665598335328033, + "eval_loss": 0.09775370359420776, + "eval_runtime": 90.7418, + "eval_samples_per_second": 110.192, + "eval_steps_per_second": 6.888, + "step": 18000 + }, + { + "epoch": 0.45, + "learning_rate": 0.002321282315403362, + "loss": 0.1237, + "step": 18010 + }, + { + "epoch": 0.45, + "learning_rate": 0.002320905459387483, + "loss": 0.1249, + "step": 18020 + }, + { + "epoch": 0.45, + "learning_rate": 0.0023205286033716054, + "loss": 0.1234, + "step": 18030 + }, + { + "epoch": 0.45, + "learning_rate": 0.002320151747355727, + "loss": 0.1262, + "step": 18040 + }, + { + "epoch": 0.45, + "learning_rate": 0.002319774891339849, + "loss": 0.1243, + "step": 18050 + }, + { + "epoch": 0.45, + "learning_rate": 0.0023193980353239706, + "loss": 0.1269, + "step": 18060 + }, + { + "epoch": 0.45, + "learning_rate": 0.0023190211793080923, + "loss": 0.12, + "step": 18070 + }, + { + "epoch": 0.45, + "learning_rate": 0.002318644323292214, + "loss": 0.123, + "step": 18080 + }, + { + "epoch": 0.45, + "learning_rate": 0.002318267467276336, + "loss": 0.1257, + "step": 18090 + }, + { + "epoch": 0.45, + "learning_rate": 0.0023178906112604576, + "loss": 0.1206, + "step": 18100 + }, + { + "epoch": 0.45, + "learning_rate": 0.0023175137552445798, + "loss": 0.1256, + "step": 18110 + }, + { + "epoch": 0.46, + "learning_rate": 0.0023171368992287015, + "loss": 0.1233, + "step": 18120 + }, + { + "epoch": 0.46, + "learning_rate": 0.0023167600432128233, + "loss": 0.1218, + "step": 18130 + }, + { + "epoch": 0.46, + "learning_rate": 0.002316383187196945, + "loss": 0.1226, + "step": 18140 + }, + { + "epoch": 0.46, + "learning_rate": 0.0023160063311810667, + "loss": 0.1261, + "step": 18150 + }, + { + "epoch": 0.46, + "learning_rate": 0.002315629475165189, + "loss": 0.1266, + "step": 18160 + }, + { + "epoch": 0.46, + "learning_rate": 0.0023152526191493102, + "loss": 0.1251, + "step": 18170 + }, + { + "epoch": 0.46, + "learning_rate": 0.002314875763133432, + "loss": 0.1207, + "step": 18180 + }, + { + "epoch": 0.46, + "learning_rate": 0.002314498907117554, + "loss": 0.1216, + "step": 18190 + }, + { + "epoch": 0.46, + "learning_rate": 0.002314122051101676, + "loss": 0.1245, + "step": 18200 + }, + { + "epoch": 0.46, + "learning_rate": 0.0023137451950857976, + "loss": 0.1237, + "step": 18210 + }, + { + "epoch": 0.46, + "learning_rate": 0.0023133683390699194, + "loss": 0.1242, + "step": 18220 + }, + { + "epoch": 0.46, + "learning_rate": 0.002312991483054041, + "loss": 0.1258, + "step": 18230 + }, + { + "epoch": 0.46, + "learning_rate": 0.0023126146270381633, + "loss": 0.1235, + "step": 18240 + }, + { + "epoch": 0.46, + "learning_rate": 0.0023122377710222846, + "loss": 0.1249, + "step": 18250 + }, + { + "epoch": 0.46, + "learning_rate": 0.002311860915006407, + "loss": 0.1215, + "step": 18260 + }, + { + "epoch": 0.46, + "learning_rate": 0.0023114840589905285, + "loss": 0.1191, + "step": 18270 + }, + { + "epoch": 0.46, + "learning_rate": 0.00231110720297465, + "loss": 0.124, + "step": 18280 + }, + { + "epoch": 0.46, + "learning_rate": 0.002310730346958772, + "loss": 0.118, + "step": 18290 + }, + { + "epoch": 0.46, + "learning_rate": 0.0023103534909428938, + "loss": 0.1242, + "step": 18300 + }, + { + "epoch": 0.46, + "learning_rate": 0.0023099766349270155, + "loss": 0.1194, + "step": 18310 + }, + { + "epoch": 0.46, + "learning_rate": 0.0023095997789111373, + "loss": 0.1201, + "step": 18320 + }, + { + "epoch": 0.46, + "learning_rate": 0.002309222922895259, + "loss": 0.124, + "step": 18330 + }, + { + "epoch": 0.46, + "learning_rate": 0.002308846066879381, + "loss": 0.1186, + "step": 18340 + }, + { + "epoch": 0.46, + "learning_rate": 0.002308469210863503, + "loss": 0.1269, + "step": 18350 + }, + { + "epoch": 0.46, + "learning_rate": 0.0023080923548476247, + "loss": 0.1216, + "step": 18360 + }, + { + "epoch": 0.46, + "learning_rate": 0.0023077154988317464, + "loss": 0.1281, + "step": 18370 + }, + { + "epoch": 0.46, + "learning_rate": 0.002307338642815868, + "loss": 0.1173, + "step": 18380 + }, + { + "epoch": 0.46, + "learning_rate": 0.0023069617867999903, + "loss": 0.1263, + "step": 18390 + }, + { + "epoch": 0.46, + "learning_rate": 0.0023065849307841117, + "loss": 0.1241, + "step": 18400 + }, + { + "epoch": 0.46, + "learning_rate": 0.0023062080747682334, + "loss": 0.1192, + "step": 18410 + }, + { + "epoch": 0.46, + "learning_rate": 0.0023058312187523556, + "loss": 0.1211, + "step": 18420 + }, + { + "epoch": 0.46, + "learning_rate": 0.0023054543627364773, + "loss": 0.1245, + "step": 18430 + }, + { + "epoch": 0.46, + "learning_rate": 0.002305077506720599, + "loss": 0.1278, + "step": 18440 + }, + { + "epoch": 0.46, + "learning_rate": 0.002304700650704721, + "loss": 0.1201, + "step": 18450 + }, + { + "epoch": 0.46, + "learning_rate": 0.0023043237946888426, + "loss": 0.1232, + "step": 18460 + }, + { + "epoch": 0.46, + "learning_rate": 0.0023039469386729643, + "loss": 0.1217, + "step": 18470 + }, + { + "epoch": 0.46, + "learning_rate": 0.002303570082657086, + "loss": 0.1234, + "step": 18480 + }, + { + "epoch": 0.46, + "learning_rate": 0.002303193226641208, + "loss": 0.1227, + "step": 18490 + }, + { + "epoch": 0.46, + "learning_rate": 0.00230281637062533, + "loss": 0.127, + "step": 18500 + }, + { + "epoch": 0.46, + "eval_cer": 0.666954442405632, + "eval_loss": 0.09521838277578354, + "eval_runtime": 90.8104, + "eval_samples_per_second": 110.108, + "eval_steps_per_second": 6.882, + "step": 18500 + }, + { + "epoch": 0.47, + "learning_rate": 0.0023024395146094513, + "loss": 0.1223, + "step": 18510 + }, + { + "epoch": 0.47, + "learning_rate": 0.0023020626585935735, + "loss": 0.1227, + "step": 18520 + }, + { + "epoch": 0.47, + "learning_rate": 0.002301685802577695, + "loss": 0.125, + "step": 18530 + }, + { + "epoch": 0.47, + "learning_rate": 0.002301308946561817, + "loss": 0.1247, + "step": 18540 + }, + { + "epoch": 0.47, + "learning_rate": 0.0023009320905459387, + "loss": 0.123, + "step": 18550 + }, + { + "epoch": 0.47, + "learning_rate": 0.0023005552345300604, + "loss": 0.1183, + "step": 18560 + }, + { + "epoch": 0.47, + "learning_rate": 0.0023001783785141826, + "loss": 0.1241, + "step": 18570 + }, + { + "epoch": 0.47, + "learning_rate": 0.0022998015224983044, + "loss": 0.1171, + "step": 18580 + }, + { + "epoch": 0.47, + "learning_rate": 0.0022994246664824257, + "loss": 0.1219, + "step": 18590 + }, + { + "epoch": 0.47, + "learning_rate": 0.002299047810466548, + "loss": 0.1205, + "step": 18600 + }, + { + "epoch": 0.47, + "learning_rate": 0.0022986709544506696, + "loss": 0.1256, + "step": 18610 + }, + { + "epoch": 0.47, + "learning_rate": 0.0022982940984347913, + "loss": 0.1216, + "step": 18620 + }, + { + "epoch": 0.47, + "learning_rate": 0.002297917242418913, + "loss": 0.1178, + "step": 18630 + }, + { + "epoch": 0.47, + "learning_rate": 0.002297540386403035, + "loss": 0.1251, + "step": 18640 + }, + { + "epoch": 0.47, + "learning_rate": 0.002297163530387157, + "loss": 0.1244, + "step": 18650 + }, + { + "epoch": 0.47, + "learning_rate": 0.0022967866743712788, + "loss": 0.1232, + "step": 18660 + }, + { + "epoch": 0.47, + "learning_rate": 0.0022964098183554005, + "loss": 0.122, + "step": 18670 + }, + { + "epoch": 0.47, + "learning_rate": 0.0022960329623395222, + "loss": 0.1202, + "step": 18680 + }, + { + "epoch": 0.47, + "learning_rate": 0.002295656106323644, + "loss": 0.121, + "step": 18690 + }, + { + "epoch": 0.47, + "learning_rate": 0.0022952792503077657, + "loss": 0.1192, + "step": 18700 + }, + { + "epoch": 0.47, + "learning_rate": 0.0022949023942918875, + "loss": 0.1214, + "step": 18710 + }, + { + "epoch": 0.47, + "learning_rate": 0.0022945255382760092, + "loss": 0.1244, + "step": 18720 + }, + { + "epoch": 0.47, + "learning_rate": 0.0022941486822601314, + "loss": 0.1192, + "step": 18730 + }, + { + "epoch": 0.47, + "learning_rate": 0.0022937718262442527, + "loss": 0.1202, + "step": 18740 + }, + { + "epoch": 0.47, + "learning_rate": 0.002293394970228375, + "loss": 0.1208, + "step": 18750 + }, + { + "epoch": 0.47, + "learning_rate": 0.0022930181142124966, + "loss": 0.1224, + "step": 18760 + }, + { + "epoch": 0.47, + "learning_rate": 0.0022926412581966184, + "loss": 0.1217, + "step": 18770 + }, + { + "epoch": 0.47, + "learning_rate": 0.00229226440218074, + "loss": 0.1192, + "step": 18780 + }, + { + "epoch": 0.47, + "learning_rate": 0.002291887546164862, + "loss": 0.1227, + "step": 18790 + }, + { + "epoch": 0.47, + "learning_rate": 0.002291510690148984, + "loss": 0.1202, + "step": 18800 + }, + { + "epoch": 0.47, + "learning_rate": 0.002291133834133106, + "loss": 0.1191, + "step": 18810 + }, + { + "epoch": 0.47, + "learning_rate": 0.002290756978117227, + "loss": 0.1211, + "step": 18820 + }, + { + "epoch": 0.47, + "learning_rate": 0.0022903801221013493, + "loss": 0.1165, + "step": 18830 + }, + { + "epoch": 0.47, + "learning_rate": 0.002290003266085471, + "loss": 0.1223, + "step": 18840 + }, + { + "epoch": 0.47, + "learning_rate": 0.0022896264100695928, + "loss": 0.1191, + "step": 18850 + }, + { + "epoch": 0.47, + "learning_rate": 0.0022892495540537145, + "loss": 0.1233, + "step": 18860 + }, + { + "epoch": 0.47, + "learning_rate": 0.0022888726980378363, + "loss": 0.1229, + "step": 18870 + }, + { + "epoch": 0.47, + "learning_rate": 0.0022884958420219584, + "loss": 0.1229, + "step": 18880 + }, + { + "epoch": 0.47, + "learning_rate": 0.00228811898600608, + "loss": 0.1148, + "step": 18890 + }, + { + "epoch": 0.47, + "learning_rate": 0.0022877421299902015, + "loss": 0.122, + "step": 18900 + }, + { + "epoch": 0.48, + "learning_rate": 0.0022873652739743237, + "loss": 0.1173, + "step": 18910 + }, + { + "epoch": 0.48, + "learning_rate": 0.0022869884179584454, + "loss": 0.1202, + "step": 18920 + }, + { + "epoch": 0.48, + "learning_rate": 0.002286611561942567, + "loss": 0.1187, + "step": 18930 + }, + { + "epoch": 0.48, + "learning_rate": 0.002286234705926689, + "loss": 0.1185, + "step": 18940 + }, + { + "epoch": 0.48, + "learning_rate": 0.0022858578499108106, + "loss": 0.1197, + "step": 18950 + }, + { + "epoch": 0.48, + "learning_rate": 0.002285480993894933, + "loss": 0.1194, + "step": 18960 + }, + { + "epoch": 0.48, + "learning_rate": 0.002285104137879054, + "loss": 0.1173, + "step": 18970 + }, + { + "epoch": 0.48, + "learning_rate": 0.0022847272818631763, + "loss": 0.1204, + "step": 18980 + }, + { + "epoch": 0.48, + "learning_rate": 0.002284350425847298, + "loss": 0.122, + "step": 18990 + }, + { + "epoch": 0.48, + "learning_rate": 0.00228397356983142, + "loss": 0.1218, + "step": 19000 + }, + { + "epoch": 0.48, + "eval_cer": 0.6666175811727294, + "eval_loss": 0.09327735006809235, + "eval_runtime": 90.7107, + "eval_samples_per_second": 110.23, + "eval_steps_per_second": 6.89, + "step": 19000 + }, + { + "epoch": 0.48, + "learning_rate": 0.0022835967138155415, + "loss": 0.1221, + "step": 19010 + }, + { + "epoch": 0.48, + "learning_rate": 0.0022832198577996633, + "loss": 0.116, + "step": 19020 + }, + { + "epoch": 0.48, + "learning_rate": 0.002282843001783785, + "loss": 0.1177, + "step": 19030 + }, + { + "epoch": 0.48, + "learning_rate": 0.002282466145767907, + "loss": 0.1163, + "step": 19040 + }, + { + "epoch": 0.48, + "learning_rate": 0.0022820892897520285, + "loss": 0.1187, + "step": 19050 + }, + { + "epoch": 0.48, + "learning_rate": 0.0022817124337361507, + "loss": 0.1194, + "step": 19060 + }, + { + "epoch": 0.48, + "learning_rate": 0.0022813355777202724, + "loss": 0.1258, + "step": 19070 + }, + { + "epoch": 0.48, + "learning_rate": 0.002280958721704394, + "loss": 0.1166, + "step": 19080 + }, + { + "epoch": 0.48, + "learning_rate": 0.002280581865688516, + "loss": 0.1228, + "step": 19090 + }, + { + "epoch": 0.48, + "learning_rate": 0.0022802050096726377, + "loss": 0.1203, + "step": 19100 + }, + { + "epoch": 0.48, + "learning_rate": 0.00227982815365676, + "loss": 0.1189, + "step": 19110 + }, + { + "epoch": 0.48, + "learning_rate": 0.0022794512976408816, + "loss": 0.122, + "step": 19120 + }, + { + "epoch": 0.48, + "learning_rate": 0.002279074441625003, + "loss": 0.124, + "step": 19130 + }, + { + "epoch": 0.48, + "learning_rate": 0.002278697585609125, + "loss": 0.1167, + "step": 19140 + }, + { + "epoch": 0.48, + "learning_rate": 0.002278320729593247, + "loss": 0.1135, + "step": 19150 + }, + { + "epoch": 0.48, + "learning_rate": 0.0022779438735773686, + "loss": 0.1167, + "step": 19160 + }, + { + "epoch": 0.48, + "learning_rate": 0.0022775670175614903, + "loss": 0.1166, + "step": 19170 + }, + { + "epoch": 0.48, + "learning_rate": 0.002277190161545612, + "loss": 0.121, + "step": 19180 + }, + { + "epoch": 0.48, + "learning_rate": 0.0022768133055297343, + "loss": 0.1165, + "step": 19190 + }, + { + "epoch": 0.48, + "learning_rate": 0.0022764364495138556, + "loss": 0.1173, + "step": 19200 + }, + { + "epoch": 0.48, + "learning_rate": 0.0022760595934979777, + "loss": 0.1213, + "step": 19210 + }, + { + "epoch": 0.48, + "learning_rate": 0.0022756827374820995, + "loss": 0.1188, + "step": 19220 + }, + { + "epoch": 0.48, + "learning_rate": 0.0022753058814662212, + "loss": 0.1217, + "step": 19230 + }, + { + "epoch": 0.48, + "learning_rate": 0.002274929025450343, + "loss": 0.1161, + "step": 19240 + }, + { + "epoch": 0.48, + "learning_rate": 0.0022745521694344647, + "loss": 0.1178, + "step": 19250 + }, + { + "epoch": 0.48, + "learning_rate": 0.0022741753134185865, + "loss": 0.1174, + "step": 19260 + }, + { + "epoch": 0.48, + "learning_rate": 0.0022737984574027086, + "loss": 0.1216, + "step": 19270 + }, + { + "epoch": 0.48, + "learning_rate": 0.00227342160138683, + "loss": 0.1221, + "step": 19280 + }, + { + "epoch": 0.48, + "learning_rate": 0.002273044745370952, + "loss": 0.1164, + "step": 19290 + }, + { + "epoch": 0.48, + "learning_rate": 0.002272667889355074, + "loss": 0.1192, + "step": 19300 + }, + { + "epoch": 0.49, + "learning_rate": 0.0022722910333391956, + "loss": 0.1179, + "step": 19310 + }, + { + "epoch": 0.49, + "learning_rate": 0.0022719141773233174, + "loss": 0.1218, + "step": 19320 + }, + { + "epoch": 0.49, + "learning_rate": 0.002271537321307439, + "loss": 0.1203, + "step": 19330 + }, + { + "epoch": 0.49, + "learning_rate": 0.002271160465291561, + "loss": 0.1147, + "step": 19340 + }, + { + "epoch": 0.49, + "learning_rate": 0.002270783609275683, + "loss": 0.1206, + "step": 19350 + }, + { + "epoch": 0.49, + "learning_rate": 0.0022704067532598043, + "loss": 0.1198, + "step": 19360 + }, + { + "epoch": 0.49, + "learning_rate": 0.0022700298972439265, + "loss": 0.1178, + "step": 19370 + }, + { + "epoch": 0.49, + "learning_rate": 0.0022696530412280483, + "loss": 0.1152, + "step": 19380 + }, + { + "epoch": 0.49, + "learning_rate": 0.00226927618521217, + "loss": 0.1182, + "step": 19390 + }, + { + "epoch": 0.49, + "learning_rate": 0.0022688993291962918, + "loss": 0.1174, + "step": 19400 + }, + { + "epoch": 0.49, + "learning_rate": 0.0022685224731804135, + "loss": 0.1188, + "step": 19410 + }, + { + "epoch": 0.49, + "learning_rate": 0.0022681456171645357, + "loss": 0.1168, + "step": 19420 + }, + { + "epoch": 0.49, + "learning_rate": 0.002267768761148657, + "loss": 0.1203, + "step": 19430 + }, + { + "epoch": 0.49, + "learning_rate": 0.0022673919051327787, + "loss": 0.1236, + "step": 19440 + }, + { + "epoch": 0.49, + "learning_rate": 0.002267015049116901, + "loss": 0.1227, + "step": 19450 + }, + { + "epoch": 0.49, + "learning_rate": 0.0022666381931010227, + "loss": 0.1164, + "step": 19460 + }, + { + "epoch": 0.49, + "learning_rate": 0.0022662613370851444, + "loss": 0.117, + "step": 19470 + }, + { + "epoch": 0.49, + "learning_rate": 0.002265884481069266, + "loss": 0.117, + "step": 19480 + }, + { + "epoch": 0.49, + "learning_rate": 0.002265507625053388, + "loss": 0.1143, + "step": 19490 + }, + { + "epoch": 0.49, + "learning_rate": 0.00226513076903751, + "loss": 0.1196, + "step": 19500 + }, + { + "epoch": 0.49, + "eval_cer": 0.6669568485572955, + "eval_loss": 0.09227263927459717, + "eval_runtime": 90.7185, + "eval_samples_per_second": 110.22, + "eval_steps_per_second": 6.889, + "step": 19500 + }, + { + "epoch": 0.49, + "learning_rate": 0.0022647539130216314, + "loss": 0.1182, + "step": 19510 + }, + { + "epoch": 0.49, + "learning_rate": 0.0022643770570057536, + "loss": 0.1229, + "step": 19520 + }, + { + "epoch": 0.49, + "learning_rate": 0.0022640002009898753, + "loss": 0.119, + "step": 19530 + }, + { + "epoch": 0.49, + "learning_rate": 0.002263623344973997, + "loss": 0.1206, + "step": 19540 + }, + { + "epoch": 0.49, + "learning_rate": 0.002263246488958119, + "loss": 0.1215, + "step": 19550 + }, + { + "epoch": 0.49, + "learning_rate": 0.0022628696329422405, + "loss": 0.1164, + "step": 19560 + }, + { + "epoch": 0.49, + "learning_rate": 0.0022624927769263623, + "loss": 0.1196, + "step": 19570 + }, + { + "epoch": 0.49, + "learning_rate": 0.002262115920910484, + "loss": 0.1197, + "step": 19580 + }, + { + "epoch": 0.49, + "learning_rate": 0.0022617390648946058, + "loss": 0.1172, + "step": 19590 + }, + { + "epoch": 0.49, + "learning_rate": 0.002261362208878728, + "loss": 0.12, + "step": 19600 + }, + { + "epoch": 0.49, + "learning_rate": 0.0022609853528628497, + "loss": 0.1218, + "step": 19610 + }, + { + "epoch": 0.49, + "learning_rate": 0.0022606084968469714, + "loss": 0.1144, + "step": 19620 + }, + { + "epoch": 0.49, + "learning_rate": 0.002260231640831093, + "loss": 0.1146, + "step": 19630 + }, + { + "epoch": 0.49, + "learning_rate": 0.002259854784815215, + "loss": 0.1174, + "step": 19640 + }, + { + "epoch": 0.49, + "learning_rate": 0.002259477928799337, + "loss": 0.1192, + "step": 19650 + }, + { + "epoch": 0.49, + "learning_rate": 0.0022591010727834584, + "loss": 0.1187, + "step": 19660 + }, + { + "epoch": 0.49, + "learning_rate": 0.00225872421676758, + "loss": 0.1168, + "step": 19670 + }, + { + "epoch": 0.49, + "learning_rate": 0.0022583473607517023, + "loss": 0.1135, + "step": 19680 + }, + { + "epoch": 0.49, + "learning_rate": 0.002257970504735824, + "loss": 0.1226, + "step": 19690 + }, + { + "epoch": 0.49, + "learning_rate": 0.002257593648719946, + "loss": 0.1168, + "step": 19700 + }, + { + "epoch": 0.5, + "learning_rate": 0.0022572167927040676, + "loss": 0.1186, + "step": 19710 + }, + { + "epoch": 0.5, + "learning_rate": 0.0022568399366881893, + "loss": 0.1157, + "step": 19720 + }, + { + "epoch": 0.5, + "learning_rate": 0.0022564630806723115, + "loss": 0.12, + "step": 19730 + }, + { + "epoch": 0.5, + "learning_rate": 0.002256086224656433, + "loss": 0.1199, + "step": 19740 + }, + { + "epoch": 0.5, + "learning_rate": 0.0022557093686405546, + "loss": 0.1184, + "step": 19750 + }, + { + "epoch": 0.5, + "learning_rate": 0.0022553325126246767, + "loss": 0.1196, + "step": 19760 + }, + { + "epoch": 0.5, + "learning_rate": 0.0022549556566087985, + "loss": 0.1181, + "step": 19770 + }, + { + "epoch": 0.5, + "learning_rate": 0.0022545788005929202, + "loss": 0.12, + "step": 19780 + }, + { + "epoch": 0.5, + "learning_rate": 0.002254201944577042, + "loss": 0.1205, + "step": 19790 + }, + { + "epoch": 0.5, + "learning_rate": 0.0022538250885611637, + "loss": 0.1222, + "step": 19800 + }, + { + "epoch": 0.5, + "learning_rate": 0.0022534482325452855, + "loss": 0.1145, + "step": 19810 + }, + { + "epoch": 0.5, + "learning_rate": 0.002253071376529407, + "loss": 0.1165, + "step": 19820 + }, + { + "epoch": 0.5, + "learning_rate": 0.0022526945205135294, + "loss": 0.1159, + "step": 19830 + }, + { + "epoch": 0.5, + "learning_rate": 0.002252317664497651, + "loss": 0.1232, + "step": 19840 + }, + { + "epoch": 0.5, + "learning_rate": 0.0022519408084817724, + "loss": 0.1218, + "step": 19850 + }, + { + "epoch": 0.5, + "learning_rate": 0.0022515639524658946, + "loss": 0.1184, + "step": 19860 + }, + { + "epoch": 0.5, + "learning_rate": 0.0022511870964500164, + "loss": 0.122, + "step": 19870 + }, + { + "epoch": 0.5, + "learning_rate": 0.002250810240434138, + "loss": 0.1124, + "step": 19880 + }, + { + "epoch": 0.5, + "learning_rate": 0.00225043338441826, + "loss": 0.1178, + "step": 19890 + }, + { + "epoch": 0.5, + "learning_rate": 0.0022500565284023816, + "loss": 0.1173, + "step": 19900 + }, + { + "epoch": 0.5, + "learning_rate": 0.0022496796723865038, + "loss": 0.1223, + "step": 19910 + }, + { + "epoch": 0.5, + "learning_rate": 0.0022493028163706255, + "loss": 0.1175, + "step": 19920 + }, + { + "epoch": 0.5, + "learning_rate": 0.0022489259603547473, + "loss": 0.1188, + "step": 19930 + }, + { + "epoch": 0.5, + "learning_rate": 0.002248549104338869, + "loss": 0.1198, + "step": 19940 + }, + { + "epoch": 0.5, + "learning_rate": 0.0022481722483229907, + "loss": 0.1179, + "step": 19950 + }, + { + "epoch": 0.5, + "learning_rate": 0.002247795392307113, + "loss": 0.1201, + "step": 19960 + }, + { + "epoch": 0.5, + "learning_rate": 0.0022474185362912342, + "loss": 0.1225, + "step": 19970 + }, + { + "epoch": 0.5, + "learning_rate": 0.002247041680275356, + "loss": 0.1212, + "step": 19980 + }, + { + "epoch": 0.5, + "learning_rate": 0.002246664824259478, + "loss": 0.1194, + "step": 19990 + }, + { + "epoch": 0.5, + "learning_rate": 0.0022462879682436, + "loss": 0.1192, + "step": 20000 + }, + { + "epoch": 0.5, + "eval_cer": 0.6664963111288845, + "eval_loss": 0.092043936252594, + "eval_runtime": 90.451, + "eval_samples_per_second": 110.546, + "eval_steps_per_second": 6.91, + "step": 20000 + }, + { + "epoch": 0.5, + "learning_rate": 0.0022459111122277216, + "loss": 0.1115, + "step": 20010 + }, + { + "epoch": 0.5, + "learning_rate": 0.0022455342562118434, + "loss": 0.1164, + "step": 20020 + }, + { + "epoch": 0.5, + "learning_rate": 0.002245157400195965, + "loss": 0.1172, + "step": 20030 + }, + { + "epoch": 0.5, + "learning_rate": 0.002244780544180087, + "loss": 0.1178, + "step": 20040 + }, + { + "epoch": 0.5, + "learning_rate": 0.0022444036881642086, + "loss": 0.1159, + "step": 20050 + }, + { + "epoch": 0.5, + "learning_rate": 0.0022440268321483304, + "loss": 0.1169, + "step": 20060 + }, + { + "epoch": 0.5, + "learning_rate": 0.0022436499761324525, + "loss": 0.1225, + "step": 20070 + }, + { + "epoch": 0.5, + "learning_rate": 0.002243273120116574, + "loss": 0.1197, + "step": 20080 + }, + { + "epoch": 0.5, + "learning_rate": 0.002242896264100696, + "loss": 0.1165, + "step": 20090 + }, + { + "epoch": 0.5, + "learning_rate": 0.002242519408084818, + "loss": 0.1179, + "step": 20100 + }, + { + "epoch": 0.51, + "learning_rate": 0.0022421425520689395, + "loss": 0.1151, + "step": 20110 + }, + { + "epoch": 0.51, + "learning_rate": 0.0022417656960530613, + "loss": 0.1182, + "step": 20120 + }, + { + "epoch": 0.51, + "learning_rate": 0.002241388840037183, + "loss": 0.1153, + "step": 20130 + }, + { + "epoch": 0.51, + "learning_rate": 0.002241011984021305, + "loss": 0.1169, + "step": 20140 + }, + { + "epoch": 0.51, + "learning_rate": 0.002240635128005427, + "loss": 0.1147, + "step": 20150 + }, + { + "epoch": 0.51, + "learning_rate": 0.0022402582719895483, + "loss": 0.1198, + "step": 20160 + }, + { + "epoch": 0.51, + "learning_rate": 0.0022398814159736704, + "loss": 0.1145, + "step": 20170 + }, + { + "epoch": 0.51, + "learning_rate": 0.002239504559957792, + "loss": 0.1199, + "step": 20180 + }, + { + "epoch": 0.51, + "learning_rate": 0.002239127703941914, + "loss": 0.1185, + "step": 20190 + }, + { + "epoch": 0.51, + "learning_rate": 0.0022387508479260357, + "loss": 0.1161, + "step": 20200 + }, + { + "epoch": 0.51, + "learning_rate": 0.0022383739919101574, + "loss": 0.1151, + "step": 20210 + }, + { + "epoch": 0.51, + "learning_rate": 0.0022379971358942796, + "loss": 0.1166, + "step": 20220 + }, + { + "epoch": 0.51, + "learning_rate": 0.0022376202798784013, + "loss": 0.1154, + "step": 20230 + }, + { + "epoch": 0.51, + "learning_rate": 0.002237243423862523, + "loss": 0.113, + "step": 20240 + }, + { + "epoch": 0.51, + "learning_rate": 0.002236866567846645, + "loss": 0.117, + "step": 20250 + }, + { + "epoch": 0.51, + "learning_rate": 0.0022364897118307666, + "loss": 0.1133, + "step": 20260 + }, + { + "epoch": 0.51, + "learning_rate": 0.0022361128558148883, + "loss": 0.1151, + "step": 20270 + }, + { + "epoch": 0.51, + "learning_rate": 0.00223573599979901, + "loss": 0.1179, + "step": 20280 + }, + { + "epoch": 0.51, + "learning_rate": 0.002235359143783132, + "loss": 0.1155, + "step": 20290 + }, + { + "epoch": 0.51, + "learning_rate": 0.002234982287767254, + "loss": 0.1183, + "step": 20300 + }, + { + "epoch": 0.51, + "learning_rate": 0.0022346054317513753, + "loss": 0.1147, + "step": 20310 + }, + { + "epoch": 0.51, + "learning_rate": 0.0022342285757354975, + "loss": 0.1121, + "step": 20320 + }, + { + "epoch": 0.51, + "learning_rate": 0.002233851719719619, + "loss": 0.1151, + "step": 20330 + }, + { + "epoch": 0.51, + "learning_rate": 0.002233474863703741, + "loss": 0.1132, + "step": 20340 + }, + { + "epoch": 0.51, + "learning_rate": 0.0022330980076878627, + "loss": 0.112, + "step": 20350 + }, + { + "epoch": 0.51, + "learning_rate": 0.0022327211516719844, + "loss": 0.117, + "step": 20360 + }, + { + "epoch": 0.51, + "learning_rate": 0.0022323442956561066, + "loss": 0.1193, + "step": 20370 + }, + { + "epoch": 0.51, + "learning_rate": 0.0022319674396402284, + "loss": 0.1169, + "step": 20380 + }, + { + "epoch": 0.51, + "learning_rate": 0.0022315905836243497, + "loss": 0.1149, + "step": 20390 + }, + { + "epoch": 0.51, + "learning_rate": 0.002231213727608472, + "loss": 0.117, + "step": 20400 + }, + { + "epoch": 0.51, + "learning_rate": 0.0022308368715925936, + "loss": 0.1156, + "step": 20410 + }, + { + "epoch": 0.51, + "learning_rate": 0.0022304600155767153, + "loss": 0.1151, + "step": 20420 + }, + { + "epoch": 0.51, + "learning_rate": 0.002230083159560837, + "loss": 0.1175, + "step": 20430 + }, + { + "epoch": 0.51, + "learning_rate": 0.002229706303544959, + "loss": 0.1186, + "step": 20440 + }, + { + "epoch": 0.51, + "learning_rate": 0.002229329447529081, + "loss": 0.1189, + "step": 20450 + }, + { + "epoch": 0.51, + "learning_rate": 0.0022289525915132028, + "loss": 0.1145, + "step": 20460 + }, + { + "epoch": 0.51, + "learning_rate": 0.002228575735497324, + "loss": 0.1116, + "step": 20470 + }, + { + "epoch": 0.51, + "learning_rate": 0.0022281988794814462, + "loss": 0.1133, + "step": 20480 + }, + { + "epoch": 0.51, + "learning_rate": 0.002227822023465568, + "loss": 0.1166, + "step": 20490 + }, + { + "epoch": 0.52, + "learning_rate": 0.0022274451674496897, + "loss": 0.1171, + "step": 20500 + }, + { + "epoch": 0.52, + "eval_cer": 0.6664255702699751, + "eval_loss": 0.09097065031528473, + "eval_runtime": 90.5473, + "eval_samples_per_second": 110.428, + "eval_steps_per_second": 6.902, + "step": 20500 + }, + { + "epoch": 0.52, + "learning_rate": 0.0022270683114338115, + "loss": 0.1169, + "step": 20510 + }, + { + "epoch": 0.52, + "learning_rate": 0.0022266914554179332, + "loss": 0.1147, + "step": 20520 + }, + { + "epoch": 0.52, + "learning_rate": 0.0022263145994020554, + "loss": 0.1185, + "step": 20530 + }, + { + "epoch": 0.52, + "learning_rate": 0.0022259377433861767, + "loss": 0.1151, + "step": 20540 + }, + { + "epoch": 0.52, + "learning_rate": 0.002225560887370299, + "loss": 0.1262, + "step": 20550 + }, + { + "epoch": 0.52, + "learning_rate": 0.0022251840313544206, + "loss": 0.1153, + "step": 20560 + }, + { + "epoch": 0.52, + "learning_rate": 0.0022248071753385424, + "loss": 0.1152, + "step": 20570 + }, + { + "epoch": 0.52, + "learning_rate": 0.002224430319322664, + "loss": 0.116, + "step": 20580 + }, + { + "epoch": 0.52, + "learning_rate": 0.002224053463306786, + "loss": 0.1174, + "step": 20590 + }, + { + "epoch": 0.52, + "learning_rate": 0.0022236766072909076, + "loss": 0.1168, + "step": 20600 + }, + { + "epoch": 0.52, + "learning_rate": 0.00222329975127503, + "loss": 0.1212, + "step": 20610 + }, + { + "epoch": 0.52, + "learning_rate": 0.002222922895259151, + "loss": 0.1179, + "step": 20620 + }, + { + "epoch": 0.52, + "learning_rate": 0.0022225460392432733, + "loss": 0.1173, + "step": 20630 + }, + { + "epoch": 0.52, + "learning_rate": 0.002222169183227395, + "loss": 0.1177, + "step": 20640 + }, + { + "epoch": 0.52, + "learning_rate": 0.0022217923272115168, + "loss": 0.1143, + "step": 20650 + }, + { + "epoch": 0.52, + "learning_rate": 0.0022214154711956385, + "loss": 0.1165, + "step": 20660 + }, + { + "epoch": 0.52, + "learning_rate": 0.0022210386151797603, + "loss": 0.1171, + "step": 20670 + }, + { + "epoch": 0.52, + "learning_rate": 0.0022206617591638824, + "loss": 0.1179, + "step": 20680 + }, + { + "epoch": 0.52, + "learning_rate": 0.002220284903148004, + "loss": 0.1132, + "step": 20690 + }, + { + "epoch": 0.52, + "learning_rate": 0.0022199080471321255, + "loss": 0.1157, + "step": 20700 + }, + { + "epoch": 0.52, + "learning_rate": 0.0022195311911162477, + "loss": 0.1183, + "step": 20710 + }, + { + "epoch": 0.52, + "learning_rate": 0.0022191543351003694, + "loss": 0.1109, + "step": 20720 + }, + { + "epoch": 0.52, + "learning_rate": 0.002218777479084491, + "loss": 0.1149, + "step": 20730 + }, + { + "epoch": 0.52, + "learning_rate": 0.002218400623068613, + "loss": 0.1176, + "step": 20740 + }, + { + "epoch": 0.52, + "learning_rate": 0.0022180237670527347, + "loss": 0.1171, + "step": 20750 + }, + { + "epoch": 0.52, + "learning_rate": 0.002217646911036857, + "loss": 0.1141, + "step": 20760 + }, + { + "epoch": 0.52, + "learning_rate": 0.002217270055020978, + "loss": 0.1177, + "step": 20770 + }, + { + "epoch": 0.52, + "learning_rate": 0.0022168931990051003, + "loss": 0.1168, + "step": 20780 + }, + { + "epoch": 0.52, + "learning_rate": 0.002216516342989222, + "loss": 0.1154, + "step": 20790 + }, + { + "epoch": 0.52, + "learning_rate": 0.002216139486973344, + "loss": 0.117, + "step": 20800 + }, + { + "epoch": 0.52, + "learning_rate": 0.0022157626309574656, + "loss": 0.1117, + "step": 20810 + }, + { + "epoch": 0.52, + "learning_rate": 0.0022153857749415873, + "loss": 0.1193, + "step": 20820 + }, + { + "epoch": 0.52, + "learning_rate": 0.002215008918925709, + "loss": 0.1155, + "step": 20830 + }, + { + "epoch": 0.52, + "learning_rate": 0.0022146320629098312, + "loss": 0.1168, + "step": 20840 + }, + { + "epoch": 0.52, + "learning_rate": 0.0022142552068939525, + "loss": 0.1174, + "step": 20850 + }, + { + "epoch": 0.52, + "learning_rate": 0.0022138783508780747, + "loss": 0.1157, + "step": 20860 + }, + { + "epoch": 0.52, + "learning_rate": 0.0022135014948621965, + "loss": 0.1179, + "step": 20870 + }, + { + "epoch": 0.52, + "learning_rate": 0.002213124638846318, + "loss": 0.1193, + "step": 20880 + }, + { + "epoch": 0.52, + "learning_rate": 0.00221274778283044, + "loss": 0.1098, + "step": 20890 + }, + { + "epoch": 0.53, + "learning_rate": 0.0022123709268145617, + "loss": 0.1113, + "step": 20900 + }, + { + "epoch": 0.53, + "learning_rate": 0.0022119940707986834, + "loss": 0.1159, + "step": 20910 + }, + { + "epoch": 0.53, + "learning_rate": 0.002211617214782805, + "loss": 0.115, + "step": 20920 + }, + { + "epoch": 0.53, + "learning_rate": 0.002211240358766927, + "loss": 0.1144, + "step": 20930 + }, + { + "epoch": 0.53, + "learning_rate": 0.002210863502751049, + "loss": 0.1148, + "step": 20940 + }, + { + "epoch": 0.53, + "learning_rate": 0.002210486646735171, + "loss": 0.1135, + "step": 20950 + }, + { + "epoch": 0.53, + "learning_rate": 0.0022101097907192926, + "loss": 0.1133, + "step": 20960 + }, + { + "epoch": 0.53, + "learning_rate": 0.0022097329347034143, + "loss": 0.1146, + "step": 20970 + }, + { + "epoch": 0.53, + "learning_rate": 0.002209356078687536, + "loss": 0.1112, + "step": 20980 + }, + { + "epoch": 0.53, + "learning_rate": 0.0022089792226716583, + "loss": 0.1161, + "step": 20990 + }, + { + "epoch": 0.53, + "learning_rate": 0.0022086023666557796, + "loss": 0.1153, + "step": 21000 + }, + { + "epoch": 0.53, + "eval_cer": 0.6667460696715651, + "eval_loss": 0.09056726843118668, + "eval_runtime": 90.5012, + "eval_samples_per_second": 110.485, + "eval_steps_per_second": 6.906, + "step": 21000 + }, + { + "epoch": 0.53, + "learning_rate": 0.0022082255106399013, + "loss": 0.1174, + "step": 21010 + }, + { + "epoch": 0.53, + "learning_rate": 0.0022078486546240235, + "loss": 0.1156, + "step": 21020 + }, + { + "epoch": 0.53, + "learning_rate": 0.0022074717986081452, + "loss": 0.1146, + "step": 21030 + }, + { + "epoch": 0.53, + "learning_rate": 0.002207094942592267, + "loss": 0.1141, + "step": 21040 + }, + { + "epoch": 0.53, + "learning_rate": 0.0022067180865763887, + "loss": 0.1204, + "step": 21050 + }, + { + "epoch": 0.53, + "learning_rate": 0.0022063412305605105, + "loss": 0.1143, + "step": 21060 + }, + { + "epoch": 0.53, + "learning_rate": 0.0022059643745446327, + "loss": 0.1137, + "step": 21070 + }, + { + "epoch": 0.53, + "learning_rate": 0.002205587518528754, + "loss": 0.1142, + "step": 21080 + }, + { + "epoch": 0.53, + "learning_rate": 0.002205210662512876, + "loss": 0.1162, + "step": 21090 + }, + { + "epoch": 0.53, + "learning_rate": 0.002204833806496998, + "loss": 0.1157, + "step": 21100 + }, + { + "epoch": 0.53, + "learning_rate": 0.0022044569504811196, + "loss": 0.1174, + "step": 21110 + }, + { + "epoch": 0.53, + "learning_rate": 0.0022040800944652414, + "loss": 0.1144, + "step": 21120 + }, + { + "epoch": 0.53, + "learning_rate": 0.002203703238449363, + "loss": 0.1112, + "step": 21130 + }, + { + "epoch": 0.53, + "learning_rate": 0.002203326382433485, + "loss": 0.1166, + "step": 21140 + }, + { + "epoch": 0.53, + "learning_rate": 0.0022029495264176066, + "loss": 0.1152, + "step": 21150 + }, + { + "epoch": 0.53, + "learning_rate": 0.0022025726704017284, + "loss": 0.1105, + "step": 21160 + }, + { + "epoch": 0.53, + "learning_rate": 0.0022021958143858505, + "loss": 0.1146, + "step": 21170 + }, + { + "epoch": 0.53, + "learning_rate": 0.0022018189583699723, + "loss": 0.1094, + "step": 21180 + }, + { + "epoch": 0.53, + "learning_rate": 0.002201442102354094, + "loss": 0.1152, + "step": 21190 + }, + { + "epoch": 0.53, + "learning_rate": 0.0022010652463382158, + "loss": 0.1148, + "step": 21200 + }, + { + "epoch": 0.53, + "learning_rate": 0.0022006883903223375, + "loss": 0.1176, + "step": 21210 + }, + { + "epoch": 0.53, + "learning_rate": 0.0022003115343064597, + "loss": 0.115, + "step": 21220 + }, + { + "epoch": 0.53, + "learning_rate": 0.002199934678290581, + "loss": 0.1175, + "step": 21230 + }, + { + "epoch": 0.53, + "learning_rate": 0.0021995578222747027, + "loss": 0.1085, + "step": 21240 + }, + { + "epoch": 0.53, + "learning_rate": 0.002199180966258825, + "loss": 0.119, + "step": 21250 + }, + { + "epoch": 0.53, + "learning_rate": 0.0021988041102429467, + "loss": 0.1126, + "step": 21260 + }, + { + "epoch": 0.53, + "learning_rate": 0.0021984272542270684, + "loss": 0.1117, + "step": 21270 + }, + { + "epoch": 0.53, + "learning_rate": 0.00219805039821119, + "loss": 0.1146, + "step": 21280 + }, + { + "epoch": 0.53, + "learning_rate": 0.002197673542195312, + "loss": 0.1172, + "step": 21290 + }, + { + "epoch": 0.54, + "learning_rate": 0.002197296686179434, + "loss": 0.1111, + "step": 21300 + }, + { + "epoch": 0.54, + "learning_rate": 0.0021969198301635554, + "loss": 0.113, + "step": 21310 + }, + { + "epoch": 0.54, + "learning_rate": 0.002196542974147677, + "loss": 0.1072, + "step": 21320 + }, + { + "epoch": 0.54, + "learning_rate": 0.0021961661181317993, + "loss": 0.1112, + "step": 21330 + }, + { + "epoch": 0.54, + "learning_rate": 0.002195789262115921, + "loss": 0.1138, + "step": 21340 + }, + { + "epoch": 0.54, + "learning_rate": 0.002195412406100043, + "loss": 0.1179, + "step": 21350 + }, + { + "epoch": 0.54, + "learning_rate": 0.0021950355500841645, + "loss": 0.1125, + "step": 21360 + }, + { + "epoch": 0.54, + "learning_rate": 0.0021946586940682863, + "loss": 0.116, + "step": 21370 + }, + { + "epoch": 0.54, + "learning_rate": 0.002194281838052408, + "loss": 0.1137, + "step": 21380 + }, + { + "epoch": 0.54, + "learning_rate": 0.0021939049820365298, + "loss": 0.1113, + "step": 21390 + }, + { + "epoch": 0.54, + "learning_rate": 0.002193528126020652, + "loss": 0.1131, + "step": 21400 + }, + { + "epoch": 0.54, + "learning_rate": 0.0021931512700047737, + "loss": 0.1159, + "step": 21410 + }, + { + "epoch": 0.54, + "learning_rate": 0.002192774413988895, + "loss": 0.1164, + "step": 21420 + }, + { + "epoch": 0.54, + "learning_rate": 0.002192397557973017, + "loss": 0.1153, + "step": 21430 + }, + { + "epoch": 0.54, + "learning_rate": 0.002192020701957139, + "loss": 0.1154, + "step": 21440 + }, + { + "epoch": 0.54, + "learning_rate": 0.0021916438459412607, + "loss": 0.1124, + "step": 21450 + }, + { + "epoch": 0.54, + "learning_rate": 0.0021912669899253824, + "loss": 0.1153, + "step": 21460 + }, + { + "epoch": 0.54, + "learning_rate": 0.002190890133909504, + "loss": 0.116, + "step": 21470 + }, + { + "epoch": 0.54, + "learning_rate": 0.0021905132778936263, + "loss": 0.1127, + "step": 21480 + }, + { + "epoch": 0.54, + "learning_rate": 0.002190136421877748, + "loss": 0.1138, + "step": 21490 + }, + { + "epoch": 0.54, + "learning_rate": 0.00218975956586187, + "loss": 0.1102, + "step": 21500 + }, + { + "epoch": 0.54, + "eval_cer": 0.6668567526480902, + "eval_loss": 0.08902458846569061, + "eval_runtime": 90.6566, + "eval_samples_per_second": 110.295, + "eval_steps_per_second": 6.894, + "step": 21500 + }, + { + "epoch": 0.54, + "learning_rate": 0.0021893827098459916, + "loss": 0.1131, + "step": 21510 + }, + { + "epoch": 0.54, + "learning_rate": 0.0021890058538301133, + "loss": 0.1157, + "step": 21520 + }, + { + "epoch": 0.54, + "learning_rate": 0.0021886289978142355, + "loss": 0.1149, + "step": 21530 + }, + { + "epoch": 0.54, + "learning_rate": 0.002188252141798357, + "loss": 0.1186, + "step": 21540 + }, + { + "epoch": 0.54, + "learning_rate": 0.0021878752857824786, + "loss": 0.1136, + "step": 21550 + }, + { + "epoch": 0.54, + "learning_rate": 0.0021874984297666007, + "loss": 0.1118, + "step": 21560 + }, + { + "epoch": 0.54, + "learning_rate": 0.0021871215737507225, + "loss": 0.1162, + "step": 21570 + }, + { + "epoch": 0.54, + "learning_rate": 0.0021867447177348442, + "loss": 0.1141, + "step": 21580 + }, + { + "epoch": 0.54, + "learning_rate": 0.002186367861718966, + "loss": 0.1146, + "step": 21590 + }, + { + "epoch": 0.54, + "learning_rate": 0.0021859910057030877, + "loss": 0.1196, + "step": 21600 + }, + { + "epoch": 0.54, + "learning_rate": 0.0021856141496872095, + "loss": 0.114, + "step": 21610 + }, + { + "epoch": 0.54, + "learning_rate": 0.002185237293671331, + "loss": 0.1138, + "step": 21620 + }, + { + "epoch": 0.54, + "learning_rate": 0.0021848604376554534, + "loss": 0.1109, + "step": 21630 + }, + { + "epoch": 0.54, + "learning_rate": 0.002184483581639575, + "loss": 0.109, + "step": 21640 + }, + { + "epoch": 0.54, + "learning_rate": 0.0021841067256236964, + "loss": 0.1119, + "step": 21650 + }, + { + "epoch": 0.54, + "learning_rate": 0.0021837298696078186, + "loss": 0.1158, + "step": 21660 + }, + { + "epoch": 0.54, + "learning_rate": 0.0021833530135919404, + "loss": 0.1173, + "step": 21670 + }, + { + "epoch": 0.54, + "learning_rate": 0.002182976157576062, + "loss": 0.1134, + "step": 21680 + }, + { + "epoch": 0.54, + "learning_rate": 0.002182599301560184, + "loss": 0.114, + "step": 21690 + }, + { + "epoch": 0.55, + "learning_rate": 0.0021822224455443056, + "loss": 0.1112, + "step": 21700 + }, + { + "epoch": 0.55, + "learning_rate": 0.0021818455895284278, + "loss": 0.1179, + "step": 21710 + }, + { + "epoch": 0.55, + "learning_rate": 0.0021814687335125495, + "loss": 0.1152, + "step": 21720 + }, + { + "epoch": 0.55, + "learning_rate": 0.002181091877496671, + "loss": 0.1151, + "step": 21730 + }, + { + "epoch": 0.55, + "learning_rate": 0.002180715021480793, + "loss": 0.1141, + "step": 21740 + }, + { + "epoch": 0.55, + "learning_rate": 0.0021803381654649148, + "loss": 0.109, + "step": 21750 + }, + { + "epoch": 0.55, + "learning_rate": 0.0021799613094490365, + "loss": 0.1111, + "step": 21760 + }, + { + "epoch": 0.55, + "learning_rate": 0.0021795844534331582, + "loss": 0.1145, + "step": 21770 + }, + { + "epoch": 0.55, + "learning_rate": 0.00217920759741728, + "loss": 0.1118, + "step": 21780 + }, + { + "epoch": 0.55, + "learning_rate": 0.002178830741401402, + "loss": 0.1116, + "step": 21790 + }, + { + "epoch": 0.55, + "learning_rate": 0.002178453885385524, + "loss": 0.1155, + "step": 21800 + }, + { + "epoch": 0.55, + "learning_rate": 0.0021780770293696457, + "loss": 0.1132, + "step": 21810 + }, + { + "epoch": 0.55, + "learning_rate": 0.0021777001733537674, + "loss": 0.1149, + "step": 21820 + }, + { + "epoch": 0.55, + "learning_rate": 0.002177323317337889, + "loss": 0.1104, + "step": 21830 + }, + { + "epoch": 0.55, + "learning_rate": 0.002176946461322011, + "loss": 0.1162, + "step": 21840 + }, + { + "epoch": 0.55, + "learning_rate": 0.0021765696053061326, + "loss": 0.1115, + "step": 21850 + }, + { + "epoch": 0.55, + "learning_rate": 0.0021761927492902544, + "loss": 0.1138, + "step": 21860 + }, + { + "epoch": 0.55, + "learning_rate": 0.0021758158932743766, + "loss": 0.1107, + "step": 21870 + }, + { + "epoch": 0.55, + "learning_rate": 0.002175439037258498, + "loss": 0.1108, + "step": 21880 + }, + { + "epoch": 0.55, + "learning_rate": 0.00217506218124262, + "loss": 0.1127, + "step": 21890 + }, + { + "epoch": 0.55, + "learning_rate": 0.002174685325226742, + "loss": 0.1157, + "step": 21900 + }, + { + "epoch": 0.55, + "learning_rate": 0.0021743084692108635, + "loss": 0.1102, + "step": 21910 + }, + { + "epoch": 0.55, + "learning_rate": 0.0021739316131949853, + "loss": 0.1119, + "step": 21920 + }, + { + "epoch": 0.55, + "learning_rate": 0.002173554757179107, + "loss": 0.1193, + "step": 21930 + }, + { + "epoch": 0.55, + "learning_rate": 0.002173177901163229, + "loss": 0.1146, + "step": 21940 + }, + { + "epoch": 0.55, + "learning_rate": 0.002172801045147351, + "loss": 0.1112, + "step": 21950 + }, + { + "epoch": 0.55, + "learning_rate": 0.0021724241891314723, + "loss": 0.1088, + "step": 21960 + }, + { + "epoch": 0.55, + "learning_rate": 0.0021720473331155944, + "loss": 0.1114, + "step": 21970 + }, + { + "epoch": 0.55, + "learning_rate": 0.002171670477099716, + "loss": 0.1147, + "step": 21980 + }, + { + "epoch": 0.55, + "learning_rate": 0.002171293621083838, + "loss": 0.1102, + "step": 21990 + }, + { + "epoch": 0.55, + "learning_rate": 0.0021709167650679597, + "loss": 0.1147, + "step": 22000 + }, + { + "epoch": 0.55, + "eval_cer": 0.666688322031639, + "eval_loss": 0.08858127146959305, + "eval_runtime": 90.7851, + "eval_samples_per_second": 110.139, + "eval_steps_per_second": 6.884, + "step": 22000 + }, + { + "epoch": 0.55, + "learning_rate": 0.0021705399090520814, + "loss": 0.1154, + "step": 22010 + }, + { + "epoch": 0.55, + "learning_rate": 0.0021701630530362036, + "loss": 0.1173, + "step": 22020 + }, + { + "epoch": 0.55, + "learning_rate": 0.002169786197020325, + "loss": 0.1106, + "step": 22030 + }, + { + "epoch": 0.55, + "learning_rate": 0.002169409341004447, + "loss": 0.1111, + "step": 22040 + }, + { + "epoch": 0.55, + "learning_rate": 0.002169032484988569, + "loss": 0.1086, + "step": 22050 + }, + { + "epoch": 0.55, + "learning_rate": 0.0021686556289726906, + "loss": 0.1112, + "step": 22060 + }, + { + "epoch": 0.55, + "learning_rate": 0.0021682787729568123, + "loss": 0.1127, + "step": 22070 + }, + { + "epoch": 0.55, + "learning_rate": 0.002167901916940934, + "loss": 0.1103, + "step": 22080 + }, + { + "epoch": 0.55, + "learning_rate": 0.002167525060925056, + "loss": 0.1123, + "step": 22090 + }, + { + "epoch": 0.56, + "learning_rate": 0.002167148204909178, + "loss": 0.1105, + "step": 22100 + }, + { + "epoch": 0.56, + "learning_rate": 0.0021667713488932993, + "loss": 0.1101, + "step": 22110 + }, + { + "epoch": 0.56, + "learning_rate": 0.0021663944928774215, + "loss": 0.1088, + "step": 22120 + }, + { + "epoch": 0.56, + "learning_rate": 0.0021660176368615432, + "loss": 0.1128, + "step": 22130 + }, + { + "epoch": 0.56, + "learning_rate": 0.002165640780845665, + "loss": 0.1125, + "step": 22140 + }, + { + "epoch": 0.56, + "learning_rate": 0.0021652639248297867, + "loss": 0.1112, + "step": 22150 + }, + { + "epoch": 0.56, + "learning_rate": 0.0021648870688139085, + "loss": 0.1094, + "step": 22160 + }, + { + "epoch": 0.56, + "learning_rate": 0.00216451021279803, + "loss": 0.1132, + "step": 22170 + }, + { + "epoch": 0.56, + "learning_rate": 0.0021641333567821524, + "loss": 0.1107, + "step": 22180 + }, + { + "epoch": 0.56, + "learning_rate": 0.0021637565007662737, + "loss": 0.1138, + "step": 22190 + }, + { + "epoch": 0.56, + "learning_rate": 0.002163379644750396, + "loss": 0.1144, + "step": 22200 + }, + { + "epoch": 0.56, + "learning_rate": 0.0021630027887345176, + "loss": 0.1129, + "step": 22210 + }, + { + "epoch": 0.56, + "learning_rate": 0.0021626259327186394, + "loss": 0.1146, + "step": 22220 + }, + { + "epoch": 0.56, + "learning_rate": 0.002162249076702761, + "loss": 0.1131, + "step": 22230 + }, + { + "epoch": 0.56, + "learning_rate": 0.002161872220686883, + "loss": 0.1155, + "step": 22240 + }, + { + "epoch": 0.56, + "learning_rate": 0.002161495364671005, + "loss": 0.108, + "step": 22250 + }, + { + "epoch": 0.56, + "learning_rate": 0.0021611185086551263, + "loss": 0.1088, + "step": 22260 + }, + { + "epoch": 0.56, + "learning_rate": 0.002160741652639248, + "loss": 0.1103, + "step": 22270 + }, + { + "epoch": 0.56, + "learning_rate": 0.0021603647966233703, + "loss": 0.1099, + "step": 22280 + }, + { + "epoch": 0.56, + "learning_rate": 0.002159987940607492, + "loss": 0.1122, + "step": 22290 + }, + { + "epoch": 0.56, + "learning_rate": 0.0021596110845916137, + "loss": 0.1144, + "step": 22300 + }, + { + "epoch": 0.56, + "learning_rate": 0.0021592342285757355, + "loss": 0.1127, + "step": 22310 + }, + { + "epoch": 0.56, + "learning_rate": 0.0021588573725598572, + "loss": 0.1123, + "step": 22320 + }, + { + "epoch": 0.56, + "learning_rate": 0.0021584805165439794, + "loss": 0.1154, + "step": 22330 + }, + { + "epoch": 0.56, + "learning_rate": 0.0021581036605281007, + "loss": 0.1109, + "step": 22340 + }, + { + "epoch": 0.56, + "learning_rate": 0.002157726804512223, + "loss": 0.1111, + "step": 22350 + }, + { + "epoch": 0.56, + "learning_rate": 0.0021573499484963446, + "loss": 0.1085, + "step": 22360 + }, + { + "epoch": 0.56, + "learning_rate": 0.0021569730924804664, + "loss": 0.1093, + "step": 22370 + }, + { + "epoch": 0.56, + "learning_rate": 0.002156596236464588, + "loss": 0.1126, + "step": 22380 + }, + { + "epoch": 0.56, + "learning_rate": 0.00215621938044871, + "loss": 0.1108, + "step": 22390 + }, + { + "epoch": 0.56, + "learning_rate": 0.0021558425244328316, + "loss": 0.1084, + "step": 22400 + }, + { + "epoch": 0.56, + "learning_rate": 0.002155465668416954, + "loss": 0.1128, + "step": 22410 + }, + { + "epoch": 0.56, + "learning_rate": 0.002155088812401075, + "loss": 0.1128, + "step": 22420 + }, + { + "epoch": 0.56, + "learning_rate": 0.0021547119563851973, + "loss": 0.112, + "step": 22430 + }, + { + "epoch": 0.56, + "learning_rate": 0.002154335100369319, + "loss": 0.1103, + "step": 22440 + }, + { + "epoch": 0.56, + "learning_rate": 0.0021539582443534408, + "loss": 0.1099, + "step": 22450 + }, + { + "epoch": 0.56, + "learning_rate": 0.0021535813883375625, + "loss": 0.11, + "step": 22460 + }, + { + "epoch": 0.56, + "learning_rate": 0.0021532045323216843, + "loss": 0.1126, + "step": 22470 + }, + { + "epoch": 0.56, + "learning_rate": 0.002152827676305806, + "loss": 0.1111, + "step": 22480 + }, + { + "epoch": 0.57, + "learning_rate": 0.0021524508202899278, + "loss": 0.1072, + "step": 22490 + }, + { + "epoch": 0.57, + "learning_rate": 0.0021520739642740495, + "loss": 0.1144, + "step": 22500 + }, + { + "epoch": 0.57, + "eval_cer": 0.6664390447192912, + "eval_loss": 0.08680952340364456, + "eval_runtime": 90.6322, + "eval_samples_per_second": 110.325, + "eval_steps_per_second": 6.896, + "step": 22500 + }, + { + "epoch": 0.57, + "learning_rate": 0.0021516971082581717, + "loss": 0.1108, + "step": 22510 + }, + { + "epoch": 0.57, + "learning_rate": 0.0021513202522422934, + "loss": 0.1112, + "step": 22520 + }, + { + "epoch": 0.57, + "learning_rate": 0.002150943396226415, + "loss": 0.11, + "step": 22530 + }, + { + "epoch": 0.57, + "learning_rate": 0.002150566540210537, + "loss": 0.1124, + "step": 22540 + }, + { + "epoch": 0.57, + "learning_rate": 0.0021501896841946587, + "loss": 0.1131, + "step": 22550 + }, + { + "epoch": 0.57, + "learning_rate": 0.002149812828178781, + "loss": 0.1093, + "step": 22560 + }, + { + "epoch": 0.57, + "learning_rate": 0.002149435972162902, + "loss": 0.1166, + "step": 22570 + }, + { + "epoch": 0.57, + "learning_rate": 0.002149059116147024, + "loss": 0.1096, + "step": 22580 + }, + { + "epoch": 0.57, + "learning_rate": 0.002148682260131146, + "loss": 0.1121, + "step": 22590 + }, + { + "epoch": 0.57, + "learning_rate": 0.002148305404115268, + "loss": 0.1122, + "step": 22600 + }, + { + "epoch": 0.57, + "learning_rate": 0.0021479285480993896, + "loss": 0.1071, + "step": 22610 + }, + { + "epoch": 0.57, + "learning_rate": 0.0021475516920835113, + "loss": 0.1089, + "step": 22620 + }, + { + "epoch": 0.57, + "learning_rate": 0.002147174836067633, + "loss": 0.1123, + "step": 22630 + }, + { + "epoch": 0.57, + "learning_rate": 0.0021467979800517552, + "loss": 0.1092, + "step": 22640 + }, + { + "epoch": 0.57, + "learning_rate": 0.0021464211240358765, + "loss": 0.1076, + "step": 22650 + }, + { + "epoch": 0.57, + "learning_rate": 0.0021460442680199987, + "loss": 0.1095, + "step": 22660 + }, + { + "epoch": 0.57, + "learning_rate": 0.0021456674120041205, + "loss": 0.1107, + "step": 22670 + }, + { + "epoch": 0.57, + "learning_rate": 0.002145290555988242, + "loss": 0.1099, + "step": 22680 + }, + { + "epoch": 0.57, + "learning_rate": 0.002144913699972364, + "loss": 0.1103, + "step": 22690 + }, + { + "epoch": 0.57, + "learning_rate": 0.0021445368439564857, + "loss": 0.1155, + "step": 22700 + }, + { + "epoch": 0.57, + "learning_rate": 0.0021441599879406074, + "loss": 0.1082, + "step": 22710 + }, + { + "epoch": 0.57, + "learning_rate": 0.002143783131924729, + "loss": 0.1117, + "step": 22720 + }, + { + "epoch": 0.57, + "learning_rate": 0.002143406275908851, + "loss": 0.1089, + "step": 22730 + }, + { + "epoch": 0.57, + "learning_rate": 0.002143029419892973, + "loss": 0.1121, + "step": 22740 + }, + { + "epoch": 0.57, + "learning_rate": 0.002142652563877095, + "loss": 0.1062, + "step": 22750 + }, + { + "epoch": 0.57, + "learning_rate": 0.0021422757078612166, + "loss": 0.1118, + "step": 22760 + }, + { + "epoch": 0.57, + "learning_rate": 0.0021418988518453383, + "loss": 0.1112, + "step": 22770 + }, + { + "epoch": 0.57, + "learning_rate": 0.00214152199582946, + "loss": 0.1119, + "step": 22780 + }, + { + "epoch": 0.57, + "learning_rate": 0.0021411451398135823, + "loss": 0.1151, + "step": 22790 + }, + { + "epoch": 0.57, + "learning_rate": 0.0021407682837977036, + "loss": 0.1126, + "step": 22800 + }, + { + "epoch": 0.57, + "learning_rate": 0.0021403914277818253, + "loss": 0.1119, + "step": 22810 + }, + { + "epoch": 0.57, + "learning_rate": 0.0021400145717659475, + "loss": 0.1179, + "step": 22820 + }, + { + "epoch": 0.57, + "learning_rate": 0.0021396377157500692, + "loss": 0.1097, + "step": 22830 + }, + { + "epoch": 0.57, + "learning_rate": 0.002139260859734191, + "loss": 0.111, + "step": 22840 + }, + { + "epoch": 0.57, + "learning_rate": 0.0021388840037183127, + "loss": 0.1081, + "step": 22850 + }, + { + "epoch": 0.57, + "learning_rate": 0.0021385071477024345, + "loss": 0.1145, + "step": 22860 + }, + { + "epoch": 0.57, + "learning_rate": 0.0021381302916865567, + "loss": 0.1128, + "step": 22870 + }, + { + "epoch": 0.57, + "learning_rate": 0.002137753435670678, + "loss": 0.1095, + "step": 22880 + }, + { + "epoch": 0.58, + "learning_rate": 0.0021373765796547997, + "loss": 0.1125, + "step": 22890 + }, + { + "epoch": 0.58, + "learning_rate": 0.002136999723638922, + "loss": 0.1108, + "step": 22900 + }, + { + "epoch": 0.58, + "learning_rate": 0.0021366228676230436, + "loss": 0.1148, + "step": 22910 + }, + { + "epoch": 0.58, + "learning_rate": 0.0021362460116071654, + "loss": 0.1093, + "step": 22920 + }, + { + "epoch": 0.58, + "learning_rate": 0.002135869155591287, + "loss": 0.11, + "step": 22930 + }, + { + "epoch": 0.58, + "learning_rate": 0.002135492299575409, + "loss": 0.1082, + "step": 22940 + }, + { + "epoch": 0.58, + "learning_rate": 0.0021351154435595306, + "loss": 0.1119, + "step": 22950 + }, + { + "epoch": 0.58, + "learning_rate": 0.0021347385875436524, + "loss": 0.1127, + "step": 22960 + }, + { + "epoch": 0.58, + "learning_rate": 0.0021343617315277745, + "loss": 0.1118, + "step": 22970 + }, + { + "epoch": 0.58, + "learning_rate": 0.0021339848755118963, + "loss": 0.1102, + "step": 22980 + }, + { + "epoch": 0.58, + "learning_rate": 0.0021336080194960176, + "loss": 0.111, + "step": 22990 + }, + { + "epoch": 0.58, + "learning_rate": 0.0021332311634801398, + "loss": 0.1132, + "step": 23000 + }, + { + "epoch": 0.58, + "eval_cer": 0.6665848575101047, + "eval_loss": 0.08576372265815735, + "eval_runtime": 90.6462, + "eval_samples_per_second": 110.308, + "eval_steps_per_second": 6.895, + "step": 23000 + }, + { + "epoch": 0.58, + "learning_rate": 0.0021328543074642615, + "loss": 0.1111, + "step": 23010 + }, + { + "epoch": 0.58, + "learning_rate": 0.0021324774514483833, + "loss": 0.109, + "step": 23020 + }, + { + "epoch": 0.58, + "learning_rate": 0.002132100595432505, + "loss": 0.109, + "step": 23030 + }, + { + "epoch": 0.58, + "learning_rate": 0.0021317237394166267, + "loss": 0.1102, + "step": 23040 + }, + { + "epoch": 0.58, + "learning_rate": 0.002131346883400749, + "loss": 0.1135, + "step": 23050 + }, + { + "epoch": 0.58, + "learning_rate": 0.0021309700273848707, + "loss": 0.1128, + "step": 23060 + }, + { + "epoch": 0.58, + "learning_rate": 0.0021305931713689924, + "loss": 0.1107, + "step": 23070 + }, + { + "epoch": 0.58, + "learning_rate": 0.002130216315353114, + "loss": 0.1085, + "step": 23080 + }, + { + "epoch": 0.58, + "learning_rate": 0.002129839459337236, + "loss": 0.1109, + "step": 23090 + }, + { + "epoch": 0.58, + "learning_rate": 0.002129462603321358, + "loss": 0.1117, + "step": 23100 + }, + { + "epoch": 0.58, + "learning_rate": 0.0021290857473054794, + "loss": 0.1074, + "step": 23110 + }, + { + "epoch": 0.58, + "learning_rate": 0.002128708891289601, + "loss": 0.1093, + "step": 23120 + }, + { + "epoch": 0.58, + "learning_rate": 0.0021283320352737233, + "loss": 0.1067, + "step": 23130 + }, + { + "epoch": 0.58, + "learning_rate": 0.0021279551792578446, + "loss": 0.1132, + "step": 23140 + }, + { + "epoch": 0.58, + "learning_rate": 0.002127578323241967, + "loss": 0.1059, + "step": 23150 + }, + { + "epoch": 0.58, + "learning_rate": 0.0021272014672260886, + "loss": 0.1103, + "step": 23160 + }, + { + "epoch": 0.58, + "learning_rate": 0.0021268246112102103, + "loss": 0.1079, + "step": 23170 + }, + { + "epoch": 0.58, + "learning_rate": 0.002126447755194332, + "loss": 0.1082, + "step": 23180 + }, + { + "epoch": 0.58, + "learning_rate": 0.002126070899178454, + "loss": 0.1061, + "step": 23190 + }, + { + "epoch": 0.58, + "learning_rate": 0.002125694043162576, + "loss": 0.1124, + "step": 23200 + }, + { + "epoch": 0.58, + "learning_rate": 0.0021253171871466977, + "loss": 0.1113, + "step": 23210 + }, + { + "epoch": 0.58, + "learning_rate": 0.002124940331130819, + "loss": 0.1055, + "step": 23220 + }, + { + "epoch": 0.58, + "learning_rate": 0.002124563475114941, + "loss": 0.1137, + "step": 23230 + }, + { + "epoch": 0.58, + "learning_rate": 0.002124186619099063, + "loss": 0.112, + "step": 23240 + }, + { + "epoch": 0.58, + "learning_rate": 0.0021238097630831847, + "loss": 0.1043, + "step": 23250 + }, + { + "epoch": 0.58, + "learning_rate": 0.0021234329070673064, + "loss": 0.1094, + "step": 23260 + }, + { + "epoch": 0.58, + "learning_rate": 0.002123056051051428, + "loss": 0.1123, + "step": 23270 + }, + { + "epoch": 0.58, + "learning_rate": 0.0021226791950355504, + "loss": 0.1087, + "step": 23280 + }, + { + "epoch": 0.59, + "learning_rate": 0.002122302339019672, + "loss": 0.1161, + "step": 23290 + }, + { + "epoch": 0.59, + "learning_rate": 0.0021219254830037934, + "loss": 0.1083, + "step": 23300 + }, + { + "epoch": 0.59, + "learning_rate": 0.0021215486269879156, + "loss": 0.1095, + "step": 23310 + }, + { + "epoch": 0.59, + "learning_rate": 0.0021211717709720373, + "loss": 0.1109, + "step": 23320 + }, + { + "epoch": 0.59, + "learning_rate": 0.002120794914956159, + "loss": 0.1116, + "step": 23330 + }, + { + "epoch": 0.59, + "learning_rate": 0.002120418058940281, + "loss": 0.1127, + "step": 23340 + }, + { + "epoch": 0.59, + "learning_rate": 0.0021200412029244026, + "loss": 0.109, + "step": 23350 + }, + { + "epoch": 0.59, + "learning_rate": 0.0021196643469085247, + "loss": 0.1046, + "step": 23360 + }, + { + "epoch": 0.59, + "learning_rate": 0.002119287490892646, + "loss": 0.1071, + "step": 23370 + }, + { + "epoch": 0.59, + "learning_rate": 0.0021189106348767682, + "loss": 0.1146, + "step": 23380 + }, + { + "epoch": 0.59, + "learning_rate": 0.00211853377886089, + "loss": 0.1081, + "step": 23390 + }, + { + "epoch": 0.59, + "learning_rate": 0.0021181569228450117, + "loss": 0.109, + "step": 23400 + }, + { + "epoch": 0.59, + "learning_rate": 0.0021177800668291335, + "loss": 0.1042, + "step": 23410 + }, + { + "epoch": 0.59, + "learning_rate": 0.002117403210813255, + "loss": 0.109, + "step": 23420 + }, + { + "epoch": 0.59, + "learning_rate": 0.002117026354797377, + "loss": 0.1113, + "step": 23430 + }, + { + "epoch": 0.59, + "learning_rate": 0.002116649498781499, + "loss": 0.1092, + "step": 23440 + }, + { + "epoch": 0.59, + "learning_rate": 0.0021162726427656204, + "loss": 0.1081, + "step": 23450 + }, + { + "epoch": 0.59, + "learning_rate": 0.0021158957867497426, + "loss": 0.1092, + "step": 23460 + }, + { + "epoch": 0.59, + "learning_rate": 0.0021155189307338644, + "loss": 0.1102, + "step": 23470 + }, + { + "epoch": 0.59, + "learning_rate": 0.002115142074717986, + "loss": 0.1068, + "step": 23480 + }, + { + "epoch": 0.59, + "learning_rate": 0.002114765218702108, + "loss": 0.1131, + "step": 23490 + }, + { + "epoch": 0.59, + "learning_rate": 0.0021143883626862296, + "loss": 0.1073, + "step": 23500 + }, + { + "epoch": 0.59, + "eval_cer": 0.6666681103576648, + "eval_loss": 0.08526523411273956, + "eval_runtime": 90.7857, + "eval_samples_per_second": 110.138, + "eval_steps_per_second": 6.884, + "step": 23500 + }, + { + "epoch": 0.59, + "learning_rate": 0.0021140115066703518, + "loss": 0.1107, + "step": 23510 + }, + { + "epoch": 0.59, + "learning_rate": 0.0021136346506544735, + "loss": 0.1094, + "step": 23520 + }, + { + "epoch": 0.59, + "learning_rate": 0.002113257794638595, + "loss": 0.1098, + "step": 23530 + }, + { + "epoch": 0.59, + "learning_rate": 0.002112880938622717, + "loss": 0.1093, + "step": 23540 + }, + { + "epoch": 0.59, + "learning_rate": 0.0021125040826068388, + "loss": 0.1112, + "step": 23550 + }, + { + "epoch": 0.59, + "learning_rate": 0.0021121272265909605, + "loss": 0.1123, + "step": 23560 + }, + { + "epoch": 0.59, + "learning_rate": 0.0021117503705750823, + "loss": 0.1089, + "step": 23570 + }, + { + "epoch": 0.59, + "learning_rate": 0.002111373514559204, + "loss": 0.1085, + "step": 23580 + }, + { + "epoch": 0.59, + "learning_rate": 0.002110996658543326, + "loss": 0.1095, + "step": 23590 + }, + { + "epoch": 0.59, + "learning_rate": 0.0021106198025274475, + "loss": 0.1061, + "step": 23600 + }, + { + "epoch": 0.59, + "learning_rate": 0.0021102429465115697, + "loss": 0.1114, + "step": 23610 + }, + { + "epoch": 0.59, + "learning_rate": 0.0021098660904956914, + "loss": 0.1127, + "step": 23620 + }, + { + "epoch": 0.59, + "learning_rate": 0.002109489234479813, + "loss": 0.1056, + "step": 23630 + }, + { + "epoch": 0.59, + "learning_rate": 0.002109112378463935, + "loss": 0.1092, + "step": 23640 + }, + { + "epoch": 0.59, + "learning_rate": 0.0021087355224480566, + "loss": 0.111, + "step": 23650 + }, + { + "epoch": 0.59, + "learning_rate": 0.0021083586664321784, + "loss": 0.1074, + "step": 23660 + }, + { + "epoch": 0.59, + "learning_rate": 0.0021079818104163006, + "loss": 0.1045, + "step": 23670 + }, + { + "epoch": 0.59, + "learning_rate": 0.002107604954400422, + "loss": 0.1101, + "step": 23680 + }, + { + "epoch": 0.6, + "learning_rate": 0.002107228098384544, + "loss": 0.1071, + "step": 23690 + }, + { + "epoch": 0.6, + "learning_rate": 0.002106851242368666, + "loss": 0.1107, + "step": 23700 + }, + { + "epoch": 0.6, + "learning_rate": 0.0021064743863527875, + "loss": 0.1095, + "step": 23710 + }, + { + "epoch": 0.6, + "learning_rate": 0.0021060975303369093, + "loss": 0.1113, + "step": 23720 + }, + { + "epoch": 0.6, + "learning_rate": 0.002105720674321031, + "loss": 0.108, + "step": 23730 + }, + { + "epoch": 0.6, + "learning_rate": 0.0021053438183051528, + "loss": 0.1056, + "step": 23740 + }, + { + "epoch": 0.6, + "learning_rate": 0.002104966962289275, + "loss": 0.1141, + "step": 23750 + }, + { + "epoch": 0.6, + "learning_rate": 0.0021045901062733963, + "loss": 0.1052, + "step": 23760 + }, + { + "epoch": 0.6, + "learning_rate": 0.0021042132502575184, + "loss": 0.1061, + "step": 23770 + }, + { + "epoch": 0.6, + "learning_rate": 0.00210383639424164, + "loss": 0.1064, + "step": 23780 + }, + { + "epoch": 0.6, + "learning_rate": 0.002103459538225762, + "loss": 0.1076, + "step": 23790 + }, + { + "epoch": 0.6, + "learning_rate": 0.0021030826822098837, + "loss": 0.1076, + "step": 23800 + }, + { + "epoch": 0.6, + "learning_rate": 0.0021027058261940054, + "loss": 0.1113, + "step": 23810 + }, + { + "epoch": 0.6, + "learning_rate": 0.0021023289701781276, + "loss": 0.1066, + "step": 23820 + }, + { + "epoch": 0.6, + "learning_rate": 0.002101952114162249, + "loss": 0.1064, + "step": 23830 + }, + { + "epoch": 0.6, + "learning_rate": 0.0021015752581463707, + "loss": 0.1085, + "step": 23840 + }, + { + "epoch": 0.6, + "learning_rate": 0.002101198402130493, + "loss": 0.1094, + "step": 23850 + }, + { + "epoch": 0.6, + "learning_rate": 0.0021008215461146146, + "loss": 0.1076, + "step": 23860 + }, + { + "epoch": 0.6, + "learning_rate": 0.0021004446900987363, + "loss": 0.1085, + "step": 23870 + }, + { + "epoch": 0.6, + "learning_rate": 0.002100067834082858, + "loss": 0.1075, + "step": 23880 + }, + { + "epoch": 0.6, + "learning_rate": 0.00209969097806698, + "loss": 0.1099, + "step": 23890 + }, + { + "epoch": 0.6, + "learning_rate": 0.002099314122051102, + "loss": 0.1092, + "step": 23900 + }, + { + "epoch": 0.6, + "learning_rate": 0.0020989372660352233, + "loss": 0.1071, + "step": 23910 + }, + { + "epoch": 0.6, + "learning_rate": 0.0020985604100193455, + "loss": 0.1099, + "step": 23920 + }, + { + "epoch": 0.6, + "learning_rate": 0.0020981835540034672, + "loss": 0.1094, + "step": 23930 + }, + { + "epoch": 0.6, + "learning_rate": 0.002097806697987589, + "loss": 0.1079, + "step": 23940 + }, + { + "epoch": 0.6, + "learning_rate": 0.0020974298419717107, + "loss": 0.1082, + "step": 23950 + }, + { + "epoch": 0.6, + "learning_rate": 0.0020970529859558325, + "loss": 0.1109, + "step": 23960 + }, + { + "epoch": 0.6, + "learning_rate": 0.002096676129939954, + "loss": 0.1072, + "step": 23970 + }, + { + "epoch": 0.6, + "learning_rate": 0.0020962992739240764, + "loss": 0.108, + "step": 23980 + }, + { + "epoch": 0.6, + "learning_rate": 0.0020959224179081977, + "loss": 0.1085, + "step": 23990 + }, + { + "epoch": 0.6, + "learning_rate": 0.00209554556189232, + "loss": 0.109, + "step": 24000 + }, + { + "epoch": 0.6, + "eval_cer": 0.6662922694678122, + "eval_loss": 0.08452539891004562, + "eval_runtime": 90.7194, + "eval_samples_per_second": 110.219, + "eval_steps_per_second": 6.889, + "step": 24000 + }, + { + "epoch": 0.6, + "learning_rate": 0.0020951687058764416, + "loss": 0.1087, + "step": 24010 + }, + { + "epoch": 0.6, + "learning_rate": 0.0020947918498605634, + "loss": 0.111, + "step": 24020 + }, + { + "epoch": 0.6, + "learning_rate": 0.002094414993844685, + "loss": 0.1099, + "step": 24030 + }, + { + "epoch": 0.6, + "learning_rate": 0.002094038137828807, + "loss": 0.1096, + "step": 24040 + }, + { + "epoch": 0.6, + "learning_rate": 0.0020936612818129286, + "loss": 0.1041, + "step": 24050 + }, + { + "epoch": 0.6, + "learning_rate": 0.0020932844257970503, + "loss": 0.1044, + "step": 24060 + }, + { + "epoch": 0.6, + "learning_rate": 0.002092907569781172, + "loss": 0.1058, + "step": 24070 + }, + { + "epoch": 0.6, + "learning_rate": 0.0020925307137652943, + "loss": 0.106, + "step": 24080 + }, + { + "epoch": 0.61, + "learning_rate": 0.002092153857749416, + "loss": 0.1091, + "step": 24090 + }, + { + "epoch": 0.61, + "learning_rate": 0.0020917770017335378, + "loss": 0.1052, + "step": 24100 + }, + { + "epoch": 0.61, + "learning_rate": 0.0020914001457176595, + "loss": 0.1083, + "step": 24110 + }, + { + "epoch": 0.61, + "learning_rate": 0.0020910232897017812, + "loss": 0.1049, + "step": 24120 + }, + { + "epoch": 0.61, + "learning_rate": 0.0020906464336859034, + "loss": 0.1098, + "step": 24130 + }, + { + "epoch": 0.61, + "learning_rate": 0.0020902695776700247, + "loss": 0.1041, + "step": 24140 + }, + { + "epoch": 0.61, + "learning_rate": 0.0020898927216541465, + "loss": 0.1064, + "step": 24150 + }, + { + "epoch": 0.61, + "learning_rate": 0.0020895158656382687, + "loss": 0.1094, + "step": 24160 + }, + { + "epoch": 0.61, + "learning_rate": 0.0020891390096223904, + "loss": 0.1075, + "step": 24170 + }, + { + "epoch": 0.61, + "learning_rate": 0.002088762153606512, + "loss": 0.1095, + "step": 24180 + }, + { + "epoch": 0.61, + "learning_rate": 0.002088385297590634, + "loss": 0.1089, + "step": 24190 + }, + { + "epoch": 0.61, + "learning_rate": 0.0020880084415747556, + "loss": 0.1085, + "step": 24200 + }, + { + "epoch": 0.61, + "learning_rate": 0.002087631585558878, + "loss": 0.1145, + "step": 24210 + }, + { + "epoch": 0.61, + "learning_rate": 0.002087254729542999, + "loss": 0.1065, + "step": 24220 + }, + { + "epoch": 0.61, + "learning_rate": 0.0020868778735271213, + "loss": 0.1084, + "step": 24230 + }, + { + "epoch": 0.61, + "learning_rate": 0.002086501017511243, + "loss": 0.1005, + "step": 24240 + }, + { + "epoch": 0.61, + "learning_rate": 0.002086124161495365, + "loss": 0.108, + "step": 24250 + }, + { + "epoch": 0.61, + "learning_rate": 0.0020857473054794865, + "loss": 0.103, + "step": 24260 + }, + { + "epoch": 0.61, + "learning_rate": 0.0020853704494636083, + "loss": 0.1106, + "step": 24270 + }, + { + "epoch": 0.61, + "learning_rate": 0.00208499359344773, + "loss": 0.1071, + "step": 24280 + }, + { + "epoch": 0.61, + "learning_rate": 0.0020846167374318518, + "loss": 0.1054, + "step": 24290 + }, + { + "epoch": 0.61, + "learning_rate": 0.0020842398814159735, + "loss": 0.1085, + "step": 24300 + }, + { + "epoch": 0.61, + "learning_rate": 0.0020838630254000957, + "loss": 0.1067, + "step": 24310 + }, + { + "epoch": 0.61, + "learning_rate": 0.0020834861693842174, + "loss": 0.1058, + "step": 24320 + }, + { + "epoch": 0.61, + "learning_rate": 0.002083109313368339, + "loss": 0.1079, + "step": 24330 + }, + { + "epoch": 0.61, + "learning_rate": 0.002082732457352461, + "loss": 0.1084, + "step": 24340 + }, + { + "epoch": 0.61, + "learning_rate": 0.0020823556013365827, + "loss": 0.1096, + "step": 24350 + }, + { + "epoch": 0.61, + "learning_rate": 0.002081978745320705, + "loss": 0.1084, + "step": 24360 + }, + { + "epoch": 0.61, + "learning_rate": 0.002081601889304826, + "loss": 0.1093, + "step": 24370 + }, + { + "epoch": 0.61, + "learning_rate": 0.002081225033288948, + "loss": 0.106, + "step": 24380 + }, + { + "epoch": 0.61, + "learning_rate": 0.00208084817727307, + "loss": 0.1097, + "step": 24390 + }, + { + "epoch": 0.61, + "learning_rate": 0.002080471321257192, + "loss": 0.1105, + "step": 24400 + }, + { + "epoch": 0.61, + "learning_rate": 0.0020800944652413136, + "loss": 0.1031, + "step": 24410 + }, + { + "epoch": 0.61, + "learning_rate": 0.0020797176092254353, + "loss": 0.1092, + "step": 24420 + }, + { + "epoch": 0.61, + "learning_rate": 0.002079340753209557, + "loss": 0.1081, + "step": 24430 + }, + { + "epoch": 0.61, + "learning_rate": 0.0020789638971936792, + "loss": 0.1044, + "step": 24440 + }, + { + "epoch": 0.61, + "learning_rate": 0.0020785870411778005, + "loss": 0.1106, + "step": 24450 + }, + { + "epoch": 0.61, + "learning_rate": 0.0020782101851619223, + "loss": 0.1071, + "step": 24460 + }, + { + "epoch": 0.61, + "learning_rate": 0.0020778333291460445, + "loss": 0.1115, + "step": 24470 + }, + { + "epoch": 0.62, + "learning_rate": 0.0020774564731301658, + "loss": 0.1085, + "step": 24480 + }, + { + "epoch": 0.62, + "learning_rate": 0.002077079617114288, + "loss": 0.1038, + "step": 24490 + }, + { + "epoch": 0.62, + "learning_rate": 0.0020767027610984097, + "loss": 0.1073, + "step": 24500 + }, + { + "epoch": 0.62, + "eval_cer": 0.6662446276648731, + "eval_loss": 0.0842297375202179, + "eval_runtime": 90.7825, + "eval_samples_per_second": 110.142, + "eval_steps_per_second": 6.885, + "step": 24500 + }, + { + "epoch": 0.62, + "learning_rate": 0.0020763259050825314, + "loss": 0.1039, + "step": 24510 + }, + { + "epoch": 0.62, + "learning_rate": 0.002075949049066653, + "loss": 0.1047, + "step": 24520 + }, + { + "epoch": 0.62, + "learning_rate": 0.002075572193050775, + "loss": 0.1053, + "step": 24530 + }, + { + "epoch": 0.62, + "learning_rate": 0.002075195337034897, + "loss": 0.1017, + "step": 24540 + }, + { + "epoch": 0.62, + "learning_rate": 0.002074818481019019, + "loss": 0.1053, + "step": 24550 + }, + { + "epoch": 0.62, + "learning_rate": 0.00207444162500314, + "loss": 0.1045, + "step": 24560 + }, + { + "epoch": 0.62, + "learning_rate": 0.0020740647689872624, + "loss": 0.1002, + "step": 24570 + }, + { + "epoch": 0.62, + "learning_rate": 0.002073687912971384, + "loss": 0.1062, + "step": 24580 + }, + { + "epoch": 0.62, + "learning_rate": 0.002073311056955506, + "loss": 0.1074, + "step": 24590 + }, + { + "epoch": 0.62, + "learning_rate": 0.0020729342009396276, + "loss": 0.1043, + "step": 24600 + }, + { + "epoch": 0.62, + "learning_rate": 0.0020725573449237493, + "loss": 0.1087, + "step": 24610 + }, + { + "epoch": 0.62, + "learning_rate": 0.0020721804889078715, + "loss": 0.1081, + "step": 24620 + }, + { + "epoch": 0.62, + "learning_rate": 0.0020718036328919933, + "loss": 0.1067, + "step": 24630 + }, + { + "epoch": 0.62, + "learning_rate": 0.002071426776876115, + "loss": 0.1084, + "step": 24640 + }, + { + "epoch": 0.62, + "learning_rate": 0.0020710499208602367, + "loss": 0.1083, + "step": 24650 + }, + { + "epoch": 0.62, + "learning_rate": 0.0020706730648443585, + "loss": 0.1072, + "step": 24660 + }, + { + "epoch": 0.62, + "learning_rate": 0.0020702962088284807, + "loss": 0.1063, + "step": 24670 + }, + { + "epoch": 0.62, + "learning_rate": 0.002069919352812602, + "loss": 0.1022, + "step": 24680 + }, + { + "epoch": 0.62, + "learning_rate": 0.0020695424967967237, + "loss": 0.1075, + "step": 24690 + }, + { + "epoch": 0.62, + "learning_rate": 0.002069165640780846, + "loss": 0.1082, + "step": 24700 + }, + { + "epoch": 0.62, + "learning_rate": 0.002068788784764967, + "loss": 0.1053, + "step": 24710 + }, + { + "epoch": 0.62, + "learning_rate": 0.0020684119287490894, + "loss": 0.1078, + "step": 24720 + }, + { + "epoch": 0.62, + "learning_rate": 0.002068035072733211, + "loss": 0.1086, + "step": 24730 + }, + { + "epoch": 0.62, + "learning_rate": 0.002067658216717333, + "loss": 0.1062, + "step": 24740 + }, + { + "epoch": 0.62, + "learning_rate": 0.0020672813607014546, + "loss": 0.1093, + "step": 24750 + }, + { + "epoch": 0.62, + "learning_rate": 0.0020669045046855764, + "loss": 0.1075, + "step": 24760 + }, + { + "epoch": 0.62, + "learning_rate": 0.0020665276486696985, + "loss": 0.104, + "step": 24770 + }, + { + "epoch": 0.62, + "learning_rate": 0.0020661507926538203, + "loss": 0.1061, + "step": 24780 + }, + { + "epoch": 0.62, + "learning_rate": 0.0020657739366379416, + "loss": 0.1052, + "step": 24790 + }, + { + "epoch": 0.62, + "learning_rate": 0.0020653970806220638, + "loss": 0.1068, + "step": 24800 + }, + { + "epoch": 0.62, + "learning_rate": 0.0020650202246061855, + "loss": 0.1067, + "step": 24810 + }, + { + "epoch": 0.62, + "learning_rate": 0.0020646433685903073, + "loss": 0.1059, + "step": 24820 + }, + { + "epoch": 0.62, + "learning_rate": 0.002064266512574429, + "loss": 0.1069, + "step": 24830 + }, + { + "epoch": 0.62, + "learning_rate": 0.0020638896565585508, + "loss": 0.1024, + "step": 24840 + }, + { + "epoch": 0.62, + "learning_rate": 0.002063512800542673, + "loss": 0.1061, + "step": 24850 + }, + { + "epoch": 0.62, + "learning_rate": 0.0020631359445267947, + "loss": 0.1087, + "step": 24860 + }, + { + "epoch": 0.62, + "learning_rate": 0.002062759088510916, + "loss": 0.1065, + "step": 24870 + }, + { + "epoch": 0.63, + "learning_rate": 0.002062382232495038, + "loss": 0.1048, + "step": 24880 + }, + { + "epoch": 0.63, + "learning_rate": 0.00206200537647916, + "loss": 0.1081, + "step": 24890 + }, + { + "epoch": 0.63, + "learning_rate": 0.0020616285204632817, + "loss": 0.1052, + "step": 24900 + }, + { + "epoch": 0.63, + "learning_rate": 0.0020612516644474034, + "loss": 0.1043, + "step": 24910 + }, + { + "epoch": 0.63, + "learning_rate": 0.002060874808431525, + "loss": 0.1082, + "step": 24920 + }, + { + "epoch": 0.63, + "learning_rate": 0.0020604979524156473, + "loss": 0.1031, + "step": 24930 + }, + { + "epoch": 0.63, + "learning_rate": 0.0020601210963997686, + "loss": 0.1079, + "step": 24940 + }, + { + "epoch": 0.63, + "learning_rate": 0.002059744240383891, + "loss": 0.1063, + "step": 24950 + }, + { + "epoch": 0.63, + "learning_rate": 0.0020593673843680126, + "loss": 0.1017, + "step": 24960 + }, + { + "epoch": 0.63, + "learning_rate": 0.0020589905283521343, + "loss": 0.1105, + "step": 24970 + }, + { + "epoch": 0.63, + "learning_rate": 0.002058613672336256, + "loss": 0.1095, + "step": 24980 + }, + { + "epoch": 0.63, + "learning_rate": 0.002058236816320378, + "loss": 0.1111, + "step": 24990 + }, + { + "epoch": 0.63, + "learning_rate": 0.0020578599603044995, + "loss": 0.1062, + "step": 25000 + }, + { + "epoch": 0.63, + "eval_cer": 0.6662200849179045, + "eval_loss": 0.0830809623003006, + "eval_runtime": 90.7235, + "eval_samples_per_second": 110.214, + "eval_steps_per_second": 6.889, + "step": 25000 + }, + { + "epoch": 0.63, + "learning_rate": 0.0020574831042886217, + "loss": 0.1057, + "step": 25010 + }, + { + "epoch": 0.63, + "learning_rate": 0.002057106248272743, + "loss": 0.107, + "step": 25020 + }, + { + "epoch": 0.63, + "learning_rate": 0.002056729392256865, + "loss": 0.107, + "step": 25030 + }, + { + "epoch": 0.63, + "learning_rate": 0.002056352536240987, + "loss": 0.109, + "step": 25040 + }, + { + "epoch": 0.63, + "learning_rate": 0.0020559756802251087, + "loss": 0.1029, + "step": 25050 + }, + { + "epoch": 0.63, + "learning_rate": 0.0020555988242092304, + "loss": 0.1044, + "step": 25060 + }, + { + "epoch": 0.63, + "learning_rate": 0.002055221968193352, + "loss": 0.1039, + "step": 25070 + }, + { + "epoch": 0.63, + "learning_rate": 0.0020548451121774744, + "loss": 0.1063, + "step": 25080 + }, + { + "epoch": 0.63, + "learning_rate": 0.002054468256161596, + "loss": 0.1064, + "step": 25090 + }, + { + "epoch": 0.63, + "learning_rate": 0.0020540914001457174, + "loss": 0.1046, + "step": 25100 + }, + { + "epoch": 0.63, + "learning_rate": 0.0020537145441298396, + "loss": 0.1034, + "step": 25110 + }, + { + "epoch": 0.63, + "learning_rate": 0.0020533376881139613, + "loss": 0.1062, + "step": 25120 + }, + { + "epoch": 0.63, + "learning_rate": 0.002052960832098083, + "loss": 0.1068, + "step": 25130 + }, + { + "epoch": 0.63, + "learning_rate": 0.002052583976082205, + "loss": 0.1041, + "step": 25140 + }, + { + "epoch": 0.63, + "learning_rate": 0.0020522071200663266, + "loss": 0.1065, + "step": 25150 + }, + { + "epoch": 0.63, + "learning_rate": 0.0020518302640504488, + "loss": 0.1041, + "step": 25160 + }, + { + "epoch": 0.63, + "learning_rate": 0.00205145340803457, + "loss": 0.1073, + "step": 25170 + }, + { + "epoch": 0.63, + "learning_rate": 0.0020510765520186922, + "loss": 0.1049, + "step": 25180 + }, + { + "epoch": 0.63, + "learning_rate": 0.002050699696002814, + "loss": 0.1037, + "step": 25190 + }, + { + "epoch": 0.63, + "learning_rate": 0.0020503228399869357, + "loss": 0.1044, + "step": 25200 + }, + { + "epoch": 0.63, + "learning_rate": 0.0020499459839710575, + "loss": 0.1079, + "step": 25210 + }, + { + "epoch": 0.63, + "learning_rate": 0.0020495691279551792, + "loss": 0.103, + "step": 25220 + }, + { + "epoch": 0.63, + "learning_rate": 0.002049192271939301, + "loss": 0.1066, + "step": 25230 + }, + { + "epoch": 0.63, + "learning_rate": 0.002048815415923423, + "loss": 0.1085, + "step": 25240 + }, + { + "epoch": 0.63, + "learning_rate": 0.0020484385599075445, + "loss": 0.1048, + "step": 25250 + }, + { + "epoch": 0.63, + "learning_rate": 0.0020480617038916666, + "loss": 0.1102, + "step": 25260 + }, + { + "epoch": 0.63, + "learning_rate": 0.0020476848478757884, + "loss": 0.1088, + "step": 25270 + }, + { + "epoch": 0.64, + "learning_rate": 0.00204730799185991, + "loss": 0.1043, + "step": 25280 + }, + { + "epoch": 0.64, + "learning_rate": 0.002046931135844032, + "loss": 0.1093, + "step": 25290 + }, + { + "epoch": 0.64, + "learning_rate": 0.0020465542798281536, + "loss": 0.1037, + "step": 25300 + }, + { + "epoch": 0.64, + "learning_rate": 0.0020461774238122754, + "loss": 0.1057, + "step": 25310 + }, + { + "epoch": 0.64, + "learning_rate": 0.0020458005677963975, + "loss": 0.1083, + "step": 25320 + }, + { + "epoch": 0.64, + "learning_rate": 0.002045423711780519, + "loss": 0.1039, + "step": 25330 + }, + { + "epoch": 0.64, + "learning_rate": 0.002045046855764641, + "loss": 0.1075, + "step": 25340 + }, + { + "epoch": 0.64, + "learning_rate": 0.0020446699997487628, + "loss": 0.1023, + "step": 25350 + }, + { + "epoch": 0.64, + "learning_rate": 0.0020442931437328845, + "loss": 0.1043, + "step": 25360 + }, + { + "epoch": 0.64, + "learning_rate": 0.0020439162877170063, + "loss": 0.1027, + "step": 25370 + }, + { + "epoch": 0.64, + "learning_rate": 0.002043539431701128, + "loss": 0.106, + "step": 25380 + }, + { + "epoch": 0.64, + "learning_rate": 0.00204316257568525, + "loss": 0.1073, + "step": 25390 + }, + { + "epoch": 0.64, + "learning_rate": 0.0020427857196693715, + "loss": 0.1105, + "step": 25400 + }, + { + "epoch": 0.64, + "learning_rate": 0.0020424088636534932, + "loss": 0.1081, + "step": 25410 + }, + { + "epoch": 0.64, + "learning_rate": 0.0020420320076376154, + "loss": 0.104, + "step": 25420 + }, + { + "epoch": 0.64, + "learning_rate": 0.002041655151621737, + "loss": 0.104, + "step": 25430 + }, + { + "epoch": 0.64, + "learning_rate": 0.002041278295605859, + "loss": 0.1032, + "step": 25440 + }, + { + "epoch": 0.64, + "learning_rate": 0.0020409014395899806, + "loss": 0.1035, + "step": 25450 + }, + { + "epoch": 0.64, + "learning_rate": 0.0020405245835741024, + "loss": 0.1042, + "step": 25460 + }, + { + "epoch": 0.64, + "learning_rate": 0.0020401477275582246, + "loss": 0.1058, + "step": 25470 + }, + { + "epoch": 0.64, + "learning_rate": 0.002039770871542346, + "loss": 0.1043, + "step": 25480 + }, + { + "epoch": 0.64, + "learning_rate": 0.002039394015526468, + "loss": 0.1057, + "step": 25490 + }, + { + "epoch": 0.64, + "learning_rate": 0.00203901715951059, + "loss": 0.1018, + "step": 25500 + }, + { + "epoch": 0.64, + "eval_cer": 0.6662013169349286, + "eval_loss": 0.08301563560962677, + "eval_runtime": 90.6697, + "eval_samples_per_second": 110.279, + "eval_steps_per_second": 6.893, + "step": 25500 + }, + { + "epoch": 0.64, + "learning_rate": 0.0020386403034947116, + "loss": 0.104, + "step": 25510 + }, + { + "epoch": 0.64, + "learning_rate": 0.0020382634474788333, + "loss": 0.1074, + "step": 25520 + }, + { + "epoch": 0.64, + "learning_rate": 0.002037886591462955, + "loss": 0.1081, + "step": 25530 + }, + { + "epoch": 0.64, + "learning_rate": 0.002037509735447077, + "loss": 0.104, + "step": 25540 + }, + { + "epoch": 0.64, + "learning_rate": 0.002037132879431199, + "loss": 0.1028, + "step": 25550 + }, + { + "epoch": 0.64, + "learning_rate": 0.0020367560234153203, + "loss": 0.1061, + "step": 25560 + }, + { + "epoch": 0.64, + "learning_rate": 0.0020363791673994425, + "loss": 0.1077, + "step": 25570 + }, + { + "epoch": 0.64, + "learning_rate": 0.002036002311383564, + "loss": 0.1092, + "step": 25580 + }, + { + "epoch": 0.64, + "learning_rate": 0.002035625455367686, + "loss": 0.1062, + "step": 25590 + }, + { + "epoch": 0.64, + "learning_rate": 0.0020352485993518077, + "loss": 0.1037, + "step": 25600 + }, + { + "epoch": 0.64, + "learning_rate": 0.0020348717433359294, + "loss": 0.1011, + "step": 25610 + }, + { + "epoch": 0.64, + "learning_rate": 0.002034494887320051, + "loss": 0.1059, + "step": 25620 + }, + { + "epoch": 0.64, + "learning_rate": 0.002034118031304173, + "loss": 0.1126, + "step": 25630 + }, + { + "epoch": 0.64, + "learning_rate": 0.0020337411752882947, + "loss": 0.105, + "step": 25640 + }, + { + "epoch": 0.64, + "learning_rate": 0.002033364319272417, + "loss": 0.1067, + "step": 25650 + }, + { + "epoch": 0.64, + "learning_rate": 0.0020329874632565386, + "loss": 0.1051, + "step": 25660 + }, + { + "epoch": 0.64, + "learning_rate": 0.0020326106072406603, + "loss": 0.102, + "step": 25670 + }, + { + "epoch": 0.65, + "learning_rate": 0.002032233751224782, + "loss": 0.1073, + "step": 25680 + }, + { + "epoch": 0.65, + "learning_rate": 0.002031856895208904, + "loss": 0.105, + "step": 25690 + }, + { + "epoch": 0.65, + "learning_rate": 0.002031480039193026, + "loss": 0.105, + "step": 25700 + }, + { + "epoch": 0.65, + "learning_rate": 0.0020311031831771473, + "loss": 0.106, + "step": 25710 + }, + { + "epoch": 0.65, + "learning_rate": 0.002030726327161269, + "loss": 0.1013, + "step": 25720 + }, + { + "epoch": 0.65, + "learning_rate": 0.0020303494711453912, + "loss": 0.1043, + "step": 25730 + }, + { + "epoch": 0.65, + "learning_rate": 0.002029972615129513, + "loss": 0.1061, + "step": 25740 + }, + { + "epoch": 0.65, + "learning_rate": 0.0020295957591136347, + "loss": 0.1047, + "step": 25750 + }, + { + "epoch": 0.65, + "learning_rate": 0.0020292189030977565, + "loss": 0.104, + "step": 25760 + }, + { + "epoch": 0.65, + "learning_rate": 0.002028842047081878, + "loss": 0.1056, + "step": 25770 + }, + { + "epoch": 0.65, + "learning_rate": 0.0020284651910660004, + "loss": 0.106, + "step": 25780 + }, + { + "epoch": 0.65, + "learning_rate": 0.0020280883350501217, + "loss": 0.105, + "step": 25790 + }, + { + "epoch": 0.65, + "learning_rate": 0.002027711479034244, + "loss": 0.1049, + "step": 25800 + }, + { + "epoch": 0.65, + "learning_rate": 0.0020273346230183656, + "loss": 0.1061, + "step": 25810 + }, + { + "epoch": 0.65, + "learning_rate": 0.002026957767002487, + "loss": 0.1009, + "step": 25820 + }, + { + "epoch": 0.65, + "learning_rate": 0.002026580910986609, + "loss": 0.1066, + "step": 25830 + }, + { + "epoch": 0.65, + "learning_rate": 0.002026204054970731, + "loss": 0.108, + "step": 25840 + }, + { + "epoch": 0.65, + "learning_rate": 0.0020258271989548526, + "loss": 0.102, + "step": 25850 + }, + { + "epoch": 0.65, + "learning_rate": 0.0020254503429389743, + "loss": 0.1052, + "step": 25860 + }, + { + "epoch": 0.65, + "learning_rate": 0.002025073486923096, + "loss": 0.1013, + "step": 25870 + }, + { + "epoch": 0.65, + "learning_rate": 0.0020246966309072183, + "loss": 0.1034, + "step": 25880 + }, + { + "epoch": 0.65, + "learning_rate": 0.00202431977489134, + "loss": 0.1061, + "step": 25890 + }, + { + "epoch": 0.65, + "learning_rate": 0.0020239429188754618, + "loss": 0.1032, + "step": 25900 + }, + { + "epoch": 0.65, + "learning_rate": 0.0020235660628595835, + "loss": 0.1068, + "step": 25910 + }, + { + "epoch": 0.65, + "learning_rate": 0.0020231892068437052, + "loss": 0.1042, + "step": 25920 + }, + { + "epoch": 0.65, + "learning_rate": 0.0020228123508278274, + "loss": 0.106, + "step": 25930 + }, + { + "epoch": 0.65, + "learning_rate": 0.0020224354948119487, + "loss": 0.1053, + "step": 25940 + }, + { + "epoch": 0.65, + "learning_rate": 0.0020220586387960705, + "loss": 0.1049, + "step": 25950 + }, + { + "epoch": 0.65, + "learning_rate": 0.0020216817827801927, + "loss": 0.1066, + "step": 25960 + }, + { + "epoch": 0.65, + "learning_rate": 0.0020213049267643144, + "loss": 0.1051, + "step": 25970 + }, + { + "epoch": 0.65, + "learning_rate": 0.002020928070748436, + "loss": 0.1068, + "step": 25980 + }, + { + "epoch": 0.65, + "learning_rate": 0.002020551214732558, + "loss": 0.1025, + "step": 25990 + }, + { + "epoch": 0.65, + "learning_rate": 0.0020201743587166796, + "loss": 0.1052, + "step": 26000 + }, + { + "epoch": 0.65, + "eval_cer": 0.6666334617737092, + "eval_loss": 0.08180632442235947, + "eval_runtime": 90.778, + "eval_samples_per_second": 110.148, + "eval_steps_per_second": 6.885, + "step": 26000 + }, + { + "epoch": 0.65, + "learning_rate": 0.002019797502700802, + "loss": 0.108, + "step": 26010 + }, + { + "epoch": 0.65, + "learning_rate": 0.002019420646684923, + "loss": 0.1042, + "step": 26020 + }, + { + "epoch": 0.65, + "learning_rate": 0.002019043790669045, + "loss": 0.1014, + "step": 26030 + }, + { + "epoch": 0.65, + "learning_rate": 0.002018666934653167, + "loss": 0.1059, + "step": 26040 + }, + { + "epoch": 0.65, + "learning_rate": 0.0020182900786372884, + "loss": 0.1055, + "step": 26050 + }, + { + "epoch": 0.65, + "learning_rate": 0.0020179132226214105, + "loss": 0.1078, + "step": 26060 + }, + { + "epoch": 0.65, + "learning_rate": 0.0020175363666055323, + "loss": 0.1042, + "step": 26070 + }, + { + "epoch": 0.66, + "learning_rate": 0.002017159510589654, + "loss": 0.104, + "step": 26080 + }, + { + "epoch": 0.66, + "learning_rate": 0.0020167826545737758, + "loss": 0.1017, + "step": 26090 + }, + { + "epoch": 0.66, + "learning_rate": 0.0020164057985578975, + "loss": 0.1055, + "step": 26100 + }, + { + "epoch": 0.66, + "learning_rate": 0.0020160289425420197, + "loss": 0.0993, + "step": 26110 + }, + { + "epoch": 0.66, + "learning_rate": 0.0020156520865261414, + "loss": 0.1057, + "step": 26120 + }, + { + "epoch": 0.66, + "learning_rate": 0.0020152752305102628, + "loss": 0.1031, + "step": 26130 + }, + { + "epoch": 0.66, + "learning_rate": 0.002014898374494385, + "loss": 0.1055, + "step": 26140 + }, + { + "epoch": 0.66, + "learning_rate": 0.0020145215184785067, + "loss": 0.1061, + "step": 26150 + }, + { + "epoch": 0.66, + "learning_rate": 0.0020141446624626284, + "loss": 0.0989, + "step": 26160 + }, + { + "epoch": 0.66, + "learning_rate": 0.00201376780644675, + "loss": 0.1023, + "step": 26170 + }, + { + "epoch": 0.66, + "learning_rate": 0.002013390950430872, + "loss": 0.1088, + "step": 26180 + }, + { + "epoch": 0.66, + "learning_rate": 0.002013014094414994, + "loss": 0.1023, + "step": 26190 + }, + { + "epoch": 0.66, + "learning_rate": 0.002012637238399116, + "loss": 0.1028, + "step": 26200 + }, + { + "epoch": 0.66, + "learning_rate": 0.0020122603823832376, + "loss": 0.1036, + "step": 26210 + }, + { + "epoch": 0.66, + "learning_rate": 0.0020118835263673593, + "loss": 0.1035, + "step": 26220 + }, + { + "epoch": 0.66, + "learning_rate": 0.002011506670351481, + "loss": 0.1043, + "step": 26230 + }, + { + "epoch": 0.66, + "learning_rate": 0.0020111298143356032, + "loss": 0.1044, + "step": 26240 + }, + { + "epoch": 0.66, + "learning_rate": 0.0020107529583197246, + "loss": 0.1008, + "step": 26250 + }, + { + "epoch": 0.66, + "learning_rate": 0.0020103761023038463, + "loss": 0.1013, + "step": 26260 + }, + { + "epoch": 0.66, + "learning_rate": 0.0020099992462879685, + "loss": 0.1047, + "step": 26270 + }, + { + "epoch": 0.66, + "learning_rate": 0.00200962239027209, + "loss": 0.1028, + "step": 26280 + }, + { + "epoch": 0.66, + "learning_rate": 0.002009245534256212, + "loss": 0.1029, + "step": 26290 + }, + { + "epoch": 0.66, + "learning_rate": 0.0020088686782403337, + "loss": 0.1066, + "step": 26300 + }, + { + "epoch": 0.66, + "learning_rate": 0.0020084918222244555, + "loss": 0.1083, + "step": 26310 + }, + { + "epoch": 0.66, + "learning_rate": 0.002008114966208577, + "loss": 0.1057, + "step": 26320 + }, + { + "epoch": 0.66, + "learning_rate": 0.002007738110192699, + "loss": 0.1027, + "step": 26330 + }, + { + "epoch": 0.66, + "learning_rate": 0.002007361254176821, + "loss": 0.1038, + "step": 26340 + }, + { + "epoch": 0.66, + "learning_rate": 0.002006984398160943, + "loss": 0.101, + "step": 26350 + }, + { + "epoch": 0.66, + "learning_rate": 0.002006607542145064, + "loss": 0.1049, + "step": 26360 + }, + { + "epoch": 0.66, + "learning_rate": 0.0020062306861291864, + "loss": 0.1054, + "step": 26370 + }, + { + "epoch": 0.66, + "learning_rate": 0.002005853830113308, + "loss": 0.1023, + "step": 26380 + }, + { + "epoch": 0.66, + "learning_rate": 0.00200547697409743, + "loss": 0.109, + "step": 26390 + }, + { + "epoch": 0.66, + "learning_rate": 0.0020051001180815516, + "loss": 0.1058, + "step": 26400 + }, + { + "epoch": 0.66, + "learning_rate": 0.0020047232620656733, + "loss": 0.1033, + "step": 26410 + }, + { + "epoch": 0.66, + "learning_rate": 0.0020043464060497955, + "loss": 0.1067, + "step": 26420 + }, + { + "epoch": 0.66, + "learning_rate": 0.0020039695500339173, + "loss": 0.1058, + "step": 26430 + }, + { + "epoch": 0.66, + "learning_rate": 0.0020035926940180386, + "loss": 0.1033, + "step": 26440 + }, + { + "epoch": 0.66, + "learning_rate": 0.0020032158380021607, + "loss": 0.1034, + "step": 26450 + }, + { + "epoch": 0.66, + "learning_rate": 0.0020028389819862825, + "loss": 0.1055, + "step": 26460 + }, + { + "epoch": 0.67, + "learning_rate": 0.0020024621259704042, + "loss": 0.0989, + "step": 26470 + }, + { + "epoch": 0.67, + "learning_rate": 0.002002085269954526, + "loss": 0.1056, + "step": 26480 + }, + { + "epoch": 0.67, + "learning_rate": 0.0020017084139386477, + "loss": 0.0971, + "step": 26490 + }, + { + "epoch": 0.67, + "learning_rate": 0.00200133155792277, + "loss": 0.1072, + "step": 26500 + }, + { + "epoch": 0.67, + "eval_cer": 0.6662273033728953, + "eval_loss": 0.08107112348079681, + "eval_runtime": 90.712, + "eval_samples_per_second": 110.228, + "eval_steps_per_second": 6.89, + "step": 26500 + }, + { + "epoch": 0.67, + "learning_rate": 0.0020009547019068912, + "loss": 0.1071, + "step": 26510 + }, + { + "epoch": 0.67, + "learning_rate": 0.0020005778458910134, + "loss": 0.1079, + "step": 26520 + }, + { + "epoch": 0.67, + "learning_rate": 0.002000200989875135, + "loss": 0.1031, + "step": 26530 + }, + { + "epoch": 0.67, + "learning_rate": 0.001999824133859257, + "loss": 0.1041, + "step": 26540 + }, + { + "epoch": 0.67, + "learning_rate": 0.0019994472778433786, + "loss": 0.1062, + "step": 26550 + }, + { + "epoch": 0.67, + "learning_rate": 0.0019990704218275004, + "loss": 0.104, + "step": 26560 + }, + { + "epoch": 0.67, + "learning_rate": 0.001998693565811622, + "loss": 0.1036, + "step": 26570 + }, + { + "epoch": 0.67, + "learning_rate": 0.0019983167097957443, + "loss": 0.105, + "step": 26580 + }, + { + "epoch": 0.67, + "learning_rate": 0.0019979398537798656, + "loss": 0.1017, + "step": 26590 + }, + { + "epoch": 0.67, + "learning_rate": 0.001997562997763988, + "loss": 0.0991, + "step": 26600 + }, + { + "epoch": 0.67, + "learning_rate": 0.0019971861417481095, + "loss": 0.1046, + "step": 26610 + }, + { + "epoch": 0.67, + "learning_rate": 0.0019968092857322313, + "loss": 0.1014, + "step": 26620 + }, + { + "epoch": 0.67, + "learning_rate": 0.001996432429716353, + "loss": 0.1016, + "step": 26630 + }, + { + "epoch": 0.67, + "learning_rate": 0.0019960555737004748, + "loss": 0.1029, + "step": 26640 + }, + { + "epoch": 0.67, + "learning_rate": 0.001995678717684597, + "loss": 0.103, + "step": 26650 + }, + { + "epoch": 0.67, + "learning_rate": 0.0019953018616687187, + "loss": 0.1085, + "step": 26660 + }, + { + "epoch": 0.67, + "learning_rate": 0.00199492500565284, + "loss": 0.1062, + "step": 26670 + }, + { + "epoch": 0.67, + "learning_rate": 0.001994548149636962, + "loss": 0.1033, + "step": 26680 + }, + { + "epoch": 0.67, + "learning_rate": 0.001994171293621084, + "loss": 0.1044, + "step": 26690 + }, + { + "epoch": 0.67, + "learning_rate": 0.0019937944376052057, + "loss": 0.1017, + "step": 26700 + }, + { + "epoch": 0.67, + "learning_rate": 0.0019934175815893274, + "loss": 0.1029, + "step": 26710 + }, + { + "epoch": 0.67, + "learning_rate": 0.001993040725573449, + "loss": 0.1026, + "step": 26720 + }, + { + "epoch": 0.67, + "learning_rate": 0.0019926638695575713, + "loss": 0.1004, + "step": 26730 + }, + { + "epoch": 0.67, + "learning_rate": 0.0019922870135416926, + "loss": 0.1052, + "step": 26740 + }, + { + "epoch": 0.67, + "learning_rate": 0.001991910157525815, + "loss": 0.1053, + "step": 26750 + }, + { + "epoch": 0.67, + "learning_rate": 0.0019915333015099366, + "loss": 0.1025, + "step": 26760 + }, + { + "epoch": 0.67, + "learning_rate": 0.0019911564454940583, + "loss": 0.1065, + "step": 26770 + }, + { + "epoch": 0.67, + "learning_rate": 0.00199077958947818, + "loss": 0.1026, + "step": 26780 + }, + { + "epoch": 0.67, + "learning_rate": 0.001990402733462302, + "loss": 0.1062, + "step": 26790 + }, + { + "epoch": 0.67, + "learning_rate": 0.0019900258774464235, + "loss": 0.1052, + "step": 26800 + }, + { + "epoch": 0.67, + "learning_rate": 0.0019896490214305457, + "loss": 0.1018, + "step": 26810 + }, + { + "epoch": 0.67, + "learning_rate": 0.001989272165414667, + "loss": 0.104, + "step": 26820 + }, + { + "epoch": 0.67, + "learning_rate": 0.001988895309398789, + "loss": 0.0998, + "step": 26830 + }, + { + "epoch": 0.67, + "learning_rate": 0.001988518453382911, + "loss": 0.1007, + "step": 26840 + }, + { + "epoch": 0.67, + "learning_rate": 0.0019881415973670327, + "loss": 0.1004, + "step": 26850 + }, + { + "epoch": 0.67, + "learning_rate": 0.0019877647413511544, + "loss": 0.1022, + "step": 26860 + }, + { + "epoch": 0.68, + "learning_rate": 0.001987387885335276, + "loss": 0.1041, + "step": 26870 + }, + { + "epoch": 0.68, + "learning_rate": 0.001987011029319398, + "loss": 0.1023, + "step": 26880 + }, + { + "epoch": 0.68, + "learning_rate": 0.00198663417330352, + "loss": 0.1026, + "step": 26890 + }, + { + "epoch": 0.68, + "learning_rate": 0.0019862573172876414, + "loss": 0.1058, + "step": 26900 + }, + { + "epoch": 0.68, + "learning_rate": 0.0019858804612717636, + "loss": 0.1013, + "step": 26910 + }, + { + "epoch": 0.68, + "learning_rate": 0.0019855036052558853, + "loss": 0.1025, + "step": 26920 + }, + { + "epoch": 0.68, + "learning_rate": 0.001985126749240007, + "loss": 0.1068, + "step": 26930 + }, + { + "epoch": 0.68, + "learning_rate": 0.001984749893224129, + "loss": 0.1007, + "step": 26940 + }, + { + "epoch": 0.68, + "learning_rate": 0.0019843730372082506, + "loss": 0.1057, + "step": 26950 + }, + { + "epoch": 0.68, + "learning_rate": 0.0019839961811923728, + "loss": 0.1009, + "step": 26960 + }, + { + "epoch": 0.68, + "learning_rate": 0.001983619325176494, + "loss": 0.1003, + "step": 26970 + }, + { + "epoch": 0.68, + "learning_rate": 0.001983242469160616, + "loss": 0.1051, + "step": 26980 + }, + { + "epoch": 0.68, + "learning_rate": 0.001982865613144738, + "loss": 0.1025, + "step": 26990 + }, + { + "epoch": 0.68, + "learning_rate": 0.0019824887571288597, + "loss": 0.1023, + "step": 27000 + }, + { + "epoch": 0.68, + "eval_cer": 0.6660819718124145, + "eval_loss": 0.08071926981210709, + "eval_runtime": 90.7266, + "eval_samples_per_second": 110.21, + "eval_steps_per_second": 6.889, + "step": 27000 + }, + { + "epoch": 0.68, + "learning_rate": 0.0019821119011129815, + "loss": 0.0987, + "step": 27010 + }, + { + "epoch": 0.68, + "learning_rate": 0.0019817350450971032, + "loss": 0.1022, + "step": 27020 + }, + { + "epoch": 0.68, + "learning_rate": 0.001981358189081225, + "loss": 0.0997, + "step": 27030 + }, + { + "epoch": 0.68, + "learning_rate": 0.001980981333065347, + "loss": 0.1049, + "step": 27040 + }, + { + "epoch": 0.68, + "learning_rate": 0.0019806044770494685, + "loss": 0.1034, + "step": 27050 + }, + { + "epoch": 0.68, + "learning_rate": 0.0019802276210335906, + "loss": 0.1, + "step": 27060 + }, + { + "epoch": 0.68, + "learning_rate": 0.0019798507650177124, + "loss": 0.0994, + "step": 27070 + }, + { + "epoch": 0.68, + "learning_rate": 0.001979473909001834, + "loss": 0.1041, + "step": 27080 + }, + { + "epoch": 0.68, + "learning_rate": 0.001979097052985956, + "loss": 0.1018, + "step": 27090 + }, + { + "epoch": 0.68, + "learning_rate": 0.0019787201969700776, + "loss": 0.1014, + "step": 27100 + }, + { + "epoch": 0.68, + "learning_rate": 0.0019783433409541994, + "loss": 0.1062, + "step": 27110 + }, + { + "epoch": 0.68, + "learning_rate": 0.0019779664849383215, + "loss": 0.1003, + "step": 27120 + }, + { + "epoch": 0.68, + "learning_rate": 0.001977589628922443, + "loss": 0.1022, + "step": 27130 + }, + { + "epoch": 0.68, + "learning_rate": 0.001977212772906565, + "loss": 0.1028, + "step": 27140 + }, + { + "epoch": 0.68, + "learning_rate": 0.0019768359168906868, + "loss": 0.0999, + "step": 27150 + }, + { + "epoch": 0.68, + "learning_rate": 0.0019764590608748085, + "loss": 0.1009, + "step": 27160 + }, + { + "epoch": 0.68, + "learning_rate": 0.0019760822048589303, + "loss": 0.0997, + "step": 27170 + }, + { + "epoch": 0.68, + "learning_rate": 0.001975705348843052, + "loss": 0.1038, + "step": 27180 + }, + { + "epoch": 0.68, + "learning_rate": 0.001975328492827174, + "loss": 0.1025, + "step": 27190 + }, + { + "epoch": 0.68, + "learning_rate": 0.0019749516368112955, + "loss": 0.1024, + "step": 27200 + }, + { + "epoch": 0.68, + "learning_rate": 0.0019745747807954172, + "loss": 0.1022, + "step": 27210 + }, + { + "epoch": 0.68, + "learning_rate": 0.0019741979247795394, + "loss": 0.0983, + "step": 27220 + }, + { + "epoch": 0.68, + "learning_rate": 0.001973821068763661, + "loss": 0.1008, + "step": 27230 + }, + { + "epoch": 0.68, + "learning_rate": 0.001973444212747783, + "loss": 0.1035, + "step": 27240 + }, + { + "epoch": 0.68, + "learning_rate": 0.0019730673567319047, + "loss": 0.1023, + "step": 27250 + }, + { + "epoch": 0.68, + "learning_rate": 0.0019726905007160264, + "loss": 0.1032, + "step": 27260 + }, + { + "epoch": 0.69, + "learning_rate": 0.0019723136447001486, + "loss": 0.0987, + "step": 27270 + }, + { + "epoch": 0.69, + "learning_rate": 0.00197193678868427, + "loss": 0.101, + "step": 27280 + }, + { + "epoch": 0.69, + "learning_rate": 0.0019715599326683916, + "loss": 0.0983, + "step": 27290 + }, + { + "epoch": 0.69, + "learning_rate": 0.001971183076652514, + "loss": 0.0978, + "step": 27300 + }, + { + "epoch": 0.69, + "learning_rate": 0.0019708062206366356, + "loss": 0.1028, + "step": 27310 + }, + { + "epoch": 0.69, + "learning_rate": 0.0019704293646207573, + "loss": 0.1008, + "step": 27320 + }, + { + "epoch": 0.69, + "learning_rate": 0.001970052508604879, + "loss": 0.1033, + "step": 27330 + }, + { + "epoch": 0.69, + "learning_rate": 0.001969675652589001, + "loss": 0.1035, + "step": 27340 + }, + { + "epoch": 0.69, + "learning_rate": 0.001969298796573123, + "loss": 0.1016, + "step": 27350 + }, + { + "epoch": 0.69, + "learning_rate": 0.0019689219405572443, + "loss": 0.1005, + "step": 27360 + }, + { + "epoch": 0.69, + "learning_rate": 0.0019685450845413665, + "loss": 0.1041, + "step": 27370 + }, + { + "epoch": 0.69, + "learning_rate": 0.001968168228525488, + "loss": 0.1032, + "step": 27380 + }, + { + "epoch": 0.69, + "learning_rate": 0.0019677913725096095, + "loss": 0.0945, + "step": 27390 + }, + { + "epoch": 0.69, + "learning_rate": 0.0019674145164937317, + "loss": 0.1027, + "step": 27400 + }, + { + "epoch": 0.69, + "learning_rate": 0.0019670376604778534, + "loss": 0.1041, + "step": 27410 + }, + { + "epoch": 0.69, + "learning_rate": 0.001966660804461975, + "loss": 0.1044, + "step": 27420 + }, + { + "epoch": 0.69, + "learning_rate": 0.001966283948446097, + "loss": 0.1061, + "step": 27430 + }, + { + "epoch": 0.69, + "learning_rate": 0.0019659070924302187, + "loss": 0.1008, + "step": 27440 + }, + { + "epoch": 0.69, + "learning_rate": 0.001965530236414341, + "loss": 0.1006, + "step": 27450 + }, + { + "epoch": 0.69, + "learning_rate": 0.0019651533803984626, + "loss": 0.0987, + "step": 27460 + }, + { + "epoch": 0.69, + "learning_rate": 0.0019647765243825843, + "loss": 0.1013, + "step": 27470 + }, + { + "epoch": 0.69, + "learning_rate": 0.001964399668366706, + "loss": 0.0994, + "step": 27480 + }, + { + "epoch": 0.69, + "learning_rate": 0.001964022812350828, + "loss": 0.1045, + "step": 27490 + }, + { + "epoch": 0.69, + "learning_rate": 0.00196364595633495, + "loss": 0.1013, + "step": 27500 + }, + { + "epoch": 0.69, + "eval_cer": 0.6664063210566663, + "eval_loss": 0.08010150492191315, + "eval_runtime": 90.5425, + "eval_samples_per_second": 110.434, + "eval_steps_per_second": 6.903, + "step": 27500 + }, + { + "epoch": 0.69, + "learning_rate": 0.0019632691003190713, + "loss": 0.1035, + "step": 27510 + }, + { + "epoch": 0.69, + "learning_rate": 0.001962892244303193, + "loss": 0.1013, + "step": 27520 + }, + { + "epoch": 0.69, + "learning_rate": 0.0019625153882873152, + "loss": 0.1041, + "step": 27530 + }, + { + "epoch": 0.69, + "learning_rate": 0.001962138532271437, + "loss": 0.1011, + "step": 27540 + }, + { + "epoch": 0.69, + "learning_rate": 0.0019617616762555587, + "loss": 0.1012, + "step": 27550 + }, + { + "epoch": 0.69, + "learning_rate": 0.0019613848202396805, + "loss": 0.1019, + "step": 27560 + }, + { + "epoch": 0.69, + "learning_rate": 0.0019610079642238022, + "loss": 0.0998, + "step": 27570 + }, + { + "epoch": 0.69, + "learning_rate": 0.0019606311082079244, + "loss": 0.0991, + "step": 27580 + }, + { + "epoch": 0.69, + "learning_rate": 0.0019602542521920457, + "loss": 0.1025, + "step": 27590 + }, + { + "epoch": 0.69, + "learning_rate": 0.001959877396176168, + "loss": 0.0997, + "step": 27600 + }, + { + "epoch": 0.69, + "learning_rate": 0.0019595005401602896, + "loss": 0.104, + "step": 27610 + }, + { + "epoch": 0.69, + "learning_rate": 0.001959123684144411, + "loss": 0.1013, + "step": 27620 + }, + { + "epoch": 0.69, + "learning_rate": 0.001958746828128533, + "loss": 0.1012, + "step": 27630 + }, + { + "epoch": 0.69, + "learning_rate": 0.001958369972112655, + "loss": 0.1017, + "step": 27640 + }, + { + "epoch": 0.69, + "learning_rate": 0.0019579931160967766, + "loss": 0.1034, + "step": 27650 + }, + { + "epoch": 0.69, + "learning_rate": 0.0019576162600808984, + "loss": 0.1005, + "step": 27660 + }, + { + "epoch": 0.7, + "learning_rate": 0.00195723940406502, + "loss": 0.1005, + "step": 27670 + }, + { + "epoch": 0.7, + "learning_rate": 0.0019568625480491423, + "loss": 0.1019, + "step": 27680 + }, + { + "epoch": 0.7, + "learning_rate": 0.001956485692033264, + "loss": 0.1018, + "step": 27690 + }, + { + "epoch": 0.7, + "learning_rate": 0.0019561088360173853, + "loss": 0.1023, + "step": 27700 + }, + { + "epoch": 0.7, + "learning_rate": 0.0019557319800015075, + "loss": 0.1031, + "step": 27710 + }, + { + "epoch": 0.7, + "learning_rate": 0.0019553551239856293, + "loss": 0.1028, + "step": 27720 + }, + { + "epoch": 0.7, + "learning_rate": 0.001954978267969751, + "loss": 0.0986, + "step": 27730 + }, + { + "epoch": 0.7, + "learning_rate": 0.0019546014119538727, + "loss": 0.1046, + "step": 27740 + }, + { + "epoch": 0.7, + "learning_rate": 0.0019542245559379945, + "loss": 0.101, + "step": 27750 + }, + { + "epoch": 0.7, + "learning_rate": 0.0019538476999221167, + "loss": 0.1045, + "step": 27760 + }, + { + "epoch": 0.7, + "learning_rate": 0.0019534708439062384, + "loss": 0.103, + "step": 27770 + }, + { + "epoch": 0.7, + "learning_rate": 0.00195309398789036, + "loss": 0.1023, + "step": 27780 + }, + { + "epoch": 0.7, + "learning_rate": 0.001952717131874482, + "loss": 0.1007, + "step": 27790 + }, + { + "epoch": 0.7, + "learning_rate": 0.0019523402758586036, + "loss": 0.1021, + "step": 27800 + }, + { + "epoch": 0.7, + "learning_rate": 0.0019519634198427256, + "loss": 0.1061, + "step": 27810 + }, + { + "epoch": 0.7, + "learning_rate": 0.0019515865638268471, + "loss": 0.1013, + "step": 27820 + }, + { + "epoch": 0.7, + "learning_rate": 0.001951209707810969, + "loss": 0.1039, + "step": 27830 + }, + { + "epoch": 0.7, + "learning_rate": 0.001950832851795091, + "loss": 0.1005, + "step": 27840 + }, + { + "epoch": 0.7, + "learning_rate": 0.0019504559957792126, + "loss": 0.1013, + "step": 27850 + }, + { + "epoch": 0.7, + "learning_rate": 0.0019500791397633343, + "loss": 0.1003, + "step": 27860 + }, + { + "epoch": 0.7, + "learning_rate": 0.0019497022837474563, + "loss": 0.099, + "step": 27870 + }, + { + "epoch": 0.7, + "learning_rate": 0.0019493254277315783, + "loss": 0.1027, + "step": 27880 + }, + { + "epoch": 0.7, + "learning_rate": 0.0019489485717156998, + "loss": 0.0979, + "step": 27890 + }, + { + "epoch": 0.7, + "learning_rate": 0.0019485717156998215, + "loss": 0.1025, + "step": 27900 + }, + { + "epoch": 0.7, + "learning_rate": 0.0019481948596839435, + "loss": 0.0973, + "step": 27910 + }, + { + "epoch": 0.7, + "learning_rate": 0.0019478180036680654, + "loss": 0.1003, + "step": 27920 + }, + { + "epoch": 0.7, + "learning_rate": 0.001947441147652187, + "loss": 0.1009, + "step": 27930 + }, + { + "epoch": 0.7, + "learning_rate": 0.0019470642916363087, + "loss": 0.0995, + "step": 27940 + }, + { + "epoch": 0.7, + "learning_rate": 0.0019466874356204307, + "loss": 0.0998, + "step": 27950 + }, + { + "epoch": 0.7, + "learning_rate": 0.0019463105796045526, + "loss": 0.0988, + "step": 27960 + }, + { + "epoch": 0.7, + "learning_rate": 0.0019459337235886742, + "loss": 0.1018, + "step": 27970 + }, + { + "epoch": 0.7, + "learning_rate": 0.0019455568675727961, + "loss": 0.1023, + "step": 27980 + }, + { + "epoch": 0.7, + "learning_rate": 0.0019451800115569179, + "loss": 0.099, + "step": 27990 + }, + { + "epoch": 0.7, + "learning_rate": 0.0019448031555410398, + "loss": 0.0986, + "step": 28000 + }, + { + "epoch": 0.7, + "eval_cer": 0.6663938090680156, + "eval_loss": 0.07968434691429138, + "eval_runtime": 90.6337, + "eval_samples_per_second": 110.323, + "eval_steps_per_second": 6.896, + "step": 28000 + }, + { + "epoch": 0.7, + "learning_rate": 0.0019444262995251614, + "loss": 0.1032, + "step": 28010 + }, + { + "epoch": 0.7, + "learning_rate": 0.0019440494435092833, + "loss": 0.0981, + "step": 28020 + }, + { + "epoch": 0.7, + "learning_rate": 0.001943672587493405, + "loss": 0.1021, + "step": 28030 + }, + { + "epoch": 0.7, + "learning_rate": 0.0019432957314775266, + "loss": 0.0998, + "step": 28040 + }, + { + "epoch": 0.7, + "learning_rate": 0.0019429188754616486, + "loss": 0.1031, + "step": 28050 + }, + { + "epoch": 0.7, + "learning_rate": 0.0019425420194457705, + "loss": 0.1053, + "step": 28060 + }, + { + "epoch": 0.71, + "learning_rate": 0.0019421651634298923, + "loss": 0.1035, + "step": 28070 + }, + { + "epoch": 0.71, + "learning_rate": 0.001941788307414014, + "loss": 0.101, + "step": 28080 + }, + { + "epoch": 0.71, + "learning_rate": 0.0019414114513981358, + "loss": 0.1014, + "step": 28090 + }, + { + "epoch": 0.71, + "learning_rate": 0.0019410345953822577, + "loss": 0.0977, + "step": 28100 + }, + { + "epoch": 0.71, + "learning_rate": 0.0019406577393663795, + "loss": 0.0996, + "step": 28110 + }, + { + "epoch": 0.71, + "learning_rate": 0.0019402808833505012, + "loss": 0.0977, + "step": 28120 + }, + { + "epoch": 0.71, + "learning_rate": 0.001939904027334623, + "loss": 0.1009, + "step": 28130 + }, + { + "epoch": 0.71, + "learning_rate": 0.001939527171318745, + "loss": 0.1008, + "step": 28140 + }, + { + "epoch": 0.71, + "learning_rate": 0.0019391503153028669, + "loss": 0.1033, + "step": 28150 + }, + { + "epoch": 0.71, + "learning_rate": 0.0019387734592869884, + "loss": 0.1008, + "step": 28160 + }, + { + "epoch": 0.71, + "learning_rate": 0.0019383966032711101, + "loss": 0.1006, + "step": 28170 + }, + { + "epoch": 0.71, + "learning_rate": 0.0019380197472552321, + "loss": 0.1, + "step": 28180 + }, + { + "epoch": 0.71, + "learning_rate": 0.001937642891239354, + "loss": 0.1031, + "step": 28190 + }, + { + "epoch": 0.71, + "learning_rate": 0.0019372660352234756, + "loss": 0.1011, + "step": 28200 + }, + { + "epoch": 0.71, + "learning_rate": 0.0019368891792075973, + "loss": 0.1005, + "step": 28210 + }, + { + "epoch": 0.71, + "learning_rate": 0.0019365123231917193, + "loss": 0.0974, + "step": 28220 + }, + { + "epoch": 0.71, + "learning_rate": 0.0019361354671758413, + "loss": 0.1, + "step": 28230 + }, + { + "epoch": 0.71, + "learning_rate": 0.0019357586111599628, + "loss": 0.0995, + "step": 28240 + }, + { + "epoch": 0.71, + "learning_rate": 0.0019353817551440848, + "loss": 0.0999, + "step": 28250 + }, + { + "epoch": 0.71, + "learning_rate": 0.0019350048991282065, + "loss": 0.0997, + "step": 28260 + }, + { + "epoch": 0.71, + "learning_rate": 0.001934628043112328, + "loss": 0.0988, + "step": 28270 + }, + { + "epoch": 0.71, + "learning_rate": 0.00193425118709645, + "loss": 0.1054, + "step": 28280 + }, + { + "epoch": 0.71, + "learning_rate": 0.001933874331080572, + "loss": 0.0984, + "step": 28290 + }, + { + "epoch": 0.71, + "learning_rate": 0.0019334974750646937, + "loss": 0.0963, + "step": 28300 + }, + { + "epoch": 0.71, + "learning_rate": 0.0019331206190488152, + "loss": 0.0975, + "step": 28310 + }, + { + "epoch": 0.71, + "learning_rate": 0.0019327437630329372, + "loss": 0.0986, + "step": 28320 + }, + { + "epoch": 0.71, + "learning_rate": 0.0019323669070170591, + "loss": 0.103, + "step": 28330 + }, + { + "epoch": 0.71, + "learning_rate": 0.001931990051001181, + "loss": 0.0999, + "step": 28340 + }, + { + "epoch": 0.71, + "learning_rate": 0.0019316131949853024, + "loss": 0.1017, + "step": 28350 + }, + { + "epoch": 0.71, + "learning_rate": 0.0019312363389694244, + "loss": 0.1024, + "step": 28360 + }, + { + "epoch": 0.71, + "learning_rate": 0.0019308594829535463, + "loss": 0.0984, + "step": 28370 + }, + { + "epoch": 0.71, + "learning_rate": 0.001930482626937668, + "loss": 0.0992, + "step": 28380 + }, + { + "epoch": 0.71, + "learning_rate": 0.0019301057709217898, + "loss": 0.1043, + "step": 28390 + }, + { + "epoch": 0.71, + "learning_rate": 0.0019297289149059116, + "loss": 0.1006, + "step": 28400 + }, + { + "epoch": 0.71, + "learning_rate": 0.0019293520588900335, + "loss": 0.1026, + "step": 28410 + }, + { + "epoch": 0.71, + "learning_rate": 0.0019289752028741555, + "loss": 0.1009, + "step": 28420 + }, + { + "epoch": 0.71, + "learning_rate": 0.001928598346858277, + "loss": 0.1028, + "step": 28430 + }, + { + "epoch": 0.71, + "learning_rate": 0.0019282214908423988, + "loss": 0.1039, + "step": 28440 + }, + { + "epoch": 0.71, + "learning_rate": 0.0019278446348265207, + "loss": 0.0983, + "step": 28450 + }, + { + "epoch": 0.72, + "learning_rate": 0.0019274677788106427, + "loss": 0.0987, + "step": 28460 + }, + { + "epoch": 0.72, + "learning_rate": 0.0019270909227947642, + "loss": 0.0997, + "step": 28470 + }, + { + "epoch": 0.72, + "learning_rate": 0.001926714066778886, + "loss": 0.1033, + "step": 28480 + }, + { + "epoch": 0.72, + "learning_rate": 0.001926337210763008, + "loss": 0.1025, + "step": 28490 + }, + { + "epoch": 0.72, + "learning_rate": 0.0019259603547471295, + "loss": 0.1022, + "step": 28500 + }, + { + "epoch": 0.72, + "eval_cer": 0.6661753304969618, + "eval_loss": 0.07863720506429672, + "eval_runtime": 90.541, + "eval_samples_per_second": 110.436, + "eval_steps_per_second": 6.903, + "step": 28500 + }, + { + "epoch": 0.72, + "learning_rate": 0.0019255834987312514, + "loss": 0.1002, + "step": 28510 + }, + { + "epoch": 0.72, + "learning_rate": 0.0019252066427153732, + "loss": 0.0997, + "step": 28520 + }, + { + "epoch": 0.72, + "learning_rate": 0.0019248297866994951, + "loss": 0.1005, + "step": 28530 + }, + { + "epoch": 0.72, + "learning_rate": 0.0019244529306836167, + "loss": 0.099, + "step": 28540 + }, + { + "epoch": 0.72, + "learning_rate": 0.0019240760746677386, + "loss": 0.1016, + "step": 28550 + }, + { + "epoch": 0.72, + "learning_rate": 0.0019236992186518606, + "loss": 0.1033, + "step": 28560 + }, + { + "epoch": 0.72, + "learning_rate": 0.0019233223626359823, + "loss": 0.099, + "step": 28570 + }, + { + "epoch": 0.72, + "learning_rate": 0.0019229455066201038, + "loss": 0.0997, + "step": 28580 + }, + { + "epoch": 0.72, + "learning_rate": 0.0019225686506042258, + "loss": 0.0981, + "step": 28590 + }, + { + "epoch": 0.72, + "learning_rate": 0.0019221917945883478, + "loss": 0.0975, + "step": 28600 + }, + { + "epoch": 0.72, + "learning_rate": 0.0019218149385724695, + "loss": 0.1016, + "step": 28610 + }, + { + "epoch": 0.72, + "learning_rate": 0.001921438082556591, + "loss": 0.0965, + "step": 28620 + }, + { + "epoch": 0.72, + "learning_rate": 0.001921061226540713, + "loss": 0.1033, + "step": 28630 + }, + { + "epoch": 0.72, + "learning_rate": 0.001920684370524835, + "loss": 0.1017, + "step": 28640 + }, + { + "epoch": 0.72, + "learning_rate": 0.0019203075145089567, + "loss": 0.1016, + "step": 28650 + }, + { + "epoch": 0.72, + "learning_rate": 0.0019199306584930785, + "loss": 0.1009, + "step": 28660 + }, + { + "epoch": 0.72, + "learning_rate": 0.0019195538024772002, + "loss": 0.1024, + "step": 28670 + }, + { + "epoch": 0.72, + "learning_rate": 0.0019191769464613222, + "loss": 0.0999, + "step": 28680 + }, + { + "epoch": 0.72, + "learning_rate": 0.001918800090445444, + "loss": 0.1023, + "step": 28690 + }, + { + "epoch": 0.72, + "learning_rate": 0.0019184232344295657, + "loss": 0.1016, + "step": 28700 + }, + { + "epoch": 0.72, + "learning_rate": 0.0019180463784136874, + "loss": 0.1027, + "step": 28710 + }, + { + "epoch": 0.72, + "learning_rate": 0.0019176695223978094, + "loss": 0.1039, + "step": 28720 + }, + { + "epoch": 0.72, + "learning_rate": 0.0019172926663819309, + "loss": 0.0976, + "step": 28730 + }, + { + "epoch": 0.72, + "learning_rate": 0.0019169158103660528, + "loss": 0.0989, + "step": 28740 + }, + { + "epoch": 0.72, + "learning_rate": 0.0019165389543501746, + "loss": 0.0977, + "step": 28750 + }, + { + "epoch": 0.72, + "learning_rate": 0.0019161620983342966, + "loss": 0.0974, + "step": 28760 + }, + { + "epoch": 0.72, + "learning_rate": 0.001915785242318418, + "loss": 0.1004, + "step": 28770 + }, + { + "epoch": 0.72, + "learning_rate": 0.00191540838630254, + "loss": 0.0977, + "step": 28780 + }, + { + "epoch": 0.72, + "learning_rate": 0.0019150315302866618, + "loss": 0.1007, + "step": 28790 + }, + { + "epoch": 0.72, + "learning_rate": 0.0019146546742707837, + "loss": 0.0981, + "step": 28800 + }, + { + "epoch": 0.72, + "learning_rate": 0.0019142778182549053, + "loss": 0.1005, + "step": 28810 + }, + { + "epoch": 0.72, + "learning_rate": 0.0019139009622390272, + "loss": 0.099, + "step": 28820 + }, + { + "epoch": 0.72, + "learning_rate": 0.0019135241062231492, + "loss": 0.0974, + "step": 28830 + }, + { + "epoch": 0.72, + "learning_rate": 0.001913147250207271, + "loss": 0.097, + "step": 28840 + }, + { + "epoch": 0.72, + "learning_rate": 0.0019127703941913925, + "loss": 0.0989, + "step": 28850 + }, + { + "epoch": 0.73, + "learning_rate": 0.0019123935381755144, + "loss": 0.0987, + "step": 28860 + }, + { + "epoch": 0.73, + "learning_rate": 0.0019120166821596364, + "loss": 0.0988, + "step": 28870 + }, + { + "epoch": 0.73, + "learning_rate": 0.0019116398261437581, + "loss": 0.0983, + "step": 28880 + }, + { + "epoch": 0.73, + "learning_rate": 0.0019112629701278797, + "loss": 0.1038, + "step": 28890 + }, + { + "epoch": 0.73, + "learning_rate": 0.0019108861141120016, + "loss": 0.0969, + "step": 28900 + }, + { + "epoch": 0.73, + "learning_rate": 0.0019105092580961236, + "loss": 0.1002, + "step": 28910 + }, + { + "epoch": 0.73, + "learning_rate": 0.0019101324020802453, + "loss": 0.0995, + "step": 28920 + }, + { + "epoch": 0.73, + "learning_rate": 0.0019097555460643669, + "loss": 0.0996, + "step": 28930 + }, + { + "epoch": 0.73, + "learning_rate": 0.0019093786900484888, + "loss": 0.0971, + "step": 28940 + }, + { + "epoch": 0.73, + "learning_rate": 0.0019090018340326108, + "loss": 0.101, + "step": 28950 + }, + { + "epoch": 0.73, + "learning_rate": 0.0019086249780167323, + "loss": 0.0991, + "step": 28960 + }, + { + "epoch": 0.73, + "learning_rate": 0.0019082481220008543, + "loss": 0.1009, + "step": 28970 + }, + { + "epoch": 0.73, + "learning_rate": 0.001907871265984976, + "loss": 0.0994, + "step": 28980 + }, + { + "epoch": 0.73, + "learning_rate": 0.001907494409969098, + "loss": 0.0986, + "step": 28990 + }, + { + "epoch": 0.73, + "learning_rate": 0.0019071175539532195, + "loss": 0.0984, + "step": 29000 + }, + { + "epoch": 0.73, + "eval_cer": 0.6658707116963514, + "eval_loss": 0.07814398407936096, + "eval_runtime": 90.6335, + "eval_samples_per_second": 110.323, + "eval_steps_per_second": 6.896, + "step": 29000 + }, + { + "epoch": 0.73, + "learning_rate": 0.0019067406979373415, + "loss": 0.1015, + "step": 29010 + }, + { + "epoch": 0.73, + "learning_rate": 0.0019063638419214632, + "loss": 0.1036, + "step": 29020 + }, + { + "epoch": 0.73, + "learning_rate": 0.0019059869859055852, + "loss": 0.096, + "step": 29030 + }, + { + "epoch": 0.73, + "learning_rate": 0.0019056101298897067, + "loss": 0.0991, + "step": 29040 + }, + { + "epoch": 0.73, + "learning_rate": 0.0019052332738738287, + "loss": 0.0942, + "step": 29050 + }, + { + "epoch": 0.73, + "learning_rate": 0.0019048564178579504, + "loss": 0.1032, + "step": 29060 + }, + { + "epoch": 0.73, + "learning_rate": 0.0019044795618420724, + "loss": 0.099, + "step": 29070 + }, + { + "epoch": 0.73, + "learning_rate": 0.001904102705826194, + "loss": 0.1025, + "step": 29080 + }, + { + "epoch": 0.73, + "learning_rate": 0.0019037258498103159, + "loss": 0.0979, + "step": 29090 + }, + { + "epoch": 0.73, + "learning_rate": 0.0019033489937944376, + "loss": 0.097, + "step": 29100 + }, + { + "epoch": 0.73, + "learning_rate": 0.0019029721377785596, + "loss": 0.0972, + "step": 29110 + }, + { + "epoch": 0.73, + "learning_rate": 0.001902595281762681, + "loss": 0.0996, + "step": 29120 + }, + { + "epoch": 0.73, + "learning_rate": 0.001902218425746803, + "loss": 0.0989, + "step": 29130 + }, + { + "epoch": 0.73, + "learning_rate": 0.001901841569730925, + "loss": 0.1029, + "step": 29140 + }, + { + "epoch": 0.73, + "learning_rate": 0.0019014647137150465, + "loss": 0.0997, + "step": 29150 + }, + { + "epoch": 0.73, + "learning_rate": 0.0019010878576991683, + "loss": 0.0979, + "step": 29160 + }, + { + "epoch": 0.73, + "learning_rate": 0.0019007110016832902, + "loss": 0.0987, + "step": 29170 + }, + { + "epoch": 0.73, + "learning_rate": 0.0019003341456674122, + "loss": 0.1012, + "step": 29180 + }, + { + "epoch": 0.73, + "learning_rate": 0.0018999572896515337, + "loss": 0.0981, + "step": 29190 + }, + { + "epoch": 0.73, + "learning_rate": 0.0018995804336356555, + "loss": 0.1002, + "step": 29200 + }, + { + "epoch": 0.73, + "learning_rate": 0.0018992035776197774, + "loss": 0.0982, + "step": 29210 + }, + { + "epoch": 0.73, + "learning_rate": 0.0018988267216038994, + "loss": 0.0995, + "step": 29220 + }, + { + "epoch": 0.73, + "learning_rate": 0.001898449865588021, + "loss": 0.0998, + "step": 29230 + }, + { + "epoch": 0.73, + "learning_rate": 0.001898073009572143, + "loss": 0.0971, + "step": 29240 + }, + { + "epoch": 0.73, + "learning_rate": 0.0018976961535562646, + "loss": 0.1025, + "step": 29250 + }, + { + "epoch": 0.74, + "learning_rate": 0.0018973192975403866, + "loss": 0.0967, + "step": 29260 + }, + { + "epoch": 0.74, + "learning_rate": 0.0018969424415245081, + "loss": 0.0998, + "step": 29270 + }, + { + "epoch": 0.74, + "learning_rate": 0.00189656558550863, + "loss": 0.0982, + "step": 29280 + }, + { + "epoch": 0.74, + "learning_rate": 0.0018961887294927518, + "loss": 0.1012, + "step": 29290 + }, + { + "epoch": 0.74, + "learning_rate": 0.0018958118734768738, + "loss": 0.0985, + "step": 29300 + }, + { + "epoch": 0.74, + "learning_rate": 0.0018954350174609953, + "loss": 0.0973, + "step": 29310 + }, + { + "epoch": 0.74, + "learning_rate": 0.0018950581614451173, + "loss": 0.096, + "step": 29320 + }, + { + "epoch": 0.74, + "learning_rate": 0.001894681305429239, + "loss": 0.0981, + "step": 29330 + }, + { + "epoch": 0.74, + "learning_rate": 0.001894304449413361, + "loss": 0.1002, + "step": 29340 + }, + { + "epoch": 0.74, + "learning_rate": 0.0018939275933974825, + "loss": 0.0987, + "step": 29350 + }, + { + "epoch": 0.74, + "learning_rate": 0.0018935507373816045, + "loss": 0.0973, + "step": 29360 + }, + { + "epoch": 0.74, + "learning_rate": 0.0018931738813657262, + "loss": 0.1002, + "step": 29370 + }, + { + "epoch": 0.74, + "learning_rate": 0.001892797025349848, + "loss": 0.0955, + "step": 29380 + }, + { + "epoch": 0.74, + "learning_rate": 0.0018924201693339697, + "loss": 0.0967, + "step": 29390 + }, + { + "epoch": 0.74, + "learning_rate": 0.0018920433133180917, + "loss": 0.1002, + "step": 29400 + }, + { + "epoch": 0.74, + "learning_rate": 0.0018916664573022136, + "loss": 0.0958, + "step": 29410 + }, + { + "epoch": 0.74, + "learning_rate": 0.0018912896012863352, + "loss": 0.0999, + "step": 29420 + }, + { + "epoch": 0.74, + "learning_rate": 0.001890912745270457, + "loss": 0.0973, + "step": 29430 + }, + { + "epoch": 0.74, + "learning_rate": 0.0018905358892545789, + "loss": 0.0988, + "step": 29440 + }, + { + "epoch": 0.74, + "learning_rate": 0.0018901590332387008, + "loss": 0.0957, + "step": 29450 + }, + { + "epoch": 0.74, + "learning_rate": 0.0018897821772228224, + "loss": 0.0978, + "step": 29460 + }, + { + "epoch": 0.74, + "learning_rate": 0.001889405321206944, + "loss": 0.1017, + "step": 29470 + }, + { + "epoch": 0.74, + "learning_rate": 0.001889028465191066, + "loss": 0.0977, + "step": 29480 + }, + { + "epoch": 0.74, + "learning_rate": 0.001888651609175188, + "loss": 0.0997, + "step": 29490 + }, + { + "epoch": 0.74, + "learning_rate": 0.0018882747531593096, + "loss": 0.0971, + "step": 29500 + }, + { + "epoch": 0.74, + "eval_cer": 0.6662253784515644, + "eval_loss": 0.077802374958992, + "eval_runtime": 90.7555, + "eval_samples_per_second": 110.175, + "eval_steps_per_second": 6.887, + "step": 29500 + }, + { + "epoch": 0.74, + "learning_rate": 0.0018878978971434313, + "loss": 0.0972, + "step": 29510 + }, + { + "epoch": 0.74, + "learning_rate": 0.0018875210411275533, + "loss": 0.0957, + "step": 29520 + }, + { + "epoch": 0.74, + "learning_rate": 0.0018871441851116752, + "loss": 0.097, + "step": 29530 + }, + { + "epoch": 0.74, + "learning_rate": 0.0018867673290957968, + "loss": 0.0929, + "step": 29540 + }, + { + "epoch": 0.74, + "learning_rate": 0.0018863904730799187, + "loss": 0.0968, + "step": 29550 + }, + { + "epoch": 0.74, + "learning_rate": 0.0018860136170640405, + "loss": 0.0981, + "step": 29560 + }, + { + "epoch": 0.74, + "learning_rate": 0.0018856367610481624, + "loss": 0.0977, + "step": 29570 + }, + { + "epoch": 0.74, + "learning_rate": 0.001885259905032284, + "loss": 0.0952, + "step": 29580 + }, + { + "epoch": 0.74, + "learning_rate": 0.001884883049016406, + "loss": 0.097, + "step": 29590 + }, + { + "epoch": 0.74, + "learning_rate": 0.0018845061930005277, + "loss": 0.0973, + "step": 29600 + }, + { + "epoch": 0.74, + "learning_rate": 0.0018841293369846492, + "loss": 0.1026, + "step": 29610 + }, + { + "epoch": 0.74, + "learning_rate": 0.0018837524809687711, + "loss": 0.0981, + "step": 29620 + }, + { + "epoch": 0.74, + "learning_rate": 0.001883375624952893, + "loss": 0.0977, + "step": 29630 + }, + { + "epoch": 0.74, + "learning_rate": 0.0018829987689370148, + "loss": 0.0956, + "step": 29640 + }, + { + "epoch": 0.74, + "learning_rate": 0.0018826219129211366, + "loss": 0.0967, + "step": 29650 + }, + { + "epoch": 0.75, + "learning_rate": 0.0018822450569052583, + "loss": 0.0986, + "step": 29660 + }, + { + "epoch": 0.75, + "learning_rate": 0.0018818682008893803, + "loss": 0.0916, + "step": 29670 + }, + { + "epoch": 0.75, + "learning_rate": 0.0018814913448735023, + "loss": 0.1046, + "step": 29680 + }, + { + "epoch": 0.75, + "learning_rate": 0.0018811144888576238, + "loss": 0.0966, + "step": 29690 + }, + { + "epoch": 0.75, + "learning_rate": 0.0018807376328417455, + "loss": 0.0959, + "step": 29700 + }, + { + "epoch": 0.75, + "learning_rate": 0.0018803607768258675, + "loss": 0.099, + "step": 29710 + }, + { + "epoch": 0.75, + "learning_rate": 0.0018799839208099895, + "loss": 0.0978, + "step": 29720 + }, + { + "epoch": 0.75, + "learning_rate": 0.001879607064794111, + "loss": 0.0946, + "step": 29730 + }, + { + "epoch": 0.75, + "learning_rate": 0.0018792302087782327, + "loss": 0.0966, + "step": 29740 + }, + { + "epoch": 0.75, + "learning_rate": 0.0018788533527623547, + "loss": 0.0984, + "step": 29750 + }, + { + "epoch": 0.75, + "learning_rate": 0.0018784764967464767, + "loss": 0.1024, + "step": 29760 + }, + { + "epoch": 0.75, + "learning_rate": 0.0018780996407305982, + "loss": 0.0986, + "step": 29770 + }, + { + "epoch": 0.75, + "learning_rate": 0.00187772278471472, + "loss": 0.0995, + "step": 29780 + }, + { + "epoch": 0.75, + "learning_rate": 0.0018773459286988419, + "loss": 0.0969, + "step": 29790 + }, + { + "epoch": 0.75, + "learning_rate": 0.0018769690726829638, + "loss": 0.1, + "step": 29800 + }, + { + "epoch": 0.75, + "learning_rate": 0.0018765922166670854, + "loss": 0.1014, + "step": 29810 + }, + { + "epoch": 0.75, + "learning_rate": 0.0018762153606512073, + "loss": 0.0982, + "step": 29820 + }, + { + "epoch": 0.75, + "learning_rate": 0.001875838504635329, + "loss": 0.0963, + "step": 29830 + }, + { + "epoch": 0.75, + "learning_rate": 0.0018754616486194506, + "loss": 0.0949, + "step": 29840 + }, + { + "epoch": 0.75, + "learning_rate": 0.0018750847926035726, + "loss": 0.1005, + "step": 29850 + }, + { + "epoch": 0.75, + "learning_rate": 0.0018747079365876945, + "loss": 0.0978, + "step": 29860 + }, + { + "epoch": 0.75, + "learning_rate": 0.0018743310805718163, + "loss": 0.0981, + "step": 29870 + }, + { + "epoch": 0.75, + "learning_rate": 0.0018739542245559378, + "loss": 0.0951, + "step": 29880 + }, + { + "epoch": 0.75, + "learning_rate": 0.0018735773685400598, + "loss": 0.0977, + "step": 29890 + }, + { + "epoch": 0.75, + "learning_rate": 0.0018732005125241817, + "loss": 0.0988, + "step": 29900 + }, + { + "epoch": 0.75, + "learning_rate": 0.0018728236565083035, + "loss": 0.1009, + "step": 29910 + }, + { + "epoch": 0.75, + "learning_rate": 0.001872446800492425, + "loss": 0.0997, + "step": 29920 + }, + { + "epoch": 0.75, + "learning_rate": 0.001872069944476547, + "loss": 0.0971, + "step": 29930 + }, + { + "epoch": 0.75, + "learning_rate": 0.001871693088460669, + "loss": 0.1, + "step": 29940 + }, + { + "epoch": 0.75, + "learning_rate": 0.0018713162324447907, + "loss": 0.0997, + "step": 29950 + }, + { + "epoch": 0.75, + "learning_rate": 0.0018709393764289124, + "loss": 0.1002, + "step": 29960 + }, + { + "epoch": 0.75, + "learning_rate": 0.0018705625204130342, + "loss": 0.0974, + "step": 29970 + }, + { + "epoch": 0.75, + "learning_rate": 0.0018701856643971561, + "loss": 0.0967, + "step": 29980 + }, + { + "epoch": 0.75, + "learning_rate": 0.001869808808381278, + "loss": 0.0904, + "step": 29990 + }, + { + "epoch": 0.75, + "learning_rate": 0.0018694319523653996, + "loss": 0.0963, + "step": 30000 + }, + { + "epoch": 0.75, + "eval_cer": 0.6659708076055567, + "eval_loss": 0.07728173583745956, + "eval_runtime": 90.6693, + "eval_samples_per_second": 110.28, + "eval_steps_per_second": 6.893, + "step": 30000 + }, + { + "epoch": 0.75, + "learning_rate": 0.0018690550963495214, + "loss": 0.1015, + "step": 30010 + }, + { + "epoch": 0.75, + "learning_rate": 0.0018686782403336433, + "loss": 0.0994, + "step": 30020 + }, + { + "epoch": 0.75, + "learning_rate": 0.0018683013843177653, + "loss": 0.1013, + "step": 30030 + }, + { + "epoch": 0.75, + "learning_rate": 0.0018679245283018868, + "loss": 0.0995, + "step": 30040 + }, + { + "epoch": 0.75, + "learning_rate": 0.0018675476722860085, + "loss": 0.0963, + "step": 30050 + }, + { + "epoch": 0.76, + "learning_rate": 0.0018671708162701305, + "loss": 0.0978, + "step": 30060 + }, + { + "epoch": 0.76, + "learning_rate": 0.001866793960254252, + "loss": 0.0989, + "step": 30070 + }, + { + "epoch": 0.76, + "learning_rate": 0.001866417104238374, + "loss": 0.0997, + "step": 30080 + }, + { + "epoch": 0.76, + "learning_rate": 0.0018660402482224957, + "loss": 0.0986, + "step": 30090 + }, + { + "epoch": 0.76, + "learning_rate": 0.0018656633922066177, + "loss": 0.0961, + "step": 30100 + }, + { + "epoch": 0.76, + "learning_rate": 0.0018652865361907392, + "loss": 0.0952, + "step": 30110 + }, + { + "epoch": 0.76, + "learning_rate": 0.0018649096801748612, + "loss": 0.0959, + "step": 30120 + }, + { + "epoch": 0.76, + "learning_rate": 0.0018645328241589832, + "loss": 0.0975, + "step": 30130 + }, + { + "epoch": 0.76, + "learning_rate": 0.001864155968143105, + "loss": 0.0911, + "step": 30140 + }, + { + "epoch": 0.76, + "learning_rate": 0.0018637791121272264, + "loss": 0.0977, + "step": 30150 + }, + { + "epoch": 0.76, + "learning_rate": 0.0018634022561113484, + "loss": 0.0958, + "step": 30160 + }, + { + "epoch": 0.76, + "learning_rate": 0.0018630254000954704, + "loss": 0.0987, + "step": 30170 + }, + { + "epoch": 0.76, + "learning_rate": 0.001862648544079592, + "loss": 0.0973, + "step": 30180 + }, + { + "epoch": 0.76, + "learning_rate": 0.0018622716880637136, + "loss": 0.0995, + "step": 30190 + }, + { + "epoch": 0.76, + "learning_rate": 0.0018618948320478356, + "loss": 0.0998, + "step": 30200 + }, + { + "epoch": 0.76, + "learning_rate": 0.0018615179760319575, + "loss": 0.0989, + "step": 30210 + }, + { + "epoch": 0.76, + "learning_rate": 0.0018611411200160793, + "loss": 0.1, + "step": 30220 + }, + { + "epoch": 0.76, + "learning_rate": 0.001860764264000201, + "loss": 0.0991, + "step": 30230 + }, + { + "epoch": 0.76, + "learning_rate": 0.0018603874079843228, + "loss": 0.1011, + "step": 30240 + }, + { + "epoch": 0.76, + "learning_rate": 0.0018600105519684447, + "loss": 0.0989, + "step": 30250 + }, + { + "epoch": 0.76, + "learning_rate": 0.0018596336959525663, + "loss": 0.095, + "step": 30260 + }, + { + "epoch": 0.76, + "learning_rate": 0.0018592568399366882, + "loss": 0.0968, + "step": 30270 + }, + { + "epoch": 0.76, + "learning_rate": 0.00185887998392081, + "loss": 0.0936, + "step": 30280 + }, + { + "epoch": 0.76, + "learning_rate": 0.001858503127904932, + "loss": 0.1002, + "step": 30290 + }, + { + "epoch": 0.76, + "learning_rate": 0.0018581262718890535, + "loss": 0.0974, + "step": 30300 + }, + { + "epoch": 0.76, + "learning_rate": 0.0018577494158731754, + "loss": 0.0954, + "step": 30310 + }, + { + "epoch": 0.76, + "learning_rate": 0.0018573725598572972, + "loss": 0.0954, + "step": 30320 + }, + { + "epoch": 0.76, + "learning_rate": 0.0018569957038414191, + "loss": 0.0983, + "step": 30330 + }, + { + "epoch": 0.76, + "learning_rate": 0.0018566188478255407, + "loss": 0.0978, + "step": 30340 + }, + { + "epoch": 0.76, + "learning_rate": 0.0018562419918096626, + "loss": 0.0994, + "step": 30350 + }, + { + "epoch": 0.76, + "learning_rate": 0.0018558651357937844, + "loss": 0.0974, + "step": 30360 + }, + { + "epoch": 0.76, + "learning_rate": 0.0018554882797779063, + "loss": 0.0952, + "step": 30370 + }, + { + "epoch": 0.76, + "learning_rate": 0.0018551114237620279, + "loss": 0.0938, + "step": 30380 + }, + { + "epoch": 0.76, + "learning_rate": 0.0018547345677461498, + "loss": 0.0971, + "step": 30390 + }, + { + "epoch": 0.76, + "learning_rate": 0.0018543577117302718, + "loss": 0.0995, + "step": 30400 + }, + { + "epoch": 0.76, + "learning_rate": 0.0018539808557143935, + "loss": 0.0957, + "step": 30410 + }, + { + "epoch": 0.76, + "learning_rate": 0.001853603999698515, + "loss": 0.0985, + "step": 30420 + }, + { + "epoch": 0.76, + "learning_rate": 0.001853227143682637, + "loss": 0.0944, + "step": 30430 + }, + { + "epoch": 0.76, + "learning_rate": 0.001852850287666759, + "loss": 0.0984, + "step": 30440 + }, + { + "epoch": 0.77, + "learning_rate": 0.0018524734316508807, + "loss": 0.102, + "step": 30450 + }, + { + "epoch": 0.77, + "learning_rate": 0.0018520965756350022, + "loss": 0.1017, + "step": 30460 + }, + { + "epoch": 0.77, + "learning_rate": 0.0018517197196191242, + "loss": 0.0997, + "step": 30470 + }, + { + "epoch": 0.77, + "learning_rate": 0.0018513428636032462, + "loss": 0.101, + "step": 30480 + }, + { + "epoch": 0.77, + "learning_rate": 0.0018509660075873677, + "loss": 0.098, + "step": 30490 + }, + { + "epoch": 0.77, + "learning_rate": 0.0018505891515714894, + "loss": 0.0958, + "step": 30500 + }, + { + "epoch": 0.77, + "eval_cer": 0.6662455901255385, + "eval_loss": 0.07596764713525772, + "eval_runtime": 90.6663, + "eval_samples_per_second": 110.283, + "eval_steps_per_second": 6.893, + "step": 30500 + }, + { + "epoch": 0.77, + "learning_rate": 0.0018502122955556114, + "loss": 0.0934, + "step": 30510 + }, + { + "epoch": 0.77, + "learning_rate": 0.0018498354395397334, + "loss": 0.0951, + "step": 30520 + }, + { + "epoch": 0.77, + "learning_rate": 0.0018494585835238549, + "loss": 0.0959, + "step": 30530 + }, + { + "epoch": 0.77, + "learning_rate": 0.0018490817275079769, + "loss": 0.1019, + "step": 30540 + }, + { + "epoch": 0.77, + "learning_rate": 0.0018487048714920986, + "loss": 0.0972, + "step": 30550 + }, + { + "epoch": 0.77, + "learning_rate": 0.0018483280154762206, + "loss": 0.0984, + "step": 30560 + }, + { + "epoch": 0.77, + "learning_rate": 0.001847951159460342, + "loss": 0.0973, + "step": 30570 + }, + { + "epoch": 0.77, + "learning_rate": 0.001847574303444464, + "loss": 0.0956, + "step": 30580 + }, + { + "epoch": 0.77, + "learning_rate": 0.0018471974474285858, + "loss": 0.0991, + "step": 30590 + }, + { + "epoch": 0.77, + "learning_rate": 0.0018468205914127078, + "loss": 0.0969, + "step": 30600 + }, + { + "epoch": 0.77, + "learning_rate": 0.0018464437353968293, + "loss": 0.0965, + "step": 30610 + }, + { + "epoch": 0.77, + "learning_rate": 0.0018460668793809512, + "loss": 0.0959, + "step": 30620 + }, + { + "epoch": 0.77, + "learning_rate": 0.001845690023365073, + "loss": 0.0971, + "step": 30630 + }, + { + "epoch": 0.77, + "learning_rate": 0.001845313167349195, + "loss": 0.0962, + "step": 30640 + }, + { + "epoch": 0.77, + "learning_rate": 0.0018449363113333165, + "loss": 0.0977, + "step": 30650 + }, + { + "epoch": 0.77, + "learning_rate": 0.0018445594553174384, + "loss": 0.0941, + "step": 30660 + }, + { + "epoch": 0.77, + "learning_rate": 0.0018441825993015604, + "loss": 0.0981, + "step": 30670 + }, + { + "epoch": 0.77, + "learning_rate": 0.0018438057432856821, + "loss": 0.0967, + "step": 30680 + }, + { + "epoch": 0.77, + "learning_rate": 0.0018434288872698037, + "loss": 0.0981, + "step": 30690 + }, + { + "epoch": 0.77, + "learning_rate": 0.0018430520312539256, + "loss": 0.0969, + "step": 30700 + }, + { + "epoch": 0.77, + "learning_rate": 0.0018426751752380476, + "loss": 0.0967, + "step": 30710 + }, + { + "epoch": 0.77, + "learning_rate": 0.0018422983192221691, + "loss": 0.0952, + "step": 30720 + }, + { + "epoch": 0.77, + "learning_rate": 0.0018419214632062909, + "loss": 0.0993, + "step": 30730 + }, + { + "epoch": 0.77, + "learning_rate": 0.0018415446071904128, + "loss": 0.0953, + "step": 30740 + }, + { + "epoch": 0.77, + "learning_rate": 0.0018411677511745348, + "loss": 0.0968, + "step": 30750 + }, + { + "epoch": 0.77, + "learning_rate": 0.0018407908951586563, + "loss": 0.093, + "step": 30760 + }, + { + "epoch": 0.77, + "learning_rate": 0.001840414039142778, + "loss": 0.0961, + "step": 30770 + }, + { + "epoch": 0.77, + "learning_rate": 0.0018400371831269, + "loss": 0.0961, + "step": 30780 + }, + { + "epoch": 0.77, + "learning_rate": 0.001839660327111022, + "loss": 0.096, + "step": 30790 + }, + { + "epoch": 0.77, + "learning_rate": 0.0018392834710951435, + "loss": 0.0985, + "step": 30800 + }, + { + "epoch": 0.77, + "learning_rate": 0.0018389066150792655, + "loss": 0.0962, + "step": 30810 + }, + { + "epoch": 0.77, + "learning_rate": 0.0018385297590633872, + "loss": 0.0965, + "step": 30820 + }, + { + "epoch": 0.77, + "learning_rate": 0.0018381529030475092, + "loss": 0.0997, + "step": 30830 + }, + { + "epoch": 0.77, + "learning_rate": 0.0018377760470316307, + "loss": 0.1014, + "step": 30840 + }, + { + "epoch": 0.78, + "learning_rate": 0.0018373991910157527, + "loss": 0.0963, + "step": 30850 + }, + { + "epoch": 0.78, + "learning_rate": 0.0018370223349998744, + "loss": 0.096, + "step": 30860 + }, + { + "epoch": 0.78, + "learning_rate": 0.0018366454789839964, + "loss": 0.0979, + "step": 30870 + }, + { + "epoch": 0.78, + "learning_rate": 0.001836268622968118, + "loss": 0.094, + "step": 30880 + }, + { + "epoch": 0.78, + "learning_rate": 0.0018358917669522399, + "loss": 0.095, + "step": 30890 + }, + { + "epoch": 0.78, + "learning_rate": 0.0018355149109363616, + "loss": 0.0946, + "step": 30900 + }, + { + "epoch": 0.78, + "learning_rate": 0.0018351380549204836, + "loss": 0.0967, + "step": 30910 + }, + { + "epoch": 0.78, + "learning_rate": 0.001834761198904605, + "loss": 0.0981, + "step": 30920 + }, + { + "epoch": 0.78, + "learning_rate": 0.001834384342888727, + "loss": 0.0968, + "step": 30930 + }, + { + "epoch": 0.78, + "learning_rate": 0.0018340074868728488, + "loss": 0.0945, + "step": 30940 + }, + { + "epoch": 0.78, + "learning_rate": 0.0018336306308569706, + "loss": 0.0951, + "step": 30950 + }, + { + "epoch": 0.78, + "learning_rate": 0.0018332537748410923, + "loss": 0.0931, + "step": 30960 + }, + { + "epoch": 0.78, + "learning_rate": 0.0018328769188252143, + "loss": 0.0999, + "step": 30970 + }, + { + "epoch": 0.78, + "learning_rate": 0.0018325000628093362, + "loss": 0.0918, + "step": 30980 + }, + { + "epoch": 0.78, + "learning_rate": 0.0018321232067934577, + "loss": 0.0927, + "step": 30990 + }, + { + "epoch": 0.78, + "learning_rate": 0.0018317463507775795, + "loss": 0.0999, + "step": 31000 + }, + { + "epoch": 0.78, + "eval_cer": 0.6661349071490135, + "eval_loss": 0.07599937915802002, + "eval_runtime": 90.6874, + "eval_samples_per_second": 110.258, + "eval_steps_per_second": 6.892, + "step": 31000 + }, + { + "epoch": 0.78, + "learning_rate": 0.0018313694947617015, + "loss": 0.0963, + "step": 31010 + }, + { + "epoch": 0.78, + "learning_rate": 0.0018309926387458234, + "loss": 0.0964, + "step": 31020 + }, + { + "epoch": 0.78, + "learning_rate": 0.001830615782729945, + "loss": 0.0985, + "step": 31030 + }, + { + "epoch": 0.78, + "learning_rate": 0.0018302389267140667, + "loss": 0.0956, + "step": 31040 + }, + { + "epoch": 0.78, + "learning_rate": 0.0018298620706981886, + "loss": 0.0983, + "step": 31050 + }, + { + "epoch": 0.78, + "learning_rate": 0.0018294852146823106, + "loss": 0.0927, + "step": 31060 + }, + { + "epoch": 0.78, + "learning_rate": 0.0018291083586664321, + "loss": 0.0913, + "step": 31070 + }, + { + "epoch": 0.78, + "learning_rate": 0.001828731502650554, + "loss": 0.0932, + "step": 31080 + }, + { + "epoch": 0.78, + "learning_rate": 0.0018283546466346758, + "loss": 0.0954, + "step": 31090 + }, + { + "epoch": 0.78, + "learning_rate": 0.0018279777906187978, + "loss": 0.0978, + "step": 31100 + }, + { + "epoch": 0.78, + "learning_rate": 0.0018276009346029193, + "loss": 0.0953, + "step": 31110 + }, + { + "epoch": 0.78, + "learning_rate": 0.0018272240785870413, + "loss": 0.0969, + "step": 31120 + }, + { + "epoch": 0.78, + "learning_rate": 0.001826847222571163, + "loss": 0.1006, + "step": 31130 + }, + { + "epoch": 0.78, + "learning_rate": 0.001826470366555285, + "loss": 0.0923, + "step": 31140 + }, + { + "epoch": 0.78, + "learning_rate": 0.0018260935105394065, + "loss": 0.0949, + "step": 31150 + }, + { + "epoch": 0.78, + "learning_rate": 0.0018257166545235285, + "loss": 0.0972, + "step": 31160 + }, + { + "epoch": 0.78, + "learning_rate": 0.0018253397985076502, + "loss": 0.0916, + "step": 31170 + }, + { + "epoch": 0.78, + "learning_rate": 0.0018249629424917718, + "loss": 0.0975, + "step": 31180 + }, + { + "epoch": 0.78, + "learning_rate": 0.0018245860864758937, + "loss": 0.0962, + "step": 31190 + }, + { + "epoch": 0.78, + "learning_rate": 0.0018242092304600157, + "loss": 0.0968, + "step": 31200 + }, + { + "epoch": 0.78, + "learning_rate": 0.0018238323744441374, + "loss": 0.097, + "step": 31210 + }, + { + "epoch": 0.78, + "learning_rate": 0.0018234555184282592, + "loss": 0.0965, + "step": 31220 + }, + { + "epoch": 0.78, + "learning_rate": 0.001823078662412381, + "loss": 0.0948, + "step": 31230 + }, + { + "epoch": 0.78, + "learning_rate": 0.0018227018063965029, + "loss": 0.0927, + "step": 31240 + }, + { + "epoch": 0.79, + "learning_rate": 0.0018223249503806248, + "loss": 0.0938, + "step": 31250 + }, + { + "epoch": 0.79, + "learning_rate": 0.0018219480943647464, + "loss": 0.0976, + "step": 31260 + }, + { + "epoch": 0.79, + "learning_rate": 0.0018215712383488681, + "loss": 0.093, + "step": 31270 + }, + { + "epoch": 0.79, + "learning_rate": 0.00182119438233299, + "loss": 0.0961, + "step": 31280 + }, + { + "epoch": 0.79, + "learning_rate": 0.001820817526317112, + "loss": 0.0948, + "step": 31290 + }, + { + "epoch": 0.79, + "learning_rate": 0.0018204406703012336, + "loss": 0.0974, + "step": 31300 + }, + { + "epoch": 0.79, + "learning_rate": 0.0018200638142853553, + "loss": 0.0915, + "step": 31310 + }, + { + "epoch": 0.79, + "learning_rate": 0.0018196869582694773, + "loss": 0.0956, + "step": 31320 + }, + { + "epoch": 0.79, + "learning_rate": 0.0018193101022535992, + "loss": 0.0971, + "step": 31330 + }, + { + "epoch": 0.79, + "learning_rate": 0.0018189332462377208, + "loss": 0.0941, + "step": 31340 + }, + { + "epoch": 0.79, + "learning_rate": 0.0018185563902218425, + "loss": 0.0949, + "step": 31350 + }, + { + "epoch": 0.79, + "learning_rate": 0.0018181795342059645, + "loss": 0.0934, + "step": 31360 + }, + { + "epoch": 0.79, + "learning_rate": 0.0018178026781900864, + "loss": 0.0957, + "step": 31370 + }, + { + "epoch": 0.79, + "learning_rate": 0.001817425822174208, + "loss": 0.0958, + "step": 31380 + }, + { + "epoch": 0.79, + "learning_rate": 0.00181704896615833, + "loss": 0.0965, + "step": 31390 + }, + { + "epoch": 0.79, + "learning_rate": 0.0018166721101424517, + "loss": 0.0956, + "step": 31400 + }, + { + "epoch": 0.79, + "learning_rate": 0.0018162952541265732, + "loss": 0.0972, + "step": 31410 + }, + { + "epoch": 0.79, + "learning_rate": 0.0018159183981106952, + "loss": 0.0995, + "step": 31420 + }, + { + "epoch": 0.79, + "learning_rate": 0.0018155415420948171, + "loss": 0.0925, + "step": 31430 + }, + { + "epoch": 0.79, + "learning_rate": 0.0018151646860789389, + "loss": 0.0944, + "step": 31440 + }, + { + "epoch": 0.79, + "learning_rate": 0.0018147878300630604, + "loss": 0.0914, + "step": 31450 + }, + { + "epoch": 0.79, + "learning_rate": 0.0018144109740471823, + "loss": 0.0953, + "step": 31460 + }, + { + "epoch": 0.79, + "learning_rate": 0.0018140341180313043, + "loss": 0.094, + "step": 31470 + }, + { + "epoch": 0.79, + "learning_rate": 0.001813657262015426, + "loss": 0.0964, + "step": 31480 + }, + { + "epoch": 0.79, + "learning_rate": 0.0018132804059995478, + "loss": 0.0949, + "step": 31490 + }, + { + "epoch": 0.79, + "learning_rate": 0.0018129035499836695, + "loss": 0.0953, + "step": 31500 + }, + { + "epoch": 0.79, + "eval_cer": 0.6660814905820818, + "eval_loss": 0.07518129050731659, + "eval_runtime": 90.6489, + "eval_samples_per_second": 110.305, + "eval_steps_per_second": 6.895, + "step": 31500 + }, + { + "epoch": 0.79, + "learning_rate": 0.0018125266939677915, + "loss": 0.0923, + "step": 31510 + }, + { + "epoch": 0.79, + "learning_rate": 0.0018121498379519132, + "loss": 0.1015, + "step": 31520 + }, + { + "epoch": 0.79, + "learning_rate": 0.001811772981936035, + "loss": 0.0961, + "step": 31530 + }, + { + "epoch": 0.79, + "learning_rate": 0.0018113961259201567, + "loss": 0.0955, + "step": 31540 + }, + { + "epoch": 0.79, + "learning_rate": 0.0018110192699042787, + "loss": 0.0983, + "step": 31550 + }, + { + "epoch": 0.79, + "learning_rate": 0.0018106424138884007, + "loss": 0.0977, + "step": 31560 + }, + { + "epoch": 0.79, + "learning_rate": 0.0018102655578725222, + "loss": 0.0982, + "step": 31570 + }, + { + "epoch": 0.79, + "learning_rate": 0.001809888701856644, + "loss": 0.0937, + "step": 31580 + }, + { + "epoch": 0.79, + "learning_rate": 0.001809511845840766, + "loss": 0.0956, + "step": 31590 + }, + { + "epoch": 0.79, + "learning_rate": 0.0018091349898248874, + "loss": 0.0955, + "step": 31600 + }, + { + "epoch": 0.79, + "learning_rate": 0.0018087581338090094, + "loss": 0.0926, + "step": 31610 + }, + { + "epoch": 0.79, + "learning_rate": 0.0018083812777931311, + "loss": 0.0961, + "step": 31620 + }, + { + "epoch": 0.79, + "learning_rate": 0.001808004421777253, + "loss": 0.0952, + "step": 31630 + }, + { + "epoch": 0.79, + "learning_rate": 0.0018076275657613746, + "loss": 0.0969, + "step": 31640 + }, + { + "epoch": 0.8, + "learning_rate": 0.0018072507097454966, + "loss": 0.0995, + "step": 31650 + }, + { + "epoch": 0.8, + "learning_rate": 0.0018068738537296185, + "loss": 0.0956, + "step": 31660 + }, + { + "epoch": 0.8, + "learning_rate": 0.0018064969977137403, + "loss": 0.0951, + "step": 31670 + }, + { + "epoch": 0.8, + "learning_rate": 0.0018061201416978618, + "loss": 0.099, + "step": 31680 + }, + { + "epoch": 0.8, + "learning_rate": 0.0018057432856819838, + "loss": 0.0959, + "step": 31690 + }, + { + "epoch": 0.8, + "learning_rate": 0.0018053664296661057, + "loss": 0.0974, + "step": 31700 + }, + { + "epoch": 0.8, + "learning_rate": 0.0018049895736502275, + "loss": 0.0936, + "step": 31710 + }, + { + "epoch": 0.8, + "learning_rate": 0.001804612717634349, + "loss": 0.0978, + "step": 31720 + }, + { + "epoch": 0.8, + "learning_rate": 0.001804235861618471, + "loss": 0.096, + "step": 31730 + }, + { + "epoch": 0.8, + "learning_rate": 0.001803859005602593, + "loss": 0.0995, + "step": 31740 + }, + { + "epoch": 0.8, + "learning_rate": 0.0018034821495867147, + "loss": 0.0954, + "step": 31750 + }, + { + "epoch": 0.8, + "learning_rate": 0.0018031052935708362, + "loss": 0.0929, + "step": 31760 + }, + { + "epoch": 0.8, + "learning_rate": 0.0018027284375549582, + "loss": 0.093, + "step": 31770 + }, + { + "epoch": 0.8, + "learning_rate": 0.0018023515815390801, + "loss": 0.0933, + "step": 31780 + }, + { + "epoch": 0.8, + "learning_rate": 0.0018019747255232019, + "loss": 0.0939, + "step": 31790 + }, + { + "epoch": 0.8, + "learning_rate": 0.0018015978695073236, + "loss": 0.0916, + "step": 31800 + }, + { + "epoch": 0.8, + "learning_rate": 0.0018012210134914454, + "loss": 0.0982, + "step": 31810 + }, + { + "epoch": 0.8, + "learning_rate": 0.0018008441574755673, + "loss": 0.093, + "step": 31820 + }, + { + "epoch": 0.8, + "learning_rate": 0.0018004673014596888, + "loss": 0.0967, + "step": 31830 + }, + { + "epoch": 0.8, + "learning_rate": 0.0018000904454438108, + "loss": 0.0949, + "step": 31840 + }, + { + "epoch": 0.8, + "learning_rate": 0.0017997135894279326, + "loss": 0.0948, + "step": 31850 + }, + { + "epoch": 0.8, + "learning_rate": 0.0017993367334120545, + "loss": 0.0965, + "step": 31860 + }, + { + "epoch": 0.8, + "learning_rate": 0.001798959877396176, + "loss": 0.0951, + "step": 31870 + }, + { + "epoch": 0.8, + "learning_rate": 0.001798583021380298, + "loss": 0.1012, + "step": 31880 + }, + { + "epoch": 0.8, + "learning_rate": 0.0017982061653644198, + "loss": 0.0969, + "step": 31890 + }, + { + "epoch": 0.8, + "learning_rate": 0.0017978293093485417, + "loss": 0.095, + "step": 31900 + }, + { + "epoch": 0.8, + "learning_rate": 0.0017974524533326632, + "loss": 0.0935, + "step": 31910 + }, + { + "epoch": 0.8, + "learning_rate": 0.0017970755973167852, + "loss": 0.0951, + "step": 31920 + }, + { + "epoch": 0.8, + "learning_rate": 0.001796698741300907, + "loss": 0.0974, + "step": 31930 + }, + { + "epoch": 0.8, + "learning_rate": 0.001796321885285029, + "loss": 0.0941, + "step": 31940 + }, + { + "epoch": 0.8, + "learning_rate": 0.0017959450292691504, + "loss": 0.0965, + "step": 31950 + }, + { + "epoch": 0.8, + "learning_rate": 0.0017955681732532724, + "loss": 0.0939, + "step": 31960 + }, + { + "epoch": 0.8, + "learning_rate": 0.0017951913172373944, + "loss": 0.0975, + "step": 31970 + }, + { + "epoch": 0.8, + "learning_rate": 0.001794814461221516, + "loss": 0.0947, + "step": 31980 + }, + { + "epoch": 0.8, + "learning_rate": 0.0017944376052056376, + "loss": 0.0963, + "step": 31990 + }, + { + "epoch": 0.8, + "learning_rate": 0.0017940607491897596, + "loss": 0.095, + "step": 32000 + }, + { + "epoch": 0.8, + "eval_cer": 0.6662220098392354, + "eval_loss": 0.07489816099405289, + "eval_runtime": 90.5954, + "eval_samples_per_second": 110.37, + "eval_steps_per_second": 6.899, + "step": 32000 + }, + { + "epoch": 0.8, + "learning_rate": 0.0017936838931738816, + "loss": 0.0966, + "step": 32010 + }, + { + "epoch": 0.8, + "learning_rate": 0.0017933070371580033, + "loss": 0.096, + "step": 32020 + }, + { + "epoch": 0.8, + "learning_rate": 0.0017929301811421248, + "loss": 0.0933, + "step": 32030 + }, + { + "epoch": 0.8, + "learning_rate": 0.0017925533251262468, + "loss": 0.0946, + "step": 32040 + }, + { + "epoch": 0.81, + "learning_rate": 0.0017921764691103687, + "loss": 0.0965, + "step": 32050 + }, + { + "epoch": 0.81, + "learning_rate": 0.0017917996130944903, + "loss": 0.0956, + "step": 32060 + }, + { + "epoch": 0.81, + "learning_rate": 0.0017914227570786122, + "loss": 0.0931, + "step": 32070 + }, + { + "epoch": 0.81, + "learning_rate": 0.001791045901062734, + "loss": 0.0952, + "step": 32080 + }, + { + "epoch": 0.81, + "learning_rate": 0.001790669045046856, + "loss": 0.0952, + "step": 32090 + }, + { + "epoch": 0.81, + "learning_rate": 0.0017902921890309775, + "loss": 0.0916, + "step": 32100 + }, + { + "epoch": 0.81, + "learning_rate": 0.0017899153330150994, + "loss": 0.0926, + "step": 32110 + }, + { + "epoch": 0.81, + "learning_rate": 0.0017895384769992212, + "loss": 0.1009, + "step": 32120 + }, + { + "epoch": 0.81, + "learning_rate": 0.0017891616209833431, + "loss": 0.0927, + "step": 32130 + }, + { + "epoch": 0.81, + "learning_rate": 0.0017887847649674647, + "loss": 0.0993, + "step": 32140 + }, + { + "epoch": 0.81, + "learning_rate": 0.0017884079089515866, + "loss": 0.0974, + "step": 32150 + }, + { + "epoch": 0.81, + "learning_rate": 0.0017880310529357084, + "loss": 0.0937, + "step": 32160 + }, + { + "epoch": 0.81, + "learning_rate": 0.0017876541969198303, + "loss": 0.0957, + "step": 32170 + }, + { + "epoch": 0.81, + "learning_rate": 0.0017872773409039519, + "loss": 0.095, + "step": 32180 + }, + { + "epoch": 0.81, + "learning_rate": 0.0017869004848880738, + "loss": 0.095, + "step": 32190 + }, + { + "epoch": 0.81, + "learning_rate": 0.0017865236288721956, + "loss": 0.0979, + "step": 32200 + }, + { + "epoch": 0.81, + "learning_rate": 0.0017861467728563175, + "loss": 0.0903, + "step": 32210 + }, + { + "epoch": 0.81, + "learning_rate": 0.001785769916840439, + "loss": 0.0944, + "step": 32220 + }, + { + "epoch": 0.81, + "learning_rate": 0.001785393060824561, + "loss": 0.0943, + "step": 32230 + }, + { + "epoch": 0.81, + "learning_rate": 0.001785016204808683, + "loss": 0.0986, + "step": 32240 + }, + { + "epoch": 0.81, + "learning_rate": 0.0017846393487928047, + "loss": 0.0931, + "step": 32250 + }, + { + "epoch": 0.81, + "learning_rate": 0.0017842624927769263, + "loss": 0.0915, + "step": 32260 + }, + { + "epoch": 0.81, + "learning_rate": 0.0017838856367610482, + "loss": 0.0935, + "step": 32270 + }, + { + "epoch": 0.81, + "learning_rate": 0.0017835087807451702, + "loss": 0.0938, + "step": 32280 + }, + { + "epoch": 0.81, + "learning_rate": 0.0017831319247292917, + "loss": 0.0942, + "step": 32290 + }, + { + "epoch": 0.81, + "learning_rate": 0.0017827550687134134, + "loss": 0.0977, + "step": 32300 + }, + { + "epoch": 0.81, + "learning_rate": 0.0017823782126975354, + "loss": 0.0938, + "step": 32310 + }, + { + "epoch": 0.81, + "learning_rate": 0.0017820013566816574, + "loss": 0.0961, + "step": 32320 + }, + { + "epoch": 0.81, + "learning_rate": 0.001781624500665779, + "loss": 0.0929, + "step": 32330 + }, + { + "epoch": 0.81, + "learning_rate": 0.0017812476446499006, + "loss": 0.0904, + "step": 32340 + }, + { + "epoch": 0.81, + "learning_rate": 0.0017808707886340226, + "loss": 0.0981, + "step": 32350 + }, + { + "epoch": 0.81, + "learning_rate": 0.0017804939326181446, + "loss": 0.0945, + "step": 32360 + }, + { + "epoch": 0.81, + "learning_rate": 0.001780117076602266, + "loss": 0.0971, + "step": 32370 + }, + { + "epoch": 0.81, + "learning_rate": 0.001779740220586388, + "loss": 0.0965, + "step": 32380 + }, + { + "epoch": 0.81, + "learning_rate": 0.0017793633645705098, + "loss": 0.0958, + "step": 32390 + }, + { + "epoch": 0.81, + "learning_rate": 0.0017789865085546318, + "loss": 0.099, + "step": 32400 + }, + { + "epoch": 0.81, + "learning_rate": 0.0017786096525387533, + "loss": 0.0947, + "step": 32410 + }, + { + "epoch": 0.81, + "learning_rate": 0.0017782327965228753, + "loss": 0.0964, + "step": 32420 + }, + { + "epoch": 0.81, + "learning_rate": 0.001777855940506997, + "loss": 0.103, + "step": 32430 + }, + { + "epoch": 0.82, + "learning_rate": 0.001777479084491119, + "loss": 0.0953, + "step": 32440 + }, + { + "epoch": 0.82, + "learning_rate": 0.0017771022284752405, + "loss": 0.0934, + "step": 32450 + }, + { + "epoch": 0.82, + "learning_rate": 0.0017767253724593624, + "loss": 0.0963, + "step": 32460 + }, + { + "epoch": 0.82, + "learning_rate": 0.0017763485164434842, + "loss": 0.0929, + "step": 32470 + }, + { + "epoch": 0.82, + "learning_rate": 0.0017759716604276062, + "loss": 0.0949, + "step": 32480 + }, + { + "epoch": 0.82, + "learning_rate": 0.0017755948044117277, + "loss": 0.0952, + "step": 32490 + }, + { + "epoch": 0.82, + "learning_rate": 0.0017752179483958496, + "loss": 0.09, + "step": 32500 + }, + { + "epoch": 0.82, + "eval_cer": 0.6662576208838565, + "eval_loss": 0.07475540041923523, + "eval_runtime": 90.7185, + "eval_samples_per_second": 110.22, + "eval_steps_per_second": 6.889, + "step": 32500 + }, + { + "epoch": 0.82, + "learning_rate": 0.0017748410923799714, + "loss": 0.0996, + "step": 32510 + }, + { + "epoch": 0.82, + "learning_rate": 0.0017744642363640931, + "loss": 0.0974, + "step": 32520 + }, + { + "epoch": 0.82, + "learning_rate": 0.0017740873803482149, + "loss": 0.0936, + "step": 32530 + }, + { + "epoch": 0.82, + "learning_rate": 0.0017737105243323368, + "loss": 0.0976, + "step": 32540 + }, + { + "epoch": 0.82, + "learning_rate": 0.0017733336683164588, + "loss": 0.0948, + "step": 32550 + }, + { + "epoch": 0.82, + "learning_rate": 0.0017729568123005803, + "loss": 0.0954, + "step": 32560 + }, + { + "epoch": 0.82, + "learning_rate": 0.001772579956284702, + "loss": 0.0959, + "step": 32570 + }, + { + "epoch": 0.82, + "learning_rate": 0.001772203100268824, + "loss": 0.0974, + "step": 32580 + }, + { + "epoch": 0.82, + "learning_rate": 0.001771826244252946, + "loss": 0.0967, + "step": 32590 + }, + { + "epoch": 0.82, + "learning_rate": 0.0017714493882370675, + "loss": 0.0929, + "step": 32600 + }, + { + "epoch": 0.82, + "learning_rate": 0.0017710725322211893, + "loss": 0.0947, + "step": 32610 + }, + { + "epoch": 0.82, + "learning_rate": 0.0017706956762053112, + "loss": 0.0964, + "step": 32620 + }, + { + "epoch": 0.82, + "learning_rate": 0.0017703188201894332, + "loss": 0.0929, + "step": 32630 + }, + { + "epoch": 0.82, + "learning_rate": 0.0017699419641735547, + "loss": 0.091, + "step": 32640 + }, + { + "epoch": 0.82, + "learning_rate": 0.0017695651081576767, + "loss": 0.0927, + "step": 32650 + }, + { + "epoch": 0.82, + "learning_rate": 0.0017691882521417984, + "loss": 0.0942, + "step": 32660 + }, + { + "epoch": 0.82, + "learning_rate": 0.0017688113961259204, + "loss": 0.0924, + "step": 32670 + }, + { + "epoch": 0.82, + "learning_rate": 0.001768434540110042, + "loss": 0.0967, + "step": 32680 + }, + { + "epoch": 0.82, + "learning_rate": 0.0017680576840941639, + "loss": 0.0936, + "step": 32690 + }, + { + "epoch": 0.82, + "learning_rate": 0.0017676808280782856, + "loss": 0.0964, + "step": 32700 + }, + { + "epoch": 0.82, + "learning_rate": 0.0017673039720624071, + "loss": 0.0944, + "step": 32710 + }, + { + "epoch": 0.82, + "learning_rate": 0.001766927116046529, + "loss": 0.0932, + "step": 32720 + }, + { + "epoch": 0.82, + "learning_rate": 0.001766550260030651, + "loss": 0.0894, + "step": 32730 + }, + { + "epoch": 0.82, + "learning_rate": 0.0017661734040147728, + "loss": 0.0946, + "step": 32740 + }, + { + "epoch": 0.82, + "learning_rate": 0.0017657965479988943, + "loss": 0.0945, + "step": 32750 + }, + { + "epoch": 0.82, + "learning_rate": 0.0017654196919830163, + "loss": 0.0966, + "step": 32760 + }, + { + "epoch": 0.82, + "learning_rate": 0.0017650428359671383, + "loss": 0.0972, + "step": 32770 + }, + { + "epoch": 0.82, + "learning_rate": 0.00176466597995126, + "loss": 0.0925, + "step": 32780 + }, + { + "epoch": 0.82, + "learning_rate": 0.0017642891239353818, + "loss": 0.097, + "step": 32790 + }, + { + "epoch": 0.82, + "learning_rate": 0.0017639122679195035, + "loss": 0.0931, + "step": 32800 + }, + { + "epoch": 0.82, + "learning_rate": 0.0017635354119036255, + "loss": 0.0914, + "step": 32810 + }, + { + "epoch": 0.82, + "learning_rate": 0.0017631585558877474, + "loss": 0.0939, + "step": 32820 + }, + { + "epoch": 0.82, + "learning_rate": 0.001762781699871869, + "loss": 0.0944, + "step": 32830 + }, + { + "epoch": 0.83, + "learning_rate": 0.0017624048438559907, + "loss": 0.0913, + "step": 32840 + }, + { + "epoch": 0.83, + "learning_rate": 0.0017620279878401127, + "loss": 0.0939, + "step": 32850 + }, + { + "epoch": 0.83, + "learning_rate": 0.0017616511318242346, + "loss": 0.0938, + "step": 32860 + }, + { + "epoch": 0.83, + "learning_rate": 0.0017612742758083561, + "loss": 0.0922, + "step": 32870 + }, + { + "epoch": 0.83, + "learning_rate": 0.0017608974197924779, + "loss": 0.097, + "step": 32880 + }, + { + "epoch": 0.83, + "learning_rate": 0.0017605205637765999, + "loss": 0.0948, + "step": 32890 + }, + { + "epoch": 0.83, + "learning_rate": 0.0017601437077607218, + "loss": 0.0952, + "step": 32900 + }, + { + "epoch": 0.83, + "learning_rate": 0.0017597668517448433, + "loss": 0.0958, + "step": 32910 + }, + { + "epoch": 0.83, + "learning_rate": 0.001759389995728965, + "loss": 0.0936, + "step": 32920 + }, + { + "epoch": 0.83, + "learning_rate": 0.001759013139713087, + "loss": 0.0942, + "step": 32930 + }, + { + "epoch": 0.83, + "learning_rate": 0.0017586362836972086, + "loss": 0.0982, + "step": 32940 + }, + { + "epoch": 0.83, + "learning_rate": 0.0017582594276813305, + "loss": 0.0943, + "step": 32950 + }, + { + "epoch": 0.83, + "learning_rate": 0.0017578825716654525, + "loss": 0.0946, + "step": 32960 + }, + { + "epoch": 0.83, + "learning_rate": 0.0017575057156495742, + "loss": 0.095, + "step": 32970 + }, + { + "epoch": 0.83, + "learning_rate": 0.0017571288596336958, + "loss": 0.093, + "step": 32980 + }, + { + "epoch": 0.83, + "learning_rate": 0.0017567520036178177, + "loss": 0.0948, + "step": 32990 + }, + { + "epoch": 0.83, + "learning_rate": 0.0017563751476019397, + "loss": 0.0927, + "step": 33000 + }, + { + "epoch": 0.83, + "eval_cer": 0.6656248029963325, + "eval_loss": 0.07400975376367569, + "eval_runtime": 90.819, + "eval_samples_per_second": 110.098, + "eval_steps_per_second": 6.882, + "step": 33000 + }, + { + "epoch": 0.83, + "learning_rate": 0.0017559982915860614, + "loss": 0.0909, + "step": 33010 + }, + { + "epoch": 0.83, + "learning_rate": 0.001755621435570183, + "loss": 0.0924, + "step": 33020 + }, + { + "epoch": 0.83, + "learning_rate": 0.001755244579554305, + "loss": 0.0877, + "step": 33030 + }, + { + "epoch": 0.83, + "learning_rate": 0.0017548677235384269, + "loss": 0.0936, + "step": 33040 + }, + { + "epoch": 0.83, + "learning_rate": 0.0017544908675225486, + "loss": 0.0929, + "step": 33050 + }, + { + "epoch": 0.83, + "learning_rate": 0.0017541140115066704, + "loss": 0.0943, + "step": 33060 + }, + { + "epoch": 0.83, + "learning_rate": 0.0017537371554907921, + "loss": 0.0924, + "step": 33070 + }, + { + "epoch": 0.83, + "learning_rate": 0.001753360299474914, + "loss": 0.0967, + "step": 33080 + }, + { + "epoch": 0.83, + "learning_rate": 0.0017529834434590358, + "loss": 0.0918, + "step": 33090 + }, + { + "epoch": 0.83, + "learning_rate": 0.0017526065874431576, + "loss": 0.094, + "step": 33100 + }, + { + "epoch": 0.83, + "learning_rate": 0.0017522297314272793, + "loss": 0.0924, + "step": 33110 + }, + { + "epoch": 0.83, + "learning_rate": 0.0017518528754114013, + "loss": 0.0933, + "step": 33120 + }, + { + "epoch": 0.83, + "learning_rate": 0.0017514760193955232, + "loss": 0.0937, + "step": 33130 + }, + { + "epoch": 0.83, + "learning_rate": 0.0017510991633796448, + "loss": 0.0909, + "step": 33140 + }, + { + "epoch": 0.83, + "learning_rate": 0.0017507223073637665, + "loss": 0.0945, + "step": 33150 + }, + { + "epoch": 0.83, + "learning_rate": 0.0017503454513478885, + "loss": 0.0906, + "step": 33160 + }, + { + "epoch": 0.83, + "learning_rate": 0.00174996859533201, + "loss": 0.0962, + "step": 33170 + }, + { + "epoch": 0.83, + "learning_rate": 0.001749591739316132, + "loss": 0.091, + "step": 33180 + }, + { + "epoch": 0.83, + "learning_rate": 0.0017492148833002537, + "loss": 0.0924, + "step": 33190 + }, + { + "epoch": 0.83, + "learning_rate": 0.0017488380272843757, + "loss": 0.0909, + "step": 33200 + }, + { + "epoch": 0.83, + "learning_rate": 0.0017484611712684972, + "loss": 0.0921, + "step": 33210 + }, + { + "epoch": 0.83, + "learning_rate": 0.0017480843152526192, + "loss": 0.09, + "step": 33220 + }, + { + "epoch": 0.83, + "learning_rate": 0.0017477074592367411, + "loss": 0.0988, + "step": 33230 + }, + { + "epoch": 0.84, + "learning_rate": 0.0017473306032208629, + "loss": 0.0931, + "step": 33240 + }, + { + "epoch": 0.84, + "learning_rate": 0.0017469537472049844, + "loss": 0.0974, + "step": 33250 + }, + { + "epoch": 0.84, + "learning_rate": 0.0017465768911891064, + "loss": 0.0907, + "step": 33260 + }, + { + "epoch": 0.84, + "learning_rate": 0.0017462000351732283, + "loss": 0.0921, + "step": 33270 + }, + { + "epoch": 0.84, + "learning_rate": 0.00174582317915735, + "loss": 0.094, + "step": 33280 + }, + { + "epoch": 0.84, + "learning_rate": 0.0017454463231414716, + "loss": 0.091, + "step": 33290 + }, + { + "epoch": 0.84, + "learning_rate": 0.0017450694671255935, + "loss": 0.0906, + "step": 33300 + }, + { + "epoch": 0.84, + "learning_rate": 0.0017446926111097155, + "loss": 0.0884, + "step": 33310 + }, + { + "epoch": 0.84, + "learning_rate": 0.0017443157550938373, + "loss": 0.0916, + "step": 33320 + }, + { + "epoch": 0.84, + "learning_rate": 0.0017439388990779588, + "loss": 0.0951, + "step": 33330 + }, + { + "epoch": 0.84, + "learning_rate": 0.0017435620430620807, + "loss": 0.0937, + "step": 33340 + }, + { + "epoch": 0.84, + "learning_rate": 0.0017431851870462027, + "loss": 0.0922, + "step": 33350 + }, + { + "epoch": 0.84, + "learning_rate": 0.0017428083310303245, + "loss": 0.0923, + "step": 33360 + }, + { + "epoch": 0.84, + "learning_rate": 0.0017424314750144462, + "loss": 0.0941, + "step": 33370 + }, + { + "epoch": 0.84, + "learning_rate": 0.001742054618998568, + "loss": 0.0932, + "step": 33380 + }, + { + "epoch": 0.84, + "learning_rate": 0.00174167776298269, + "loss": 0.0934, + "step": 33390 + }, + { + "epoch": 0.84, + "learning_rate": 0.0017413009069668114, + "loss": 0.095, + "step": 33400 + }, + { + "epoch": 0.84, + "learning_rate": 0.0017409240509509334, + "loss": 0.0925, + "step": 33410 + }, + { + "epoch": 0.84, + "learning_rate": 0.0017405471949350551, + "loss": 0.0933, + "step": 33420 + }, + { + "epoch": 0.84, + "learning_rate": 0.001740170338919177, + "loss": 0.0931, + "step": 33430 + }, + { + "epoch": 0.84, + "learning_rate": 0.0017397934829032986, + "loss": 0.0936, + "step": 33440 + }, + { + "epoch": 0.84, + "learning_rate": 0.0017394166268874206, + "loss": 0.0896, + "step": 33450 + }, + { + "epoch": 0.84, + "learning_rate": 0.0017390397708715423, + "loss": 0.0935, + "step": 33460 + }, + { + "epoch": 0.84, + "learning_rate": 0.0017386629148556643, + "loss": 0.0955, + "step": 33470 + }, + { + "epoch": 0.84, + "learning_rate": 0.0017382860588397858, + "loss": 0.0952, + "step": 33480 + }, + { + "epoch": 0.84, + "learning_rate": 0.0017379092028239078, + "loss": 0.0954, + "step": 33490 + }, + { + "epoch": 0.84, + "learning_rate": 0.0017375323468080295, + "loss": 0.0914, + "step": 33500 + }, + { + "epoch": 0.84, + "eval_cer": 0.6662003544742631, + "eval_loss": 0.07387839257717133, + "eval_runtime": 90.756, + "eval_samples_per_second": 110.175, + "eval_steps_per_second": 6.887, + "step": 33500 + }, + { + "epoch": 0.84, + "learning_rate": 0.0017371554907921515, + "loss": 0.094, + "step": 33510 + }, + { + "epoch": 0.84, + "learning_rate": 0.001736778634776273, + "loss": 0.091, + "step": 33520 + }, + { + "epoch": 0.84, + "learning_rate": 0.001736401778760395, + "loss": 0.09, + "step": 33530 + }, + { + "epoch": 0.84, + "learning_rate": 0.001736024922744517, + "loss": 0.0934, + "step": 33540 + }, + { + "epoch": 0.84, + "learning_rate": 0.0017356480667286387, + "loss": 0.0958, + "step": 33550 + }, + { + "epoch": 0.84, + "learning_rate": 0.0017352712107127602, + "loss": 0.0926, + "step": 33560 + }, + { + "epoch": 0.84, + "learning_rate": 0.0017348943546968822, + "loss": 0.0905, + "step": 33570 + }, + { + "epoch": 0.84, + "learning_rate": 0.0017345174986810041, + "loss": 0.0919, + "step": 33580 + }, + { + "epoch": 0.84, + "learning_rate": 0.0017341406426651259, + "loss": 0.0964, + "step": 33590 + }, + { + "epoch": 0.84, + "learning_rate": 0.0017337637866492474, + "loss": 0.0949, + "step": 33600 + }, + { + "epoch": 0.84, + "learning_rate": 0.0017333869306333694, + "loss": 0.09, + "step": 33610 + }, + { + "epoch": 0.84, + "learning_rate": 0.0017330100746174913, + "loss": 0.091, + "step": 33620 + }, + { + "epoch": 0.84, + "learning_rate": 0.0017326332186016129, + "loss": 0.0972, + "step": 33630 + }, + { + "epoch": 0.85, + "learning_rate": 0.0017322563625857348, + "loss": 0.0954, + "step": 33640 + }, + { + "epoch": 0.85, + "learning_rate": 0.0017318795065698566, + "loss": 0.095, + "step": 33650 + }, + { + "epoch": 0.85, + "learning_rate": 0.0017315026505539785, + "loss": 0.0931, + "step": 33660 + }, + { + "epoch": 0.85, + "learning_rate": 0.0017311257945381, + "loss": 0.0932, + "step": 33670 + }, + { + "epoch": 0.85, + "learning_rate": 0.001730748938522222, + "loss": 0.0919, + "step": 33680 + }, + { + "epoch": 0.85, + "learning_rate": 0.0017303720825063438, + "loss": 0.089, + "step": 33690 + }, + { + "epoch": 0.85, + "learning_rate": 0.0017299952264904657, + "loss": 0.0972, + "step": 33700 + }, + { + "epoch": 0.85, + "learning_rate": 0.0017296183704745872, + "loss": 0.0916, + "step": 33710 + }, + { + "epoch": 0.85, + "learning_rate": 0.0017292415144587092, + "loss": 0.0878, + "step": 33720 + }, + { + "epoch": 0.85, + "learning_rate": 0.001728864658442831, + "loss": 0.0971, + "step": 33730 + }, + { + "epoch": 0.85, + "learning_rate": 0.001728487802426953, + "loss": 0.0936, + "step": 33740 + }, + { + "epoch": 0.85, + "learning_rate": 0.0017281109464110744, + "loss": 0.0936, + "step": 33750 + }, + { + "epoch": 0.85, + "learning_rate": 0.0017277340903951964, + "loss": 0.0947, + "step": 33760 + }, + { + "epoch": 0.85, + "learning_rate": 0.0017273572343793181, + "loss": 0.0947, + "step": 33770 + }, + { + "epoch": 0.85, + "learning_rate": 0.0017269803783634401, + "loss": 0.091, + "step": 33780 + }, + { + "epoch": 0.85, + "learning_rate": 0.0017266035223475616, + "loss": 0.0943, + "step": 33790 + }, + { + "epoch": 0.85, + "learning_rate": 0.0017262266663316836, + "loss": 0.0911, + "step": 33800 + }, + { + "epoch": 0.85, + "learning_rate": 0.0017258498103158056, + "loss": 0.0921, + "step": 33810 + }, + { + "epoch": 0.85, + "learning_rate": 0.001725472954299927, + "loss": 0.0895, + "step": 33820 + }, + { + "epoch": 0.85, + "learning_rate": 0.0017250960982840488, + "loss": 0.093, + "step": 33830 + }, + { + "epoch": 0.85, + "learning_rate": 0.0017247192422681708, + "loss": 0.0933, + "step": 33840 + }, + { + "epoch": 0.85, + "learning_rate": 0.0017243423862522928, + "loss": 0.0962, + "step": 33850 + }, + { + "epoch": 0.85, + "learning_rate": 0.0017239655302364143, + "loss": 0.095, + "step": 33860 + }, + { + "epoch": 0.85, + "learning_rate": 0.001723588674220536, + "loss": 0.0909, + "step": 33870 + }, + { + "epoch": 0.85, + "learning_rate": 0.001723211818204658, + "loss": 0.0924, + "step": 33880 + }, + { + "epoch": 0.85, + "learning_rate": 0.00172283496218878, + "loss": 0.0895, + "step": 33890 + }, + { + "epoch": 0.85, + "learning_rate": 0.0017224581061729015, + "loss": 0.0909, + "step": 33900 + }, + { + "epoch": 0.85, + "learning_rate": 0.0017220812501570232, + "loss": 0.0938, + "step": 33910 + }, + { + "epoch": 0.85, + "learning_rate": 0.0017217043941411452, + "loss": 0.0934, + "step": 33920 + }, + { + "epoch": 0.85, + "learning_rate": 0.0017213275381252671, + "loss": 0.0947, + "step": 33930 + }, + { + "epoch": 0.85, + "learning_rate": 0.0017209506821093887, + "loss": 0.0933, + "step": 33940 + }, + { + "epoch": 0.85, + "learning_rate": 0.0017205738260935106, + "loss": 0.0956, + "step": 33950 + }, + { + "epoch": 0.85, + "learning_rate": 0.0017201969700776324, + "loss": 0.0919, + "step": 33960 + }, + { + "epoch": 0.85, + "learning_rate": 0.0017198201140617543, + "loss": 0.0962, + "step": 33970 + }, + { + "epoch": 0.85, + "learning_rate": 0.0017194432580458759, + "loss": 0.0935, + "step": 33980 + }, + { + "epoch": 0.85, + "learning_rate": 0.0017190664020299978, + "loss": 0.0932, + "step": 33990 + }, + { + "epoch": 0.85, + "learning_rate": 0.0017186895460141196, + "loss": 0.0889, + "step": 34000 + }, + { + "epoch": 0.85, + "eval_cer": 0.665936159021601, + "eval_loss": 0.07373498380184174, + "eval_runtime": 90.8685, + "eval_samples_per_second": 110.038, + "eval_steps_per_second": 6.878, + "step": 34000 + }, + { + "epoch": 0.85, + "learning_rate": 0.0017183126899982415, + "loss": 0.0922, + "step": 34010 + }, + { + "epoch": 0.85, + "learning_rate": 0.001717935833982363, + "loss": 0.0928, + "step": 34020 + }, + { + "epoch": 0.85, + "learning_rate": 0.001717558977966485, + "loss": 0.0973, + "step": 34030 + }, + { + "epoch": 0.86, + "learning_rate": 0.0017171821219506068, + "loss": 0.092, + "step": 34040 + }, + { + "epoch": 0.86, + "learning_rate": 0.0017168052659347285, + "loss": 0.0924, + "step": 34050 + }, + { + "epoch": 0.86, + "learning_rate": 0.0017164284099188503, + "loss": 0.0968, + "step": 34060 + }, + { + "epoch": 0.86, + "learning_rate": 0.0017160515539029722, + "loss": 0.095, + "step": 34070 + }, + { + "epoch": 0.86, + "learning_rate": 0.001715674697887094, + "loss": 0.0928, + "step": 34080 + }, + { + "epoch": 0.86, + "learning_rate": 0.0017152978418712157, + "loss": 0.0945, + "step": 34090 + }, + { + "epoch": 0.86, + "learning_rate": 0.0017149209858553375, + "loss": 0.0929, + "step": 34100 + }, + { + "epoch": 0.86, + "learning_rate": 0.0017145441298394594, + "loss": 0.0899, + "step": 34110 + }, + { + "epoch": 0.86, + "learning_rate": 0.0017141672738235814, + "loss": 0.0887, + "step": 34120 + }, + { + "epoch": 0.86, + "learning_rate": 0.001713790417807703, + "loss": 0.0915, + "step": 34130 + }, + { + "epoch": 0.86, + "learning_rate": 0.0017134135617918247, + "loss": 0.0945, + "step": 34140 + }, + { + "epoch": 0.86, + "learning_rate": 0.0017130367057759466, + "loss": 0.0913, + "step": 34150 + }, + { + "epoch": 0.86, + "learning_rate": 0.0017126598497600686, + "loss": 0.0915, + "step": 34160 + }, + { + "epoch": 0.86, + "learning_rate": 0.00171228299374419, + "loss": 0.0951, + "step": 34170 + }, + { + "epoch": 0.86, + "learning_rate": 0.0017119061377283118, + "loss": 0.0959, + "step": 34180 + }, + { + "epoch": 0.86, + "learning_rate": 0.0017115292817124338, + "loss": 0.0957, + "step": 34190 + }, + { + "epoch": 0.86, + "learning_rate": 0.0017111524256965558, + "loss": 0.0911, + "step": 34200 + }, + { + "epoch": 0.86, + "learning_rate": 0.0017107755696806773, + "loss": 0.0934, + "step": 34210 + }, + { + "epoch": 0.86, + "learning_rate": 0.0017103987136647993, + "loss": 0.0918, + "step": 34220 + }, + { + "epoch": 0.86, + "learning_rate": 0.001710021857648921, + "loss": 0.0925, + "step": 34230 + }, + { + "epoch": 0.86, + "learning_rate": 0.001709645001633043, + "loss": 0.0916, + "step": 34240 + }, + { + "epoch": 0.86, + "learning_rate": 0.0017092681456171645, + "loss": 0.0907, + "step": 34250 + }, + { + "epoch": 0.86, + "learning_rate": 0.0017088912896012865, + "loss": 0.0905, + "step": 34260 + }, + { + "epoch": 0.86, + "learning_rate": 0.0017085144335854082, + "loss": 0.0933, + "step": 34270 + }, + { + "epoch": 0.86, + "learning_rate": 0.0017081375775695297, + "loss": 0.0923, + "step": 34280 + }, + { + "epoch": 0.86, + "learning_rate": 0.0017077607215536517, + "loss": 0.0953, + "step": 34290 + }, + { + "epoch": 0.86, + "learning_rate": 0.0017073838655377736, + "loss": 0.0925, + "step": 34300 + }, + { + "epoch": 0.86, + "learning_rate": 0.0017070070095218954, + "loss": 0.092, + "step": 34310 + }, + { + "epoch": 0.86, + "learning_rate": 0.001706630153506017, + "loss": 0.094, + "step": 34320 + }, + { + "epoch": 0.86, + "learning_rate": 0.0017062532974901389, + "loss": 0.0938, + "step": 34330 + }, + { + "epoch": 0.86, + "learning_rate": 0.0017058764414742608, + "loss": 0.0876, + "step": 34340 + }, + { + "epoch": 0.86, + "learning_rate": 0.0017054995854583826, + "loss": 0.0927, + "step": 34350 + }, + { + "epoch": 0.86, + "learning_rate": 0.0017051227294425043, + "loss": 0.0946, + "step": 34360 + }, + { + "epoch": 0.86, + "learning_rate": 0.001704745873426626, + "loss": 0.0934, + "step": 34370 + }, + { + "epoch": 0.86, + "learning_rate": 0.001704369017410748, + "loss": 0.0908, + "step": 34380 + }, + { + "epoch": 0.86, + "learning_rate": 0.00170399216139487, + "loss": 0.0909, + "step": 34390 + }, + { + "epoch": 0.86, + "learning_rate": 0.0017036153053789915, + "loss": 0.0901, + "step": 34400 + }, + { + "epoch": 0.86, + "learning_rate": 0.0017032384493631133, + "loss": 0.0888, + "step": 34410 + }, + { + "epoch": 0.86, + "learning_rate": 0.0017028615933472352, + "loss": 0.0895, + "step": 34420 + }, + { + "epoch": 0.86, + "learning_rate": 0.0017024847373313572, + "loss": 0.0867, + "step": 34430 + }, + { + "epoch": 0.87, + "learning_rate": 0.0017021078813154787, + "loss": 0.0912, + "step": 34440 + }, + { + "epoch": 0.87, + "learning_rate": 0.0017017310252996005, + "loss": 0.0906, + "step": 34450 + }, + { + "epoch": 0.87, + "learning_rate": 0.0017013541692837224, + "loss": 0.0943, + "step": 34460 + }, + { + "epoch": 0.87, + "learning_rate": 0.0017009773132678444, + "loss": 0.0911, + "step": 34470 + }, + { + "epoch": 0.87, + "learning_rate": 0.001700600457251966, + "loss": 0.0914, + "step": 34480 + }, + { + "epoch": 0.87, + "learning_rate": 0.0017002236012360877, + "loss": 0.0936, + "step": 34490 + }, + { + "epoch": 0.87, + "learning_rate": 0.0016998467452202096, + "loss": 0.0924, + "step": 34500 + }, + { + "epoch": 0.87, + "eval_cer": 0.6659621454595678, + "eval_loss": 0.0725727379322052, + "eval_runtime": 90.8863, + "eval_samples_per_second": 110.017, + "eval_steps_per_second": 6.877, + "step": 34500 + }, + { + "epoch": 0.87, + "learning_rate": 0.0016994698892043312, + "loss": 0.0938, + "step": 34510 + }, + { + "epoch": 0.87, + "learning_rate": 0.0016990930331884531, + "loss": 0.0948, + "step": 34520 + }, + { + "epoch": 0.87, + "learning_rate": 0.001698716177172575, + "loss": 0.0885, + "step": 34530 + }, + { + "epoch": 0.87, + "learning_rate": 0.0016983393211566968, + "loss": 0.0896, + "step": 34540 + }, + { + "epoch": 0.87, + "learning_rate": 0.0016979624651408183, + "loss": 0.0916, + "step": 34550 + }, + { + "epoch": 0.87, + "learning_rate": 0.0016975856091249403, + "loss": 0.0926, + "step": 34560 + }, + { + "epoch": 0.87, + "learning_rate": 0.0016972087531090623, + "loss": 0.0942, + "step": 34570 + }, + { + "epoch": 0.87, + "learning_rate": 0.001696831897093184, + "loss": 0.0939, + "step": 34580 + }, + { + "epoch": 0.87, + "learning_rate": 0.0016964550410773055, + "loss": 0.0919, + "step": 34590 + }, + { + "epoch": 0.87, + "learning_rate": 0.0016960781850614275, + "loss": 0.0903, + "step": 34600 + }, + { + "epoch": 0.87, + "learning_rate": 0.0016957013290455495, + "loss": 0.0898, + "step": 34610 + }, + { + "epoch": 0.87, + "learning_rate": 0.0016953244730296712, + "loss": 0.0906, + "step": 34620 + }, + { + "epoch": 0.87, + "learning_rate": 0.001694947617013793, + "loss": 0.0888, + "step": 34630 + }, + { + "epoch": 0.87, + "learning_rate": 0.0016945707609979147, + "loss": 0.094, + "step": 34640 + }, + { + "epoch": 0.87, + "learning_rate": 0.0016941939049820367, + "loss": 0.0922, + "step": 34650 + }, + { + "epoch": 0.87, + "learning_rate": 0.0016938170489661584, + "loss": 0.0935, + "step": 34660 + }, + { + "epoch": 0.87, + "learning_rate": 0.0016934401929502802, + "loss": 0.0926, + "step": 34670 + }, + { + "epoch": 0.87, + "learning_rate": 0.001693063336934402, + "loss": 0.0905, + "step": 34680 + }, + { + "epoch": 0.87, + "learning_rate": 0.0016926864809185239, + "loss": 0.0906, + "step": 34690 + }, + { + "epoch": 0.87, + "learning_rate": 0.0016923096249026458, + "loss": 0.0912, + "step": 34700 + }, + { + "epoch": 0.87, + "learning_rate": 0.0016919327688867673, + "loss": 0.092, + "step": 34710 + }, + { + "epoch": 0.87, + "learning_rate": 0.001691555912870889, + "loss": 0.0925, + "step": 34720 + }, + { + "epoch": 0.87, + "learning_rate": 0.001691179056855011, + "loss": 0.0932, + "step": 34730 + }, + { + "epoch": 0.87, + "learning_rate": 0.0016908022008391326, + "loss": 0.0904, + "step": 34740 + }, + { + "epoch": 0.87, + "learning_rate": 0.0016904253448232545, + "loss": 0.0923, + "step": 34750 + }, + { + "epoch": 0.87, + "learning_rate": 0.0016900484888073763, + "loss": 0.0913, + "step": 34760 + }, + { + "epoch": 0.87, + "learning_rate": 0.0016896716327914982, + "loss": 0.0921, + "step": 34770 + }, + { + "epoch": 0.87, + "learning_rate": 0.0016892947767756198, + "loss": 0.0904, + "step": 34780 + }, + { + "epoch": 0.87, + "learning_rate": 0.0016889179207597417, + "loss": 0.0906, + "step": 34790 + }, + { + "epoch": 0.87, + "learning_rate": 0.0016885410647438637, + "loss": 0.0885, + "step": 34800 + }, + { + "epoch": 0.87, + "learning_rate": 0.0016881642087279854, + "loss": 0.0935, + "step": 34810 + }, + { + "epoch": 0.87, + "learning_rate": 0.001687787352712107, + "loss": 0.0912, + "step": 34820 + }, + { + "epoch": 0.88, + "learning_rate": 0.001687410496696229, + "loss": 0.0919, + "step": 34830 + }, + { + "epoch": 0.88, + "learning_rate": 0.001687033640680351, + "loss": 0.0929, + "step": 34840 + }, + { + "epoch": 0.88, + "learning_rate": 0.0016866567846644726, + "loss": 0.0913, + "step": 34850 + }, + { + "epoch": 0.88, + "learning_rate": 0.0016862799286485942, + "loss": 0.0885, + "step": 34860 + }, + { + "epoch": 0.88, + "learning_rate": 0.0016859030726327161, + "loss": 0.0882, + "step": 34870 + }, + { + "epoch": 0.88, + "learning_rate": 0.001685526216616838, + "loss": 0.0944, + "step": 34880 + }, + { + "epoch": 0.88, + "learning_rate": 0.0016851493606009598, + "loss": 0.0919, + "step": 34890 + }, + { + "epoch": 0.88, + "learning_rate": 0.0016847725045850814, + "loss": 0.0915, + "step": 34900 + }, + { + "epoch": 0.88, + "learning_rate": 0.0016843956485692033, + "loss": 0.094, + "step": 34910 + }, + { + "epoch": 0.88, + "learning_rate": 0.0016840187925533253, + "loss": 0.0897, + "step": 34920 + }, + { + "epoch": 0.88, + "learning_rate": 0.001683641936537447, + "loss": 0.0963, + "step": 34930 + }, + { + "epoch": 0.88, + "learning_rate": 0.0016832650805215688, + "loss": 0.0902, + "step": 34940 + }, + { + "epoch": 0.88, + "learning_rate": 0.0016828882245056905, + "loss": 0.0966, + "step": 34950 + }, + { + "epoch": 0.88, + "learning_rate": 0.0016825113684898125, + "loss": 0.0971, + "step": 34960 + }, + { + "epoch": 0.88, + "learning_rate": 0.001682134512473934, + "loss": 0.0928, + "step": 34970 + }, + { + "epoch": 0.88, + "learning_rate": 0.001681757656458056, + "loss": 0.0926, + "step": 34980 + }, + { + "epoch": 0.88, + "learning_rate": 0.0016813808004421777, + "loss": 0.0901, + "step": 34990 + }, + { + "epoch": 0.88, + "learning_rate": 0.0016810039444262997, + "loss": 0.0898, + "step": 35000 + }, + { + "epoch": 0.88, + "eval_cer": 0.6658870735276637, + "eval_loss": 0.07192695885896683, + "eval_runtime": 90.571, + "eval_samples_per_second": 110.4, + "eval_steps_per_second": 6.901, + "step": 35000 + }, + { + "epoch": 0.88, + "learning_rate": 0.0016806270884104212, + "loss": 0.0918, + "step": 35010 + }, + { + "epoch": 0.88, + "learning_rate": 0.0016802502323945432, + "loss": 0.0892, + "step": 35020 + }, + { + "epoch": 0.88, + "learning_rate": 0.001679873376378665, + "loss": 0.0907, + "step": 35030 + }, + { + "epoch": 0.88, + "learning_rate": 0.0016794965203627869, + "loss": 0.0915, + "step": 35040 + }, + { + "epoch": 0.88, + "learning_rate": 0.0016791196643469084, + "loss": 0.0957, + "step": 35050 + }, + { + "epoch": 0.88, + "learning_rate": 0.0016787428083310304, + "loss": 0.0924, + "step": 35060 + }, + { + "epoch": 0.88, + "learning_rate": 0.001678365952315152, + "loss": 0.0896, + "step": 35070 + }, + { + "epoch": 0.88, + "learning_rate": 0.001677989096299274, + "loss": 0.0887, + "step": 35080 + }, + { + "epoch": 0.88, + "learning_rate": 0.0016776122402833956, + "loss": 0.0921, + "step": 35090 + }, + { + "epoch": 0.88, + "learning_rate": 0.0016772353842675176, + "loss": 0.0917, + "step": 35100 + }, + { + "epoch": 0.88, + "learning_rate": 0.0016768585282516395, + "loss": 0.0942, + "step": 35110 + }, + { + "epoch": 0.88, + "learning_rate": 0.0016764816722357613, + "loss": 0.0933, + "step": 35120 + }, + { + "epoch": 0.88, + "learning_rate": 0.0016761048162198828, + "loss": 0.0892, + "step": 35130 + }, + { + "epoch": 0.88, + "learning_rate": 0.0016757279602040048, + "loss": 0.0919, + "step": 35140 + }, + { + "epoch": 0.88, + "learning_rate": 0.0016753511041881267, + "loss": 0.0971, + "step": 35150 + }, + { + "epoch": 0.88, + "learning_rate": 0.0016749742481722482, + "loss": 0.0943, + "step": 35160 + }, + { + "epoch": 0.88, + "learning_rate": 0.00167459739215637, + "loss": 0.0885, + "step": 35170 + }, + { + "epoch": 0.88, + "learning_rate": 0.001674220536140492, + "loss": 0.0894, + "step": 35180 + }, + { + "epoch": 0.88, + "learning_rate": 0.001673843680124614, + "loss": 0.0895, + "step": 35190 + }, + { + "epoch": 0.88, + "learning_rate": 0.0016734668241087354, + "loss": 0.0913, + "step": 35200 + }, + { + "epoch": 0.88, + "learning_rate": 0.0016730899680928574, + "loss": 0.0927, + "step": 35210 + }, + { + "epoch": 0.88, + "learning_rate": 0.0016727131120769791, + "loss": 0.0922, + "step": 35220 + }, + { + "epoch": 0.89, + "learning_rate": 0.001672336256061101, + "loss": 0.0918, + "step": 35230 + }, + { + "epoch": 0.89, + "learning_rate": 0.0016719594000452226, + "loss": 0.0933, + "step": 35240 + }, + { + "epoch": 0.89, + "learning_rate": 0.0016715825440293446, + "loss": 0.0957, + "step": 35250 + }, + { + "epoch": 0.89, + "learning_rate": 0.0016712056880134663, + "loss": 0.0941, + "step": 35260 + }, + { + "epoch": 0.89, + "learning_rate": 0.0016708288319975883, + "loss": 0.0917, + "step": 35270 + }, + { + "epoch": 0.89, + "learning_rate": 0.0016704519759817098, + "loss": 0.0904, + "step": 35280 + }, + { + "epoch": 0.89, + "learning_rate": 0.0016700751199658318, + "loss": 0.09, + "step": 35290 + }, + { + "epoch": 0.89, + "learning_rate": 0.0016696982639499535, + "loss": 0.0926, + "step": 35300 + }, + { + "epoch": 0.89, + "learning_rate": 0.0016693214079340755, + "loss": 0.0889, + "step": 35310 + }, + { + "epoch": 0.89, + "learning_rate": 0.001668944551918197, + "loss": 0.0899, + "step": 35320 + }, + { + "epoch": 0.89, + "learning_rate": 0.001668567695902319, + "loss": 0.0892, + "step": 35330 + }, + { + "epoch": 0.89, + "learning_rate": 0.0016681908398864407, + "loss": 0.0924, + "step": 35340 + }, + { + "epoch": 0.89, + "learning_rate": 0.0016678139838705627, + "loss": 0.0907, + "step": 35350 + }, + { + "epoch": 0.89, + "learning_rate": 0.0016674371278546842, + "loss": 0.0906, + "step": 35360 + }, + { + "epoch": 0.89, + "learning_rate": 0.0016670602718388062, + "loss": 0.0928, + "step": 35370 + }, + { + "epoch": 0.89, + "learning_rate": 0.0016666834158229281, + "loss": 0.0898, + "step": 35380 + }, + { + "epoch": 0.89, + "learning_rate": 0.0016663065598070497, + "loss": 0.0908, + "step": 35390 + }, + { + "epoch": 0.89, + "learning_rate": 0.0016659297037911714, + "loss": 0.0911, + "step": 35400 + }, + { + "epoch": 0.89, + "learning_rate": 0.0016655528477752934, + "loss": 0.0916, + "step": 35410 + }, + { + "epoch": 0.89, + "learning_rate": 0.0016651759917594153, + "loss": 0.0887, + "step": 35420 + }, + { + "epoch": 0.89, + "learning_rate": 0.0016647991357435369, + "loss": 0.091, + "step": 35430 + }, + { + "epoch": 0.89, + "learning_rate": 0.0016644222797276586, + "loss": 0.0907, + "step": 35440 + }, + { + "epoch": 0.89, + "learning_rate": 0.0016640454237117806, + "loss": 0.0908, + "step": 35450 + }, + { + "epoch": 0.89, + "learning_rate": 0.0016636685676959025, + "loss": 0.0903, + "step": 35460 + }, + { + "epoch": 0.89, + "learning_rate": 0.001663291711680024, + "loss": 0.089, + "step": 35470 + }, + { + "epoch": 0.89, + "learning_rate": 0.0016629148556641458, + "loss": 0.0887, + "step": 35480 + }, + { + "epoch": 0.89, + "learning_rate": 0.0016625379996482678, + "loss": 0.0898, + "step": 35490 + }, + { + "epoch": 0.89, + "learning_rate": 0.0016621611436323897, + "loss": 0.0913, + "step": 35500 + }, + { + "epoch": 0.89, + "eval_cer": 0.6657017998495673, + "eval_loss": 0.07208002358675003, + "eval_runtime": 90.5347, + "eval_samples_per_second": 110.444, + "eval_steps_per_second": 6.903, + "step": 35500 + }, + { + "epoch": 0.89, + "learning_rate": 0.0016617842876165113, + "loss": 0.0886, + "step": 35510 + }, + { + "epoch": 0.89, + "learning_rate": 0.0016614074316006332, + "loss": 0.0912, + "step": 35520 + }, + { + "epoch": 0.89, + "learning_rate": 0.001661030575584755, + "loss": 0.0922, + "step": 35530 + }, + { + "epoch": 0.89, + "learning_rate": 0.001660653719568877, + "loss": 0.0907, + "step": 35540 + }, + { + "epoch": 0.89, + "learning_rate": 0.0016602768635529984, + "loss": 0.0882, + "step": 35550 + }, + { + "epoch": 0.89, + "learning_rate": 0.0016599000075371204, + "loss": 0.0863, + "step": 35560 + }, + { + "epoch": 0.89, + "learning_rate": 0.0016595231515212422, + "loss": 0.0889, + "step": 35570 + }, + { + "epoch": 0.89, + "learning_rate": 0.0016591462955053641, + "loss": 0.0906, + "step": 35580 + }, + { + "epoch": 0.89, + "learning_rate": 0.0016587694394894856, + "loss": 0.0917, + "step": 35590 + }, + { + "epoch": 0.89, + "learning_rate": 0.0016583925834736076, + "loss": 0.0931, + "step": 35600 + }, + { + "epoch": 0.89, + "learning_rate": 0.0016580157274577294, + "loss": 0.0898, + "step": 35610 + }, + { + "epoch": 0.89, + "learning_rate": 0.001657638871441851, + "loss": 0.0894, + "step": 35620 + }, + { + "epoch": 0.9, + "learning_rate": 0.0016572620154259728, + "loss": 0.0849, + "step": 35630 + }, + { + "epoch": 0.9, + "learning_rate": 0.0016568851594100948, + "loss": 0.0883, + "step": 35640 + }, + { + "epoch": 0.9, + "learning_rate": 0.0016565083033942165, + "loss": 0.0911, + "step": 35650 + }, + { + "epoch": 0.9, + "learning_rate": 0.0016561314473783383, + "loss": 0.0902, + "step": 35660 + }, + { + "epoch": 0.9, + "learning_rate": 0.00165575459136246, + "loss": 0.0947, + "step": 35670 + }, + { + "epoch": 0.9, + "learning_rate": 0.001655377735346582, + "loss": 0.0884, + "step": 35680 + }, + { + "epoch": 0.9, + "learning_rate": 0.001655000879330704, + "loss": 0.0922, + "step": 35690 + }, + { + "epoch": 0.9, + "learning_rate": 0.0016546240233148255, + "loss": 0.0874, + "step": 35700 + }, + { + "epoch": 0.9, + "learning_rate": 0.0016542471672989472, + "loss": 0.0905, + "step": 35710 + }, + { + "epoch": 0.9, + "learning_rate": 0.0016538703112830692, + "loss": 0.0903, + "step": 35720 + }, + { + "epoch": 0.9, + "learning_rate": 0.0016534934552671912, + "loss": 0.0913, + "step": 35730 + }, + { + "epoch": 0.9, + "learning_rate": 0.0016531165992513127, + "loss": 0.0874, + "step": 35740 + }, + { + "epoch": 0.9, + "learning_rate": 0.0016527397432354344, + "loss": 0.0951, + "step": 35750 + }, + { + "epoch": 0.9, + "learning_rate": 0.0016523628872195564, + "loss": 0.0942, + "step": 35760 + }, + { + "epoch": 0.9, + "learning_rate": 0.0016519860312036783, + "loss": 0.0907, + "step": 35770 + }, + { + "epoch": 0.9, + "learning_rate": 0.0016516091751877999, + "loss": 0.0912, + "step": 35780 + }, + { + "epoch": 0.9, + "learning_rate": 0.0016512323191719218, + "loss": 0.0907, + "step": 35790 + }, + { + "epoch": 0.9, + "learning_rate": 0.0016508554631560436, + "loss": 0.0879, + "step": 35800 + }, + { + "epoch": 0.9, + "learning_rate": 0.0016504786071401655, + "loss": 0.0927, + "step": 35810 + }, + { + "epoch": 0.9, + "learning_rate": 0.001650101751124287, + "loss": 0.0902, + "step": 35820 + }, + { + "epoch": 0.9, + "learning_rate": 0.001649724895108409, + "loss": 0.0913, + "step": 35830 + }, + { + "epoch": 0.9, + "learning_rate": 0.0016493480390925308, + "loss": 0.0917, + "step": 35840 + }, + { + "epoch": 0.9, + "learning_rate": 0.0016489711830766523, + "loss": 0.0927, + "step": 35850 + }, + { + "epoch": 0.9, + "learning_rate": 0.0016485943270607743, + "loss": 0.0917, + "step": 35860 + }, + { + "epoch": 0.9, + "learning_rate": 0.0016482174710448962, + "loss": 0.0922, + "step": 35870 + }, + { + "epoch": 0.9, + "learning_rate": 0.001647840615029018, + "loss": 0.0907, + "step": 35880 + }, + { + "epoch": 0.9, + "learning_rate": 0.0016474637590131395, + "loss": 0.0894, + "step": 35890 + }, + { + "epoch": 0.9, + "learning_rate": 0.0016470869029972615, + "loss": 0.0886, + "step": 35900 + }, + { + "epoch": 0.9, + "learning_rate": 0.0016467100469813834, + "loss": 0.0892, + "step": 35910 + }, + { + "epoch": 0.9, + "learning_rate": 0.0016463331909655052, + "loss": 0.0902, + "step": 35920 + }, + { + "epoch": 0.9, + "learning_rate": 0.001645956334949627, + "loss": 0.0916, + "step": 35930 + }, + { + "epoch": 0.9, + "learning_rate": 0.0016455794789337487, + "loss": 0.0907, + "step": 35940 + }, + { + "epoch": 0.9, + "learning_rate": 0.0016452026229178706, + "loss": 0.0938, + "step": 35950 + }, + { + "epoch": 0.9, + "learning_rate": 0.0016448257669019926, + "loss": 0.0909, + "step": 35960 + }, + { + "epoch": 0.9, + "learning_rate": 0.0016444489108861141, + "loss": 0.0877, + "step": 35970 + }, + { + "epoch": 0.9, + "learning_rate": 0.0016440720548702359, + "loss": 0.0888, + "step": 35980 + }, + { + "epoch": 0.9, + "learning_rate": 0.0016436951988543578, + "loss": 0.0899, + "step": 35990 + }, + { + "epoch": 0.9, + "learning_rate": 0.0016433183428384798, + "loss": 0.0897, + "step": 36000 + }, + { + "epoch": 0.9, + "eval_cer": 0.6657489604221738, + "eval_loss": 0.07150072604417801, + "eval_runtime": 90.8705, + "eval_samples_per_second": 110.036, + "eval_steps_per_second": 6.878, + "step": 36000 + }, + { + "epoch": 0.9, + "learning_rate": 0.0016429414868226013, + "loss": 0.0934, + "step": 36010 + }, + { + "epoch": 0.9, + "learning_rate": 0.001642564630806723, + "loss": 0.0884, + "step": 36020 + }, + { + "epoch": 0.91, + "learning_rate": 0.001642187774790845, + "loss": 0.0897, + "step": 36030 + }, + { + "epoch": 0.91, + "learning_rate": 0.001641810918774967, + "loss": 0.0865, + "step": 36040 + }, + { + "epoch": 0.91, + "learning_rate": 0.0016414340627590885, + "loss": 0.0889, + "step": 36050 + }, + { + "epoch": 0.91, + "learning_rate": 0.0016410572067432102, + "loss": 0.0876, + "step": 36060 + }, + { + "epoch": 0.91, + "learning_rate": 0.0016406803507273322, + "loss": 0.0912, + "step": 36070 + }, + { + "epoch": 0.91, + "learning_rate": 0.0016403034947114537, + "loss": 0.0868, + "step": 36080 + }, + { + "epoch": 0.91, + "learning_rate": 0.0016399266386955757, + "loss": 0.0901, + "step": 36090 + }, + { + "epoch": 0.91, + "learning_rate": 0.0016395497826796977, + "loss": 0.0909, + "step": 36100 + }, + { + "epoch": 0.91, + "learning_rate": 0.0016391729266638194, + "loss": 0.0894, + "step": 36110 + }, + { + "epoch": 0.91, + "learning_rate": 0.001638796070647941, + "loss": 0.0941, + "step": 36120 + }, + { + "epoch": 0.91, + "learning_rate": 0.0016384192146320629, + "loss": 0.0872, + "step": 36130 + }, + { + "epoch": 0.91, + "learning_rate": 0.0016380423586161849, + "loss": 0.0949, + "step": 36140 + }, + { + "epoch": 0.91, + "learning_rate": 0.0016376655026003066, + "loss": 0.0929, + "step": 36150 + }, + { + "epoch": 0.91, + "learning_rate": 0.0016372886465844281, + "loss": 0.0884, + "step": 36160 + }, + { + "epoch": 0.91, + "learning_rate": 0.00163691179056855, + "loss": 0.0931, + "step": 36170 + }, + { + "epoch": 0.91, + "learning_rate": 0.001636534934552672, + "loss": 0.0909, + "step": 36180 + }, + { + "epoch": 0.91, + "learning_rate": 0.0016361580785367938, + "loss": 0.0944, + "step": 36190 + }, + { + "epoch": 0.91, + "learning_rate": 0.0016357812225209155, + "loss": 0.0893, + "step": 36200 + }, + { + "epoch": 0.91, + "learning_rate": 0.0016354043665050373, + "loss": 0.0883, + "step": 36210 + }, + { + "epoch": 0.91, + "learning_rate": 0.0016350275104891592, + "loss": 0.0904, + "step": 36220 + }, + { + "epoch": 0.91, + "learning_rate": 0.0016346506544732812, + "loss": 0.0939, + "step": 36230 + }, + { + "epoch": 0.91, + "learning_rate": 0.0016342737984574027, + "loss": 0.0903, + "step": 36240 + }, + { + "epoch": 0.91, + "learning_rate": 0.0016338969424415245, + "loss": 0.0889, + "step": 36250 + }, + { + "epoch": 0.91, + "learning_rate": 0.0016335200864256464, + "loss": 0.0876, + "step": 36260 + }, + { + "epoch": 0.91, + "learning_rate": 0.001633143230409768, + "loss": 0.0943, + "step": 36270 + }, + { + "epoch": 0.91, + "learning_rate": 0.00163276637439389, + "loss": 0.0916, + "step": 36280 + }, + { + "epoch": 0.91, + "learning_rate": 0.0016323895183780117, + "loss": 0.0893, + "step": 36290 + }, + { + "epoch": 0.91, + "learning_rate": 0.0016320126623621336, + "loss": 0.0915, + "step": 36300 + }, + { + "epoch": 0.91, + "learning_rate": 0.0016316358063462552, + "loss": 0.0883, + "step": 36310 + }, + { + "epoch": 0.91, + "learning_rate": 0.0016312589503303771, + "loss": 0.0879, + "step": 36320 + }, + { + "epoch": 0.91, + "learning_rate": 0.0016308820943144989, + "loss": 0.0872, + "step": 36330 + }, + { + "epoch": 0.91, + "learning_rate": 0.0016305052382986208, + "loss": 0.0907, + "step": 36340 + }, + { + "epoch": 0.91, + "learning_rate": 0.0016301283822827424, + "loss": 0.0913, + "step": 36350 + }, + { + "epoch": 0.91, + "learning_rate": 0.0016297515262668643, + "loss": 0.0866, + "step": 36360 + }, + { + "epoch": 0.91, + "learning_rate": 0.0016293746702509863, + "loss": 0.0929, + "step": 36370 + }, + { + "epoch": 0.91, + "learning_rate": 0.001628997814235108, + "loss": 0.091, + "step": 36380 + }, + { + "epoch": 0.91, + "learning_rate": 0.0016286209582192296, + "loss": 0.0866, + "step": 36390 + }, + { + "epoch": 0.91, + "learning_rate": 0.0016282441022033515, + "loss": 0.0895, + "step": 36400 + }, + { + "epoch": 0.91, + "learning_rate": 0.0016278672461874735, + "loss": 0.088, + "step": 36410 + }, + { + "epoch": 0.91, + "learning_rate": 0.0016274903901715952, + "loss": 0.0907, + "step": 36420 + }, + { + "epoch": 0.92, + "learning_rate": 0.0016271135341557167, + "loss": 0.0956, + "step": 36430 + }, + { + "epoch": 0.92, + "learning_rate": 0.0016267366781398387, + "loss": 0.0899, + "step": 36440 + }, + { + "epoch": 0.92, + "learning_rate": 0.0016263598221239607, + "loss": 0.0883, + "step": 36450 + }, + { + "epoch": 0.92, + "learning_rate": 0.0016259829661080824, + "loss": 0.09, + "step": 36460 + }, + { + "epoch": 0.92, + "learning_rate": 0.001625606110092204, + "loss": 0.0912, + "step": 36470 + }, + { + "epoch": 0.92, + "learning_rate": 0.001625229254076326, + "loss": 0.0923, + "step": 36480 + }, + { + "epoch": 0.92, + "learning_rate": 0.0016248523980604479, + "loss": 0.0876, + "step": 36490 + }, + { + "epoch": 0.92, + "learning_rate": 0.0016244755420445694, + "loss": 0.0887, + "step": 36500 + }, + { + "epoch": 0.92, + "eval_cer": 0.6658702304660187, + "eval_loss": 0.07075611501932144, + "eval_runtime": 90.7034, + "eval_samples_per_second": 110.238, + "eval_steps_per_second": 6.891, + "step": 36500 + }, + { + "epoch": 0.92, + "learning_rate": 0.0016240986860286914, + "loss": 0.089, + "step": 36510 + }, + { + "epoch": 0.92, + "learning_rate": 0.001623721830012813, + "loss": 0.0892, + "step": 36520 + }, + { + "epoch": 0.92, + "learning_rate": 0.001623344973996935, + "loss": 0.094, + "step": 36530 + }, + { + "epoch": 0.92, + "learning_rate": 0.0016229681179810566, + "loss": 0.0915, + "step": 36540 + }, + { + "epoch": 0.92, + "learning_rate": 0.0016225912619651785, + "loss": 0.0863, + "step": 36550 + }, + { + "epoch": 0.92, + "learning_rate": 0.0016222144059493003, + "loss": 0.0909, + "step": 36560 + }, + { + "epoch": 0.92, + "learning_rate": 0.0016218375499334223, + "loss": 0.0877, + "step": 36570 + }, + { + "epoch": 0.92, + "learning_rate": 0.0016214606939175438, + "loss": 0.0923, + "step": 36580 + }, + { + "epoch": 0.92, + "learning_rate": 0.0016210838379016657, + "loss": 0.0893, + "step": 36590 + }, + { + "epoch": 0.92, + "learning_rate": 0.0016207069818857875, + "loss": 0.0924, + "step": 36600 + }, + { + "epoch": 0.92, + "learning_rate": 0.0016203301258699095, + "loss": 0.0908, + "step": 36610 + }, + { + "epoch": 0.92, + "learning_rate": 0.001619953269854031, + "loss": 0.0874, + "step": 36620 + }, + { + "epoch": 0.92, + "learning_rate": 0.001619576413838153, + "loss": 0.0859, + "step": 36630 + }, + { + "epoch": 0.92, + "learning_rate": 0.0016191995578222747, + "loss": 0.0923, + "step": 36640 + }, + { + "epoch": 0.92, + "learning_rate": 0.0016188227018063966, + "loss": 0.091, + "step": 36650 + }, + { + "epoch": 0.92, + "learning_rate": 0.0016184458457905182, + "loss": 0.0898, + "step": 36660 + }, + { + "epoch": 0.92, + "learning_rate": 0.0016180689897746401, + "loss": 0.0874, + "step": 36670 + }, + { + "epoch": 0.92, + "learning_rate": 0.001617692133758762, + "loss": 0.0881, + "step": 36680 + }, + { + "epoch": 0.92, + "learning_rate": 0.0016173152777428838, + "loss": 0.0915, + "step": 36690 + }, + { + "epoch": 0.92, + "learning_rate": 0.0016169384217270054, + "loss": 0.0905, + "step": 36700 + }, + { + "epoch": 0.92, + "learning_rate": 0.0016165615657111273, + "loss": 0.091, + "step": 36710 + }, + { + "epoch": 0.92, + "learning_rate": 0.0016161847096952493, + "loss": 0.09, + "step": 36720 + }, + { + "epoch": 0.92, + "learning_rate": 0.0016158078536793708, + "loss": 0.0872, + "step": 36730 + }, + { + "epoch": 0.92, + "learning_rate": 0.0016154309976634926, + "loss": 0.0867, + "step": 36740 + }, + { + "epoch": 0.92, + "learning_rate": 0.0016150541416476145, + "loss": 0.0875, + "step": 36750 + }, + { + "epoch": 0.92, + "learning_rate": 0.0016146772856317365, + "loss": 0.0902, + "step": 36760 + }, + { + "epoch": 0.92, + "learning_rate": 0.001614300429615858, + "loss": 0.0915, + "step": 36770 + }, + { + "epoch": 0.92, + "learning_rate": 0.00161392357359998, + "loss": 0.089, + "step": 36780 + }, + { + "epoch": 0.92, + "learning_rate": 0.0016135467175841017, + "loss": 0.0867, + "step": 36790 + }, + { + "epoch": 0.92, + "learning_rate": 0.0016131698615682237, + "loss": 0.0884, + "step": 36800 + }, + { + "epoch": 0.92, + "learning_rate": 0.0016127930055523452, + "loss": 0.0907, + "step": 36810 + }, + { + "epoch": 0.93, + "learning_rate": 0.0016124161495364672, + "loss": 0.0911, + "step": 36820 + }, + { + "epoch": 0.93, + "learning_rate": 0.001612039293520589, + "loss": 0.0903, + "step": 36830 + }, + { + "epoch": 0.93, + "learning_rate": 0.0016116624375047109, + "loss": 0.0893, + "step": 36840 + }, + { + "epoch": 0.93, + "learning_rate": 0.0016112855814888324, + "loss": 0.0912, + "step": 36850 + }, + { + "epoch": 0.93, + "learning_rate": 0.0016109087254729544, + "loss": 0.0902, + "step": 36860 + }, + { + "epoch": 0.93, + "learning_rate": 0.0016105318694570761, + "loss": 0.0936, + "step": 36870 + }, + { + "epoch": 0.93, + "learning_rate": 0.001610155013441198, + "loss": 0.0901, + "step": 36880 + }, + { + "epoch": 0.93, + "learning_rate": 0.0016097781574253196, + "loss": 0.0864, + "step": 36890 + }, + { + "epoch": 0.93, + "learning_rate": 0.0016094013014094416, + "loss": 0.0862, + "step": 36900 + }, + { + "epoch": 0.93, + "learning_rate": 0.0016090244453935633, + "loss": 0.089, + "step": 36910 + }, + { + "epoch": 0.93, + "learning_rate": 0.0016086475893776853, + "loss": 0.089, + "step": 36920 + }, + { + "epoch": 0.93, + "learning_rate": 0.0016082707333618068, + "loss": 0.088, + "step": 36930 + }, + { + "epoch": 0.93, + "learning_rate": 0.0016078938773459288, + "loss": 0.0889, + "step": 36940 + }, + { + "epoch": 0.93, + "learning_rate": 0.0016075170213300507, + "loss": 0.0884, + "step": 36950 + }, + { + "epoch": 0.93, + "learning_rate": 0.0016071401653141722, + "loss": 0.0884, + "step": 36960 + }, + { + "epoch": 0.93, + "learning_rate": 0.001606763309298294, + "loss": 0.086, + "step": 36970 + }, + { + "epoch": 0.93, + "learning_rate": 0.001606386453282416, + "loss": 0.091, + "step": 36980 + }, + { + "epoch": 0.93, + "learning_rate": 0.001606009597266538, + "loss": 0.0906, + "step": 36990 + }, + { + "epoch": 0.93, + "learning_rate": 0.0016056327412506594, + "loss": 0.0922, + "step": 37000 + }, + { + "epoch": 0.93, + "eval_cer": 0.6653331774147055, + "eval_loss": 0.07120376080274582, + "eval_runtime": 90.8589, + "eval_samples_per_second": 110.05, + "eval_steps_per_second": 6.879, + "step": 37000 + }, + { + "epoch": 0.93, + "learning_rate": 0.0016052558852347812, + "loss": 0.0909, + "step": 37010 + }, + { + "epoch": 0.93, + "learning_rate": 0.0016048790292189031, + "loss": 0.0879, + "step": 37020 + }, + { + "epoch": 0.93, + "learning_rate": 0.0016045021732030251, + "loss": 0.0878, + "step": 37030 + }, + { + "epoch": 0.93, + "learning_rate": 0.0016041253171871466, + "loss": 0.0872, + "step": 37040 + }, + { + "epoch": 0.93, + "learning_rate": 0.0016037484611712684, + "loss": 0.0867, + "step": 37050 + }, + { + "epoch": 0.93, + "learning_rate": 0.0016033716051553903, + "loss": 0.0886, + "step": 37060 + }, + { + "epoch": 0.93, + "learning_rate": 0.0016029947491395123, + "loss": 0.0873, + "step": 37070 + }, + { + "epoch": 0.93, + "learning_rate": 0.0016026178931236338, + "loss": 0.0892, + "step": 37080 + }, + { + "epoch": 0.93, + "learning_rate": 0.0016022410371077558, + "loss": 0.0889, + "step": 37090 + }, + { + "epoch": 0.93, + "learning_rate": 0.0016018641810918775, + "loss": 0.0872, + "step": 37100 + }, + { + "epoch": 0.93, + "learning_rate": 0.0016014873250759995, + "loss": 0.0892, + "step": 37110 + }, + { + "epoch": 0.93, + "learning_rate": 0.001601110469060121, + "loss": 0.0914, + "step": 37120 + }, + { + "epoch": 0.93, + "learning_rate": 0.001600733613044243, + "loss": 0.09, + "step": 37130 + }, + { + "epoch": 0.93, + "learning_rate": 0.0016003567570283647, + "loss": 0.0882, + "step": 37140 + }, + { + "epoch": 0.93, + "learning_rate": 0.0015999799010124867, + "loss": 0.0852, + "step": 37150 + }, + { + "epoch": 0.93, + "learning_rate": 0.0015996030449966082, + "loss": 0.0871, + "step": 37160 + }, + { + "epoch": 0.93, + "learning_rate": 0.0015992261889807302, + "loss": 0.0884, + "step": 37170 + }, + { + "epoch": 0.93, + "learning_rate": 0.001598849332964852, + "loss": 0.092, + "step": 37180 + }, + { + "epoch": 0.93, + "learning_rate": 0.0015984724769489737, + "loss": 0.0903, + "step": 37190 + }, + { + "epoch": 0.93, + "learning_rate": 0.0015980956209330954, + "loss": 0.0893, + "step": 37200 + }, + { + "epoch": 0.93, + "learning_rate": 0.0015977187649172174, + "loss": 0.0898, + "step": 37210 + }, + { + "epoch": 0.94, + "learning_rate": 0.0015973419089013393, + "loss": 0.0907, + "step": 37220 + }, + { + "epoch": 0.94, + "learning_rate": 0.0015969650528854609, + "loss": 0.0897, + "step": 37230 + }, + { + "epoch": 0.94, + "learning_rate": 0.0015965881968695826, + "loss": 0.0923, + "step": 37240 + }, + { + "epoch": 0.94, + "learning_rate": 0.0015962113408537046, + "loss": 0.0909, + "step": 37250 + }, + { + "epoch": 0.94, + "learning_rate": 0.0015958344848378265, + "loss": 0.0909, + "step": 37260 + }, + { + "epoch": 0.94, + "learning_rate": 0.001595457628821948, + "loss": 0.0874, + "step": 37270 + }, + { + "epoch": 0.94, + "learning_rate": 0.0015950807728060698, + "loss": 0.0862, + "step": 37280 + }, + { + "epoch": 0.94, + "learning_rate": 0.0015947039167901918, + "loss": 0.089, + "step": 37290 + }, + { + "epoch": 0.94, + "learning_rate": 0.0015943270607743137, + "loss": 0.0852, + "step": 37300 + }, + { + "epoch": 0.94, + "learning_rate": 0.0015939502047584353, + "loss": 0.0898, + "step": 37310 + }, + { + "epoch": 0.94, + "learning_rate": 0.001593573348742557, + "loss": 0.0906, + "step": 37320 + }, + { + "epoch": 0.94, + "learning_rate": 0.001593196492726679, + "loss": 0.0905, + "step": 37330 + }, + { + "epoch": 0.94, + "learning_rate": 0.001592819636710801, + "loss": 0.0873, + "step": 37340 + }, + { + "epoch": 0.94, + "learning_rate": 0.0015924427806949225, + "loss": 0.0883, + "step": 37350 + }, + { + "epoch": 0.94, + "learning_rate": 0.0015920659246790444, + "loss": 0.087, + "step": 37360 + }, + { + "epoch": 0.94, + "learning_rate": 0.0015916890686631662, + "loss": 0.0909, + "step": 37370 + }, + { + "epoch": 0.94, + "learning_rate": 0.0015913122126472877, + "loss": 0.0908, + "step": 37380 + }, + { + "epoch": 0.94, + "learning_rate": 0.0015909353566314097, + "loss": 0.0917, + "step": 37390 + }, + { + "epoch": 0.94, + "learning_rate": 0.0015905585006155316, + "loss": 0.0889, + "step": 37400 + }, + { + "epoch": 0.94, + "learning_rate": 0.0015901816445996534, + "loss": 0.0891, + "step": 37410 + }, + { + "epoch": 0.94, + "learning_rate": 0.0015898047885837749, + "loss": 0.0904, + "step": 37420 + }, + { + "epoch": 0.94, + "learning_rate": 0.0015894279325678968, + "loss": 0.0897, + "step": 37430 + }, + { + "epoch": 0.94, + "learning_rate": 0.0015890510765520188, + "loss": 0.0869, + "step": 37440 + }, + { + "epoch": 0.94, + "learning_rate": 0.0015886742205361406, + "loss": 0.0849, + "step": 37450 + }, + { + "epoch": 0.94, + "learning_rate": 0.001588297364520262, + "loss": 0.0891, + "step": 37460 + }, + { + "epoch": 0.94, + "learning_rate": 0.001587920508504384, + "loss": 0.0919, + "step": 37470 + }, + { + "epoch": 0.94, + "learning_rate": 0.001587543652488506, + "loss": 0.0893, + "step": 37480 + }, + { + "epoch": 0.94, + "learning_rate": 0.0015871667964726277, + "loss": 0.0892, + "step": 37490 + }, + { + "epoch": 0.94, + "learning_rate": 0.0015867899404567495, + "loss": 0.0905, + "step": 37500 + }, + { + "epoch": 0.94, + "eval_cer": 0.6659635891505659, + "eval_loss": 0.07065676897764206, + "eval_runtime": 90.5606, + "eval_samples_per_second": 110.412, + "eval_steps_per_second": 6.901, + "step": 37500 + }, + { + "epoch": 0.94, + "learning_rate": 0.0015864130844408712, + "loss": 0.0874, + "step": 37510 + }, + { + "epoch": 0.94, + "learning_rate": 0.0015860362284249932, + "loss": 0.0857, + "step": 37520 + }, + { + "epoch": 0.94, + "learning_rate": 0.0015856593724091152, + "loss": 0.0874, + "step": 37530 + }, + { + "epoch": 0.94, + "learning_rate": 0.0015852825163932367, + "loss": 0.0898, + "step": 37540 + }, + { + "epoch": 0.94, + "learning_rate": 0.0015849056603773584, + "loss": 0.0887, + "step": 37550 + }, + { + "epoch": 0.94, + "learning_rate": 0.0015845288043614804, + "loss": 0.0885, + "step": 37560 + }, + { + "epoch": 0.94, + "learning_rate": 0.0015841519483456024, + "loss": 0.0867, + "step": 37570 + }, + { + "epoch": 0.94, + "learning_rate": 0.0015837750923297239, + "loss": 0.089, + "step": 37580 + }, + { + "epoch": 0.94, + "learning_rate": 0.0015833982363138456, + "loss": 0.0883, + "step": 37590 + }, + { + "epoch": 0.94, + "learning_rate": 0.0015830213802979676, + "loss": 0.0857, + "step": 37600 + }, + { + "epoch": 0.94, + "learning_rate": 0.0015826445242820891, + "loss": 0.0898, + "step": 37610 + }, + { + "epoch": 0.95, + "learning_rate": 0.001582267668266211, + "loss": 0.0881, + "step": 37620 + }, + { + "epoch": 0.95, + "learning_rate": 0.001581890812250333, + "loss": 0.0901, + "step": 37630 + }, + { + "epoch": 0.95, + "learning_rate": 0.0015815139562344548, + "loss": 0.0857, + "step": 37640 + }, + { + "epoch": 0.95, + "learning_rate": 0.0015811371002185763, + "loss": 0.0888, + "step": 37650 + }, + { + "epoch": 0.95, + "learning_rate": 0.0015807602442026983, + "loss": 0.093, + "step": 37660 + }, + { + "epoch": 0.95, + "learning_rate": 0.0015803833881868202, + "loss": 0.0835, + "step": 37670 + }, + { + "epoch": 0.95, + "learning_rate": 0.001580006532170942, + "loss": 0.0839, + "step": 37680 + }, + { + "epoch": 0.95, + "learning_rate": 0.0015796296761550635, + "loss": 0.0881, + "step": 37690 + }, + { + "epoch": 0.95, + "learning_rate": 0.0015792528201391855, + "loss": 0.0925, + "step": 37700 + }, + { + "epoch": 0.95, + "learning_rate": 0.0015788759641233074, + "loss": 0.0915, + "step": 37710 + }, + { + "epoch": 0.95, + "learning_rate": 0.0015784991081074292, + "loss": 0.0862, + "step": 37720 + }, + { + "epoch": 0.95, + "learning_rate": 0.0015781222520915507, + "loss": 0.0904, + "step": 37730 + }, + { + "epoch": 0.95, + "learning_rate": 0.0015777453960756727, + "loss": 0.0922, + "step": 37740 + }, + { + "epoch": 0.95, + "learning_rate": 0.0015773685400597946, + "loss": 0.0893, + "step": 37750 + }, + { + "epoch": 0.95, + "learning_rate": 0.0015769916840439164, + "loss": 0.0925, + "step": 37760 + }, + { + "epoch": 0.95, + "learning_rate": 0.0015766148280280381, + "loss": 0.0914, + "step": 37770 + }, + { + "epoch": 0.95, + "learning_rate": 0.0015762379720121599, + "loss": 0.0861, + "step": 37780 + }, + { + "epoch": 0.95, + "learning_rate": 0.0015758611159962818, + "loss": 0.09, + "step": 37790 + }, + { + "epoch": 0.95, + "learning_rate": 0.0015754842599804038, + "loss": 0.0869, + "step": 37800 + }, + { + "epoch": 0.95, + "learning_rate": 0.0015751074039645253, + "loss": 0.0865, + "step": 37810 + }, + { + "epoch": 0.95, + "learning_rate": 0.001574730547948647, + "loss": 0.0893, + "step": 37820 + }, + { + "epoch": 0.95, + "learning_rate": 0.001574353691932769, + "loss": 0.0851, + "step": 37830 + }, + { + "epoch": 0.95, + "learning_rate": 0.0015739768359168905, + "loss": 0.0882, + "step": 37840 + }, + { + "epoch": 0.95, + "learning_rate": 0.0015735999799010125, + "loss": 0.0886, + "step": 37850 + }, + { + "epoch": 0.95, + "learning_rate": 0.0015732231238851343, + "loss": 0.0908, + "step": 37860 + }, + { + "epoch": 0.95, + "learning_rate": 0.0015728462678692562, + "loss": 0.0871, + "step": 37870 + }, + { + "epoch": 0.95, + "learning_rate": 0.0015724694118533777, + "loss": 0.0869, + "step": 37880 + }, + { + "epoch": 0.95, + "learning_rate": 0.0015720925558374997, + "loss": 0.0918, + "step": 37890 + }, + { + "epoch": 0.95, + "learning_rate": 0.0015717156998216214, + "loss": 0.0886, + "step": 37900 + }, + { + "epoch": 0.95, + "learning_rate": 0.0015713388438057434, + "loss": 0.0904, + "step": 37910 + }, + { + "epoch": 0.95, + "learning_rate": 0.001570961987789865, + "loss": 0.0907, + "step": 37920 + }, + { + "epoch": 0.95, + "learning_rate": 0.001570585131773987, + "loss": 0.0886, + "step": 37930 + }, + { + "epoch": 0.95, + "learning_rate": 0.0015702082757581089, + "loss": 0.0878, + "step": 37940 + }, + { + "epoch": 0.95, + "learning_rate": 0.0015698314197422306, + "loss": 0.0868, + "step": 37950 + }, + { + "epoch": 0.95, + "learning_rate": 0.0015694545637263521, + "loss": 0.0882, + "step": 37960 + }, + { + "epoch": 0.95, + "learning_rate": 0.001569077707710474, + "loss": 0.0859, + "step": 37970 + }, + { + "epoch": 0.95, + "learning_rate": 0.001568700851694596, + "loss": 0.0885, + "step": 37980 + }, + { + "epoch": 0.95, + "learning_rate": 0.0015683239956787178, + "loss": 0.0905, + "step": 37990 + }, + { + "epoch": 0.95, + "learning_rate": 0.0015679471396628393, + "loss": 0.0881, + "step": 38000 + }, + { + "epoch": 0.95, + "eval_cer": 0.6658206637417488, + "eval_loss": 0.07003695517778397, + "eval_runtime": 90.6769, + "eval_samples_per_second": 110.271, + "eval_steps_per_second": 6.893, + "step": 38000 + }, + { + "epoch": 0.95, + "learning_rate": 0.0015675702836469613, + "loss": 0.0887, + "step": 38010 + }, + { + "epoch": 0.96, + "learning_rate": 0.0015671934276310832, + "loss": 0.0889, + "step": 38020 + }, + { + "epoch": 0.96, + "learning_rate": 0.001566816571615205, + "loss": 0.0903, + "step": 38030 + }, + { + "epoch": 0.96, + "learning_rate": 0.0015664397155993267, + "loss": 0.0895, + "step": 38040 + }, + { + "epoch": 0.96, + "learning_rate": 0.0015660628595834485, + "loss": 0.0887, + "step": 38050 + }, + { + "epoch": 0.96, + "learning_rate": 0.0015656860035675704, + "loss": 0.0874, + "step": 38060 + }, + { + "epoch": 0.96, + "learning_rate": 0.001565309147551692, + "loss": 0.0902, + "step": 38070 + }, + { + "epoch": 0.96, + "learning_rate": 0.001564932291535814, + "loss": 0.0883, + "step": 38080 + }, + { + "epoch": 0.96, + "learning_rate": 0.0015645554355199357, + "loss": 0.0902, + "step": 38090 + }, + { + "epoch": 0.96, + "learning_rate": 0.0015641785795040576, + "loss": 0.0919, + "step": 38100 + }, + { + "epoch": 0.96, + "learning_rate": 0.0015638017234881792, + "loss": 0.0886, + "step": 38110 + }, + { + "epoch": 0.96, + "learning_rate": 0.0015634248674723011, + "loss": 0.089, + "step": 38120 + }, + { + "epoch": 0.96, + "learning_rate": 0.0015630480114564229, + "loss": 0.0936, + "step": 38130 + }, + { + "epoch": 0.96, + "learning_rate": 0.0015626711554405448, + "loss": 0.0878, + "step": 38140 + }, + { + "epoch": 0.96, + "learning_rate": 0.0015622942994246664, + "loss": 0.0909, + "step": 38150 + }, + { + "epoch": 0.96, + "learning_rate": 0.0015619174434087883, + "loss": 0.0903, + "step": 38160 + }, + { + "epoch": 0.96, + "learning_rate": 0.00156154058739291, + "loss": 0.084, + "step": 38170 + }, + { + "epoch": 0.96, + "learning_rate": 0.001561163731377032, + "loss": 0.0861, + "step": 38180 + }, + { + "epoch": 0.96, + "learning_rate": 0.0015607868753611536, + "loss": 0.0859, + "step": 38190 + }, + { + "epoch": 0.96, + "learning_rate": 0.0015604100193452755, + "loss": 0.0859, + "step": 38200 + }, + { + "epoch": 0.96, + "learning_rate": 0.0015600331633293975, + "loss": 0.0887, + "step": 38210 + }, + { + "epoch": 0.96, + "learning_rate": 0.0015596563073135192, + "loss": 0.0907, + "step": 38220 + }, + { + "epoch": 0.96, + "learning_rate": 0.0015592794512976408, + "loss": 0.0895, + "step": 38230 + }, + { + "epoch": 0.96, + "learning_rate": 0.0015589025952817627, + "loss": 0.0889, + "step": 38240 + }, + { + "epoch": 0.96, + "learning_rate": 0.0015585257392658847, + "loss": 0.0867, + "step": 38250 + }, + { + "epoch": 0.96, + "learning_rate": 0.0015581488832500064, + "loss": 0.0874, + "step": 38260 + }, + { + "epoch": 0.96, + "learning_rate": 0.001557772027234128, + "loss": 0.0905, + "step": 38270 + }, + { + "epoch": 0.96, + "learning_rate": 0.00155739517121825, + "loss": 0.0847, + "step": 38280 + }, + { + "epoch": 0.96, + "learning_rate": 0.0015570183152023719, + "loss": 0.0872, + "step": 38290 + }, + { + "epoch": 0.96, + "learning_rate": 0.0015566414591864934, + "loss": 0.0881, + "step": 38300 + }, + { + "epoch": 0.96, + "learning_rate": 0.0015562646031706151, + "loss": 0.0879, + "step": 38310 + }, + { + "epoch": 0.96, + "learning_rate": 0.001555887747154737, + "loss": 0.0908, + "step": 38320 + }, + { + "epoch": 0.96, + "learning_rate": 0.001555510891138859, + "loss": 0.0904, + "step": 38330 + }, + { + "epoch": 0.96, + "learning_rate": 0.0015551340351229806, + "loss": 0.0863, + "step": 38340 + }, + { + "epoch": 0.96, + "learning_rate": 0.0015547571791071026, + "loss": 0.0832, + "step": 38350 + }, + { + "epoch": 0.96, + "learning_rate": 0.0015543803230912243, + "loss": 0.0862, + "step": 38360 + }, + { + "epoch": 0.96, + "learning_rate": 0.0015540034670753463, + "loss": 0.0832, + "step": 38370 + }, + { + "epoch": 0.96, + "learning_rate": 0.0015536266110594678, + "loss": 0.0855, + "step": 38380 + }, + { + "epoch": 0.96, + "learning_rate": 0.0015532497550435898, + "loss": 0.0871, + "step": 38390 + }, + { + "epoch": 0.96, + "learning_rate": 0.0015528728990277115, + "loss": 0.0921, + "step": 38400 + }, + { + "epoch": 0.96, + "learning_rate": 0.0015524960430118335, + "loss": 0.0882, + "step": 38410 + }, + { + "epoch": 0.97, + "learning_rate": 0.001552119186995955, + "loss": 0.0872, + "step": 38420 + }, + { + "epoch": 0.97, + "learning_rate": 0.001551742330980077, + "loss": 0.0829, + "step": 38430 + }, + { + "epoch": 0.97, + "learning_rate": 0.0015513654749641987, + "loss": 0.0887, + "step": 38440 + }, + { + "epoch": 0.97, + "learning_rate": 0.0015509886189483207, + "loss": 0.0885, + "step": 38450 + }, + { + "epoch": 0.97, + "learning_rate": 0.0015506117629324422, + "loss": 0.088, + "step": 38460 + }, + { + "epoch": 0.97, + "learning_rate": 0.0015502349069165641, + "loss": 0.0894, + "step": 38470 + }, + { + "epoch": 0.97, + "learning_rate": 0.0015498580509006859, + "loss": 0.0892, + "step": 38480 + }, + { + "epoch": 0.97, + "learning_rate": 0.0015494811948848078, + "loss": 0.0859, + "step": 38490 + }, + { + "epoch": 0.97, + "learning_rate": 0.0015491043388689294, + "loss": 0.0858, + "step": 38500 + }, + { + "epoch": 0.97, + "eval_cer": 0.6658187388204179, + "eval_loss": 0.0693318322300911, + "eval_runtime": 90.5702, + "eval_samples_per_second": 110.401, + "eval_steps_per_second": 6.901, + "step": 38500 + }, + { + "epoch": 0.97, + "learning_rate": 0.0015487274828530513, + "loss": 0.088, + "step": 38510 + }, + { + "epoch": 0.97, + "learning_rate": 0.0015483506268371733, + "loss": 0.0885, + "step": 38520 + }, + { + "epoch": 0.97, + "learning_rate": 0.0015479737708212948, + "loss": 0.0879, + "step": 38530 + }, + { + "epoch": 0.97, + "learning_rate": 0.0015475969148054166, + "loss": 0.0867, + "step": 38540 + }, + { + "epoch": 0.97, + "learning_rate": 0.0015472200587895385, + "loss": 0.0869, + "step": 38550 + }, + { + "epoch": 0.97, + "learning_rate": 0.0015468432027736605, + "loss": 0.0877, + "step": 38560 + }, + { + "epoch": 0.97, + "learning_rate": 0.001546466346757782, + "loss": 0.0886, + "step": 38570 + }, + { + "epoch": 0.97, + "learning_rate": 0.0015460894907419038, + "loss": 0.0855, + "step": 38580 + }, + { + "epoch": 0.97, + "learning_rate": 0.0015457126347260257, + "loss": 0.0903, + "step": 38590 + }, + { + "epoch": 0.97, + "learning_rate": 0.0015453357787101477, + "loss": 0.0868, + "step": 38600 + }, + { + "epoch": 0.97, + "learning_rate": 0.0015449589226942692, + "loss": 0.0871, + "step": 38610 + }, + { + "epoch": 0.97, + "learning_rate": 0.0015445820666783912, + "loss": 0.0901, + "step": 38620 + }, + { + "epoch": 0.97, + "learning_rate": 0.001544205210662513, + "loss": 0.0852, + "step": 38630 + }, + { + "epoch": 0.97, + "learning_rate": 0.0015438283546466349, + "loss": 0.0877, + "step": 38640 + }, + { + "epoch": 0.97, + "learning_rate": 0.0015434514986307564, + "loss": 0.0863, + "step": 38650 + }, + { + "epoch": 0.97, + "learning_rate": 0.0015430746426148784, + "loss": 0.0878, + "step": 38660 + }, + { + "epoch": 0.97, + "learning_rate": 0.0015426977865990001, + "loss": 0.0883, + "step": 38670 + }, + { + "epoch": 0.97, + "learning_rate": 0.001542320930583122, + "loss": 0.0878, + "step": 38680 + }, + { + "epoch": 0.97, + "learning_rate": 0.0015419440745672436, + "loss": 0.0835, + "step": 38690 + }, + { + "epoch": 0.97, + "learning_rate": 0.0015415672185513656, + "loss": 0.09, + "step": 38700 + }, + { + "epoch": 0.97, + "learning_rate": 0.0015411903625354873, + "loss": 0.087, + "step": 38710 + }, + { + "epoch": 0.97, + "learning_rate": 0.0015408135065196088, + "loss": 0.0869, + "step": 38720 + }, + { + "epoch": 0.97, + "learning_rate": 0.0015404366505037308, + "loss": 0.0866, + "step": 38730 + }, + { + "epoch": 0.97, + "learning_rate": 0.0015400597944878528, + "loss": 0.0861, + "step": 38740 + }, + { + "epoch": 0.97, + "learning_rate": 0.0015396829384719745, + "loss": 0.0859, + "step": 38750 + }, + { + "epoch": 0.97, + "learning_rate": 0.0015393060824560963, + "loss": 0.0833, + "step": 38760 + }, + { + "epoch": 0.97, + "learning_rate": 0.001538929226440218, + "loss": 0.0875, + "step": 38770 + }, + { + "epoch": 0.97, + "learning_rate": 0.00153855237042434, + "loss": 0.094, + "step": 38780 + }, + { + "epoch": 0.97, + "learning_rate": 0.001538175514408462, + "loss": 0.0892, + "step": 38790 + }, + { + "epoch": 0.97, + "learning_rate": 0.0015377986583925835, + "loss": 0.0866, + "step": 38800 + }, + { + "epoch": 0.98, + "learning_rate": 0.0015374218023767052, + "loss": 0.0841, + "step": 38810 + }, + { + "epoch": 0.98, + "learning_rate": 0.0015370449463608272, + "loss": 0.086, + "step": 38820 + }, + { + "epoch": 0.98, + "learning_rate": 0.0015366680903449491, + "loss": 0.0915, + "step": 38830 + }, + { + "epoch": 0.98, + "learning_rate": 0.0015362912343290706, + "loss": 0.0834, + "step": 38840 + }, + { + "epoch": 0.98, + "learning_rate": 0.0015359143783131924, + "loss": 0.0863, + "step": 38850 + }, + { + "epoch": 0.98, + "learning_rate": 0.0015355375222973144, + "loss": 0.0908, + "step": 38860 + }, + { + "epoch": 0.98, + "learning_rate": 0.0015351606662814363, + "loss": 0.0893, + "step": 38870 + }, + { + "epoch": 0.98, + "learning_rate": 0.0015347838102655578, + "loss": 0.0884, + "step": 38880 + }, + { + "epoch": 0.98, + "learning_rate": 0.0015344069542496796, + "loss": 0.091, + "step": 38890 + }, + { + "epoch": 0.98, + "learning_rate": 0.0015340300982338015, + "loss": 0.0845, + "step": 38900 + }, + { + "epoch": 0.98, + "learning_rate": 0.0015336532422179235, + "loss": 0.0864, + "step": 38910 + }, + { + "epoch": 0.98, + "learning_rate": 0.001533276386202045, + "loss": 0.0837, + "step": 38920 + }, + { + "epoch": 0.98, + "learning_rate": 0.001532899530186167, + "loss": 0.0895, + "step": 38930 + }, + { + "epoch": 0.98, + "learning_rate": 0.0015325226741702887, + "loss": 0.0854, + "step": 38940 + }, + { + "epoch": 0.98, + "learning_rate": 0.0015321458181544103, + "loss": 0.0863, + "step": 38950 + }, + { + "epoch": 0.98, + "learning_rate": 0.0015317689621385322, + "loss": 0.087, + "step": 38960 + }, + { + "epoch": 0.98, + "learning_rate": 0.0015313921061226542, + "loss": 0.0855, + "step": 38970 + }, + { + "epoch": 0.98, + "learning_rate": 0.001531015250106776, + "loss": 0.087, + "step": 38980 + }, + { + "epoch": 0.98, + "learning_rate": 0.0015306383940908975, + "loss": 0.0867, + "step": 38990 + }, + { + "epoch": 0.98, + "learning_rate": 0.0015302615380750194, + "loss": 0.0882, + "step": 39000 + }, + { + "epoch": 0.98, + "eval_cer": 0.6656575266589574, + "eval_loss": 0.06897370517253876, + "eval_runtime": 90.71, + "eval_samples_per_second": 110.23, + "eval_steps_per_second": 6.89, + "step": 39000 + }, + { + "epoch": 0.98, + "learning_rate": 0.0015298846820591414, + "loss": 0.0879, + "step": 39010 + }, + { + "epoch": 0.98, + "learning_rate": 0.0015295078260432631, + "loss": 0.0867, + "step": 39020 + }, + { + "epoch": 0.98, + "learning_rate": 0.0015291309700273849, + "loss": 0.0872, + "step": 39030 + }, + { + "epoch": 0.98, + "learning_rate": 0.0015287541140115066, + "loss": 0.087, + "step": 39040 + }, + { + "epoch": 0.98, + "learning_rate": 0.0015283772579956286, + "loss": 0.0864, + "step": 39050 + }, + { + "epoch": 0.98, + "learning_rate": 0.0015280004019797503, + "loss": 0.089, + "step": 39060 + }, + { + "epoch": 0.98, + "learning_rate": 0.001527623545963872, + "loss": 0.0869, + "step": 39070 + }, + { + "epoch": 0.98, + "learning_rate": 0.0015272466899479938, + "loss": 0.0884, + "step": 39080 + }, + { + "epoch": 0.98, + "learning_rate": 0.0015268698339321158, + "loss": 0.0859, + "step": 39090 + }, + { + "epoch": 0.98, + "learning_rate": 0.0015264929779162377, + "loss": 0.0887, + "step": 39100 + }, + { + "epoch": 0.98, + "learning_rate": 0.0015261161219003593, + "loss": 0.0884, + "step": 39110 + }, + { + "epoch": 0.98, + "learning_rate": 0.001525739265884481, + "loss": 0.0872, + "step": 39120 + }, + { + "epoch": 0.98, + "learning_rate": 0.001525362409868603, + "loss": 0.0873, + "step": 39130 + }, + { + "epoch": 0.98, + "learning_rate": 0.001524985553852725, + "loss": 0.0838, + "step": 39140 + }, + { + "epoch": 0.98, + "learning_rate": 0.0015246086978368465, + "loss": 0.0855, + "step": 39150 + }, + { + "epoch": 0.98, + "learning_rate": 0.0015242318418209682, + "loss": 0.0864, + "step": 39160 + }, + { + "epoch": 0.98, + "learning_rate": 0.0015238549858050902, + "loss": 0.0874, + "step": 39170 + }, + { + "epoch": 0.98, + "learning_rate": 0.0015234781297892117, + "loss": 0.0882, + "step": 39180 + }, + { + "epoch": 0.98, + "learning_rate": 0.0015231012737733337, + "loss": 0.0869, + "step": 39190 + }, + { + "epoch": 0.98, + "learning_rate": 0.0015227244177574556, + "loss": 0.0886, + "step": 39200 + }, + { + "epoch": 0.99, + "learning_rate": 0.0015223475617415774, + "loss": 0.0848, + "step": 39210 + }, + { + "epoch": 0.99, + "learning_rate": 0.001521970705725699, + "loss": 0.0905, + "step": 39220 + }, + { + "epoch": 0.99, + "learning_rate": 0.0015215938497098209, + "loss": 0.0897, + "step": 39230 + }, + { + "epoch": 0.99, + "learning_rate": 0.0015212169936939428, + "loss": 0.0887, + "step": 39240 + }, + { + "epoch": 0.99, + "learning_rate": 0.0015208401376780646, + "loss": 0.0858, + "step": 39250 + }, + { + "epoch": 0.99, + "learning_rate": 0.001520463281662186, + "loss": 0.0861, + "step": 39260 + }, + { + "epoch": 0.99, + "learning_rate": 0.001520086425646308, + "loss": 0.0894, + "step": 39270 + }, + { + "epoch": 0.99, + "learning_rate": 0.00151970956963043, + "loss": 0.0888, + "step": 39280 + }, + { + "epoch": 0.99, + "learning_rate": 0.0015193327136145518, + "loss": 0.0865, + "step": 39290 + }, + { + "epoch": 0.99, + "learning_rate": 0.0015189558575986733, + "loss": 0.0905, + "step": 39300 + }, + { + "epoch": 0.99, + "learning_rate": 0.0015185790015827952, + "loss": 0.0842, + "step": 39310 + }, + { + "epoch": 0.99, + "learning_rate": 0.0015182021455669172, + "loss": 0.0872, + "step": 39320 + }, + { + "epoch": 0.99, + "learning_rate": 0.001517825289551039, + "loss": 0.09, + "step": 39330 + }, + { + "epoch": 0.99, + "learning_rate": 0.0015174484335351607, + "loss": 0.0873, + "step": 39340 + }, + { + "epoch": 0.99, + "learning_rate": 0.0015170715775192824, + "loss": 0.0859, + "step": 39350 + }, + { + "epoch": 0.99, + "learning_rate": 0.0015166947215034044, + "loss": 0.0847, + "step": 39360 + }, + { + "epoch": 0.99, + "learning_rate": 0.0015163178654875264, + "loss": 0.0879, + "step": 39370 + }, + { + "epoch": 0.99, + "learning_rate": 0.001515941009471648, + "loss": 0.0865, + "step": 39380 + }, + { + "epoch": 0.99, + "learning_rate": 0.0015155641534557696, + "loss": 0.0878, + "step": 39390 + }, + { + "epoch": 0.99, + "learning_rate": 0.0015151872974398916, + "loss": 0.0871, + "step": 39400 + }, + { + "epoch": 0.99, + "learning_rate": 0.0015148104414240131, + "loss": 0.0842, + "step": 39410 + }, + { + "epoch": 0.99, + "learning_rate": 0.001514433585408135, + "loss": 0.0883, + "step": 39420 + }, + { + "epoch": 0.99, + "learning_rate": 0.0015140567293922568, + "loss": 0.0833, + "step": 39430 + }, + { + "epoch": 0.99, + "learning_rate": 0.0015136798733763788, + "loss": 0.0864, + "step": 39440 + }, + { + "epoch": 0.99, + "learning_rate": 0.0015133030173605003, + "loss": 0.0888, + "step": 39450 + }, + { + "epoch": 0.99, + "learning_rate": 0.0015129261613446223, + "loss": 0.0835, + "step": 39460 + }, + { + "epoch": 0.99, + "learning_rate": 0.001512549305328744, + "loss": 0.0861, + "step": 39470 + }, + { + "epoch": 0.99, + "learning_rate": 0.001512172449312866, + "loss": 0.086, + "step": 39480 + }, + { + "epoch": 0.99, + "learning_rate": 0.0015117955932969875, + "loss": 0.085, + "step": 39490 + }, + { + "epoch": 0.99, + "learning_rate": 0.0015114187372811095, + "loss": 0.0858, + "step": 39500 + }, + { + "epoch": 0.99, + "eval_cer": 0.6655954479460368, + "eval_loss": 0.06882914155721664, + "eval_runtime": 90.5569, + "eval_samples_per_second": 110.417, + "eval_steps_per_second": 6.902, + "step": 39500 + }, + { + "epoch": 0.99, + "learning_rate": 0.0015110418812652314, + "loss": 0.0906, + "step": 39510 + }, + { + "epoch": 0.99, + "learning_rate": 0.0015106650252493532, + "loss": 0.0863, + "step": 39520 + }, + { + "epoch": 0.99, + "learning_rate": 0.0015102881692334747, + "loss": 0.0858, + "step": 39530 + }, + { + "epoch": 0.99, + "learning_rate": 0.0015099113132175967, + "loss": 0.0859, + "step": 39540 + }, + { + "epoch": 0.99, + "learning_rate": 0.0015095344572017186, + "loss": 0.0843, + "step": 39550 + }, + { + "epoch": 0.99, + "learning_rate": 0.0015091576011858404, + "loss": 0.085, + "step": 39560 + }, + { + "epoch": 0.99, + "learning_rate": 0.001508780745169962, + "loss": 0.0908, + "step": 39570 + }, + { + "epoch": 0.99, + "learning_rate": 0.0015084038891540839, + "loss": 0.0845, + "step": 39580 + }, + { + "epoch": 0.99, + "learning_rate": 0.0015080270331382058, + "loss": 0.0847, + "step": 39590 + }, + { + "epoch": 0.99, + "learning_rate": 0.0015076501771223276, + "loss": 0.0871, + "step": 39600 + }, + { + "epoch": 1.0, + "learning_rate": 0.0015072733211064493, + "loss": 0.0857, + "step": 39610 + }, + { + "epoch": 1.0, + "learning_rate": 0.001506896465090571, + "loss": 0.0874, + "step": 39620 + }, + { + "epoch": 1.0, + "learning_rate": 0.001506519609074693, + "loss": 0.0863, + "step": 39630 + }, + { + "epoch": 1.0, + "learning_rate": 0.0015061427530588146, + "loss": 0.0854, + "step": 39640 + }, + { + "epoch": 1.0, + "learning_rate": 0.0015057658970429365, + "loss": 0.0858, + "step": 39650 + }, + { + "epoch": 1.0, + "learning_rate": 0.0015053890410270583, + "loss": 0.0907, + "step": 39660 + }, + { + "epoch": 1.0, + "learning_rate": 0.0015050121850111802, + "loss": 0.0882, + "step": 39670 + }, + { + "epoch": 1.0, + "learning_rate": 0.0015046353289953017, + "loss": 0.0859, + "step": 39680 + }, + { + "epoch": 1.0, + "learning_rate": 0.0015042584729794237, + "loss": 0.0833, + "step": 39690 + }, + { + "epoch": 1.0, + "learning_rate": 0.0015038816169635455, + "loss": 0.0846, + "step": 39700 + }, + { + "epoch": 1.0, + "learning_rate": 0.0015035047609476674, + "loss": 0.0839, + "step": 39710 + }, + { + "epoch": 1.0, + "learning_rate": 0.001503127904931789, + "loss": 0.0852, + "step": 39720 + }, + { + "epoch": 1.0, + "learning_rate": 0.001502751048915911, + "loss": 0.0892, + "step": 39730 + }, + { + "epoch": 1.0, + "learning_rate": 0.0015023741929000326, + "loss": 0.0885, + "step": 39740 + }, + { + "epoch": 1.0, + "learning_rate": 0.0015019973368841546, + "loss": 0.0857, + "step": 39750 + }, + { + "epoch": 1.0, + "learning_rate": 0.0015016204808682761, + "loss": 0.0866, + "step": 39760 + }, + { + "epoch": 1.0, + "learning_rate": 0.001501243624852398, + "loss": 0.0869, + "step": 39770 + }, + { + "epoch": 1.0, + "learning_rate": 0.00150086676883652, + "loss": 0.0851, + "step": 39780 + }, + { + "epoch": 1.0, + "learning_rate": 0.0015004899128206418, + "loss": 0.0851, + "step": 39790 + }, + { + "epoch": 1.0, + "learning_rate": 0.0015001130568047633, + "loss": 0.0856, + "step": 39800 + }, + { + "epoch": 1.0, + "learning_rate": 0.0014997362007888853, + "loss": 0.0823, + "step": 39810 + }, + { + "epoch": 1.0, + "learning_rate": 0.0014993593447730073, + "loss": 0.0843, + "step": 39820 + }, + { + "epoch": 1.0, + "learning_rate": 0.0014989824887571288, + "loss": 0.0779, + "step": 39830 + }, + { + "epoch": 1.0, + "learning_rate": 0.0014986056327412505, + "loss": 0.0803, + "step": 39840 + }, + { + "epoch": 1.0, + "learning_rate": 0.0014982287767253725, + "loss": 0.0808, + "step": 39850 + }, + { + "epoch": 1.0, + "learning_rate": 0.0014978519207094942, + "loss": 0.0836, + "step": 39860 + }, + { + "epoch": 1.0, + "learning_rate": 0.0014974750646936162, + "loss": 0.0778, + "step": 39870 + }, + { + "epoch": 1.0, + "learning_rate": 0.0014970982086777377, + "loss": 0.0786, + "step": 39880 + }, + { + "epoch": 1.0, + "learning_rate": 0.0014967213526618597, + "loss": 0.0768, + "step": 39890 + }, + { + "epoch": 1.0, + "learning_rate": 0.0014963444966459814, + "loss": 0.0819, + "step": 39900 + }, + { + "epoch": 1.0, + "learning_rate": 0.0014959676406301034, + "loss": 0.0801, + "step": 39910 + }, + { + "epoch": 1.0, + "learning_rate": 0.0014955907846142251, + "loss": 0.0788, + "step": 39920 + }, + { + "epoch": 1.0, + "learning_rate": 0.0014952139285983469, + "loss": 0.0818, + "step": 39930 + }, + { + "epoch": 1.0, + "learning_rate": 0.0014948370725824686, + "loss": 0.0809, + "step": 39940 + }, + { + "epoch": 1.0, + "learning_rate": 0.0014944602165665906, + "loss": 0.0779, + "step": 39950 + }, + { + "epoch": 1.0, + "learning_rate": 0.0014940833605507123, + "loss": 0.0791, + "step": 39960 + }, + { + "epoch": 1.0, + "learning_rate": 0.001493706504534834, + "loss": 0.0792, + "step": 39970 + }, + { + "epoch": 1.0, + "learning_rate": 0.0014933296485189558, + "loss": 0.0761, + "step": 39980 + }, + { + "epoch": 1.0, + "learning_rate": 0.0014929527925030778, + "loss": 0.0779, + "step": 39990 + }, + { + "epoch": 1.0, + "learning_rate": 0.0014925759364871995, + "loss": 0.0808, + "step": 40000 + }, + { + "epoch": 1.0, + "eval_cer": 0.665779277933135, + "eval_loss": 0.06800606101751328, + "eval_runtime": 90.8369, + "eval_samples_per_second": 110.076, + "eval_steps_per_second": 6.88, + "step": 40000 + }, + { + "epoch": 1.01, + "learning_rate": 0.0014921990804713213, + "loss": 0.0828, + "step": 40010 + }, + { + "epoch": 1.01, + "learning_rate": 0.001491822224455443, + "loss": 0.0771, + "step": 40020 + }, + { + "epoch": 1.01, + "learning_rate": 0.001491445368439565, + "loss": 0.0794, + "step": 40030 + }, + { + "epoch": 1.01, + "learning_rate": 0.0014910685124236867, + "loss": 0.0812, + "step": 40040 + }, + { + "epoch": 1.01, + "learning_rate": 0.0014906916564078085, + "loss": 0.0781, + "step": 40050 + }, + { + "epoch": 1.01, + "learning_rate": 0.0014903148003919302, + "loss": 0.0791, + "step": 40060 + }, + { + "epoch": 1.01, + "learning_rate": 0.001489937944376052, + "loss": 0.0773, + "step": 40070 + }, + { + "epoch": 1.01, + "learning_rate": 0.001489561088360174, + "loss": 0.0797, + "step": 40080 + }, + { + "epoch": 1.01, + "learning_rate": 0.0014891842323442957, + "loss": 0.08, + "step": 40090 + }, + { + "epoch": 1.01, + "learning_rate": 0.0014888073763284174, + "loss": 0.0774, + "step": 40100 + }, + { + "epoch": 1.01, + "learning_rate": 0.0014884305203125392, + "loss": 0.08, + "step": 40110 + }, + { + "epoch": 1.01, + "learning_rate": 0.0014880536642966611, + "loss": 0.0746, + "step": 40120 + }, + { + "epoch": 1.01, + "learning_rate": 0.0014876768082807829, + "loss": 0.0809, + "step": 40130 + }, + { + "epoch": 1.01, + "learning_rate": 0.0014872999522649048, + "loss": 0.0798, + "step": 40140 + }, + { + "epoch": 1.01, + "learning_rate": 0.0014869230962490263, + "loss": 0.0806, + "step": 40150 + }, + { + "epoch": 1.01, + "learning_rate": 0.0014865462402331483, + "loss": 0.079, + "step": 40160 + }, + { + "epoch": 1.01, + "learning_rate": 0.00148616938421727, + "loss": 0.076, + "step": 40170 + }, + { + "epoch": 1.01, + "learning_rate": 0.001485792528201392, + "loss": 0.0816, + "step": 40180 + }, + { + "epoch": 1.01, + "learning_rate": 0.0014854156721855138, + "loss": 0.0786, + "step": 40190 + }, + { + "epoch": 1.01, + "learning_rate": 0.0014850388161696355, + "loss": 0.0837, + "step": 40200 + }, + { + "epoch": 1.01, + "learning_rate": 0.0014846619601537572, + "loss": 0.0779, + "step": 40210 + }, + { + "epoch": 1.01, + "learning_rate": 0.0014842851041378792, + "loss": 0.0775, + "step": 40220 + }, + { + "epoch": 1.01, + "learning_rate": 0.001483908248122001, + "loss": 0.0786, + "step": 40230 + }, + { + "epoch": 1.01, + "learning_rate": 0.0014835313921061227, + "loss": 0.0826, + "step": 40240 + }, + { + "epoch": 1.01, + "learning_rate": 0.0014831545360902444, + "loss": 0.0794, + "step": 40250 + }, + { + "epoch": 1.01, + "learning_rate": 0.0014827776800743664, + "loss": 0.082, + "step": 40260 + }, + { + "epoch": 1.01, + "learning_rate": 0.0014824008240584882, + "loss": 0.0801, + "step": 40270 + }, + { + "epoch": 1.01, + "learning_rate": 0.00148202396804261, + "loss": 0.0795, + "step": 40280 + }, + { + "epoch": 1.01, + "learning_rate": 0.0014816471120267316, + "loss": 0.0793, + "step": 40290 + }, + { + "epoch": 1.01, + "learning_rate": 0.0014812702560108534, + "loss": 0.0812, + "step": 40300 + }, + { + "epoch": 1.01, + "learning_rate": 0.0014808933999949753, + "loss": 0.0786, + "step": 40310 + }, + { + "epoch": 1.01, + "learning_rate": 0.001480516543979097, + "loss": 0.0835, + "step": 40320 + }, + { + "epoch": 1.01, + "learning_rate": 0.0014801396879632188, + "loss": 0.0803, + "step": 40330 + }, + { + "epoch": 1.01, + "learning_rate": 0.0014797628319473406, + "loss": 0.0768, + "step": 40340 + }, + { + "epoch": 1.01, + "learning_rate": 0.0014793859759314625, + "loss": 0.0818, + "step": 40350 + }, + { + "epoch": 1.01, + "learning_rate": 0.0014790091199155843, + "loss": 0.0765, + "step": 40360 + }, + { + "epoch": 1.01, + "learning_rate": 0.001478632263899706, + "loss": 0.0779, + "step": 40370 + }, + { + "epoch": 1.01, + "learning_rate": 0.0014782554078838278, + "loss": 0.0835, + "step": 40380 + }, + { + "epoch": 1.01, + "learning_rate": 0.0014778785518679497, + "loss": 0.0762, + "step": 40390 + }, + { + "epoch": 1.01, + "learning_rate": 0.0014775016958520715, + "loss": 0.079, + "step": 40400 + }, + { + "epoch": 1.02, + "learning_rate": 0.0014771248398361934, + "loss": 0.0802, + "step": 40410 + }, + { + "epoch": 1.02, + "learning_rate": 0.001476747983820315, + "loss": 0.083, + "step": 40420 + }, + { + "epoch": 1.02, + "learning_rate": 0.001476371127804437, + "loss": 0.0782, + "step": 40430 + }, + { + "epoch": 1.02, + "learning_rate": 0.0014759942717885587, + "loss": 0.0779, + "step": 40440 + }, + { + "epoch": 1.02, + "learning_rate": 0.0014756174157726806, + "loss": 0.0753, + "step": 40450 + }, + { + "epoch": 1.02, + "learning_rate": 0.0014752405597568022, + "loss": 0.0799, + "step": 40460 + }, + { + "epoch": 1.02, + "learning_rate": 0.0014748637037409241, + "loss": 0.0807, + "step": 40470 + }, + { + "epoch": 1.02, + "learning_rate": 0.0014744868477250459, + "loss": 0.0781, + "step": 40480 + }, + { + "epoch": 1.02, + "learning_rate": 0.0014741099917091678, + "loss": 0.0815, + "step": 40490 + }, + { + "epoch": 1.02, + "learning_rate": 0.0014737331356932896, + "loss": 0.0783, + "step": 40500 + }, + { + "epoch": 1.02, + "eval_cer": 0.6657051684618964, + "eval_loss": 0.06801352649927139, + "eval_runtime": 90.9119, + "eval_samples_per_second": 109.986, + "eval_steps_per_second": 6.875, + "step": 40500 + }, + { + "epoch": 1.02, + "learning_rate": 0.001473356279677411, + "loss": 0.0779, + "step": 40510 + }, + { + "epoch": 1.02, + "learning_rate": 0.001472979423661533, + "loss": 0.0833, + "step": 40520 + }, + { + "epoch": 1.02, + "learning_rate": 0.0014726025676456548, + "loss": 0.0778, + "step": 40530 + }, + { + "epoch": 1.02, + "learning_rate": 0.0014722257116297768, + "loss": 0.084, + "step": 40540 + }, + { + "epoch": 1.02, + "learning_rate": 0.0014718488556138985, + "loss": 0.0814, + "step": 40550 + }, + { + "epoch": 1.02, + "learning_rate": 0.0014714719995980203, + "loss": 0.0806, + "step": 40560 + }, + { + "epoch": 1.02, + "learning_rate": 0.001471095143582142, + "loss": 0.0788, + "step": 40570 + }, + { + "epoch": 1.02, + "learning_rate": 0.001470718287566264, + "loss": 0.0822, + "step": 40580 + }, + { + "epoch": 1.02, + "learning_rate": 0.0014703414315503857, + "loss": 0.0778, + "step": 40590 + }, + { + "epoch": 1.02, + "learning_rate": 0.0014699645755345075, + "loss": 0.0771, + "step": 40600 + }, + { + "epoch": 1.02, + "learning_rate": 0.0014695877195186292, + "loss": 0.0766, + "step": 40610 + }, + { + "epoch": 1.02, + "learning_rate": 0.0014692108635027512, + "loss": 0.078, + "step": 40620 + }, + { + "epoch": 1.02, + "learning_rate": 0.001468834007486873, + "loss": 0.0759, + "step": 40630 + }, + { + "epoch": 1.02, + "learning_rate": 0.0014684571514709947, + "loss": 0.0787, + "step": 40640 + }, + { + "epoch": 1.02, + "learning_rate": 0.0014680802954551164, + "loss": 0.0778, + "step": 40650 + }, + { + "epoch": 1.02, + "learning_rate": 0.0014677034394392384, + "loss": 0.08, + "step": 40660 + }, + { + "epoch": 1.02, + "learning_rate": 0.00146732658342336, + "loss": 0.0763, + "step": 40670 + }, + { + "epoch": 1.02, + "learning_rate": 0.0014669497274074818, + "loss": 0.0784, + "step": 40680 + }, + { + "epoch": 1.02, + "learning_rate": 0.0014665728713916036, + "loss": 0.0786, + "step": 40690 + }, + { + "epoch": 1.02, + "learning_rate": 0.0014661960153757256, + "loss": 0.0769, + "step": 40700 + }, + { + "epoch": 1.02, + "learning_rate": 0.0014658191593598473, + "loss": 0.0787, + "step": 40710 + }, + { + "epoch": 1.02, + "learning_rate": 0.001465442303343969, + "loss": 0.0813, + "step": 40720 + }, + { + "epoch": 1.02, + "learning_rate": 0.0014650654473280908, + "loss": 0.0807, + "step": 40730 + }, + { + "epoch": 1.02, + "learning_rate": 0.0014646885913122125, + "loss": 0.0771, + "step": 40740 + }, + { + "epoch": 1.02, + "learning_rate": 0.0014643117352963345, + "loss": 0.0796, + "step": 40750 + }, + { + "epoch": 1.02, + "learning_rate": 0.0014639348792804562, + "loss": 0.078, + "step": 40760 + }, + { + "epoch": 1.02, + "learning_rate": 0.0014635580232645782, + "loss": 0.0757, + "step": 40770 + }, + { + "epoch": 1.02, + "learning_rate": 0.0014631811672486997, + "loss": 0.0785, + "step": 40780 + }, + { + "epoch": 1.02, + "learning_rate": 0.0014628043112328217, + "loss": 0.0792, + "step": 40790 + }, + { + "epoch": 1.03, + "learning_rate": 0.0014624274552169434, + "loss": 0.0769, + "step": 40800 + }, + { + "epoch": 1.03, + "learning_rate": 0.0014620505992010654, + "loss": 0.0819, + "step": 40810 + }, + { + "epoch": 1.03, + "learning_rate": 0.0014616737431851871, + "loss": 0.0815, + "step": 40820 + }, + { + "epoch": 1.03, + "learning_rate": 0.0014612968871693089, + "loss": 0.0788, + "step": 40830 + }, + { + "epoch": 1.03, + "learning_rate": 0.0014609200311534306, + "loss": 0.0764, + "step": 40840 + }, + { + "epoch": 1.03, + "learning_rate": 0.0014605431751375526, + "loss": 0.0775, + "step": 40850 + }, + { + "epoch": 1.03, + "learning_rate": 0.0014601663191216743, + "loss": 0.0845, + "step": 40860 + }, + { + "epoch": 1.03, + "learning_rate": 0.001459789463105796, + "loss": 0.0789, + "step": 40870 + }, + { + "epoch": 1.03, + "learning_rate": 0.0014594126070899178, + "loss": 0.0779, + "step": 40880 + }, + { + "epoch": 1.03, + "learning_rate": 0.0014590357510740398, + "loss": 0.0803, + "step": 40890 + }, + { + "epoch": 1.03, + "learning_rate": 0.0014586588950581615, + "loss": 0.0782, + "step": 40900 + }, + { + "epoch": 1.03, + "learning_rate": 0.0014582820390422833, + "loss": 0.0785, + "step": 40910 + }, + { + "epoch": 1.03, + "learning_rate": 0.001457905183026405, + "loss": 0.075, + "step": 40920 + }, + { + "epoch": 1.03, + "learning_rate": 0.001457528327010527, + "loss": 0.0831, + "step": 40930 + }, + { + "epoch": 1.03, + "learning_rate": 0.0014571514709946487, + "loss": 0.0776, + "step": 40940 + }, + { + "epoch": 1.03, + "learning_rate": 0.0014567746149787705, + "loss": 0.0794, + "step": 40950 + }, + { + "epoch": 1.03, + "learning_rate": 0.0014563977589628922, + "loss": 0.0811, + "step": 40960 + }, + { + "epoch": 1.03, + "learning_rate": 0.001456020902947014, + "loss": 0.0832, + "step": 40970 + }, + { + "epoch": 1.03, + "learning_rate": 0.001455644046931136, + "loss": 0.0818, + "step": 40980 + }, + { + "epoch": 1.03, + "learning_rate": 0.0014552671909152577, + "loss": 0.0833, + "step": 40990 + }, + { + "epoch": 1.03, + "learning_rate": 0.0014548903348993794, + "loss": 0.0822, + "step": 41000 + }, + { + "epoch": 1.03, + "eval_cer": 0.6657999708374418, + "eval_loss": 0.06757137924432755, + "eval_runtime": 90.6292, + "eval_samples_per_second": 110.329, + "eval_steps_per_second": 6.896, + "step": 41000 + }, + { + "epoch": 1.03, + "learning_rate": 0.0014545134788835012, + "loss": 0.0816, + "step": 41010 + }, + { + "epoch": 1.03, + "learning_rate": 0.0014541366228676231, + "loss": 0.0803, + "step": 41020 + }, + { + "epoch": 1.03, + "learning_rate": 0.0014537597668517449, + "loss": 0.0761, + "step": 41030 + }, + { + "epoch": 1.03, + "learning_rate": 0.0014533829108358666, + "loss": 0.078, + "step": 41040 + }, + { + "epoch": 1.03, + "learning_rate": 0.0014530060548199884, + "loss": 0.0806, + "step": 41050 + }, + { + "epoch": 1.03, + "learning_rate": 0.0014526291988041103, + "loss": 0.0779, + "step": 41060 + }, + { + "epoch": 1.03, + "learning_rate": 0.001452252342788232, + "loss": 0.079, + "step": 41070 + }, + { + "epoch": 1.03, + "learning_rate": 0.001451875486772354, + "loss": 0.0778, + "step": 41080 + }, + { + "epoch": 1.03, + "learning_rate": 0.0014514986307564755, + "loss": 0.0755, + "step": 41090 + }, + { + "epoch": 1.03, + "learning_rate": 0.0014511217747405975, + "loss": 0.0805, + "step": 41100 + }, + { + "epoch": 1.03, + "learning_rate": 0.0014507449187247193, + "loss": 0.0765, + "step": 41110 + }, + { + "epoch": 1.03, + "learning_rate": 0.0014503680627088412, + "loss": 0.0777, + "step": 41120 + }, + { + "epoch": 1.03, + "learning_rate": 0.001449991206692963, + "loss": 0.0769, + "step": 41130 + }, + { + "epoch": 1.03, + "learning_rate": 0.0014496143506770847, + "loss": 0.0806, + "step": 41140 + }, + { + "epoch": 1.03, + "learning_rate": 0.0014492374946612064, + "loss": 0.0801, + "step": 41150 + }, + { + "epoch": 1.03, + "learning_rate": 0.0014488606386453284, + "loss": 0.0802, + "step": 41160 + }, + { + "epoch": 1.03, + "learning_rate": 0.0014484837826294502, + "loss": 0.0785, + "step": 41170 + }, + { + "epoch": 1.03, + "learning_rate": 0.001448106926613572, + "loss": 0.077, + "step": 41180 + }, + { + "epoch": 1.03, + "learning_rate": 0.0014477300705976936, + "loss": 0.0786, + "step": 41190 + }, + { + "epoch": 1.04, + "learning_rate": 0.0014473532145818154, + "loss": 0.0783, + "step": 41200 + }, + { + "epoch": 1.04, + "learning_rate": 0.0014469763585659373, + "loss": 0.0784, + "step": 41210 + }, + { + "epoch": 1.04, + "learning_rate": 0.001446599502550059, + "loss": 0.0782, + "step": 41220 + }, + { + "epoch": 1.04, + "learning_rate": 0.0014462226465341808, + "loss": 0.0773, + "step": 41230 + }, + { + "epoch": 1.04, + "learning_rate": 0.0014458457905183026, + "loss": 0.0797, + "step": 41240 + }, + { + "epoch": 1.04, + "learning_rate": 0.0014454689345024245, + "loss": 0.0812, + "step": 41250 + }, + { + "epoch": 1.04, + "learning_rate": 0.0014450920784865463, + "loss": 0.0825, + "step": 41260 + }, + { + "epoch": 1.04, + "learning_rate": 0.001444715222470668, + "loss": 0.0816, + "step": 41270 + }, + { + "epoch": 1.04, + "learning_rate": 0.0014443383664547898, + "loss": 0.0763, + "step": 41280 + }, + { + "epoch": 1.04, + "learning_rate": 0.0014439615104389117, + "loss": 0.0787, + "step": 41290 + }, + { + "epoch": 1.04, + "learning_rate": 0.0014435846544230335, + "loss": 0.0757, + "step": 41300 + }, + { + "epoch": 1.04, + "learning_rate": 0.0014432077984071552, + "loss": 0.0786, + "step": 41310 + }, + { + "epoch": 1.04, + "learning_rate": 0.001442830942391277, + "loss": 0.0764, + "step": 41320 + }, + { + "epoch": 1.04, + "learning_rate": 0.001442454086375399, + "loss": 0.0757, + "step": 41330 + }, + { + "epoch": 1.04, + "learning_rate": 0.0014420772303595207, + "loss": 0.0774, + "step": 41340 + }, + { + "epoch": 1.04, + "learning_rate": 0.0014417003743436426, + "loss": 0.0795, + "step": 41350 + }, + { + "epoch": 1.04, + "learning_rate": 0.0014413235183277642, + "loss": 0.0795, + "step": 41360 + }, + { + "epoch": 1.04, + "learning_rate": 0.0014409466623118861, + "loss": 0.0797, + "step": 41370 + }, + { + "epoch": 1.04, + "learning_rate": 0.0014405698062960079, + "loss": 0.0804, + "step": 41380 + }, + { + "epoch": 1.04, + "learning_rate": 0.0014401929502801296, + "loss": 0.0768, + "step": 41390 + }, + { + "epoch": 1.04, + "learning_rate": 0.0014398160942642516, + "loss": 0.0795, + "step": 41400 + }, + { + "epoch": 1.04, + "learning_rate": 0.0014394392382483731, + "loss": 0.0789, + "step": 41410 + }, + { + "epoch": 1.04, + "learning_rate": 0.001439062382232495, + "loss": 0.0791, + "step": 41420 + }, + { + "epoch": 1.04, + "learning_rate": 0.0014386855262166168, + "loss": 0.0811, + "step": 41430 + }, + { + "epoch": 1.04, + "learning_rate": 0.0014383086702007388, + "loss": 0.0755, + "step": 41440 + }, + { + "epoch": 1.04, + "learning_rate": 0.0014379318141848603, + "loss": 0.0772, + "step": 41450 + }, + { + "epoch": 1.04, + "learning_rate": 0.0014375549581689823, + "loss": 0.0828, + "step": 41460 + }, + { + "epoch": 1.04, + "learning_rate": 0.001437178102153104, + "loss": 0.082, + "step": 41470 + }, + { + "epoch": 1.04, + "learning_rate": 0.001436801246137226, + "loss": 0.0757, + "step": 41480 + }, + { + "epoch": 1.04, + "learning_rate": 0.0014364243901213477, + "loss": 0.0775, + "step": 41490 + }, + { + "epoch": 1.04, + "learning_rate": 0.0014360475341054695, + "loss": 0.077, + "step": 41500 + }, + { + "epoch": 1.04, + "eval_cer": 0.6657475167311756, + "eval_loss": 0.0675220713019371, + "eval_runtime": 90.5271, + "eval_samples_per_second": 110.453, + "eval_steps_per_second": 6.904, + "step": 41500 + }, + { + "epoch": 1.04, + "learning_rate": 0.0014356706780895912, + "loss": 0.0812, + "step": 41510 + }, + { + "epoch": 1.04, + "learning_rate": 0.0014352938220737132, + "loss": 0.08, + "step": 41520 + }, + { + "epoch": 1.04, + "learning_rate": 0.001434916966057835, + "loss": 0.0765, + "step": 41530 + }, + { + "epoch": 1.04, + "learning_rate": 0.0014345401100419567, + "loss": 0.0768, + "step": 41540 + }, + { + "epoch": 1.04, + "learning_rate": 0.0014341632540260784, + "loss": 0.0788, + "step": 41550 + }, + { + "epoch": 1.04, + "learning_rate": 0.0014337863980102004, + "loss": 0.0817, + "step": 41560 + }, + { + "epoch": 1.04, + "learning_rate": 0.001433409541994322, + "loss": 0.0797, + "step": 41570 + }, + { + "epoch": 1.04, + "learning_rate": 0.0014330326859784439, + "loss": 0.0807, + "step": 41580 + }, + { + "epoch": 1.04, + "learning_rate": 0.0014326558299625656, + "loss": 0.0763, + "step": 41590 + }, + { + "epoch": 1.05, + "learning_rate": 0.0014322789739466876, + "loss": 0.0777, + "step": 41600 + }, + { + "epoch": 1.05, + "learning_rate": 0.0014319021179308093, + "loss": 0.0768, + "step": 41610 + }, + { + "epoch": 1.05, + "learning_rate": 0.001431525261914931, + "loss": 0.0784, + "step": 41620 + }, + { + "epoch": 1.05, + "learning_rate": 0.0014311484058990528, + "loss": 0.0775, + "step": 41630 + }, + { + "epoch": 1.05, + "learning_rate": 0.0014307715498831745, + "loss": 0.0798, + "step": 41640 + }, + { + "epoch": 1.05, + "learning_rate": 0.0014303946938672965, + "loss": 0.0781, + "step": 41650 + }, + { + "epoch": 1.05, + "learning_rate": 0.0014300178378514182, + "loss": 0.0787, + "step": 41660 + }, + { + "epoch": 1.05, + "learning_rate": 0.00142964098183554, + "loss": 0.0804, + "step": 41670 + }, + { + "epoch": 1.05, + "learning_rate": 0.0014292641258196617, + "loss": 0.0802, + "step": 41680 + }, + { + "epoch": 1.05, + "learning_rate": 0.0014288872698037837, + "loss": 0.0798, + "step": 41690 + }, + { + "epoch": 1.05, + "learning_rate": 0.0014285104137879054, + "loss": 0.0786, + "step": 41700 + }, + { + "epoch": 1.05, + "learning_rate": 0.0014281335577720274, + "loss": 0.0798, + "step": 41710 + }, + { + "epoch": 1.05, + "learning_rate": 0.001427756701756149, + "loss": 0.0793, + "step": 41720 + }, + { + "epoch": 1.05, + "learning_rate": 0.0014273798457402709, + "loss": 0.08, + "step": 41730 + }, + { + "epoch": 1.05, + "learning_rate": 0.0014270029897243926, + "loss": 0.0793, + "step": 41740 + }, + { + "epoch": 1.05, + "learning_rate": 0.0014266261337085146, + "loss": 0.0795, + "step": 41750 + }, + { + "epoch": 1.05, + "learning_rate": 0.0014262492776926363, + "loss": 0.0796, + "step": 41760 + }, + { + "epoch": 1.05, + "learning_rate": 0.001425872421676758, + "loss": 0.0833, + "step": 41770 + }, + { + "epoch": 1.05, + "learning_rate": 0.0014254955656608798, + "loss": 0.0808, + "step": 41780 + }, + { + "epoch": 1.05, + "learning_rate": 0.0014251187096450018, + "loss": 0.0769, + "step": 41790 + }, + { + "epoch": 1.05, + "learning_rate": 0.0014247418536291235, + "loss": 0.0781, + "step": 41800 + }, + { + "epoch": 1.05, + "learning_rate": 0.0014243649976132453, + "loss": 0.0753, + "step": 41810 + }, + { + "epoch": 1.05, + "learning_rate": 0.001423988141597367, + "loss": 0.0789, + "step": 41820 + }, + { + "epoch": 1.05, + "learning_rate": 0.0014236112855814888, + "loss": 0.078, + "step": 41830 + }, + { + "epoch": 1.05, + "learning_rate": 0.0014232344295656107, + "loss": 0.0754, + "step": 41840 + }, + { + "epoch": 1.05, + "learning_rate": 0.0014228575735497325, + "loss": 0.0766, + "step": 41850 + }, + { + "epoch": 1.05, + "learning_rate": 0.0014224807175338542, + "loss": 0.0749, + "step": 41860 + }, + { + "epoch": 1.05, + "learning_rate": 0.001422103861517976, + "loss": 0.0807, + "step": 41870 + }, + { + "epoch": 1.05, + "learning_rate": 0.001421727005502098, + "loss": 0.0805, + "step": 41880 + }, + { + "epoch": 1.05, + "learning_rate": 0.0014213501494862197, + "loss": 0.0793, + "step": 41890 + }, + { + "epoch": 1.05, + "learning_rate": 0.0014209732934703414, + "loss": 0.0769, + "step": 41900 + }, + { + "epoch": 1.05, + "learning_rate": 0.0014205964374544632, + "loss": 0.082, + "step": 41910 + }, + { + "epoch": 1.05, + "learning_rate": 0.0014202195814385851, + "loss": 0.0765, + "step": 41920 + }, + { + "epoch": 1.05, + "learning_rate": 0.0014198427254227069, + "loss": 0.0783, + "step": 41930 + }, + { + "epoch": 1.05, + "learning_rate": 0.0014194658694068286, + "loss": 0.0794, + "step": 41940 + }, + { + "epoch": 1.05, + "learning_rate": 0.0014190890133909504, + "loss": 0.0765, + "step": 41950 + }, + { + "epoch": 1.05, + "learning_rate": 0.0014187121573750723, + "loss": 0.0785, + "step": 41960 + }, + { + "epoch": 1.05, + "learning_rate": 0.001418335301359194, + "loss": 0.0787, + "step": 41970 + }, + { + "epoch": 1.05, + "learning_rate": 0.001417958445343316, + "loss": 0.0797, + "step": 41980 + }, + { + "epoch": 1.05, + "learning_rate": 0.0014175815893274376, + "loss": 0.0779, + "step": 41990 + }, + { + "epoch": 1.06, + "learning_rate": 0.0014172047333115595, + "loss": 0.0788, + "step": 42000 + }, + { + "epoch": 1.06, + "eval_cer": 0.6654881335818407, + "eval_loss": 0.06726432591676712, + "eval_runtime": 90.7258, + "eval_samples_per_second": 110.211, + "eval_steps_per_second": 6.889, + "step": 42000 + }, + { + "epoch": 1.06, + "learning_rate": 0.0014168278772956813, + "loss": 0.0801, + "step": 42010 + }, + { + "epoch": 1.06, + "learning_rate": 0.0014164510212798032, + "loss": 0.0776, + "step": 42020 + }, + { + "epoch": 1.06, + "learning_rate": 0.0014160741652639247, + "loss": 0.0782, + "step": 42030 + }, + { + "epoch": 1.06, + "learning_rate": 0.0014156973092480467, + "loss": 0.0778, + "step": 42040 + }, + { + "epoch": 1.06, + "learning_rate": 0.0014153204532321685, + "loss": 0.0781, + "step": 42050 + }, + { + "epoch": 1.06, + "learning_rate": 0.0014149435972162902, + "loss": 0.0793, + "step": 42060 + }, + { + "epoch": 1.06, + "learning_rate": 0.0014145667412004122, + "loss": 0.0788, + "step": 42070 + }, + { + "epoch": 1.06, + "learning_rate": 0.0014141898851845337, + "loss": 0.0792, + "step": 42080 + }, + { + "epoch": 1.06, + "learning_rate": 0.0014138130291686556, + "loss": 0.0779, + "step": 42090 + }, + { + "epoch": 1.06, + "learning_rate": 0.0014134361731527774, + "loss": 0.082, + "step": 42100 + }, + { + "epoch": 1.06, + "learning_rate": 0.0014130593171368994, + "loss": 0.0783, + "step": 42110 + }, + { + "epoch": 1.06, + "learning_rate": 0.001412682461121021, + "loss": 0.0751, + "step": 42120 + }, + { + "epoch": 1.06, + "learning_rate": 0.0014123056051051428, + "loss": 0.0807, + "step": 42130 + }, + { + "epoch": 1.06, + "learning_rate": 0.0014119287490892646, + "loss": 0.0753, + "step": 42140 + }, + { + "epoch": 1.06, + "learning_rate": 0.0014115518930733865, + "loss": 0.0764, + "step": 42150 + }, + { + "epoch": 1.06, + "learning_rate": 0.0014111750370575083, + "loss": 0.0803, + "step": 42160 + }, + { + "epoch": 1.06, + "learning_rate": 0.00141079818104163, + "loss": 0.077, + "step": 42170 + }, + { + "epoch": 1.06, + "learning_rate": 0.0014104213250257518, + "loss": 0.0771, + "step": 42180 + }, + { + "epoch": 1.06, + "learning_rate": 0.0014100444690098737, + "loss": 0.0804, + "step": 42190 + }, + { + "epoch": 1.06, + "learning_rate": 0.0014096676129939955, + "loss": 0.0763, + "step": 42200 + }, + { + "epoch": 1.06, + "learning_rate": 0.0014092907569781172, + "loss": 0.0799, + "step": 42210 + }, + { + "epoch": 1.06, + "learning_rate": 0.001408913900962239, + "loss": 0.0751, + "step": 42220 + }, + { + "epoch": 1.06, + "learning_rate": 0.001408537044946361, + "loss": 0.0793, + "step": 42230 + }, + { + "epoch": 1.06, + "learning_rate": 0.0014081601889304827, + "loss": 0.0746, + "step": 42240 + }, + { + "epoch": 1.06, + "learning_rate": 0.0014077833329146044, + "loss": 0.0778, + "step": 42250 + }, + { + "epoch": 1.06, + "learning_rate": 0.0014074064768987262, + "loss": 0.0791, + "step": 42260 + }, + { + "epoch": 1.06, + "learning_rate": 0.0014070296208828481, + "loss": 0.0787, + "step": 42270 + }, + { + "epoch": 1.06, + "learning_rate": 0.0014066527648669699, + "loss": 0.0759, + "step": 42280 + }, + { + "epoch": 1.06, + "learning_rate": 0.0014062759088510916, + "loss": 0.0782, + "step": 42290 + }, + { + "epoch": 1.06, + "learning_rate": 0.0014058990528352134, + "loss": 0.0803, + "step": 42300 + }, + { + "epoch": 1.06, + "learning_rate": 0.0014055221968193351, + "loss": 0.0776, + "step": 42310 + }, + { + "epoch": 1.06, + "learning_rate": 0.001405145340803457, + "loss": 0.0793, + "step": 42320 + }, + { + "epoch": 1.06, + "learning_rate": 0.0014047684847875788, + "loss": 0.0783, + "step": 42330 + }, + { + "epoch": 1.06, + "learning_rate": 0.0014043916287717008, + "loss": 0.076, + "step": 42340 + }, + { + "epoch": 1.06, + "learning_rate": 0.0014040147727558223, + "loss": 0.0795, + "step": 42350 + }, + { + "epoch": 1.06, + "learning_rate": 0.0014036379167399443, + "loss": 0.0742, + "step": 42360 + }, + { + "epoch": 1.06, + "learning_rate": 0.001403261060724066, + "loss": 0.0784, + "step": 42370 + }, + { + "epoch": 1.06, + "learning_rate": 0.001402884204708188, + "loss": 0.0767, + "step": 42380 + }, + { + "epoch": 1.06, + "learning_rate": 0.0014025073486923097, + "loss": 0.0789, + "step": 42390 + }, + { + "epoch": 1.07, + "learning_rate": 0.0014021304926764315, + "loss": 0.0753, + "step": 42400 + }, + { + "epoch": 1.07, + "learning_rate": 0.0014017536366605532, + "loss": 0.0762, + "step": 42410 + }, + { + "epoch": 1.07, + "learning_rate": 0.0014013767806446752, + "loss": 0.0782, + "step": 42420 + }, + { + "epoch": 1.07, + "learning_rate": 0.001400999924628797, + "loss": 0.0794, + "step": 42430 + }, + { + "epoch": 1.07, + "learning_rate": 0.0014006230686129187, + "loss": 0.0763, + "step": 42440 + }, + { + "epoch": 1.07, + "learning_rate": 0.0014002462125970404, + "loss": 0.0812, + "step": 42450 + }, + { + "epoch": 1.07, + "learning_rate": 0.0013998693565811624, + "loss": 0.0786, + "step": 42460 + }, + { + "epoch": 1.07, + "learning_rate": 0.0013994925005652841, + "loss": 0.0789, + "step": 42470 + }, + { + "epoch": 1.07, + "learning_rate": 0.0013991156445494059, + "loss": 0.0781, + "step": 42480 + }, + { + "epoch": 1.07, + "learning_rate": 0.0013987387885335276, + "loss": 0.0788, + "step": 42490 + }, + { + "epoch": 1.07, + "learning_rate": 0.0013983619325176493, + "loss": 0.0754, + "step": 42500 + }, + { + "epoch": 1.07, + "eval_cer": 0.6660415484644662, + "eval_loss": 0.06667615473270416, + "eval_runtime": 90.6952, + "eval_samples_per_second": 110.248, + "eval_steps_per_second": 6.891, + "step": 42500 + }, + { + "epoch": 1.07, + "learning_rate": 0.0013979850765017713, + "loss": 0.0779, + "step": 42510 + }, + { + "epoch": 1.07, + "learning_rate": 0.001397608220485893, + "loss": 0.079, + "step": 42520 + }, + { + "epoch": 1.07, + "learning_rate": 0.0013972313644700148, + "loss": 0.0788, + "step": 42530 + }, + { + "epoch": 1.07, + "learning_rate": 0.0013968545084541365, + "loss": 0.0782, + "step": 42540 + }, + { + "epoch": 1.07, + "learning_rate": 0.0013964776524382585, + "loss": 0.0774, + "step": 42550 + }, + { + "epoch": 1.07, + "learning_rate": 0.0013961007964223802, + "loss": 0.0759, + "step": 42560 + }, + { + "epoch": 1.07, + "learning_rate": 0.001395723940406502, + "loss": 0.076, + "step": 42570 + }, + { + "epoch": 1.07, + "learning_rate": 0.0013953470843906237, + "loss": 0.082, + "step": 42580 + }, + { + "epoch": 1.07, + "learning_rate": 0.0013949702283747457, + "loss": 0.0797, + "step": 42590 + }, + { + "epoch": 1.07, + "learning_rate": 0.0013945933723588674, + "loss": 0.08, + "step": 42600 + }, + { + "epoch": 1.07, + "learning_rate": 0.0013942165163429892, + "loss": 0.0797, + "step": 42610 + }, + { + "epoch": 1.07, + "learning_rate": 0.001393839660327111, + "loss": 0.0774, + "step": 42620 + }, + { + "epoch": 1.07, + "learning_rate": 0.001393462804311233, + "loss": 0.0782, + "step": 42630 + }, + { + "epoch": 1.07, + "learning_rate": 0.0013930859482953546, + "loss": 0.0805, + "step": 42640 + }, + { + "epoch": 1.07, + "learning_rate": 0.0013927090922794766, + "loss": 0.0779, + "step": 42650 + }, + { + "epoch": 1.07, + "learning_rate": 0.0013923322362635981, + "loss": 0.0794, + "step": 42660 + }, + { + "epoch": 1.07, + "learning_rate": 0.00139195538024772, + "loss": 0.0783, + "step": 42670 + }, + { + "epoch": 1.07, + "learning_rate": 0.0013915785242318418, + "loss": 0.0768, + "step": 42680 + }, + { + "epoch": 1.07, + "learning_rate": 0.0013912016682159638, + "loss": 0.0788, + "step": 42690 + }, + { + "epoch": 1.07, + "learning_rate": 0.0013908248122000855, + "loss": 0.0743, + "step": 42700 + }, + { + "epoch": 1.07, + "learning_rate": 0.0013904479561842073, + "loss": 0.0781, + "step": 42710 + }, + { + "epoch": 1.07, + "learning_rate": 0.001390071100168329, + "loss": 0.078, + "step": 42720 + }, + { + "epoch": 1.07, + "learning_rate": 0.0013896942441524508, + "loss": 0.0773, + "step": 42730 + }, + { + "epoch": 1.07, + "learning_rate": 0.0013893173881365727, + "loss": 0.0761, + "step": 42740 + }, + { + "epoch": 1.07, + "learning_rate": 0.0013889405321206945, + "loss": 0.0763, + "step": 42750 + }, + { + "epoch": 1.07, + "learning_rate": 0.0013885636761048162, + "loss": 0.0746, + "step": 42760 + }, + { + "epoch": 1.07, + "learning_rate": 0.001388186820088938, + "loss": 0.0826, + "step": 42770 + }, + { + "epoch": 1.07, + "learning_rate": 0.00138780996407306, + "loss": 0.0804, + "step": 42780 + }, + { + "epoch": 1.08, + "learning_rate": 0.0013874331080571817, + "loss": 0.0782, + "step": 42790 + }, + { + "epoch": 1.08, + "learning_rate": 0.0013870562520413034, + "loss": 0.0796, + "step": 42800 + }, + { + "epoch": 1.08, + "learning_rate": 0.0013866793960254252, + "loss": 0.0778, + "step": 42810 + }, + { + "epoch": 1.08, + "learning_rate": 0.0013863025400095471, + "loss": 0.0791, + "step": 42820 + }, + { + "epoch": 1.08, + "learning_rate": 0.0013859256839936689, + "loss": 0.0778, + "step": 42830 + }, + { + "epoch": 1.08, + "learning_rate": 0.0013855488279777906, + "loss": 0.0774, + "step": 42840 + }, + { + "epoch": 1.08, + "learning_rate": 0.0013851719719619124, + "loss": 0.0764, + "step": 42850 + }, + { + "epoch": 1.08, + "learning_rate": 0.0013847951159460343, + "loss": 0.0795, + "step": 42860 + }, + { + "epoch": 1.08, + "learning_rate": 0.001384418259930156, + "loss": 0.0789, + "step": 42870 + }, + { + "epoch": 1.08, + "learning_rate": 0.0013840414039142778, + "loss": 0.0786, + "step": 42880 + }, + { + "epoch": 1.08, + "learning_rate": 0.0013836645478983996, + "loss": 0.0779, + "step": 42890 + }, + { + "epoch": 1.08, + "learning_rate": 0.0013832876918825215, + "loss": 0.0746, + "step": 42900 + }, + { + "epoch": 1.08, + "learning_rate": 0.0013829108358666433, + "loss": 0.0786, + "step": 42910 + }, + { + "epoch": 1.08, + "learning_rate": 0.0013825339798507652, + "loss": 0.0782, + "step": 42920 + }, + { + "epoch": 1.08, + "learning_rate": 0.0013821571238348867, + "loss": 0.0765, + "step": 42930 + }, + { + "epoch": 1.08, + "learning_rate": 0.0013817802678190087, + "loss": 0.0765, + "step": 42940 + }, + { + "epoch": 1.08, + "learning_rate": 0.0013814034118031305, + "loss": 0.0782, + "step": 42950 + }, + { + "epoch": 1.08, + "learning_rate": 0.0013810265557872522, + "loss": 0.0778, + "step": 42960 + }, + { + "epoch": 1.08, + "learning_rate": 0.0013806496997713742, + "loss": 0.0795, + "step": 42970 + }, + { + "epoch": 1.08, + "learning_rate": 0.0013802728437554957, + "loss": 0.0776, + "step": 42980 + }, + { + "epoch": 1.08, + "learning_rate": 0.0013798959877396177, + "loss": 0.0786, + "step": 42990 + }, + { + "epoch": 1.08, + "learning_rate": 0.0013795191317237394, + "loss": 0.0762, + "step": 43000 + }, + { + "epoch": 1.08, + "eval_cer": 0.6656464583613049, + "eval_loss": 0.06690527498722076, + "eval_runtime": 90.8509, + "eval_samples_per_second": 110.059, + "eval_steps_per_second": 6.879, + "step": 43000 + }, + { + "epoch": 1.08, + "learning_rate": 0.0013791422757078614, + "loss": 0.0775, + "step": 43010 + }, + { + "epoch": 1.08, + "learning_rate": 0.0013787654196919829, + "loss": 0.0783, + "step": 43020 + }, + { + "epoch": 1.08, + "learning_rate": 0.0013783885636761048, + "loss": 0.083, + "step": 43030 + }, + { + "epoch": 1.08, + "learning_rate": 0.0013780117076602266, + "loss": 0.0778, + "step": 43040 + }, + { + "epoch": 1.08, + "learning_rate": 0.0013776348516443486, + "loss": 0.0799, + "step": 43050 + }, + { + "epoch": 1.08, + "learning_rate": 0.0013772579956284703, + "loss": 0.0757, + "step": 43060 + }, + { + "epoch": 1.08, + "learning_rate": 0.001376881139612592, + "loss": 0.0781, + "step": 43070 + }, + { + "epoch": 1.08, + "learning_rate": 0.0013765042835967138, + "loss": 0.0769, + "step": 43080 + }, + { + "epoch": 1.08, + "learning_rate": 0.0013761274275808357, + "loss": 0.0786, + "step": 43090 + }, + { + "epoch": 1.08, + "learning_rate": 0.0013757505715649575, + "loss": 0.0808, + "step": 43100 + }, + { + "epoch": 1.08, + "learning_rate": 0.0013753737155490792, + "loss": 0.0775, + "step": 43110 + }, + { + "epoch": 1.08, + "learning_rate": 0.001374996859533201, + "loss": 0.0813, + "step": 43120 + }, + { + "epoch": 1.08, + "learning_rate": 0.001374620003517323, + "loss": 0.0799, + "step": 43130 + }, + { + "epoch": 1.08, + "learning_rate": 0.0013742431475014447, + "loss": 0.0771, + "step": 43140 + }, + { + "epoch": 1.08, + "learning_rate": 0.0013738662914855664, + "loss": 0.0771, + "step": 43150 + }, + { + "epoch": 1.08, + "learning_rate": 0.0013734894354696882, + "loss": 0.079, + "step": 43160 + }, + { + "epoch": 1.08, + "learning_rate": 0.00137311257945381, + "loss": 0.0782, + "step": 43170 + }, + { + "epoch": 1.08, + "learning_rate": 0.0013727357234379319, + "loss": 0.0782, + "step": 43180 + }, + { + "epoch": 1.09, + "learning_rate": 0.0013723588674220536, + "loss": 0.0799, + "step": 43190 + }, + { + "epoch": 1.09, + "learning_rate": 0.0013719820114061754, + "loss": 0.0763, + "step": 43200 + }, + { + "epoch": 1.09, + "learning_rate": 0.0013716051553902971, + "loss": 0.0777, + "step": 43210 + }, + { + "epoch": 1.09, + "learning_rate": 0.001371228299374419, + "loss": 0.0809, + "step": 43220 + }, + { + "epoch": 1.09, + "learning_rate": 0.0013708514433585408, + "loss": 0.0774, + "step": 43230 + }, + { + "epoch": 1.09, + "learning_rate": 0.0013704745873426626, + "loss": 0.077, + "step": 43240 + }, + { + "epoch": 1.09, + "learning_rate": 0.0013700977313267843, + "loss": 0.0765, + "step": 43250 + }, + { + "epoch": 1.09, + "learning_rate": 0.0013697208753109063, + "loss": 0.0786, + "step": 43260 + }, + { + "epoch": 1.09, + "learning_rate": 0.001369344019295028, + "loss": 0.0796, + "step": 43270 + }, + { + "epoch": 1.09, + "learning_rate": 0.00136896716327915, + "loss": 0.0771, + "step": 43280 + }, + { + "epoch": 1.09, + "learning_rate": 0.0013685903072632715, + "loss": 0.076, + "step": 43290 + }, + { + "epoch": 1.09, + "learning_rate": 0.0013682134512473935, + "loss": 0.0771, + "step": 43300 + }, + { + "epoch": 1.09, + "learning_rate": 0.0013678365952315152, + "loss": 0.0796, + "step": 43310 + }, + { + "epoch": 1.09, + "learning_rate": 0.0013674597392156372, + "loss": 0.0757, + "step": 43320 + }, + { + "epoch": 1.09, + "learning_rate": 0.001367082883199759, + "loss": 0.0752, + "step": 43330 + }, + { + "epoch": 1.09, + "learning_rate": 0.0013667060271838807, + "loss": 0.0763, + "step": 43340 + }, + { + "epoch": 1.09, + "learning_rate": 0.0013663291711680024, + "loss": 0.0771, + "step": 43350 + }, + { + "epoch": 1.09, + "learning_rate": 0.0013659523151521244, + "loss": 0.0762, + "step": 43360 + }, + { + "epoch": 1.09, + "learning_rate": 0.0013655754591362461, + "loss": 0.0792, + "step": 43370 + }, + { + "epoch": 1.09, + "learning_rate": 0.0013651986031203679, + "loss": 0.0789, + "step": 43380 + }, + { + "epoch": 1.09, + "learning_rate": 0.0013648217471044896, + "loss": 0.0783, + "step": 43390 + }, + { + "epoch": 1.09, + "learning_rate": 0.0013644448910886113, + "loss": 0.0777, + "step": 43400 + }, + { + "epoch": 1.09, + "learning_rate": 0.0013640680350727333, + "loss": 0.0761, + "step": 43410 + }, + { + "epoch": 1.09, + "learning_rate": 0.001363691179056855, + "loss": 0.0774, + "step": 43420 + }, + { + "epoch": 1.09, + "learning_rate": 0.0013633143230409768, + "loss": 0.0757, + "step": 43430 + }, + { + "epoch": 1.09, + "learning_rate": 0.0013629374670250985, + "loss": 0.0771, + "step": 43440 + }, + { + "epoch": 1.09, + "learning_rate": 0.0013625606110092205, + "loss": 0.0791, + "step": 43450 + }, + { + "epoch": 1.09, + "learning_rate": 0.0013621837549933423, + "loss": 0.0754, + "step": 43460 + }, + { + "epoch": 1.09, + "learning_rate": 0.001361806898977464, + "loss": 0.0782, + "step": 43470 + }, + { + "epoch": 1.09, + "learning_rate": 0.0013614300429615857, + "loss": 0.0767, + "step": 43480 + }, + { + "epoch": 1.09, + "learning_rate": 0.0013610531869457077, + "loss": 0.079, + "step": 43490 + }, + { + "epoch": 1.09, + "learning_rate": 0.0013606763309298294, + "loss": 0.075, + "step": 43500 + }, + { + "epoch": 1.09, + "eval_cer": 0.6659833195942073, + "eval_loss": 0.06602948158979416, + "eval_runtime": 90.5861, + "eval_samples_per_second": 110.381, + "eval_steps_per_second": 6.9, + "step": 43500 + }, + { + "epoch": 1.09, + "learning_rate": 0.0013602994749139512, + "loss": 0.0779, + "step": 43510 + }, + { + "epoch": 1.09, + "learning_rate": 0.001359922618898073, + "loss": 0.0743, + "step": 43520 + }, + { + "epoch": 1.09, + "learning_rate": 0.001359545762882195, + "loss": 0.0745, + "step": 43530 + }, + { + "epoch": 1.09, + "learning_rate": 0.0013591689068663166, + "loss": 0.0734, + "step": 43540 + }, + { + "epoch": 1.09, + "learning_rate": 0.0013587920508504386, + "loss": 0.0802, + "step": 43550 + }, + { + "epoch": 1.09, + "learning_rate": 0.0013584151948345601, + "loss": 0.0774, + "step": 43560 + }, + { + "epoch": 1.09, + "learning_rate": 0.001358038338818682, + "loss": 0.0764, + "step": 43570 + }, + { + "epoch": 1.09, + "learning_rate": 0.0013576614828028038, + "loss": 0.0796, + "step": 43580 + }, + { + "epoch": 1.1, + "learning_rate": 0.0013572846267869258, + "loss": 0.0774, + "step": 43590 + }, + { + "epoch": 1.1, + "learning_rate": 0.0013569077707710473, + "loss": 0.0725, + "step": 43600 + }, + { + "epoch": 1.1, + "learning_rate": 0.001356530914755169, + "loss": 0.0786, + "step": 43610 + }, + { + "epoch": 1.1, + "learning_rate": 0.001356154058739291, + "loss": 0.0805, + "step": 43620 + }, + { + "epoch": 1.1, + "learning_rate": 0.0013557772027234128, + "loss": 0.0748, + "step": 43630 + }, + { + "epoch": 1.1, + "learning_rate": 0.0013554003467075347, + "loss": 0.077, + "step": 43640 + }, + { + "epoch": 1.1, + "learning_rate": 0.0013550234906916563, + "loss": 0.0801, + "step": 43650 + }, + { + "epoch": 1.1, + "learning_rate": 0.0013546466346757782, + "loss": 0.0799, + "step": 43660 + }, + { + "epoch": 1.1, + "learning_rate": 0.0013542697786599, + "loss": 0.0758, + "step": 43670 + }, + { + "epoch": 1.1, + "learning_rate": 0.001353892922644022, + "loss": 0.0762, + "step": 43680 + }, + { + "epoch": 1.1, + "learning_rate": 0.0013535160666281437, + "loss": 0.0767, + "step": 43690 + }, + { + "epoch": 1.1, + "learning_rate": 0.0013531392106122654, + "loss": 0.0767, + "step": 43700 + }, + { + "epoch": 1.1, + "learning_rate": 0.0013527623545963872, + "loss": 0.0749, + "step": 43710 + }, + { + "epoch": 1.1, + "learning_rate": 0.0013523854985805091, + "loss": 0.0775, + "step": 43720 + }, + { + "epoch": 1.1, + "learning_rate": 0.0013520086425646309, + "loss": 0.0767, + "step": 43730 + }, + { + "epoch": 1.1, + "learning_rate": 0.0013516317865487526, + "loss": 0.0774, + "step": 43740 + }, + { + "epoch": 1.1, + "learning_rate": 0.0013512549305328744, + "loss": 0.0766, + "step": 43750 + }, + { + "epoch": 1.1, + "learning_rate": 0.0013508780745169963, + "loss": 0.0779, + "step": 43760 + }, + { + "epoch": 1.1, + "learning_rate": 0.001350501218501118, + "loss": 0.0802, + "step": 43770 + }, + { + "epoch": 1.1, + "learning_rate": 0.0013501243624852398, + "loss": 0.0799, + "step": 43780 + }, + { + "epoch": 1.1, + "learning_rate": 0.0013497475064693616, + "loss": 0.0845, + "step": 43790 + }, + { + "epoch": 1.1, + "learning_rate": 0.0013493706504534835, + "loss": 0.0807, + "step": 43800 + }, + { + "epoch": 1.1, + "learning_rate": 0.0013489937944376053, + "loss": 0.0816, + "step": 43810 + }, + { + "epoch": 1.1, + "learning_rate": 0.001348616938421727, + "loss": 0.079, + "step": 43820 + }, + { + "epoch": 1.1, + "learning_rate": 0.0013482400824058488, + "loss": 0.0768, + "step": 43830 + }, + { + "epoch": 1.1, + "learning_rate": 0.0013478632263899705, + "loss": 0.0753, + "step": 43840 + }, + { + "epoch": 1.1, + "learning_rate": 0.0013474863703740925, + "loss": 0.0759, + "step": 43850 + }, + { + "epoch": 1.1, + "learning_rate": 0.0013471095143582142, + "loss": 0.0804, + "step": 43860 + }, + { + "epoch": 1.1, + "learning_rate": 0.001346732658342336, + "loss": 0.082, + "step": 43870 + }, + { + "epoch": 1.1, + "learning_rate": 0.0013463558023264577, + "loss": 0.0809, + "step": 43880 + }, + { + "epoch": 1.1, + "learning_rate": 0.0013459789463105797, + "loss": 0.0835, + "step": 43890 + }, + { + "epoch": 1.1, + "learning_rate": 0.0013456020902947014, + "loss": 0.0748, + "step": 43900 + }, + { + "epoch": 1.1, + "learning_rate": 0.0013452252342788234, + "loss": 0.0787, + "step": 43910 + }, + { + "epoch": 1.1, + "learning_rate": 0.0013448483782629449, + "loss": 0.0818, + "step": 43920 + }, + { + "epoch": 1.1, + "learning_rate": 0.0013444715222470669, + "loss": 0.077, + "step": 43930 + }, + { + "epoch": 1.1, + "learning_rate": 0.0013440946662311886, + "loss": 0.0752, + "step": 43940 + }, + { + "epoch": 1.1, + "learning_rate": 0.0013437178102153106, + "loss": 0.074, + "step": 43950 + }, + { + "epoch": 1.1, + "learning_rate": 0.0013433409541994323, + "loss": 0.0759, + "step": 43960 + }, + { + "epoch": 1.1, + "learning_rate": 0.001342964098183554, + "loss": 0.078, + "step": 43970 + }, + { + "epoch": 1.1, + "learning_rate": 0.0013425872421676758, + "loss": 0.0755, + "step": 43980 + }, + { + "epoch": 1.11, + "learning_rate": 0.0013422103861517978, + "loss": 0.0779, + "step": 43990 + }, + { + "epoch": 1.11, + "learning_rate": 0.0013418335301359195, + "loss": 0.0816, + "step": 44000 + }, + { + "epoch": 1.11, + "eval_cer": 0.6656503082039665, + "eval_loss": 0.06611749529838562, + "eval_runtime": 90.5698, + "eval_samples_per_second": 110.401, + "eval_steps_per_second": 6.901, + "step": 44000 + }, + { + "epoch": 1.11, + "learning_rate": 0.0013414566741200412, + "loss": 0.0785, + "step": 44010 + }, + { + "epoch": 1.11, + "learning_rate": 0.001341079818104163, + "loss": 0.0781, + "step": 44020 + }, + { + "epoch": 1.11, + "learning_rate": 0.001340702962088285, + "loss": 0.0765, + "step": 44030 + }, + { + "epoch": 1.11, + "learning_rate": 0.0013403261060724067, + "loss": 0.0816, + "step": 44040 + }, + { + "epoch": 1.11, + "learning_rate": 0.0013399492500565284, + "loss": 0.0768, + "step": 44050 + }, + { + "epoch": 1.11, + "learning_rate": 0.0013395723940406502, + "loss": 0.0786, + "step": 44060 + }, + { + "epoch": 1.11, + "learning_rate": 0.001339195538024772, + "loss": 0.0775, + "step": 44070 + }, + { + "epoch": 1.11, + "learning_rate": 0.0013388186820088939, + "loss": 0.0799, + "step": 44080 + }, + { + "epoch": 1.11, + "learning_rate": 0.0013384418259930156, + "loss": 0.0773, + "step": 44090 + }, + { + "epoch": 1.11, + "learning_rate": 0.0013380649699771374, + "loss": 0.076, + "step": 44100 + }, + { + "epoch": 1.11, + "learning_rate": 0.0013376881139612591, + "loss": 0.0775, + "step": 44110 + }, + { + "epoch": 1.11, + "learning_rate": 0.001337311257945381, + "loss": 0.079, + "step": 44120 + }, + { + "epoch": 1.11, + "learning_rate": 0.0013369344019295028, + "loss": 0.0793, + "step": 44130 + }, + { + "epoch": 1.11, + "learning_rate": 0.0013365575459136246, + "loss": 0.0766, + "step": 44140 + }, + { + "epoch": 1.11, + "learning_rate": 0.0013361806898977463, + "loss": 0.078, + "step": 44150 + }, + { + "epoch": 1.11, + "learning_rate": 0.0013358038338818683, + "loss": 0.0766, + "step": 44160 + }, + { + "epoch": 1.11, + "learning_rate": 0.00133542697786599, + "loss": 0.0778, + "step": 44170 + }, + { + "epoch": 1.11, + "learning_rate": 0.001335050121850112, + "loss": 0.0754, + "step": 44180 + }, + { + "epoch": 1.11, + "learning_rate": 0.0013346732658342335, + "loss": 0.0758, + "step": 44190 + }, + { + "epoch": 1.11, + "learning_rate": 0.0013342964098183555, + "loss": 0.0773, + "step": 44200 + }, + { + "epoch": 1.11, + "learning_rate": 0.0013339195538024772, + "loss": 0.0765, + "step": 44210 + }, + { + "epoch": 1.11, + "learning_rate": 0.0013335426977865992, + "loss": 0.0818, + "step": 44220 + }, + { + "epoch": 1.11, + "learning_rate": 0.0013331658417707207, + "loss": 0.0779, + "step": 44230 + }, + { + "epoch": 1.11, + "learning_rate": 0.0013327889857548427, + "loss": 0.0762, + "step": 44240 + }, + { + "epoch": 1.11, + "learning_rate": 0.0013324121297389644, + "loss": 0.0821, + "step": 44250 + }, + { + "epoch": 1.11, + "learning_rate": 0.0013320352737230864, + "loss": 0.0795, + "step": 44260 + }, + { + "epoch": 1.11, + "learning_rate": 0.0013316584177072081, + "loss": 0.0778, + "step": 44270 + }, + { + "epoch": 1.11, + "learning_rate": 0.0013312815616913296, + "loss": 0.0735, + "step": 44280 + }, + { + "epoch": 1.11, + "learning_rate": 0.0013309047056754516, + "loss": 0.0784, + "step": 44290 + }, + { + "epoch": 1.11, + "learning_rate": 0.0013305278496595734, + "loss": 0.0766, + "step": 44300 + }, + { + "epoch": 1.11, + "learning_rate": 0.0013301509936436953, + "loss": 0.075, + "step": 44310 + }, + { + "epoch": 1.11, + "learning_rate": 0.001329774137627817, + "loss": 0.0754, + "step": 44320 + }, + { + "epoch": 1.11, + "learning_rate": 0.0013293972816119388, + "loss": 0.0773, + "step": 44330 + }, + { + "epoch": 1.11, + "learning_rate": 0.0013290204255960605, + "loss": 0.0754, + "step": 44340 + }, + { + "epoch": 1.11, + "learning_rate": 0.0013286435695801825, + "loss": 0.0759, + "step": 44350 + }, + { + "epoch": 1.11, + "learning_rate": 0.0013282667135643043, + "loss": 0.077, + "step": 44360 + }, + { + "epoch": 1.11, + "learning_rate": 0.001327889857548426, + "loss": 0.0807, + "step": 44370 + }, + { + "epoch": 1.11, + "learning_rate": 0.0013275130015325477, + "loss": 0.0761, + "step": 44380 + }, + { + "epoch": 1.12, + "learning_rate": 0.0013271361455166697, + "loss": 0.0758, + "step": 44390 + }, + { + "epoch": 1.12, + "learning_rate": 0.0013267592895007914, + "loss": 0.0725, + "step": 44400 + }, + { + "epoch": 1.12, + "learning_rate": 0.0013263824334849132, + "loss": 0.0731, + "step": 44410 + }, + { + "epoch": 1.12, + "learning_rate": 0.001326005577469035, + "loss": 0.0772, + "step": 44420 + }, + { + "epoch": 1.12, + "learning_rate": 0.001325628721453157, + "loss": 0.0792, + "step": 44430 + }, + { + "epoch": 1.12, + "learning_rate": 0.0013252518654372786, + "loss": 0.0747, + "step": 44440 + }, + { + "epoch": 1.12, + "learning_rate": 0.0013248750094214004, + "loss": 0.0769, + "step": 44450 + }, + { + "epoch": 1.12, + "learning_rate": 0.0013244981534055221, + "loss": 0.0736, + "step": 44460 + }, + { + "epoch": 1.12, + "learning_rate": 0.001324121297389644, + "loss": 0.074, + "step": 44470 + }, + { + "epoch": 1.12, + "learning_rate": 0.0013237444413737658, + "loss": 0.0762, + "step": 44480 + }, + { + "epoch": 1.12, + "learning_rate": 0.0013233675853578878, + "loss": 0.0791, + "step": 44490 + }, + { + "epoch": 1.12, + "learning_rate": 0.0013229907293420093, + "loss": 0.0758, + "step": 44500 + }, + { + "epoch": 1.12, + "eval_cer": 0.6656565641982919, + "eval_loss": 0.06587806344032288, + "eval_runtime": 90.6347, + "eval_samples_per_second": 110.322, + "eval_steps_per_second": 6.896, + "step": 44500 + }, + { + "epoch": 1.12, + "learning_rate": 0.001322613873326131, + "loss": 0.0772, + "step": 44510 + }, + { + "epoch": 1.12, + "learning_rate": 0.001322237017310253, + "loss": 0.08, + "step": 44520 + }, + { + "epoch": 1.12, + "learning_rate": 0.0013218601612943748, + "loss": 0.075, + "step": 44530 + }, + { + "epoch": 1.12, + "learning_rate": 0.0013214833052784967, + "loss": 0.0768, + "step": 44540 + }, + { + "epoch": 1.12, + "learning_rate": 0.0013211064492626183, + "loss": 0.0809, + "step": 44550 + }, + { + "epoch": 1.12, + "learning_rate": 0.0013207295932467402, + "loss": 0.0782, + "step": 44560 + }, + { + "epoch": 1.12, + "learning_rate": 0.001320352737230862, + "loss": 0.0751, + "step": 44570 + }, + { + "epoch": 1.12, + "learning_rate": 0.001319975881214984, + "loss": 0.0754, + "step": 44580 + }, + { + "epoch": 1.12, + "learning_rate": 0.0013195990251991057, + "loss": 0.0765, + "step": 44590 + }, + { + "epoch": 1.12, + "learning_rate": 0.0013192221691832274, + "loss": 0.0775, + "step": 44600 + }, + { + "epoch": 1.12, + "learning_rate": 0.0013188453131673492, + "loss": 0.0762, + "step": 44610 + }, + { + "epoch": 1.12, + "learning_rate": 0.0013184684571514711, + "loss": 0.0778, + "step": 44620 + }, + { + "epoch": 1.12, + "learning_rate": 0.0013180916011355929, + "loss": 0.0807, + "step": 44630 + }, + { + "epoch": 1.12, + "learning_rate": 0.0013177147451197146, + "loss": 0.0805, + "step": 44640 + }, + { + "epoch": 1.12, + "learning_rate": 0.0013173378891038364, + "loss": 0.0761, + "step": 44650 + }, + { + "epoch": 1.12, + "learning_rate": 0.0013169610330879583, + "loss": 0.0762, + "step": 44660 + }, + { + "epoch": 1.12, + "learning_rate": 0.00131658417707208, + "loss": 0.0786, + "step": 44670 + }, + { + "epoch": 1.12, + "learning_rate": 0.0013162073210562018, + "loss": 0.0774, + "step": 44680 + }, + { + "epoch": 1.12, + "learning_rate": 0.0013158304650403236, + "loss": 0.0764, + "step": 44690 + }, + { + "epoch": 1.12, + "learning_rate": 0.0013154536090244455, + "loss": 0.0752, + "step": 44700 + }, + { + "epoch": 1.12, + "learning_rate": 0.0013150767530085673, + "loss": 0.0791, + "step": 44710 + }, + { + "epoch": 1.12, + "learning_rate": 0.001314699896992689, + "loss": 0.077, + "step": 44720 + }, + { + "epoch": 1.12, + "learning_rate": 0.0013143230409768108, + "loss": 0.0777, + "step": 44730 + }, + { + "epoch": 1.12, + "learning_rate": 0.0013139461849609325, + "loss": 0.0777, + "step": 44740 + }, + { + "epoch": 1.12, + "learning_rate": 0.0013135693289450545, + "loss": 0.0753, + "step": 44750 + }, + { + "epoch": 1.12, + "learning_rate": 0.0013131924729291762, + "loss": 0.0751, + "step": 44760 + }, + { + "epoch": 1.12, + "learning_rate": 0.001312815616913298, + "loss": 0.078, + "step": 44770 + }, + { + "epoch": 1.13, + "learning_rate": 0.0013124387608974197, + "loss": 0.0778, + "step": 44780 + }, + { + "epoch": 1.13, + "learning_rate": 0.0013120619048815417, + "loss": 0.0753, + "step": 44790 + }, + { + "epoch": 1.13, + "learning_rate": 0.0013116850488656634, + "loss": 0.0761, + "step": 44800 + }, + { + "epoch": 1.13, + "learning_rate": 0.0013113081928497851, + "loss": 0.0741, + "step": 44810 + }, + { + "epoch": 1.13, + "learning_rate": 0.001310931336833907, + "loss": 0.0784, + "step": 44820 + }, + { + "epoch": 1.13, + "learning_rate": 0.0013105544808180289, + "loss": 0.0736, + "step": 44830 + }, + { + "epoch": 1.13, + "learning_rate": 0.0013101776248021506, + "loss": 0.0766, + "step": 44840 + }, + { + "epoch": 1.13, + "learning_rate": 0.0013098007687862726, + "loss": 0.0757, + "step": 44850 + }, + { + "epoch": 1.13, + "learning_rate": 0.001309423912770394, + "loss": 0.0776, + "step": 44860 + }, + { + "epoch": 1.13, + "learning_rate": 0.001309047056754516, + "loss": 0.078, + "step": 44870 + }, + { + "epoch": 1.13, + "learning_rate": 0.0013086702007386378, + "loss": 0.0772, + "step": 44880 + }, + { + "epoch": 1.13, + "learning_rate": 0.0013082933447227598, + "loss": 0.0765, + "step": 44890 + }, + { + "epoch": 1.13, + "learning_rate": 0.0013079164887068815, + "loss": 0.0778, + "step": 44900 + }, + { + "epoch": 1.13, + "learning_rate": 0.0013075396326910032, + "loss": 0.0754, + "step": 44910 + }, + { + "epoch": 1.13, + "learning_rate": 0.001307162776675125, + "loss": 0.0739, + "step": 44920 + }, + { + "epoch": 1.13, + "learning_rate": 0.001306785920659247, + "loss": 0.0745, + "step": 44930 + }, + { + "epoch": 1.13, + "learning_rate": 0.0013064090646433687, + "loss": 0.0804, + "step": 44940 + }, + { + "epoch": 1.13, + "learning_rate": 0.0013060322086274904, + "loss": 0.0756, + "step": 44950 + }, + { + "epoch": 1.13, + "learning_rate": 0.0013056553526116122, + "loss": 0.0743, + "step": 44960 + }, + { + "epoch": 1.13, + "learning_rate": 0.001305278496595734, + "loss": 0.0764, + "step": 44970 + }, + { + "epoch": 1.13, + "learning_rate": 0.0013049016405798559, + "loss": 0.0746, + "step": 44980 + }, + { + "epoch": 1.13, + "learning_rate": 0.0013045247845639776, + "loss": 0.073, + "step": 44990 + }, + { + "epoch": 1.13, + "learning_rate": 0.0013041479285480994, + "loss": 0.0767, + "step": 45000 + }, + { + "epoch": 1.13, + "eval_cer": 0.6657903462307875, + "eval_loss": 0.06532227247953415, + "eval_runtime": 90.6615, + "eval_samples_per_second": 110.289, + "eval_steps_per_second": 6.894, + "step": 45000 + }, + { + "epoch": 1.13, + "learning_rate": 0.0013037710725322211, + "loss": 0.0783, + "step": 45010 + }, + { + "epoch": 1.13, + "learning_rate": 0.001303394216516343, + "loss": 0.075, + "step": 45020 + }, + { + "epoch": 1.13, + "learning_rate": 0.0013030173605004648, + "loss": 0.0787, + "step": 45030 + }, + { + "epoch": 1.13, + "learning_rate": 0.0013026405044845866, + "loss": 0.078, + "step": 45040 + }, + { + "epoch": 1.13, + "learning_rate": 0.0013022636484687083, + "loss": 0.0798, + "step": 45050 + }, + { + "epoch": 1.13, + "learning_rate": 0.0013018867924528303, + "loss": 0.0757, + "step": 45060 + }, + { + "epoch": 1.13, + "learning_rate": 0.001301509936436952, + "loss": 0.0786, + "step": 45070 + }, + { + "epoch": 1.13, + "learning_rate": 0.0013011330804210738, + "loss": 0.0777, + "step": 45080 + }, + { + "epoch": 1.13, + "learning_rate": 0.0013007562244051955, + "loss": 0.0785, + "step": 45090 + }, + { + "epoch": 1.13, + "learning_rate": 0.0013003793683893175, + "loss": 0.0769, + "step": 45100 + }, + { + "epoch": 1.13, + "learning_rate": 0.0013000025123734392, + "loss": 0.0773, + "step": 45110 + }, + { + "epoch": 1.13, + "learning_rate": 0.0012996256563575612, + "loss": 0.0759, + "step": 45120 + }, + { + "epoch": 1.13, + "learning_rate": 0.0012992488003416827, + "loss": 0.0736, + "step": 45130 + }, + { + "epoch": 1.13, + "learning_rate": 0.0012988719443258047, + "loss": 0.0748, + "step": 45140 + }, + { + "epoch": 1.13, + "learning_rate": 0.0012984950883099264, + "loss": 0.0784, + "step": 45150 + }, + { + "epoch": 1.13, + "learning_rate": 0.0012981182322940484, + "loss": 0.0771, + "step": 45160 + }, + { + "epoch": 1.13, + "learning_rate": 0.0012977413762781701, + "loss": 0.0777, + "step": 45170 + }, + { + "epoch": 1.14, + "learning_rate": 0.0012973645202622917, + "loss": 0.0752, + "step": 45180 + }, + { + "epoch": 1.14, + "learning_rate": 0.0012969876642464136, + "loss": 0.0799, + "step": 45190 + }, + { + "epoch": 1.14, + "learning_rate": 0.0012966108082305354, + "loss": 0.0744, + "step": 45200 + }, + { + "epoch": 1.14, + "learning_rate": 0.0012962339522146573, + "loss": 0.0783, + "step": 45210 + }, + { + "epoch": 1.14, + "learning_rate": 0.0012958570961987788, + "loss": 0.0738, + "step": 45220 + }, + { + "epoch": 1.14, + "learning_rate": 0.0012954802401829008, + "loss": 0.0774, + "step": 45230 + }, + { + "epoch": 1.14, + "learning_rate": 0.0012951033841670226, + "loss": 0.0768, + "step": 45240 + }, + { + "epoch": 1.14, + "learning_rate": 0.0012947265281511445, + "loss": 0.0775, + "step": 45250 + }, + { + "epoch": 1.14, + "learning_rate": 0.0012943496721352663, + "loss": 0.0775, + "step": 45260 + }, + { + "epoch": 1.14, + "learning_rate": 0.001293972816119388, + "loss": 0.0772, + "step": 45270 + }, + { + "epoch": 1.14, + "learning_rate": 0.0012935959601035097, + "loss": 0.0772, + "step": 45280 + }, + { + "epoch": 1.14, + "learning_rate": 0.0012932191040876317, + "loss": 0.0748, + "step": 45290 + }, + { + "epoch": 1.14, + "learning_rate": 0.0012928422480717535, + "loss": 0.0769, + "step": 45300 + }, + { + "epoch": 1.14, + "learning_rate": 0.0012924653920558752, + "loss": 0.0765, + "step": 45310 + }, + { + "epoch": 1.14, + "learning_rate": 0.001292088536039997, + "loss": 0.0774, + "step": 45320 + }, + { + "epoch": 1.14, + "learning_rate": 0.001291711680024119, + "loss": 0.0758, + "step": 45330 + }, + { + "epoch": 1.14, + "learning_rate": 0.0012913348240082406, + "loss": 0.0754, + "step": 45340 + }, + { + "epoch": 1.14, + "learning_rate": 0.0012909579679923624, + "loss": 0.0751, + "step": 45350 + }, + { + "epoch": 1.14, + "learning_rate": 0.0012905811119764841, + "loss": 0.0809, + "step": 45360 + }, + { + "epoch": 1.14, + "learning_rate": 0.001290204255960606, + "loss": 0.0726, + "step": 45370 + }, + { + "epoch": 1.14, + "learning_rate": 0.0012898273999447278, + "loss": 0.0749, + "step": 45380 + }, + { + "epoch": 1.14, + "learning_rate": 0.0012894505439288496, + "loss": 0.0784, + "step": 45390 + }, + { + "epoch": 1.14, + "learning_rate": 0.0012890736879129713, + "loss": 0.0771, + "step": 45400 + }, + { + "epoch": 1.14, + "learning_rate": 0.001288696831897093, + "loss": 0.0773, + "step": 45410 + }, + { + "epoch": 1.14, + "learning_rate": 0.001288319975881215, + "loss": 0.0773, + "step": 45420 + }, + { + "epoch": 1.14, + "learning_rate": 0.0012879431198653368, + "loss": 0.0764, + "step": 45430 + }, + { + "epoch": 1.14, + "learning_rate": 0.0012875662638494585, + "loss": 0.0747, + "step": 45440 + }, + { + "epoch": 1.14, + "learning_rate": 0.0012871894078335803, + "loss": 0.0773, + "step": 45450 + }, + { + "epoch": 1.14, + "learning_rate": 0.0012868125518177022, + "loss": 0.0784, + "step": 45460 + }, + { + "epoch": 1.14, + "learning_rate": 0.001286435695801824, + "loss": 0.0732, + "step": 45470 + }, + { + "epoch": 1.14, + "learning_rate": 0.001286058839785946, + "loss": 0.0737, + "step": 45480 + }, + { + "epoch": 1.14, + "learning_rate": 0.0012856819837700675, + "loss": 0.0778, + "step": 45490 + }, + { + "epoch": 1.14, + "learning_rate": 0.0012853051277541894, + "loss": 0.076, + "step": 45500 + }, + { + "epoch": 1.14, + "eval_cer": 0.6656166220806763, + "eval_loss": 0.06491339206695557, + "eval_runtime": 90.6455, + "eval_samples_per_second": 110.309, + "eval_steps_per_second": 6.895, + "step": 45500 + }, + { + "epoch": 1.14, + "learning_rate": 0.0012849282717383112, + "loss": 0.0753, + "step": 45510 + }, + { + "epoch": 1.14, + "learning_rate": 0.0012845514157224331, + "loss": 0.0766, + "step": 45520 + }, + { + "epoch": 1.14, + "learning_rate": 0.0012841745597065549, + "loss": 0.0741, + "step": 45530 + }, + { + "epoch": 1.14, + "learning_rate": 0.0012837977036906766, + "loss": 0.077, + "step": 45540 + }, + { + "epoch": 1.14, + "learning_rate": 0.0012834208476747984, + "loss": 0.0744, + "step": 45550 + }, + { + "epoch": 1.14, + "learning_rate": 0.0012830439916589203, + "loss": 0.079, + "step": 45560 + }, + { + "epoch": 1.14, + "learning_rate": 0.001282667135643042, + "loss": 0.0796, + "step": 45570 + }, + { + "epoch": 1.15, + "learning_rate": 0.0012822902796271638, + "loss": 0.0769, + "step": 45580 + }, + { + "epoch": 1.15, + "learning_rate": 0.0012819134236112856, + "loss": 0.0753, + "step": 45590 + }, + { + "epoch": 1.15, + "learning_rate": 0.0012815365675954075, + "loss": 0.0754, + "step": 45600 + }, + { + "epoch": 1.15, + "learning_rate": 0.0012811597115795293, + "loss": 0.0769, + "step": 45610 + }, + { + "epoch": 1.15, + "learning_rate": 0.001280782855563651, + "loss": 0.0733, + "step": 45620 + }, + { + "epoch": 1.15, + "learning_rate": 0.0012804059995477728, + "loss": 0.0752, + "step": 45630 + }, + { + "epoch": 1.15, + "learning_rate": 0.0012800291435318945, + "loss": 0.0773, + "step": 45640 + }, + { + "epoch": 1.15, + "learning_rate": 0.0012796522875160165, + "loss": 0.0754, + "step": 45650 + }, + { + "epoch": 1.15, + "learning_rate": 0.0012792754315001382, + "loss": 0.08, + "step": 45660 + }, + { + "epoch": 1.15, + "learning_rate": 0.00127889857548426, + "loss": 0.0804, + "step": 45670 + }, + { + "epoch": 1.15, + "learning_rate": 0.0012785217194683817, + "loss": 0.0743, + "step": 45680 + }, + { + "epoch": 1.15, + "learning_rate": 0.0012781448634525037, + "loss": 0.0785, + "step": 45690 + }, + { + "epoch": 1.15, + "learning_rate": 0.0012777680074366254, + "loss": 0.0746, + "step": 45700 + }, + { + "epoch": 1.15, + "learning_rate": 0.0012773911514207472, + "loss": 0.0781, + "step": 45710 + }, + { + "epoch": 1.15, + "learning_rate": 0.001277014295404869, + "loss": 0.0751, + "step": 45720 + }, + { + "epoch": 1.15, + "learning_rate": 0.0012766374393889909, + "loss": 0.0732, + "step": 45730 + }, + { + "epoch": 1.15, + "learning_rate": 0.0012762605833731126, + "loss": 0.078, + "step": 45740 + }, + { + "epoch": 1.15, + "learning_rate": 0.0012758837273572346, + "loss": 0.0755, + "step": 45750 + }, + { + "epoch": 1.15, + "learning_rate": 0.001275506871341356, + "loss": 0.0738, + "step": 45760 + }, + { + "epoch": 1.15, + "learning_rate": 0.001275130015325478, + "loss": 0.0758, + "step": 45770 + }, + { + "epoch": 1.15, + "learning_rate": 0.0012747531593095998, + "loss": 0.0788, + "step": 45780 + }, + { + "epoch": 1.15, + "learning_rate": 0.0012743763032937218, + "loss": 0.0747, + "step": 45790 + }, + { + "epoch": 1.15, + "learning_rate": 0.0012739994472778433, + "loss": 0.0738, + "step": 45800 + }, + { + "epoch": 1.15, + "learning_rate": 0.0012736225912619652, + "loss": 0.0766, + "step": 45810 + }, + { + "epoch": 1.15, + "learning_rate": 0.001273245735246087, + "loss": 0.0775, + "step": 45820 + }, + { + "epoch": 1.15, + "learning_rate": 0.001272868879230209, + "loss": 0.0764, + "step": 45830 + }, + { + "epoch": 1.15, + "learning_rate": 0.0012724920232143307, + "loss": 0.0763, + "step": 45840 + }, + { + "epoch": 1.15, + "learning_rate": 0.0012721151671984522, + "loss": 0.0764, + "step": 45850 + }, + { + "epoch": 1.15, + "learning_rate": 0.0012717383111825742, + "loss": 0.0783, + "step": 45860 + }, + { + "epoch": 1.15, + "learning_rate": 0.001271361455166696, + "loss": 0.0761, + "step": 45870 + }, + { + "epoch": 1.15, + "learning_rate": 0.001270984599150818, + "loss": 0.0754, + "step": 45880 + }, + { + "epoch": 1.15, + "learning_rate": 0.0012706077431349396, + "loss": 0.0747, + "step": 45890 + }, + { + "epoch": 1.15, + "learning_rate": 0.0012702308871190614, + "loss": 0.0734, + "step": 45900 + }, + { + "epoch": 1.15, + "learning_rate": 0.0012698540311031831, + "loss": 0.0731, + "step": 45910 + }, + { + "epoch": 1.15, + "learning_rate": 0.001269477175087305, + "loss": 0.0764, + "step": 45920 + }, + { + "epoch": 1.15, + "learning_rate": 0.0012691003190714268, + "loss": 0.0768, + "step": 45930 + }, + { + "epoch": 1.15, + "learning_rate": 0.0012687234630555486, + "loss": 0.0753, + "step": 45940 + }, + { + "epoch": 1.15, + "learning_rate": 0.0012683466070396703, + "loss": 0.077, + "step": 45950 + }, + { + "epoch": 1.15, + "learning_rate": 0.0012679697510237923, + "loss": 0.0747, + "step": 45960 + }, + { + "epoch": 1.15, + "learning_rate": 0.001267592895007914, + "loss": 0.0733, + "step": 45970 + }, + { + "epoch": 1.16, + "learning_rate": 0.0012672160389920358, + "loss": 0.0791, + "step": 45980 + }, + { + "epoch": 1.16, + "learning_rate": 0.0012668391829761575, + "loss": 0.0772, + "step": 45990 + }, + { + "epoch": 1.16, + "learning_rate": 0.0012664623269602795, + "loss": 0.0727, + "step": 46000 + }, + { + "epoch": 1.16, + "eval_cer": 0.6655747550417299, + "eval_loss": 0.06513096392154694, + "eval_runtime": 90.5203, + "eval_samples_per_second": 110.461, + "eval_steps_per_second": 6.905, + "step": 46000 + }, + { + "epoch": 1.16, + "learning_rate": 0.0012660854709444012, + "loss": 0.0725, + "step": 46010 + }, + { + "epoch": 1.16, + "learning_rate": 0.001265708614928523, + "loss": 0.0729, + "step": 46020 + }, + { + "epoch": 1.16, + "learning_rate": 0.0012653317589126447, + "loss": 0.0771, + "step": 46030 + }, + { + "epoch": 1.16, + "learning_rate": 0.0012649549028967667, + "loss": 0.0748, + "step": 46040 + }, + { + "epoch": 1.16, + "learning_rate": 0.0012645780468808884, + "loss": 0.0758, + "step": 46050 + }, + { + "epoch": 1.16, + "learning_rate": 0.0012642011908650102, + "loss": 0.0764, + "step": 46060 + }, + { + "epoch": 1.16, + "learning_rate": 0.001263824334849132, + "loss": 0.0768, + "step": 46070 + }, + { + "epoch": 1.16, + "learning_rate": 0.0012634474788332537, + "loss": 0.074, + "step": 46080 + }, + { + "epoch": 1.16, + "learning_rate": 0.0012630706228173756, + "loss": 0.0755, + "step": 46090 + }, + { + "epoch": 1.16, + "learning_rate": 0.0012626937668014974, + "loss": 0.0783, + "step": 46100 + }, + { + "epoch": 1.16, + "learning_rate": 0.0012623169107856193, + "loss": 0.0742, + "step": 46110 + }, + { + "epoch": 1.16, + "learning_rate": 0.0012619400547697408, + "loss": 0.0756, + "step": 46120 + }, + { + "epoch": 1.16, + "learning_rate": 0.0012615631987538628, + "loss": 0.0765, + "step": 46130 + }, + { + "epoch": 1.16, + "learning_rate": 0.0012611863427379846, + "loss": 0.0752, + "step": 46140 + }, + { + "epoch": 1.16, + "learning_rate": 0.0012608094867221065, + "loss": 0.077, + "step": 46150 + }, + { + "epoch": 1.16, + "learning_rate": 0.0012604326307062283, + "loss": 0.0764, + "step": 46160 + }, + { + "epoch": 1.16, + "learning_rate": 0.00126005577469035, + "loss": 0.0756, + "step": 46170 + }, + { + "epoch": 1.16, + "learning_rate": 0.0012596789186744718, + "loss": 0.0721, + "step": 46180 + }, + { + "epoch": 1.16, + "learning_rate": 0.0012593020626585937, + "loss": 0.0757, + "step": 46190 + }, + { + "epoch": 1.16, + "learning_rate": 0.0012589252066427155, + "loss": 0.0774, + "step": 46200 + }, + { + "epoch": 1.16, + "learning_rate": 0.0012585483506268372, + "loss": 0.078, + "step": 46210 + }, + { + "epoch": 1.16, + "learning_rate": 0.001258171494610959, + "loss": 0.0778, + "step": 46220 + }, + { + "epoch": 1.16, + "learning_rate": 0.001257794638595081, + "loss": 0.0741, + "step": 46230 + }, + { + "epoch": 1.16, + "learning_rate": 0.0012574177825792027, + "loss": 0.0783, + "step": 46240 + }, + { + "epoch": 1.16, + "learning_rate": 0.0012570409265633244, + "loss": 0.0737, + "step": 46250 + }, + { + "epoch": 1.16, + "learning_rate": 0.0012566640705474461, + "loss": 0.0769, + "step": 46260 + }, + { + "epoch": 1.16, + "learning_rate": 0.001256287214531568, + "loss": 0.076, + "step": 46270 + }, + { + "epoch": 1.16, + "learning_rate": 0.0012559103585156898, + "loss": 0.0752, + "step": 46280 + }, + { + "epoch": 1.16, + "learning_rate": 0.0012555335024998116, + "loss": 0.0792, + "step": 46290 + }, + { + "epoch": 1.16, + "learning_rate": 0.0012551566464839333, + "loss": 0.0733, + "step": 46300 + }, + { + "epoch": 1.16, + "learning_rate": 0.001254779790468055, + "loss": 0.0786, + "step": 46310 + }, + { + "epoch": 1.16, + "learning_rate": 0.001254402934452177, + "loss": 0.0757, + "step": 46320 + }, + { + "epoch": 1.16, + "learning_rate": 0.0012540260784362988, + "loss": 0.0768, + "step": 46330 + }, + { + "epoch": 1.16, + "learning_rate": 0.0012536492224204205, + "loss": 0.0742, + "step": 46340 + }, + { + "epoch": 1.16, + "learning_rate": 0.0012532723664045423, + "loss": 0.0765, + "step": 46350 + }, + { + "epoch": 1.16, + "learning_rate": 0.0012528955103886642, + "loss": 0.0782, + "step": 46360 + }, + { + "epoch": 1.16, + "learning_rate": 0.001252518654372786, + "loss": 0.0715, + "step": 46370 + }, + { + "epoch": 1.17, + "learning_rate": 0.0012521417983569077, + "loss": 0.074, + "step": 46380 + }, + { + "epoch": 1.17, + "learning_rate": 0.0012517649423410295, + "loss": 0.0776, + "step": 46390 + }, + { + "epoch": 1.17, + "learning_rate": 0.0012513880863251514, + "loss": 0.0741, + "step": 46400 + }, + { + "epoch": 1.17, + "learning_rate": 0.0012510112303092732, + "loss": 0.076, + "step": 46410 + }, + { + "epoch": 1.17, + "learning_rate": 0.0012506343742933951, + "loss": 0.0759, + "step": 46420 + }, + { + "epoch": 1.17, + "learning_rate": 0.0012502575182775167, + "loss": 0.0745, + "step": 46430 + }, + { + "epoch": 1.17, + "learning_rate": 0.0012498806622616386, + "loss": 0.0732, + "step": 46440 + }, + { + "epoch": 1.17, + "learning_rate": 0.0012495038062457604, + "loss": 0.0764, + "step": 46450 + }, + { + "epoch": 1.17, + "learning_rate": 0.0012491269502298823, + "loss": 0.0717, + "step": 46460 + }, + { + "epoch": 1.17, + "learning_rate": 0.001248750094214004, + "loss": 0.0757, + "step": 46470 + }, + { + "epoch": 1.17, + "learning_rate": 0.0012483732381981258, + "loss": 0.0775, + "step": 46480 + }, + { + "epoch": 1.17, + "learning_rate": 0.0012479963821822476, + "loss": 0.0779, + "step": 46490 + }, + { + "epoch": 1.17, + "learning_rate": 0.0012476195261663693, + "loss": 0.0768, + "step": 46500 + }, + { + "epoch": 1.17, + "eval_cer": 0.6655930417943732, + "eval_loss": 0.06406976282596588, + "eval_runtime": 90.5517, + "eval_samples_per_second": 110.423, + "eval_steps_per_second": 6.902, + "step": 46500 + }, + { + "epoch": 1.17, + "learning_rate": 0.0012472426701504913, + "loss": 0.0776, + "step": 46510 + }, + { + "epoch": 1.17, + "learning_rate": 0.001246865814134613, + "loss": 0.0767, + "step": 46520 + }, + { + "epoch": 1.17, + "learning_rate": 0.0012464889581187348, + "loss": 0.0754, + "step": 46530 + }, + { + "epoch": 1.17, + "learning_rate": 0.0012461121021028565, + "loss": 0.0757, + "step": 46540 + }, + { + "epoch": 1.17, + "learning_rate": 0.0012457352460869785, + "loss": 0.0754, + "step": 46550 + }, + { + "epoch": 1.17, + "learning_rate": 0.0012453583900711002, + "loss": 0.0723, + "step": 46560 + }, + { + "epoch": 1.17, + "learning_rate": 0.001244981534055222, + "loss": 0.0809, + "step": 46570 + }, + { + "epoch": 1.17, + "learning_rate": 0.0012446046780393437, + "loss": 0.0741, + "step": 46580 + }, + { + "epoch": 1.17, + "learning_rate": 0.0012442278220234657, + "loss": 0.0764, + "step": 46590 + }, + { + "epoch": 1.17, + "learning_rate": 0.0012438509660075874, + "loss": 0.0733, + "step": 46600 + }, + { + "epoch": 1.17, + "learning_rate": 0.0012434741099917092, + "loss": 0.0768, + "step": 46610 + }, + { + "epoch": 1.17, + "learning_rate": 0.001243097253975831, + "loss": 0.077, + "step": 46620 + }, + { + "epoch": 1.17, + "learning_rate": 0.0012427203979599529, + "loss": 0.0778, + "step": 46630 + }, + { + "epoch": 1.17, + "learning_rate": 0.0012423435419440746, + "loss": 0.0734, + "step": 46640 + }, + { + "epoch": 1.17, + "learning_rate": 0.0012419666859281964, + "loss": 0.08, + "step": 46650 + }, + { + "epoch": 1.17, + "learning_rate": 0.001241589829912318, + "loss": 0.0748, + "step": 46660 + }, + { + "epoch": 1.17, + "learning_rate": 0.00124121297389644, + "loss": 0.0786, + "step": 46670 + }, + { + "epoch": 1.17, + "learning_rate": 0.0012408361178805618, + "loss": 0.075, + "step": 46680 + }, + { + "epoch": 1.17, + "learning_rate": 0.0012404592618646838, + "loss": 0.0733, + "step": 46690 + }, + { + "epoch": 1.17, + "learning_rate": 0.0012400824058488053, + "loss": 0.0762, + "step": 46700 + }, + { + "epoch": 1.17, + "learning_rate": 0.0012397055498329273, + "loss": 0.0772, + "step": 46710 + }, + { + "epoch": 1.17, + "learning_rate": 0.001239328693817049, + "loss": 0.075, + "step": 46720 + }, + { + "epoch": 1.17, + "learning_rate": 0.0012389518378011707, + "loss": 0.0785, + "step": 46730 + }, + { + "epoch": 1.17, + "learning_rate": 0.0012385749817852927, + "loss": 0.0727, + "step": 46740 + }, + { + "epoch": 1.17, + "learning_rate": 0.0012381981257694142, + "loss": 0.0744, + "step": 46750 + }, + { + "epoch": 1.17, + "learning_rate": 0.0012378212697535362, + "loss": 0.0724, + "step": 46760 + }, + { + "epoch": 1.18, + "learning_rate": 0.001237444413737658, + "loss": 0.0806, + "step": 46770 + }, + { + "epoch": 1.18, + "learning_rate": 0.00123706755772178, + "loss": 0.0719, + "step": 46780 + }, + { + "epoch": 1.18, + "learning_rate": 0.0012366907017059014, + "loss": 0.0752, + "step": 46790 + }, + { + "epoch": 1.18, + "learning_rate": 0.0012363138456900234, + "loss": 0.0737, + "step": 46800 + }, + { + "epoch": 1.18, + "learning_rate": 0.0012359369896741451, + "loss": 0.0777, + "step": 46810 + }, + { + "epoch": 1.18, + "learning_rate": 0.001235560133658267, + "loss": 0.0728, + "step": 46820 + }, + { + "epoch": 1.18, + "learning_rate": 0.0012351832776423888, + "loss": 0.0768, + "step": 46830 + }, + { + "epoch": 1.18, + "learning_rate": 0.0012348064216265106, + "loss": 0.0739, + "step": 46840 + }, + { + "epoch": 1.18, + "learning_rate": 0.0012344295656106323, + "loss": 0.0794, + "step": 46850 + }, + { + "epoch": 1.18, + "learning_rate": 0.0012340527095947543, + "loss": 0.075, + "step": 46860 + }, + { + "epoch": 1.18, + "learning_rate": 0.001233675853578876, + "loss": 0.0712, + "step": 46870 + }, + { + "epoch": 1.18, + "learning_rate": 0.0012332989975629978, + "loss": 0.072, + "step": 46880 + }, + { + "epoch": 1.18, + "learning_rate": 0.0012329221415471195, + "loss": 0.0762, + "step": 46890 + }, + { + "epoch": 1.18, + "learning_rate": 0.0012325452855312415, + "loss": 0.0749, + "step": 46900 + }, + { + "epoch": 1.18, + "learning_rate": 0.0012321684295153632, + "loss": 0.0781, + "step": 46910 + }, + { + "epoch": 1.18, + "learning_rate": 0.001231791573499485, + "loss": 0.0743, + "step": 46920 + }, + { + "epoch": 1.18, + "learning_rate": 0.0012314147174836067, + "loss": 0.0784, + "step": 46930 + }, + { + "epoch": 1.18, + "learning_rate": 0.0012310378614677287, + "loss": 0.0747, + "step": 46940 + }, + { + "epoch": 1.18, + "learning_rate": 0.0012306610054518504, + "loss": 0.0766, + "step": 46950 + }, + { + "epoch": 1.18, + "learning_rate": 0.0012302841494359722, + "loss": 0.0786, + "step": 46960 + }, + { + "epoch": 1.18, + "learning_rate": 0.001229907293420094, + "loss": 0.0787, + "step": 46970 + }, + { + "epoch": 1.18, + "learning_rate": 0.0012295304374042157, + "loss": 0.0791, + "step": 46980 + }, + { + "epoch": 1.18, + "learning_rate": 0.0012291535813883376, + "loss": 0.0738, + "step": 46990 + }, + { + "epoch": 1.18, + "learning_rate": 0.0012287767253724594, + "loss": 0.0722, + "step": 47000 + }, + { + "epoch": 1.18, + "eval_cer": 0.665535294154447, + "eval_loss": 0.06398055702447891, + "eval_runtime": 90.575, + "eval_samples_per_second": 110.395, + "eval_steps_per_second": 6.9, + "step": 47000 + }, + { + "epoch": 1.18, + "learning_rate": 0.0012283998693565811, + "loss": 0.0727, + "step": 47010 + }, + { + "epoch": 1.18, + "learning_rate": 0.0012280230133407029, + "loss": 0.0755, + "step": 47020 + }, + { + "epoch": 1.18, + "learning_rate": 0.0012276461573248248, + "loss": 0.0754, + "step": 47030 + }, + { + "epoch": 1.18, + "learning_rate": 0.0012272693013089466, + "loss": 0.0733, + "step": 47040 + }, + { + "epoch": 1.18, + "learning_rate": 0.0012268924452930685, + "loss": 0.0773, + "step": 47050 + }, + { + "epoch": 1.18, + "learning_rate": 0.00122651558927719, + "loss": 0.0756, + "step": 47060 + }, + { + "epoch": 1.18, + "learning_rate": 0.001226138733261312, + "loss": 0.0774, + "step": 47070 + }, + { + "epoch": 1.18, + "learning_rate": 0.0012257618772454338, + "loss": 0.0743, + "step": 47080 + }, + { + "epoch": 1.18, + "learning_rate": 0.0012253850212295557, + "loss": 0.0749, + "step": 47090 + }, + { + "epoch": 1.18, + "learning_rate": 0.0012250081652136775, + "loss": 0.0756, + "step": 47100 + }, + { + "epoch": 1.18, + "learning_rate": 0.0012246313091977992, + "loss": 0.0776, + "step": 47110 + }, + { + "epoch": 1.18, + "learning_rate": 0.001224254453181921, + "loss": 0.076, + "step": 47120 + }, + { + "epoch": 1.18, + "learning_rate": 0.001223877597166043, + "loss": 0.0736, + "step": 47130 + }, + { + "epoch": 1.18, + "learning_rate": 0.0012235007411501647, + "loss": 0.0775, + "step": 47140 + }, + { + "epoch": 1.18, + "learning_rate": 0.0012231238851342864, + "loss": 0.0731, + "step": 47150 + }, + { + "epoch": 1.18, + "learning_rate": 0.0012227470291184081, + "loss": 0.0761, + "step": 47160 + }, + { + "epoch": 1.19, + "learning_rate": 0.0012223701731025299, + "loss": 0.076, + "step": 47170 + }, + { + "epoch": 1.19, + "learning_rate": 0.0012219933170866519, + "loss": 0.0743, + "step": 47180 + }, + { + "epoch": 1.19, + "learning_rate": 0.0012216164610707736, + "loss": 0.0743, + "step": 47190 + }, + { + "epoch": 1.19, + "learning_rate": 0.0012212396050548953, + "loss": 0.0728, + "step": 47200 + }, + { + "epoch": 1.19, + "learning_rate": 0.001220862749039017, + "loss": 0.0735, + "step": 47210 + }, + { + "epoch": 1.19, + "learning_rate": 0.001220485893023139, + "loss": 0.0717, + "step": 47220 + }, + { + "epoch": 1.19, + "learning_rate": 0.0012201090370072608, + "loss": 0.0785, + "step": 47230 + }, + { + "epoch": 1.19, + "learning_rate": 0.0012197321809913825, + "loss": 0.0783, + "step": 47240 + }, + { + "epoch": 1.19, + "learning_rate": 0.0012193553249755043, + "loss": 0.0704, + "step": 47250 + }, + { + "epoch": 1.19, + "learning_rate": 0.0012189784689596262, + "loss": 0.0791, + "step": 47260 + }, + { + "epoch": 1.19, + "learning_rate": 0.001218601612943748, + "loss": 0.074, + "step": 47270 + }, + { + "epoch": 1.19, + "learning_rate": 0.0012182247569278697, + "loss": 0.0769, + "step": 47280 + }, + { + "epoch": 1.19, + "learning_rate": 0.0012178479009119915, + "loss": 0.0742, + "step": 47290 + }, + { + "epoch": 1.19, + "learning_rate": 0.0012174710448961134, + "loss": 0.0785, + "step": 47300 + }, + { + "epoch": 1.19, + "learning_rate": 0.0012170941888802352, + "loss": 0.0742, + "step": 47310 + }, + { + "epoch": 1.19, + "learning_rate": 0.0012167173328643571, + "loss": 0.0744, + "step": 47320 + }, + { + "epoch": 1.19, + "learning_rate": 0.0012163404768484787, + "loss": 0.0743, + "step": 47330 + }, + { + "epoch": 1.19, + "learning_rate": 0.0012159636208326006, + "loss": 0.0762, + "step": 47340 + }, + { + "epoch": 1.19, + "learning_rate": 0.0012155867648167224, + "loss": 0.0755, + "step": 47350 + }, + { + "epoch": 1.19, + "learning_rate": 0.0012152099088008443, + "loss": 0.0765, + "step": 47360 + }, + { + "epoch": 1.19, + "learning_rate": 0.001214833052784966, + "loss": 0.0749, + "step": 47370 + }, + { + "epoch": 1.19, + "learning_rate": 0.0012144561967690878, + "loss": 0.0751, + "step": 47380 + }, + { + "epoch": 1.19, + "learning_rate": 0.0012140793407532096, + "loss": 0.0754, + "step": 47390 + }, + { + "epoch": 1.19, + "learning_rate": 0.0012137024847373313, + "loss": 0.0717, + "step": 47400 + }, + { + "epoch": 1.19, + "learning_rate": 0.0012133256287214533, + "loss": 0.0781, + "step": 47410 + }, + { + "epoch": 1.19, + "learning_rate": 0.0012129487727055748, + "loss": 0.077, + "step": 47420 + }, + { + "epoch": 1.19, + "learning_rate": 0.0012125719166896968, + "loss": 0.0773, + "step": 47430 + }, + { + "epoch": 1.19, + "learning_rate": 0.0012121950606738185, + "loss": 0.0764, + "step": 47440 + }, + { + "epoch": 1.19, + "learning_rate": 0.0012118182046579405, + "loss": 0.0756, + "step": 47450 + }, + { + "epoch": 1.19, + "learning_rate": 0.0012114413486420622, + "loss": 0.0723, + "step": 47460 + }, + { + "epoch": 1.19, + "learning_rate": 0.001211064492626184, + "loss": 0.0778, + "step": 47470 + }, + { + "epoch": 1.19, + "learning_rate": 0.0012106876366103057, + "loss": 0.0765, + "step": 47480 + }, + { + "epoch": 1.19, + "learning_rate": 0.0012103107805944277, + "loss": 0.0763, + "step": 47490 + }, + { + "epoch": 1.19, + "learning_rate": 0.0012099339245785494, + "loss": 0.0763, + "step": 47500 + }, + { + "epoch": 1.19, + "eval_cer": 0.6654433791608979, + "eval_loss": 0.06456325203180313, + "eval_runtime": 90.7603, + "eval_samples_per_second": 110.169, + "eval_steps_per_second": 6.886, + "step": 47500 + }, + { + "epoch": 1.19, + "learning_rate": 0.0012095570685626712, + "loss": 0.0749, + "step": 47510 + }, + { + "epoch": 1.19, + "learning_rate": 0.001209180212546793, + "loss": 0.0746, + "step": 47520 + }, + { + "epoch": 1.19, + "learning_rate": 0.0012088033565309149, + "loss": 0.0762, + "step": 47530 + }, + { + "epoch": 1.19, + "learning_rate": 0.0012084265005150366, + "loss": 0.0732, + "step": 47540 + }, + { + "epoch": 1.19, + "learning_rate": 0.0012080496444991584, + "loss": 0.079, + "step": 47550 + }, + { + "epoch": 1.19, + "learning_rate": 0.00120767278848328, + "loss": 0.0731, + "step": 47560 + }, + { + "epoch": 1.2, + "learning_rate": 0.001207295932467402, + "loss": 0.0733, + "step": 47570 + }, + { + "epoch": 1.2, + "learning_rate": 0.0012069190764515238, + "loss": 0.0763, + "step": 47580 + }, + { + "epoch": 1.2, + "learning_rate": 0.0012065422204356455, + "loss": 0.0736, + "step": 47590 + }, + { + "epoch": 1.2, + "learning_rate": 0.0012061653644197673, + "loss": 0.0765, + "step": 47600 + }, + { + "epoch": 1.2, + "learning_rate": 0.0012057885084038893, + "loss": 0.0718, + "step": 47610 + }, + { + "epoch": 1.2, + "learning_rate": 0.001205411652388011, + "loss": 0.0769, + "step": 47620 + }, + { + "epoch": 1.2, + "learning_rate": 0.0012050347963721327, + "loss": 0.0729, + "step": 47630 + }, + { + "epoch": 1.2, + "learning_rate": 0.0012046579403562545, + "loss": 0.0775, + "step": 47640 + }, + { + "epoch": 1.2, + "learning_rate": 0.0012042810843403762, + "loss": 0.0743, + "step": 47650 + }, + { + "epoch": 1.2, + "learning_rate": 0.0012039042283244982, + "loss": 0.0771, + "step": 47660 + }, + { + "epoch": 1.2, + "learning_rate": 0.00120352737230862, + "loss": 0.0741, + "step": 47670 + }, + { + "epoch": 1.2, + "learning_rate": 0.001203150516292742, + "loss": 0.0712, + "step": 47680 + }, + { + "epoch": 1.2, + "learning_rate": 0.0012027736602768634, + "loss": 0.0784, + "step": 47690 + }, + { + "epoch": 1.2, + "learning_rate": 0.0012023968042609854, + "loss": 0.0789, + "step": 47700 + }, + { + "epoch": 1.2, + "learning_rate": 0.0012020199482451071, + "loss": 0.0745, + "step": 47710 + }, + { + "epoch": 1.2, + "learning_rate": 0.001201643092229229, + "loss": 0.0761, + "step": 47720 + }, + { + "epoch": 1.2, + "learning_rate": 0.0012012662362133508, + "loss": 0.0758, + "step": 47730 + }, + { + "epoch": 1.2, + "learning_rate": 0.0012008893801974726, + "loss": 0.0718, + "step": 47740 + }, + { + "epoch": 1.2, + "learning_rate": 0.0012005125241815943, + "loss": 0.0712, + "step": 47750 + }, + { + "epoch": 1.2, + "learning_rate": 0.0012001356681657163, + "loss": 0.0782, + "step": 47760 + }, + { + "epoch": 1.2, + "learning_rate": 0.001199758812149838, + "loss": 0.0786, + "step": 47770 + }, + { + "epoch": 1.2, + "learning_rate": 0.0011993819561339598, + "loss": 0.0755, + "step": 47780 + }, + { + "epoch": 1.2, + "learning_rate": 0.0011990051001180815, + "loss": 0.0767, + "step": 47790 + }, + { + "epoch": 1.2, + "learning_rate": 0.0011986282441022035, + "loss": 0.0734, + "step": 47800 + }, + { + "epoch": 1.2, + "learning_rate": 0.0011982513880863252, + "loss": 0.0749, + "step": 47810 + }, + { + "epoch": 1.2, + "learning_rate": 0.001197874532070447, + "loss": 0.0722, + "step": 47820 + }, + { + "epoch": 1.2, + "learning_rate": 0.0011974976760545687, + "loss": 0.0763, + "step": 47830 + }, + { + "epoch": 1.2, + "learning_rate": 0.0011971208200386905, + "loss": 0.0744, + "step": 47840 + }, + { + "epoch": 1.2, + "learning_rate": 0.0011967439640228124, + "loss": 0.0742, + "step": 47850 + }, + { + "epoch": 1.2, + "learning_rate": 0.0011963671080069342, + "loss": 0.0758, + "step": 47860 + }, + { + "epoch": 1.2, + "learning_rate": 0.001195990251991056, + "loss": 0.0728, + "step": 47870 + }, + { + "epoch": 1.2, + "learning_rate": 0.0011956133959751777, + "loss": 0.0753, + "step": 47880 + }, + { + "epoch": 1.2, + "learning_rate": 0.0011952365399592996, + "loss": 0.0746, + "step": 47890 + }, + { + "epoch": 1.2, + "learning_rate": 0.0011948596839434214, + "loss": 0.0771, + "step": 47900 + }, + { + "epoch": 1.2, + "learning_rate": 0.0011944828279275431, + "loss": 0.0751, + "step": 47910 + }, + { + "epoch": 1.2, + "learning_rate": 0.0011941059719116649, + "loss": 0.0762, + "step": 47920 + }, + { + "epoch": 1.2, + "learning_rate": 0.0011937291158957868, + "loss": 0.0777, + "step": 47930 + }, + { + "epoch": 1.2, + "learning_rate": 0.0011933522598799086, + "loss": 0.0739, + "step": 47940 + }, + { + "epoch": 1.2, + "learning_rate": 0.0011929754038640305, + "loss": 0.0722, + "step": 47950 + }, + { + "epoch": 1.2, + "learning_rate": 0.001192598547848152, + "loss": 0.0783, + "step": 47960 + }, + { + "epoch": 1.21, + "learning_rate": 0.001192221691832274, + "loss": 0.0764, + "step": 47970 + }, + { + "epoch": 1.21, + "learning_rate": 0.0011918448358163958, + "loss": 0.0771, + "step": 47980 + }, + { + "epoch": 1.21, + "learning_rate": 0.0011914679798005177, + "loss": 0.0754, + "step": 47990 + }, + { + "epoch": 1.21, + "learning_rate": 0.0011910911237846392, + "loss": 0.0766, + "step": 48000 + }, + { + "epoch": 1.21, + "eval_cer": 0.6658129640564252, + "eval_loss": 0.06356838345527649, + "eval_runtime": 90.7662, + "eval_samples_per_second": 110.162, + "eval_steps_per_second": 6.886, + "step": 48000 + }, + { + "epoch": 1.21, + "learning_rate": 0.0011907142677687612, + "loss": 0.076, + "step": 48010 + }, + { + "epoch": 1.21, + "learning_rate": 0.001190337411752883, + "loss": 0.0752, + "step": 48020 + }, + { + "epoch": 1.21, + "learning_rate": 0.001189960555737005, + "loss": 0.0744, + "step": 48030 + }, + { + "epoch": 1.21, + "learning_rate": 0.0011895836997211267, + "loss": 0.0683, + "step": 48040 + }, + { + "epoch": 1.21, + "learning_rate": 0.0011892068437052484, + "loss": 0.0783, + "step": 48050 + }, + { + "epoch": 1.21, + "learning_rate": 0.0011888299876893701, + "loss": 0.0759, + "step": 48060 + }, + { + "epoch": 1.21, + "learning_rate": 0.001188453131673492, + "loss": 0.0764, + "step": 48070 + }, + { + "epoch": 1.21, + "learning_rate": 0.0011880762756576139, + "loss": 0.073, + "step": 48080 + }, + { + "epoch": 1.21, + "learning_rate": 0.0011876994196417356, + "loss": 0.0721, + "step": 48090 + }, + { + "epoch": 1.21, + "learning_rate": 0.0011873225636258573, + "loss": 0.073, + "step": 48100 + }, + { + "epoch": 1.21, + "learning_rate": 0.001186945707609979, + "loss": 0.0765, + "step": 48110 + }, + { + "epoch": 1.21, + "learning_rate": 0.001186568851594101, + "loss": 0.0761, + "step": 48120 + }, + { + "epoch": 1.21, + "learning_rate": 0.0011861919955782228, + "loss": 0.0743, + "step": 48130 + }, + { + "epoch": 1.21, + "learning_rate": 0.0011858151395623445, + "loss": 0.0775, + "step": 48140 + }, + { + "epoch": 1.21, + "learning_rate": 0.0011854382835464663, + "loss": 0.0735, + "step": 48150 + }, + { + "epoch": 1.21, + "learning_rate": 0.0011850614275305882, + "loss": 0.0763, + "step": 48160 + }, + { + "epoch": 1.21, + "learning_rate": 0.00118468457151471, + "loss": 0.0743, + "step": 48170 + }, + { + "epoch": 1.21, + "learning_rate": 0.0011843077154988317, + "loss": 0.0745, + "step": 48180 + }, + { + "epoch": 1.21, + "learning_rate": 0.0011839308594829535, + "loss": 0.0743, + "step": 48190 + }, + { + "epoch": 1.21, + "learning_rate": 0.0011835540034670754, + "loss": 0.0788, + "step": 48200 + }, + { + "epoch": 1.21, + "learning_rate": 0.0011831771474511972, + "loss": 0.0773, + "step": 48210 + }, + { + "epoch": 1.21, + "learning_rate": 0.001182800291435319, + "loss": 0.075, + "step": 48220 + }, + { + "epoch": 1.21, + "learning_rate": 0.0011824234354194407, + "loss": 0.0726, + "step": 48230 + }, + { + "epoch": 1.21, + "learning_rate": 0.0011820465794035626, + "loss": 0.0738, + "step": 48240 + }, + { + "epoch": 1.21, + "learning_rate": 0.0011816697233876844, + "loss": 0.073, + "step": 48250 + }, + { + "epoch": 1.21, + "learning_rate": 0.0011812928673718063, + "loss": 0.0726, + "step": 48260 + }, + { + "epoch": 1.21, + "learning_rate": 0.0011809160113559279, + "loss": 0.0748, + "step": 48270 + }, + { + "epoch": 1.21, + "learning_rate": 0.0011805391553400496, + "loss": 0.0738, + "step": 48280 + }, + { + "epoch": 1.21, + "learning_rate": 0.0011801622993241716, + "loss": 0.0741, + "step": 48290 + }, + { + "epoch": 1.21, + "learning_rate": 0.0011797854433082933, + "loss": 0.076, + "step": 48300 + }, + { + "epoch": 1.21, + "learning_rate": 0.0011794085872924153, + "loss": 0.0777, + "step": 48310 + }, + { + "epoch": 1.21, + "learning_rate": 0.0011790317312765368, + "loss": 0.0754, + "step": 48320 + }, + { + "epoch": 1.21, + "learning_rate": 0.0011786548752606588, + "loss": 0.0725, + "step": 48330 + }, + { + "epoch": 1.21, + "learning_rate": 0.0011782780192447805, + "loss": 0.0726, + "step": 48340 + }, + { + "epoch": 1.21, + "learning_rate": 0.0011779011632289025, + "loss": 0.0746, + "step": 48350 + }, + { + "epoch": 1.21, + "learning_rate": 0.0011775243072130242, + "loss": 0.0734, + "step": 48360 + }, + { + "epoch": 1.22, + "learning_rate": 0.001177147451197146, + "loss": 0.076, + "step": 48370 + }, + { + "epoch": 1.22, + "learning_rate": 0.0011767705951812677, + "loss": 0.0757, + "step": 48380 + }, + { + "epoch": 1.22, + "learning_rate": 0.0011763937391653897, + "loss": 0.0746, + "step": 48390 + }, + { + "epoch": 1.22, + "learning_rate": 0.0011760168831495114, + "loss": 0.0745, + "step": 48400 + }, + { + "epoch": 1.22, + "learning_rate": 0.0011756400271336332, + "loss": 0.0709, + "step": 48410 + }, + { + "epoch": 1.22, + "learning_rate": 0.001175263171117755, + "loss": 0.0751, + "step": 48420 + }, + { + "epoch": 1.22, + "learning_rate": 0.0011748863151018769, + "loss": 0.0737, + "step": 48430 + }, + { + "epoch": 1.22, + "learning_rate": 0.0011745094590859986, + "loss": 0.0743, + "step": 48440 + }, + { + "epoch": 1.22, + "learning_rate": 0.0011741326030701204, + "loss": 0.074, + "step": 48450 + }, + { + "epoch": 1.22, + "learning_rate": 0.001173755747054242, + "loss": 0.0747, + "step": 48460 + }, + { + "epoch": 1.22, + "learning_rate": 0.001173378891038364, + "loss": 0.0754, + "step": 48470 + }, + { + "epoch": 1.22, + "learning_rate": 0.0011730020350224858, + "loss": 0.0741, + "step": 48480 + }, + { + "epoch": 1.22, + "learning_rate": 0.0011726251790066076, + "loss": 0.0728, + "step": 48490 + }, + { + "epoch": 1.22, + "learning_rate": 0.0011722483229907293, + "loss": 0.0774, + "step": 48500 + }, + { + "epoch": 1.22, + "eval_cer": 0.6654024745826169, + "eval_loss": 0.06362287700176239, + "eval_runtime": 90.7928, + "eval_samples_per_second": 110.13, + "eval_steps_per_second": 6.884, + "step": 48500 + }, + { + "epoch": 1.22, + "learning_rate": 0.001171871466974851, + "loss": 0.0727, + "step": 48510 + }, + { + "epoch": 1.22, + "learning_rate": 0.001171494610958973, + "loss": 0.0757, + "step": 48520 + }, + { + "epoch": 1.22, + "learning_rate": 0.0011711177549430947, + "loss": 0.0747, + "step": 48530 + }, + { + "epoch": 1.22, + "learning_rate": 0.0011707408989272165, + "loss": 0.0717, + "step": 48540 + }, + { + "epoch": 1.22, + "learning_rate": 0.0011703640429113382, + "loss": 0.0726, + "step": 48550 + }, + { + "epoch": 1.22, + "learning_rate": 0.0011699871868954602, + "loss": 0.0759, + "step": 48560 + }, + { + "epoch": 1.22, + "learning_rate": 0.001169610330879582, + "loss": 0.0735, + "step": 48570 + }, + { + "epoch": 1.22, + "learning_rate": 0.0011692334748637037, + "loss": 0.0753, + "step": 48580 + }, + { + "epoch": 1.22, + "learning_rate": 0.0011688566188478254, + "loss": 0.0756, + "step": 48590 + }, + { + "epoch": 1.22, + "learning_rate": 0.0011684797628319474, + "loss": 0.077, + "step": 48600 + }, + { + "epoch": 1.22, + "learning_rate": 0.0011681029068160691, + "loss": 0.0771, + "step": 48610 + }, + { + "epoch": 1.22, + "learning_rate": 0.001167726050800191, + "loss": 0.0744, + "step": 48620 + }, + { + "epoch": 1.22, + "learning_rate": 0.0011673491947843126, + "loss": 0.0755, + "step": 48630 + }, + { + "epoch": 1.22, + "learning_rate": 0.0011669723387684346, + "loss": 0.0741, + "step": 48640 + }, + { + "epoch": 1.22, + "learning_rate": 0.0011665954827525563, + "loss": 0.0739, + "step": 48650 + }, + { + "epoch": 1.22, + "learning_rate": 0.0011662186267366783, + "loss": 0.0797, + "step": 48660 + }, + { + "epoch": 1.22, + "learning_rate": 0.0011658417707208, + "loss": 0.0767, + "step": 48670 + }, + { + "epoch": 1.22, + "learning_rate": 0.0011654649147049218, + "loss": 0.0716, + "step": 48680 + }, + { + "epoch": 1.22, + "learning_rate": 0.0011650880586890435, + "loss": 0.074, + "step": 48690 + }, + { + "epoch": 1.22, + "learning_rate": 0.0011647112026731655, + "loss": 0.0739, + "step": 48700 + }, + { + "epoch": 1.22, + "learning_rate": 0.0011643343466572872, + "loss": 0.0761, + "step": 48710 + }, + { + "epoch": 1.22, + "learning_rate": 0.001163957490641409, + "loss": 0.0747, + "step": 48720 + }, + { + "epoch": 1.22, + "learning_rate": 0.0011635806346255307, + "loss": 0.0743, + "step": 48730 + }, + { + "epoch": 1.22, + "learning_rate": 0.0011632037786096525, + "loss": 0.077, + "step": 48740 + }, + { + "epoch": 1.22, + "learning_rate": 0.0011628269225937744, + "loss": 0.0733, + "step": 48750 + }, + { + "epoch": 1.23, + "learning_rate": 0.0011624500665778962, + "loss": 0.0738, + "step": 48760 + }, + { + "epoch": 1.23, + "learning_rate": 0.001162073210562018, + "loss": 0.0743, + "step": 48770 + }, + { + "epoch": 1.23, + "learning_rate": 0.0011616963545461397, + "loss": 0.0693, + "step": 48780 + }, + { + "epoch": 1.23, + "learning_rate": 0.0011613194985302616, + "loss": 0.0751, + "step": 48790 + }, + { + "epoch": 1.23, + "learning_rate": 0.0011609426425143834, + "loss": 0.0763, + "step": 48800 + }, + { + "epoch": 1.23, + "learning_rate": 0.0011605657864985051, + "loss": 0.0735, + "step": 48810 + }, + { + "epoch": 1.23, + "learning_rate": 0.0011601889304826269, + "loss": 0.072, + "step": 48820 + }, + { + "epoch": 1.23, + "learning_rate": 0.0011598120744667488, + "loss": 0.0746, + "step": 48830 + }, + { + "epoch": 1.23, + "learning_rate": 0.0011594352184508706, + "loss": 0.0719, + "step": 48840 + }, + { + "epoch": 1.23, + "learning_rate": 0.0011590583624349923, + "loss": 0.0727, + "step": 48850 + }, + { + "epoch": 1.23, + "learning_rate": 0.001158681506419114, + "loss": 0.0714, + "step": 48860 + }, + { + "epoch": 1.23, + "learning_rate": 0.001158304650403236, + "loss": 0.0733, + "step": 48870 + }, + { + "epoch": 1.23, + "learning_rate": 0.0011579277943873578, + "loss": 0.0756, + "step": 48880 + }, + { + "epoch": 1.23, + "learning_rate": 0.0011575509383714797, + "loss": 0.0751, + "step": 48890 + }, + { + "epoch": 1.23, + "learning_rate": 0.0011571740823556013, + "loss": 0.0766, + "step": 48900 + }, + { + "epoch": 1.23, + "learning_rate": 0.0011567972263397232, + "loss": 0.0733, + "step": 48910 + }, + { + "epoch": 1.23, + "learning_rate": 0.001156420370323845, + "loss": 0.0753, + "step": 48920 + }, + { + "epoch": 1.23, + "learning_rate": 0.001156043514307967, + "loss": 0.0745, + "step": 48930 + }, + { + "epoch": 1.23, + "learning_rate": 0.0011556666582920887, + "loss": 0.0714, + "step": 48940 + }, + { + "epoch": 1.23, + "learning_rate": 0.0011552898022762102, + "loss": 0.0719, + "step": 48950 + }, + { + "epoch": 1.23, + "learning_rate": 0.0011549129462603322, + "loss": 0.0776, + "step": 48960 + }, + { + "epoch": 1.23, + "learning_rate": 0.001154536090244454, + "loss": 0.0732, + "step": 48970 + }, + { + "epoch": 1.23, + "learning_rate": 0.0011541592342285759, + "loss": 0.073, + "step": 48980 + }, + { + "epoch": 1.23, + "learning_rate": 0.0011537823782126974, + "loss": 0.0719, + "step": 48990 + }, + { + "epoch": 1.23, + "learning_rate": 0.0011534055221968193, + "loss": 0.0759, + "step": 49000 + }, + { + "epoch": 1.23, + "eval_cer": 0.6653995872006206, + "eval_loss": 0.06333644688129425, + "eval_runtime": 90.5934, + "eval_samples_per_second": 110.372, + "eval_steps_per_second": 6.899, + "step": 49000 + }, + { + "epoch": 1.23, + "learning_rate": 0.001153028666180941, + "loss": 0.0753, + "step": 49010 + }, + { + "epoch": 1.23, + "learning_rate": 0.001152651810165063, + "loss": 0.0756, + "step": 49020 + }, + { + "epoch": 1.23, + "learning_rate": 0.0011522749541491848, + "loss": 0.075, + "step": 49030 + }, + { + "epoch": 1.23, + "learning_rate": 0.0011518980981333065, + "loss": 0.0776, + "step": 49040 + }, + { + "epoch": 1.23, + "learning_rate": 0.0011515212421174283, + "loss": 0.0742, + "step": 49050 + }, + { + "epoch": 1.23, + "learning_rate": 0.0011511443861015502, + "loss": 0.0702, + "step": 49060 + }, + { + "epoch": 1.23, + "learning_rate": 0.001150767530085672, + "loss": 0.0716, + "step": 49070 + }, + { + "epoch": 1.23, + "learning_rate": 0.0011503906740697937, + "loss": 0.0765, + "step": 49080 + }, + { + "epoch": 1.23, + "learning_rate": 0.0011500138180539155, + "loss": 0.0757, + "step": 49090 + }, + { + "epoch": 1.23, + "learning_rate": 0.0011496369620380374, + "loss": 0.0748, + "step": 49100 + }, + { + "epoch": 1.23, + "learning_rate": 0.0011492601060221592, + "loss": 0.0748, + "step": 49110 + }, + { + "epoch": 1.23, + "learning_rate": 0.001148883250006281, + "loss": 0.074, + "step": 49120 + }, + { + "epoch": 1.23, + "learning_rate": 0.0011485063939904027, + "loss": 0.0707, + "step": 49130 + }, + { + "epoch": 1.23, + "learning_rate": 0.0011481295379745246, + "loss": 0.0753, + "step": 49140 + }, + { + "epoch": 1.23, + "learning_rate": 0.0011477526819586464, + "loss": 0.0722, + "step": 49150 + }, + { + "epoch": 1.24, + "learning_rate": 0.0011473758259427681, + "loss": 0.0706, + "step": 49160 + }, + { + "epoch": 1.24, + "learning_rate": 0.0011469989699268899, + "loss": 0.0758, + "step": 49170 + }, + { + "epoch": 1.24, + "learning_rate": 0.0011466221139110116, + "loss": 0.0752, + "step": 49180 + }, + { + "epoch": 1.24, + "learning_rate": 0.0011462452578951336, + "loss": 0.0752, + "step": 49190 + }, + { + "epoch": 1.24, + "learning_rate": 0.0011458684018792553, + "loss": 0.0733, + "step": 49200 + }, + { + "epoch": 1.24, + "learning_rate": 0.001145491545863377, + "loss": 0.0745, + "step": 49210 + }, + { + "epoch": 1.24, + "learning_rate": 0.0011451146898474988, + "loss": 0.0728, + "step": 49220 + }, + { + "epoch": 1.24, + "learning_rate": 0.0011447378338316208, + "loss": 0.0768, + "step": 49230 + }, + { + "epoch": 1.24, + "learning_rate": 0.0011443609778157425, + "loss": 0.0731, + "step": 49240 + }, + { + "epoch": 1.24, + "learning_rate": 0.0011439841217998645, + "loss": 0.0727, + "step": 49250 + }, + { + "epoch": 1.24, + "learning_rate": 0.001143607265783986, + "loss": 0.0718, + "step": 49260 + }, + { + "epoch": 1.24, + "learning_rate": 0.001143230409768108, + "loss": 0.076, + "step": 49270 + }, + { + "epoch": 1.24, + "learning_rate": 0.0011428535537522297, + "loss": 0.0717, + "step": 49280 + }, + { + "epoch": 1.24, + "learning_rate": 0.0011424766977363517, + "loss": 0.0729, + "step": 49290 + }, + { + "epoch": 1.24, + "learning_rate": 0.0011420998417204734, + "loss": 0.0742, + "step": 49300 + }, + { + "epoch": 1.24, + "learning_rate": 0.0011417229857045952, + "loss": 0.0748, + "step": 49310 + }, + { + "epoch": 1.24, + "learning_rate": 0.001141346129688717, + "loss": 0.0772, + "step": 49320 + }, + { + "epoch": 1.24, + "learning_rate": 0.0011409692736728389, + "loss": 0.075, + "step": 49330 + }, + { + "epoch": 1.24, + "learning_rate": 0.0011405924176569606, + "loss": 0.074, + "step": 49340 + }, + { + "epoch": 1.24, + "learning_rate": 0.0011402155616410824, + "loss": 0.0742, + "step": 49350 + }, + { + "epoch": 1.24, + "learning_rate": 0.001139838705625204, + "loss": 0.0732, + "step": 49360 + }, + { + "epoch": 1.24, + "learning_rate": 0.001139461849609326, + "loss": 0.0739, + "step": 49370 + }, + { + "epoch": 1.24, + "learning_rate": 0.0011390849935934478, + "loss": 0.0716, + "step": 49380 + }, + { + "epoch": 1.24, + "learning_rate": 0.0011387081375775696, + "loss": 0.0743, + "step": 49390 + }, + { + "epoch": 1.24, + "learning_rate": 0.0011383312815616913, + "loss": 0.0735, + "step": 49400 + }, + { + "epoch": 1.24, + "learning_rate": 0.001137954425545813, + "loss": 0.074, + "step": 49410 + }, + { + "epoch": 1.24, + "learning_rate": 0.001137577569529935, + "loss": 0.0767, + "step": 49420 + }, + { + "epoch": 1.24, + "learning_rate": 0.0011372007135140568, + "loss": 0.0734, + "step": 49430 + }, + { + "epoch": 1.24, + "learning_rate": 0.0011368238574981785, + "loss": 0.0748, + "step": 49440 + }, + { + "epoch": 1.24, + "learning_rate": 0.0011364470014823002, + "loss": 0.0728, + "step": 49450 + }, + { + "epoch": 1.24, + "learning_rate": 0.0011360701454664222, + "loss": 0.0757, + "step": 49460 + }, + { + "epoch": 1.24, + "learning_rate": 0.001135693289450544, + "loss": 0.0732, + "step": 49470 + }, + { + "epoch": 1.24, + "learning_rate": 0.0011353164334346657, + "loss": 0.0748, + "step": 49480 + }, + { + "epoch": 1.24, + "learning_rate": 0.0011349395774187874, + "loss": 0.0749, + "step": 49490 + }, + { + "epoch": 1.24, + "learning_rate": 0.0011345627214029094, + "loss": 0.0779, + "step": 49500 + }, + { + "epoch": 1.24, + "eval_cer": 0.6658298071180704, + "eval_loss": 0.06252450495958328, + "eval_runtime": 90.8892, + "eval_samples_per_second": 110.013, + "eval_steps_per_second": 6.877, + "step": 49500 + }, + { + "epoch": 1.24, + "learning_rate": 0.0011341858653870311, + "loss": 0.0753, + "step": 49510 + }, + { + "epoch": 1.24, + "learning_rate": 0.001133809009371153, + "loss": 0.0728, + "step": 49520 + }, + { + "epoch": 1.24, + "learning_rate": 0.0011334321533552746, + "loss": 0.0729, + "step": 49530 + }, + { + "epoch": 1.24, + "learning_rate": 0.0011330552973393966, + "loss": 0.0739, + "step": 49540 + }, + { + "epoch": 1.24, + "learning_rate": 0.0011326784413235183, + "loss": 0.0728, + "step": 49550 + }, + { + "epoch": 1.25, + "learning_rate": 0.0011323015853076403, + "loss": 0.0718, + "step": 49560 + }, + { + "epoch": 1.25, + "learning_rate": 0.0011319247292917618, + "loss": 0.0732, + "step": 49570 + }, + { + "epoch": 1.25, + "learning_rate": 0.0011315478732758838, + "loss": 0.07, + "step": 49580 + }, + { + "epoch": 1.25, + "learning_rate": 0.0011311710172600055, + "loss": 0.0729, + "step": 49590 + }, + { + "epoch": 1.25, + "learning_rate": 0.0011307941612441275, + "loss": 0.0758, + "step": 49600 + }, + { + "epoch": 1.25, + "learning_rate": 0.0011304173052282492, + "loss": 0.0699, + "step": 49610 + }, + { + "epoch": 1.25, + "learning_rate": 0.0011300404492123708, + "loss": 0.0747, + "step": 49620 + }, + { + "epoch": 1.25, + "learning_rate": 0.0011296635931964927, + "loss": 0.0734, + "step": 49630 + }, + { + "epoch": 1.25, + "learning_rate": 0.0011292867371806145, + "loss": 0.0766, + "step": 49640 + }, + { + "epoch": 1.25, + "learning_rate": 0.0011289098811647364, + "loss": 0.07, + "step": 49650 + }, + { + "epoch": 1.25, + "learning_rate": 0.0011285330251488582, + "loss": 0.0743, + "step": 49660 + }, + { + "epoch": 1.25, + "learning_rate": 0.00112815616913298, + "loss": 0.0731, + "step": 49670 + }, + { + "epoch": 1.25, + "learning_rate": 0.0011277793131171017, + "loss": 0.0761, + "step": 49680 + }, + { + "epoch": 1.25, + "learning_rate": 0.0011274024571012236, + "loss": 0.0764, + "step": 49690 + }, + { + "epoch": 1.25, + "learning_rate": 0.0011270256010853454, + "loss": 0.0761, + "step": 49700 + }, + { + "epoch": 1.25, + "learning_rate": 0.0011266487450694671, + "loss": 0.0736, + "step": 49710 + }, + { + "epoch": 1.25, + "learning_rate": 0.0011262718890535889, + "loss": 0.0747, + "step": 49720 + }, + { + "epoch": 1.25, + "learning_rate": 0.0011258950330377108, + "loss": 0.075, + "step": 49730 + }, + { + "epoch": 1.25, + "learning_rate": 0.0011255181770218326, + "loss": 0.0718, + "step": 49740 + }, + { + "epoch": 1.25, + "learning_rate": 0.0011251413210059543, + "loss": 0.0731, + "step": 49750 + }, + { + "epoch": 1.25, + "learning_rate": 0.001124764464990076, + "loss": 0.0732, + "step": 49760 + }, + { + "epoch": 1.25, + "learning_rate": 0.001124387608974198, + "loss": 0.0723, + "step": 49770 + }, + { + "epoch": 1.25, + "learning_rate": 0.0011240107529583198, + "loss": 0.0742, + "step": 49780 + }, + { + "epoch": 1.25, + "learning_rate": 0.0011236338969424415, + "loss": 0.0738, + "step": 49790 + }, + { + "epoch": 1.25, + "learning_rate": 0.0011232570409265633, + "loss": 0.0736, + "step": 49800 + }, + { + "epoch": 1.25, + "learning_rate": 0.0011228801849106852, + "loss": 0.0723, + "step": 49810 + }, + { + "epoch": 1.25, + "learning_rate": 0.001122503328894807, + "loss": 0.0717, + "step": 49820 + }, + { + "epoch": 1.25, + "learning_rate": 0.001122126472878929, + "loss": 0.0742, + "step": 49830 + }, + { + "epoch": 1.25, + "learning_rate": 0.0011217496168630505, + "loss": 0.0732, + "step": 49840 + }, + { + "epoch": 1.25, + "learning_rate": 0.0011213727608471722, + "loss": 0.0749, + "step": 49850 + }, + { + "epoch": 1.25, + "learning_rate": 0.0011209959048312942, + "loss": 0.0745, + "step": 49860 + }, + { + "epoch": 1.25, + "learning_rate": 0.001120619048815416, + "loss": 0.0701, + "step": 49870 + }, + { + "epoch": 1.25, + "learning_rate": 0.0011202421927995379, + "loss": 0.0746, + "step": 49880 + }, + { + "epoch": 1.25, + "learning_rate": 0.0011198653367836594, + "loss": 0.0732, + "step": 49890 + }, + { + "epoch": 1.25, + "learning_rate": 0.0011194884807677814, + "loss": 0.0706, + "step": 49900 + }, + { + "epoch": 1.25, + "learning_rate": 0.001119111624751903, + "loss": 0.0709, + "step": 49910 + }, + { + "epoch": 1.25, + "learning_rate": 0.001118734768736025, + "loss": 0.0755, + "step": 49920 + }, + { + "epoch": 1.25, + "learning_rate": 0.0011183579127201468, + "loss": 0.0707, + "step": 49930 + }, + { + "epoch": 1.25, + "learning_rate": 0.0011179810567042685, + "loss": 0.0744, + "step": 49940 + }, + { + "epoch": 1.25, + "learning_rate": 0.0011176042006883903, + "loss": 0.0713, + "step": 49950 + }, + { + "epoch": 1.26, + "learning_rate": 0.0011172273446725123, + "loss": 0.0766, + "step": 49960 + }, + { + "epoch": 1.26, + "learning_rate": 0.001116850488656634, + "loss": 0.0723, + "step": 49970 + }, + { + "epoch": 1.26, + "learning_rate": 0.0011164736326407557, + "loss": 0.0761, + "step": 49980 + }, + { + "epoch": 1.26, + "learning_rate": 0.0011160967766248775, + "loss": 0.0763, + "step": 49990 + }, + { + "epoch": 1.26, + "learning_rate": 0.0011157199206089994, + "loss": 0.074, + "step": 50000 + }, + { + "epoch": 1.26, + "eval_cer": 0.6653543515493451, + "eval_loss": 0.06283344328403473, + "eval_runtime": 90.7413, + "eval_samples_per_second": 110.192, + "eval_steps_per_second": 6.888, + "step": 50000 + }, + { + "epoch": 1.26, + "learning_rate": 0.0011153430645931212, + "loss": 0.0736, + "step": 50010 + }, + { + "epoch": 1.26, + "learning_rate": 0.001114966208577243, + "loss": 0.0729, + "step": 50020 + }, + { + "epoch": 1.26, + "learning_rate": 0.0011145893525613647, + "loss": 0.0761, + "step": 50030 + }, + { + "epoch": 1.26, + "learning_rate": 0.0011142124965454866, + "loss": 0.0715, + "step": 50040 + }, + { + "epoch": 1.26, + "learning_rate": 0.0011138356405296084, + "loss": 0.07, + "step": 50050 + }, + { + "epoch": 1.26, + "learning_rate": 0.0011134587845137301, + "loss": 0.076, + "step": 50060 + }, + { + "epoch": 1.26, + "learning_rate": 0.0011130819284978519, + "loss": 0.0735, + "step": 50070 + }, + { + "epoch": 1.26, + "learning_rate": 0.0011127050724819736, + "loss": 0.0744, + "step": 50080 + }, + { + "epoch": 1.26, + "learning_rate": 0.0011123282164660956, + "loss": 0.0741, + "step": 50090 + }, + { + "epoch": 1.26, + "learning_rate": 0.0011119513604502173, + "loss": 0.0733, + "step": 50100 + }, + { + "epoch": 1.26, + "learning_rate": 0.001111574504434339, + "loss": 0.0721, + "step": 50110 + }, + { + "epoch": 1.26, + "learning_rate": 0.0011111976484184608, + "loss": 0.0716, + "step": 50120 + }, + { + "epoch": 1.26, + "learning_rate": 0.0011108207924025828, + "loss": 0.0744, + "step": 50130 + }, + { + "epoch": 1.26, + "learning_rate": 0.0011104439363867045, + "loss": 0.0752, + "step": 50140 + }, + { + "epoch": 1.26, + "learning_rate": 0.0011100670803708263, + "loss": 0.0764, + "step": 50150 + }, + { + "epoch": 1.26, + "learning_rate": 0.001109690224354948, + "loss": 0.0725, + "step": 50160 + }, + { + "epoch": 1.26, + "learning_rate": 0.00110931336833907, + "loss": 0.0721, + "step": 50170 + }, + { + "epoch": 1.26, + "learning_rate": 0.0011089365123231917, + "loss": 0.0712, + "step": 50180 + }, + { + "epoch": 1.26, + "learning_rate": 0.0011085596563073137, + "loss": 0.0699, + "step": 50190 + }, + { + "epoch": 1.26, + "learning_rate": 0.0011081828002914352, + "loss": 0.0734, + "step": 50200 + }, + { + "epoch": 1.26, + "learning_rate": 0.0011078059442755572, + "loss": 0.0749, + "step": 50210 + }, + { + "epoch": 1.26, + "learning_rate": 0.001107429088259679, + "loss": 0.0726, + "step": 50220 + }, + { + "epoch": 1.26, + "learning_rate": 0.0011070522322438009, + "loss": 0.0707, + "step": 50230 + }, + { + "epoch": 1.26, + "learning_rate": 0.0011066753762279226, + "loss": 0.076, + "step": 50240 + }, + { + "epoch": 1.26, + "learning_rate": 0.0011062985202120444, + "loss": 0.0771, + "step": 50250 + }, + { + "epoch": 1.26, + "learning_rate": 0.0011059216641961661, + "loss": 0.0719, + "step": 50260 + }, + { + "epoch": 1.26, + "learning_rate": 0.001105544808180288, + "loss": 0.0722, + "step": 50270 + }, + { + "epoch": 1.26, + "learning_rate": 0.0011051679521644098, + "loss": 0.0743, + "step": 50280 + }, + { + "epoch": 1.26, + "learning_rate": 0.0011047910961485316, + "loss": 0.0727, + "step": 50290 + }, + { + "epoch": 1.26, + "learning_rate": 0.0011044142401326533, + "loss": 0.0727, + "step": 50300 + }, + { + "epoch": 1.26, + "learning_rate": 0.001104037384116775, + "loss": 0.0709, + "step": 50310 + }, + { + "epoch": 1.26, + "learning_rate": 0.001103660528100897, + "loss": 0.076, + "step": 50320 + }, + { + "epoch": 1.26, + "learning_rate": 0.0011032836720850188, + "loss": 0.0754, + "step": 50330 + }, + { + "epoch": 1.26, + "learning_rate": 0.0011029068160691405, + "loss": 0.0709, + "step": 50340 + }, + { + "epoch": 1.26, + "learning_rate": 0.0011025299600532622, + "loss": 0.0722, + "step": 50350 + }, + { + "epoch": 1.27, + "learning_rate": 0.0011021531040373842, + "loss": 0.072, + "step": 50360 + }, + { + "epoch": 1.27, + "learning_rate": 0.001101776248021506, + "loss": 0.0725, + "step": 50370 + }, + { + "epoch": 1.27, + "learning_rate": 0.0011013993920056277, + "loss": 0.0738, + "step": 50380 + }, + { + "epoch": 1.27, + "learning_rate": 0.0011010225359897494, + "loss": 0.0783, + "step": 50390 + }, + { + "epoch": 1.27, + "learning_rate": 0.0011006456799738714, + "loss": 0.0732, + "step": 50400 + }, + { + "epoch": 1.27, + "learning_rate": 0.0011002688239579931, + "loss": 0.0703, + "step": 50410 + }, + { + "epoch": 1.27, + "learning_rate": 0.0010998919679421149, + "loss": 0.0755, + "step": 50420 + }, + { + "epoch": 1.27, + "learning_rate": 0.0010995151119262366, + "loss": 0.0727, + "step": 50430 + }, + { + "epoch": 1.27, + "learning_rate": 0.0010991382559103586, + "loss": 0.0755, + "step": 50440 + }, + { + "epoch": 1.27, + "learning_rate": 0.0010987613998944803, + "loss": 0.0723, + "step": 50450 + }, + { + "epoch": 1.27, + "learning_rate": 0.0010983845438786023, + "loss": 0.0739, + "step": 50460 + }, + { + "epoch": 1.27, + "learning_rate": 0.0010980076878627238, + "loss": 0.0737, + "step": 50470 + }, + { + "epoch": 1.27, + "learning_rate": 0.0010976308318468458, + "loss": 0.0738, + "step": 50480 + }, + { + "epoch": 1.27, + "learning_rate": 0.0010972539758309675, + "loss": 0.0722, + "step": 50490 + }, + { + "epoch": 1.27, + "learning_rate": 0.0010968771198150895, + "loss": 0.0761, + "step": 50500 + }, + { + "epoch": 1.27, + "eval_cer": 0.665603628861693, + "eval_loss": 0.062332626432180405, + "eval_runtime": 90.8939, + "eval_samples_per_second": 110.007, + "eval_steps_per_second": 6.876, + "step": 50500 + }, + { + "epoch": 1.27, + "learning_rate": 0.0010965002637992112, + "loss": 0.0728, + "step": 50510 + }, + { + "epoch": 1.27, + "learning_rate": 0.0010961234077833328, + "loss": 0.0722, + "step": 50520 + }, + { + "epoch": 1.27, + "learning_rate": 0.0010957465517674547, + "loss": 0.075, + "step": 50530 + }, + { + "epoch": 1.27, + "learning_rate": 0.0010953696957515765, + "loss": 0.0712, + "step": 50540 + }, + { + "epoch": 1.27, + "learning_rate": 0.0010949928397356984, + "loss": 0.0712, + "step": 50550 + }, + { + "epoch": 1.27, + "learning_rate": 0.00109461598371982, + "loss": 0.0739, + "step": 50560 + }, + { + "epoch": 1.27, + "learning_rate": 0.001094239127703942, + "loss": 0.0758, + "step": 50570 + }, + { + "epoch": 1.27, + "learning_rate": 0.0010938622716880637, + "loss": 0.0721, + "step": 50580 + }, + { + "epoch": 1.27, + "learning_rate": 0.0010934854156721856, + "loss": 0.0738, + "step": 50590 + }, + { + "epoch": 1.27, + "learning_rate": 0.0010931085596563074, + "loss": 0.0707, + "step": 50600 + }, + { + "epoch": 1.27, + "learning_rate": 0.0010927317036404291, + "loss": 0.0731, + "step": 50610 + }, + { + "epoch": 1.27, + "learning_rate": 0.0010923548476245509, + "loss": 0.073, + "step": 50620 + }, + { + "epoch": 1.27, + "learning_rate": 0.0010919779916086728, + "loss": 0.0762, + "step": 50630 + }, + { + "epoch": 1.27, + "learning_rate": 0.0010916011355927946, + "loss": 0.0744, + "step": 50640 + }, + { + "epoch": 1.27, + "learning_rate": 0.0010912242795769163, + "loss": 0.0736, + "step": 50650 + }, + { + "epoch": 1.27, + "learning_rate": 0.001090847423561038, + "loss": 0.0742, + "step": 50660 + }, + { + "epoch": 1.27, + "learning_rate": 0.00109047056754516, + "loss": 0.0778, + "step": 50670 + }, + { + "epoch": 1.27, + "learning_rate": 0.0010900937115292818, + "loss": 0.0742, + "step": 50680 + }, + { + "epoch": 1.27, + "learning_rate": 0.0010897168555134035, + "loss": 0.0732, + "step": 50690 + }, + { + "epoch": 1.27, + "learning_rate": 0.0010893399994975253, + "loss": 0.0738, + "step": 50700 + }, + { + "epoch": 1.27, + "learning_rate": 0.0010889631434816472, + "loss": 0.0721, + "step": 50710 + }, + { + "epoch": 1.27, + "learning_rate": 0.001088586287465769, + "loss": 0.0775, + "step": 50720 + }, + { + "epoch": 1.27, + "learning_rate": 0.0010882094314498907, + "loss": 0.0732, + "step": 50730 + }, + { + "epoch": 1.27, + "learning_rate": 0.0010878325754340125, + "loss": 0.0718, + "step": 50740 + }, + { + "epoch": 1.28, + "learning_rate": 0.0010874557194181342, + "loss": 0.0709, + "step": 50750 + }, + { + "epoch": 1.28, + "learning_rate": 0.0010870788634022562, + "loss": 0.0746, + "step": 50760 + }, + { + "epoch": 1.28, + "learning_rate": 0.001086702007386378, + "loss": 0.0775, + "step": 50770 + }, + { + "epoch": 1.28, + "learning_rate": 0.0010863251513704996, + "loss": 0.0724, + "step": 50780 + }, + { + "epoch": 1.28, + "learning_rate": 0.0010859482953546214, + "loss": 0.0755, + "step": 50790 + }, + { + "epoch": 1.28, + "learning_rate": 0.0010855714393387434, + "loss": 0.0748, + "step": 50800 + }, + { + "epoch": 1.28, + "learning_rate": 0.001085194583322865, + "loss": 0.0774, + "step": 50810 + }, + { + "epoch": 1.28, + "learning_rate": 0.001084817727306987, + "loss": 0.0721, + "step": 50820 + }, + { + "epoch": 1.28, + "learning_rate": 0.0010844408712911086, + "loss": 0.075, + "step": 50830 + }, + { + "epoch": 1.28, + "learning_rate": 0.0010840640152752306, + "loss": 0.0717, + "step": 50840 + }, + { + "epoch": 1.28, + "learning_rate": 0.0010836871592593523, + "loss": 0.072, + "step": 50850 + }, + { + "epoch": 1.28, + "learning_rate": 0.0010833103032434743, + "loss": 0.072, + "step": 50860 + }, + { + "epoch": 1.28, + "learning_rate": 0.001082933447227596, + "loss": 0.0769, + "step": 50870 + }, + { + "epoch": 1.28, + "learning_rate": 0.0010825565912117177, + "loss": 0.0747, + "step": 50880 + }, + { + "epoch": 1.28, + "learning_rate": 0.0010821797351958395, + "loss": 0.0706, + "step": 50890 + }, + { + "epoch": 1.28, + "learning_rate": 0.0010818028791799615, + "loss": 0.0691, + "step": 50900 + }, + { + "epoch": 1.28, + "learning_rate": 0.0010814260231640832, + "loss": 0.0739, + "step": 50910 + }, + { + "epoch": 1.28, + "learning_rate": 0.001081049167148205, + "loss": 0.0745, + "step": 50920 + }, + { + "epoch": 1.28, + "learning_rate": 0.0010806723111323267, + "loss": 0.0725, + "step": 50930 + }, + { + "epoch": 1.28, + "learning_rate": 0.0010802954551164486, + "loss": 0.0748, + "step": 50940 + }, + { + "epoch": 1.28, + "learning_rate": 0.0010799185991005704, + "loss": 0.0718, + "step": 50950 + }, + { + "epoch": 1.28, + "learning_rate": 0.0010795417430846921, + "loss": 0.0747, + "step": 50960 + }, + { + "epoch": 1.28, + "learning_rate": 0.0010791648870688139, + "loss": 0.0689, + "step": 50970 + }, + { + "epoch": 1.28, + "learning_rate": 0.0010787880310529356, + "loss": 0.0724, + "step": 50980 + }, + { + "epoch": 1.28, + "learning_rate": 0.0010784111750370576, + "loss": 0.0725, + "step": 50990 + }, + { + "epoch": 1.28, + "learning_rate": 0.0010780343190211793, + "loss": 0.0763, + "step": 51000 + }, + { + "epoch": 1.28, + "eval_cer": 0.6655237446264618, + "eval_loss": 0.06174508482217789, + "eval_runtime": 90.7553, + "eval_samples_per_second": 110.175, + "eval_steps_per_second": 6.887, + "step": 51000 + }, + { + "epoch": 1.28, + "learning_rate": 0.001077657463005301, + "loss": 0.0719, + "step": 51010 + }, + { + "epoch": 1.28, + "learning_rate": 0.0010772806069894228, + "loss": 0.0751, + "step": 51020 + }, + { + "epoch": 1.28, + "learning_rate": 0.0010769037509735448, + "loss": 0.0737, + "step": 51030 + }, + { + "epoch": 1.28, + "learning_rate": 0.0010765268949576665, + "loss": 0.0771, + "step": 51040 + }, + { + "epoch": 1.28, + "learning_rate": 0.0010761500389417883, + "loss": 0.0735, + "step": 51050 + }, + { + "epoch": 1.28, + "learning_rate": 0.00107577318292591, + "loss": 0.0738, + "step": 51060 + }, + { + "epoch": 1.28, + "learning_rate": 0.001075396326910032, + "loss": 0.0769, + "step": 51070 + }, + { + "epoch": 1.28, + "learning_rate": 0.0010750194708941537, + "loss": 0.0739, + "step": 51080 + }, + { + "epoch": 1.28, + "learning_rate": 0.0010746426148782757, + "loss": 0.073, + "step": 51090 + }, + { + "epoch": 1.28, + "learning_rate": 0.0010742657588623972, + "loss": 0.0721, + "step": 51100 + }, + { + "epoch": 1.28, + "learning_rate": 0.0010738889028465192, + "loss": 0.0745, + "step": 51110 + }, + { + "epoch": 1.28, + "learning_rate": 0.001073512046830641, + "loss": 0.0729, + "step": 51120 + }, + { + "epoch": 1.28, + "learning_rate": 0.0010731351908147629, + "loss": 0.0725, + "step": 51130 + }, + { + "epoch": 1.28, + "learning_rate": 0.0010727583347988846, + "loss": 0.0733, + "step": 51140 + }, + { + "epoch": 1.29, + "learning_rate": 0.0010723814787830064, + "loss": 0.0735, + "step": 51150 + }, + { + "epoch": 1.29, + "learning_rate": 0.0010720046227671281, + "loss": 0.074, + "step": 51160 + }, + { + "epoch": 1.29, + "learning_rate": 0.00107162776675125, + "loss": 0.0746, + "step": 51170 + }, + { + "epoch": 1.29, + "learning_rate": 0.0010712509107353718, + "loss": 0.0718, + "step": 51180 + }, + { + "epoch": 1.29, + "learning_rate": 0.0010708740547194933, + "loss": 0.0727, + "step": 51190 + }, + { + "epoch": 1.29, + "learning_rate": 0.0010704971987036153, + "loss": 0.0713, + "step": 51200 + }, + { + "epoch": 1.29, + "learning_rate": 0.001070120342687737, + "loss": 0.0702, + "step": 51210 + }, + { + "epoch": 1.29, + "learning_rate": 0.001069743486671859, + "loss": 0.0692, + "step": 51220 + }, + { + "epoch": 1.29, + "learning_rate": 0.0010693666306559808, + "loss": 0.074, + "step": 51230 + }, + { + "epoch": 1.29, + "learning_rate": 0.0010689897746401025, + "loss": 0.0725, + "step": 51240 + }, + { + "epoch": 1.29, + "learning_rate": 0.0010686129186242242, + "loss": 0.076, + "step": 51250 + }, + { + "epoch": 1.29, + "learning_rate": 0.0010682360626083462, + "loss": 0.072, + "step": 51260 + }, + { + "epoch": 1.29, + "learning_rate": 0.001067859206592468, + "loss": 0.0713, + "step": 51270 + }, + { + "epoch": 1.29, + "learning_rate": 0.0010674823505765897, + "loss": 0.0726, + "step": 51280 + }, + { + "epoch": 1.29, + "learning_rate": 0.0010671054945607114, + "loss": 0.0728, + "step": 51290 + }, + { + "epoch": 1.29, + "learning_rate": 0.0010667286385448334, + "loss": 0.0729, + "step": 51300 + }, + { + "epoch": 1.29, + "learning_rate": 0.0010663517825289552, + "loss": 0.0732, + "step": 51310 + }, + { + "epoch": 1.29, + "learning_rate": 0.001065974926513077, + "loss": 0.0726, + "step": 51320 + }, + { + "epoch": 1.29, + "learning_rate": 0.0010655980704971986, + "loss": 0.0739, + "step": 51330 + }, + { + "epoch": 1.29, + "learning_rate": 0.0010652212144813206, + "loss": 0.0724, + "step": 51340 + }, + { + "epoch": 1.29, + "learning_rate": 0.0010648443584654423, + "loss": 0.075, + "step": 51350 + }, + { + "epoch": 1.29, + "learning_rate": 0.001064467502449564, + "loss": 0.0707, + "step": 51360 + }, + { + "epoch": 1.29, + "learning_rate": 0.0010640906464336858, + "loss": 0.0743, + "step": 51370 + }, + { + "epoch": 1.29, + "learning_rate": 0.0010637137904178078, + "loss": 0.0726, + "step": 51380 + }, + { + "epoch": 1.29, + "learning_rate": 0.0010633369344019295, + "loss": 0.0736, + "step": 51390 + }, + { + "epoch": 1.29, + "learning_rate": 0.0010629600783860513, + "loss": 0.0706, + "step": 51400 + }, + { + "epoch": 1.29, + "learning_rate": 0.001062583222370173, + "loss": 0.0744, + "step": 51410 + }, + { + "epoch": 1.29, + "learning_rate": 0.0010622063663542948, + "loss": 0.0723, + "step": 51420 + }, + { + "epoch": 1.29, + "learning_rate": 0.0010618295103384167, + "loss": 0.075, + "step": 51430 + }, + { + "epoch": 1.29, + "learning_rate": 0.0010614526543225385, + "loss": 0.0715, + "step": 51440 + }, + { + "epoch": 1.29, + "learning_rate": 0.0010610757983066604, + "loss": 0.0701, + "step": 51450 + }, + { + "epoch": 1.29, + "learning_rate": 0.001060698942290782, + "loss": 0.0711, + "step": 51460 + }, + { + "epoch": 1.29, + "learning_rate": 0.001060322086274904, + "loss": 0.0731, + "step": 51470 + }, + { + "epoch": 1.29, + "learning_rate": 0.0010599452302590257, + "loss": 0.0721, + "step": 51480 + }, + { + "epoch": 1.29, + "learning_rate": 0.0010595683742431476, + "loss": 0.0705, + "step": 51490 + }, + { + "epoch": 1.29, + "learning_rate": 0.0010591915182272694, + "loss": 0.072, + "step": 51500 + }, + { + "epoch": 1.29, + "eval_cer": 0.6655559870587539, + "eval_loss": 0.0616888590157032, + "eval_runtime": 91.034, + "eval_samples_per_second": 109.838, + "eval_steps_per_second": 6.866, + "step": 51500 + }, + { + "epoch": 1.29, + "learning_rate": 0.0010588146622113911, + "loss": 0.0705, + "step": 51510 + }, + { + "epoch": 1.29, + "learning_rate": 0.0010584378061955129, + "loss": 0.0754, + "step": 51520 + }, + { + "epoch": 1.29, + "learning_rate": 0.0010580609501796348, + "loss": 0.0735, + "step": 51530 + }, + { + "epoch": 1.29, + "learning_rate": 0.0010576840941637566, + "loss": 0.0748, + "step": 51540 + }, + { + "epoch": 1.3, + "learning_rate": 0.0010573072381478783, + "loss": 0.0736, + "step": 51550 + }, + { + "epoch": 1.3, + "learning_rate": 0.001056930382132, + "loss": 0.0704, + "step": 51560 + }, + { + "epoch": 1.3, + "learning_rate": 0.001056553526116122, + "loss": 0.0718, + "step": 51570 + }, + { + "epoch": 1.3, + "learning_rate": 0.0010561766701002438, + "loss": 0.0751, + "step": 51580 + }, + { + "epoch": 1.3, + "learning_rate": 0.0010557998140843655, + "loss": 0.069, + "step": 51590 + }, + { + "epoch": 1.3, + "learning_rate": 0.0010554229580684873, + "loss": 0.0723, + "step": 51600 + }, + { + "epoch": 1.3, + "learning_rate": 0.0010550461020526092, + "loss": 0.0691, + "step": 51610 + }, + { + "epoch": 1.3, + "learning_rate": 0.001054669246036731, + "loss": 0.0721, + "step": 51620 + }, + { + "epoch": 1.3, + "learning_rate": 0.0010542923900208527, + "loss": 0.0717, + "step": 51630 + }, + { + "epoch": 1.3, + "learning_rate": 0.0010539155340049745, + "loss": 0.0694, + "step": 51640 + }, + { + "epoch": 1.3, + "learning_rate": 0.0010535386779890962, + "loss": 0.0756, + "step": 51650 + }, + { + "epoch": 1.3, + "learning_rate": 0.0010531618219732182, + "loss": 0.0726, + "step": 51660 + }, + { + "epoch": 1.3, + "learning_rate": 0.00105278496595734, + "loss": 0.0762, + "step": 51670 + }, + { + "epoch": 1.3, + "learning_rate": 0.0010524081099414617, + "loss": 0.0737, + "step": 51680 + }, + { + "epoch": 1.3, + "learning_rate": 0.0010520312539255834, + "loss": 0.0721, + "step": 51690 + }, + { + "epoch": 1.3, + "learning_rate": 0.0010516543979097054, + "loss": 0.0731, + "step": 51700 + }, + { + "epoch": 1.3, + "learning_rate": 0.001051277541893827, + "loss": 0.0707, + "step": 51710 + }, + { + "epoch": 1.3, + "learning_rate": 0.001050900685877949, + "loss": 0.0745, + "step": 51720 + }, + { + "epoch": 1.3, + "learning_rate": 0.0010505238298620706, + "loss": 0.07, + "step": 51730 + }, + { + "epoch": 1.3, + "learning_rate": 0.0010501469738461926, + "loss": 0.0709, + "step": 51740 + }, + { + "epoch": 1.3, + "learning_rate": 0.0010497701178303143, + "loss": 0.0716, + "step": 51750 + }, + { + "epoch": 1.3, + "learning_rate": 0.0010493932618144363, + "loss": 0.0748, + "step": 51760 + }, + { + "epoch": 1.3, + "learning_rate": 0.0010490164057985578, + "loss": 0.0731, + "step": 51770 + }, + { + "epoch": 1.3, + "learning_rate": 0.0010486395497826797, + "loss": 0.0765, + "step": 51780 + }, + { + "epoch": 1.3, + "learning_rate": 0.0010482626937668015, + "loss": 0.0749, + "step": 51790 + }, + { + "epoch": 1.3, + "learning_rate": 0.0010478858377509235, + "loss": 0.0731, + "step": 51800 + }, + { + "epoch": 1.3, + "learning_rate": 0.0010475089817350452, + "loss": 0.0739, + "step": 51810 + }, + { + "epoch": 1.3, + "learning_rate": 0.001047132125719167, + "loss": 0.0741, + "step": 51820 + }, + { + "epoch": 1.3, + "learning_rate": 0.0010467552697032887, + "loss": 0.0737, + "step": 51830 + }, + { + "epoch": 1.3, + "learning_rate": 0.0010463784136874104, + "loss": 0.0737, + "step": 51840 + }, + { + "epoch": 1.3, + "learning_rate": 0.0010460015576715324, + "loss": 0.0729, + "step": 51850 + }, + { + "epoch": 1.3, + "learning_rate": 0.0010456247016556541, + "loss": 0.071, + "step": 51860 + }, + { + "epoch": 1.3, + "learning_rate": 0.0010452478456397759, + "loss": 0.072, + "step": 51870 + }, + { + "epoch": 1.3, + "learning_rate": 0.0010448709896238976, + "loss": 0.0693, + "step": 51880 + }, + { + "epoch": 1.3, + "learning_rate": 0.0010444941336080196, + "loss": 0.0739, + "step": 51890 + }, + { + "epoch": 1.3, + "learning_rate": 0.0010441172775921413, + "loss": 0.0753, + "step": 51900 + }, + { + "epoch": 1.3, + "learning_rate": 0.001043740421576263, + "loss": 0.0736, + "step": 51910 + }, + { + "epoch": 1.3, + "learning_rate": 0.0010433635655603848, + "loss": 0.0729, + "step": 51920 + }, + { + "epoch": 1.3, + "learning_rate": 0.0010429867095445068, + "loss": 0.0731, + "step": 51930 + }, + { + "epoch": 1.3, + "learning_rate": 0.0010426098535286285, + "loss": 0.0704, + "step": 51940 + }, + { + "epoch": 1.31, + "learning_rate": 0.0010422329975127503, + "loss": 0.0721, + "step": 51950 + }, + { + "epoch": 1.31, + "learning_rate": 0.001041856141496872, + "loss": 0.0716, + "step": 51960 + }, + { + "epoch": 1.31, + "learning_rate": 0.001041479285480994, + "loss": 0.0714, + "step": 51970 + }, + { + "epoch": 1.31, + "learning_rate": 0.0010411024294651157, + "loss": 0.0706, + "step": 51980 + }, + { + "epoch": 1.31, + "learning_rate": 0.0010407255734492375, + "loss": 0.0709, + "step": 51990 + }, + { + "epoch": 1.31, + "learning_rate": 0.0010403487174333592, + "loss": 0.0718, + "step": 52000 + }, + { + "epoch": 1.31, + "eval_cer": 0.6653235528080512, + "eval_loss": 0.06183711811900139, + "eval_runtime": 91.0284, + "eval_samples_per_second": 109.845, + "eval_steps_per_second": 6.866, + "step": 52000 + }, + { + "epoch": 1.31, + "learning_rate": 0.0010399718614174812, + "loss": 0.0703, + "step": 52010 + }, + { + "epoch": 1.31, + "learning_rate": 0.001039595005401603, + "loss": 0.0703, + "step": 52020 + }, + { + "epoch": 1.31, + "learning_rate": 0.0010392181493857249, + "loss": 0.0732, + "step": 52030 + }, + { + "epoch": 1.31, + "learning_rate": 0.0010388412933698464, + "loss": 0.0729, + "step": 52040 + }, + { + "epoch": 1.31, + "learning_rate": 0.0010384644373539684, + "loss": 0.0738, + "step": 52050 + }, + { + "epoch": 1.31, + "learning_rate": 0.0010380875813380901, + "loss": 0.0747, + "step": 52060 + }, + { + "epoch": 1.31, + "learning_rate": 0.0010377107253222119, + "loss": 0.0749, + "step": 52070 + }, + { + "epoch": 1.31, + "learning_rate": 0.0010373338693063338, + "loss": 0.0732, + "step": 52080 + }, + { + "epoch": 1.31, + "learning_rate": 0.0010369570132904554, + "loss": 0.075, + "step": 52090 + }, + { + "epoch": 1.31, + "learning_rate": 0.0010365801572745773, + "loss": 0.0721, + "step": 52100 + }, + { + "epoch": 1.31, + "learning_rate": 0.001036203301258699, + "loss": 0.0716, + "step": 52110 + }, + { + "epoch": 1.31, + "learning_rate": 0.001035826445242821, + "loss": 0.0721, + "step": 52120 + }, + { + "epoch": 1.31, + "learning_rate": 0.0010354495892269428, + "loss": 0.075, + "step": 52130 + }, + { + "epoch": 1.31, + "learning_rate": 0.0010350727332110645, + "loss": 0.0739, + "step": 52140 + }, + { + "epoch": 1.31, + "learning_rate": 0.0010346958771951863, + "loss": 0.071, + "step": 52150 + }, + { + "epoch": 1.31, + "learning_rate": 0.0010343190211793082, + "loss": 0.0702, + "step": 52160 + }, + { + "epoch": 1.31, + "learning_rate": 0.00103394216516343, + "loss": 0.0759, + "step": 52170 + }, + { + "epoch": 1.31, + "learning_rate": 0.0010335653091475517, + "loss": 0.0765, + "step": 52180 + }, + { + "epoch": 1.31, + "learning_rate": 0.0010331884531316734, + "loss": 0.0735, + "step": 52190 + }, + { + "epoch": 1.31, + "learning_rate": 0.0010328115971157954, + "loss": 0.0722, + "step": 52200 + }, + { + "epoch": 1.31, + "learning_rate": 0.0010324347410999172, + "loss": 0.0718, + "step": 52210 + }, + { + "epoch": 1.31, + "learning_rate": 0.001032057885084039, + "loss": 0.0712, + "step": 52220 + }, + { + "epoch": 1.31, + "learning_rate": 0.0010316810290681606, + "loss": 0.0741, + "step": 52230 + }, + { + "epoch": 1.31, + "learning_rate": 0.0010313041730522826, + "loss": 0.071, + "step": 52240 + }, + { + "epoch": 1.31, + "learning_rate": 0.0010309273170364043, + "loss": 0.0719, + "step": 52250 + }, + { + "epoch": 1.31, + "learning_rate": 0.001030550461020526, + "loss": 0.07, + "step": 52260 + }, + { + "epoch": 1.31, + "learning_rate": 0.0010301736050046478, + "loss": 0.0736, + "step": 52270 + }, + { + "epoch": 1.31, + "learning_rate": 0.0010297967489887698, + "loss": 0.0734, + "step": 52280 + }, + { + "epoch": 1.31, + "learning_rate": 0.0010294198929728915, + "loss": 0.0736, + "step": 52290 + }, + { + "epoch": 1.31, + "learning_rate": 0.0010290430369570133, + "loss": 0.0706, + "step": 52300 + }, + { + "epoch": 1.31, + "learning_rate": 0.001028666180941135, + "loss": 0.0719, + "step": 52310 + }, + { + "epoch": 1.31, + "learning_rate": 0.0010282893249252568, + "loss": 0.0728, + "step": 52320 + }, + { + "epoch": 1.31, + "learning_rate": 0.0010279124689093787, + "loss": 0.0694, + "step": 52330 + }, + { + "epoch": 1.31, + "learning_rate": 0.0010275356128935005, + "loss": 0.0718, + "step": 52340 + }, + { + "epoch": 1.32, + "learning_rate": 0.0010271587568776222, + "loss": 0.0706, + "step": 52350 + }, + { + "epoch": 1.32, + "learning_rate": 0.001026781900861744, + "loss": 0.0725, + "step": 52360 + }, + { + "epoch": 1.32, + "learning_rate": 0.001026405044845866, + "loss": 0.072, + "step": 52370 + }, + { + "epoch": 1.32, + "learning_rate": 0.0010260281888299877, + "loss": 0.0752, + "step": 52380 + }, + { + "epoch": 1.32, + "learning_rate": 0.0010256513328141096, + "loss": 0.0722, + "step": 52390 + }, + { + "epoch": 1.32, + "learning_rate": 0.0010252744767982312, + "loss": 0.0748, + "step": 52400 + }, + { + "epoch": 1.32, + "learning_rate": 0.0010248976207823531, + "loss": 0.073, + "step": 52410 + }, + { + "epoch": 1.32, + "learning_rate": 0.0010245207647664749, + "loss": 0.07, + "step": 52420 + }, + { + "epoch": 1.32, + "learning_rate": 0.0010241439087505968, + "loss": 0.0692, + "step": 52430 + }, + { + "epoch": 1.32, + "learning_rate": 0.0010237670527347186, + "loss": 0.0743, + "step": 52440 + }, + { + "epoch": 1.32, + "learning_rate": 0.0010233901967188403, + "loss": 0.077, + "step": 52450 + }, + { + "epoch": 1.32, + "learning_rate": 0.001023013340702962, + "loss": 0.0756, + "step": 52460 + }, + { + "epoch": 1.32, + "learning_rate": 0.001022636484687084, + "loss": 0.073, + "step": 52470 + }, + { + "epoch": 1.32, + "learning_rate": 0.0010222596286712058, + "loss": 0.0715, + "step": 52480 + }, + { + "epoch": 1.32, + "learning_rate": 0.0010218827726553275, + "loss": 0.0715, + "step": 52490 + }, + { + "epoch": 1.32, + "learning_rate": 0.0010215059166394493, + "loss": 0.0703, + "step": 52500 + }, + { + "epoch": 1.32, + "eval_cer": 0.6654621471438739, + "eval_loss": 0.06106410175561905, + "eval_runtime": 90.7505, + "eval_samples_per_second": 110.181, + "eval_steps_per_second": 6.887, + "step": 52500 + }, + { + "epoch": 1.32, + "learning_rate": 0.001021129060623571, + "loss": 0.0698, + "step": 52510 + }, + { + "epoch": 1.32, + "learning_rate": 0.001020752204607693, + "loss": 0.0719, + "step": 52520 + }, + { + "epoch": 1.32, + "learning_rate": 0.0010203753485918147, + "loss": 0.073, + "step": 52530 + }, + { + "epoch": 1.32, + "learning_rate": 0.0010199984925759365, + "loss": 0.0707, + "step": 52540 + }, + { + "epoch": 1.32, + "learning_rate": 0.0010196216365600582, + "loss": 0.072, + "step": 52550 + }, + { + "epoch": 1.32, + "learning_rate": 0.0010192447805441802, + "loss": 0.0704, + "step": 52560 + }, + { + "epoch": 1.32, + "learning_rate": 0.001018867924528302, + "loss": 0.0717, + "step": 52570 + }, + { + "epoch": 1.32, + "learning_rate": 0.0010184910685124237, + "loss": 0.0709, + "step": 52580 + }, + { + "epoch": 1.32, + "learning_rate": 0.0010181142124965454, + "loss": 0.0738, + "step": 52590 + }, + { + "epoch": 1.32, + "learning_rate": 0.0010177373564806674, + "loss": 0.067, + "step": 52600 + }, + { + "epoch": 1.32, + "learning_rate": 0.001017360500464789, + "loss": 0.07, + "step": 52610 + }, + { + "epoch": 1.32, + "learning_rate": 0.0010169836444489109, + "loss": 0.072, + "step": 52620 + }, + { + "epoch": 1.32, + "learning_rate": 0.0010166067884330326, + "loss": 0.0748, + "step": 52630 + }, + { + "epoch": 1.32, + "learning_rate": 0.0010162299324171546, + "loss": 0.0709, + "step": 52640 + }, + { + "epoch": 1.32, + "learning_rate": 0.0010158530764012763, + "loss": 0.0732, + "step": 52650 + }, + { + "epoch": 1.32, + "learning_rate": 0.0010154762203853983, + "loss": 0.0708, + "step": 52660 + }, + { + "epoch": 1.32, + "learning_rate": 0.0010150993643695198, + "loss": 0.0752, + "step": 52670 + }, + { + "epoch": 1.32, + "learning_rate": 0.0010147225083536418, + "loss": 0.0717, + "step": 52680 + }, + { + "epoch": 1.32, + "learning_rate": 0.0010143456523377635, + "loss": 0.073, + "step": 52690 + }, + { + "epoch": 1.32, + "learning_rate": 0.0010139687963218855, + "loss": 0.071, + "step": 52700 + }, + { + "epoch": 1.32, + "learning_rate": 0.0010135919403060072, + "loss": 0.07, + "step": 52710 + }, + { + "epoch": 1.32, + "learning_rate": 0.001013215084290129, + "loss": 0.0735, + "step": 52720 + }, + { + "epoch": 1.32, + "learning_rate": 0.0010128382282742507, + "loss": 0.0759, + "step": 52730 + }, + { + "epoch": 1.33, + "learning_rate": 0.0010124613722583724, + "loss": 0.0733, + "step": 52740 + }, + { + "epoch": 1.33, + "learning_rate": 0.0010120845162424944, + "loss": 0.0738, + "step": 52750 + }, + { + "epoch": 1.33, + "learning_rate": 0.001011707660226616, + "loss": 0.071, + "step": 52760 + }, + { + "epoch": 1.33, + "learning_rate": 0.0010113308042107379, + "loss": 0.0747, + "step": 52770 + }, + { + "epoch": 1.33, + "learning_rate": 0.0010109539481948596, + "loss": 0.075, + "step": 52780 + }, + { + "epoch": 1.33, + "learning_rate": 0.0010105770921789816, + "loss": 0.0727, + "step": 52790 + }, + { + "epoch": 1.33, + "learning_rate": 0.0010102002361631033, + "loss": 0.0747, + "step": 52800 + }, + { + "epoch": 1.33, + "learning_rate": 0.001009823380147225, + "loss": 0.0732, + "step": 52810 + }, + { + "epoch": 1.33, + "learning_rate": 0.0010094465241313468, + "loss": 0.0699, + "step": 52820 + }, + { + "epoch": 1.33, + "learning_rate": 0.0010090696681154688, + "loss": 0.0717, + "step": 52830 + }, + { + "epoch": 1.33, + "learning_rate": 0.0010086928120995905, + "loss": 0.0679, + "step": 52840 + }, + { + "epoch": 1.33, + "learning_rate": 0.0010083159560837123, + "loss": 0.0713, + "step": 52850 + }, + { + "epoch": 1.33, + "learning_rate": 0.001007939100067834, + "loss": 0.0747, + "step": 52860 + }, + { + "epoch": 1.33, + "learning_rate": 0.001007562244051956, + "loss": 0.073, + "step": 52870 + }, + { + "epoch": 1.33, + "learning_rate": 0.0010071853880360777, + "loss": 0.074, + "step": 52880 + }, + { + "epoch": 1.33, + "learning_rate": 0.0010068085320201995, + "loss": 0.0758, + "step": 52890 + }, + { + "epoch": 1.33, + "learning_rate": 0.0010064316760043212, + "loss": 0.0721, + "step": 52900 + }, + { + "epoch": 1.33, + "learning_rate": 0.0010060548199884432, + "loss": 0.0704, + "step": 52910 + }, + { + "epoch": 1.33, + "learning_rate": 0.001005677963972565, + "loss": 0.074, + "step": 52920 + }, + { + "epoch": 1.33, + "learning_rate": 0.0010053011079566867, + "loss": 0.0716, + "step": 52930 + }, + { + "epoch": 1.33, + "learning_rate": 0.0010049242519408084, + "loss": 0.0735, + "step": 52940 + }, + { + "epoch": 1.33, + "learning_rate": 0.0010045473959249304, + "loss": 0.0705, + "step": 52950 + }, + { + "epoch": 1.33, + "learning_rate": 0.0010041705399090521, + "loss": 0.0727, + "step": 52960 + }, + { + "epoch": 1.33, + "learning_rate": 0.0010037936838931739, + "loss": 0.0741, + "step": 52970 + }, + { + "epoch": 1.33, + "learning_rate": 0.0010034168278772956, + "loss": 0.0699, + "step": 52980 + }, + { + "epoch": 1.33, + "learning_rate": 0.0010030399718614174, + "loss": 0.071, + "step": 52990 + }, + { + "epoch": 1.33, + "learning_rate": 0.0010026631158455393, + "loss": 0.0718, + "step": 53000 + }, + { + "epoch": 1.33, + "eval_cer": 0.6655482873734304, + "eval_loss": 0.06082231178879738, + "eval_runtime": 90.7973, + "eval_samples_per_second": 110.124, + "eval_steps_per_second": 6.883, + "step": 53000 + }, + { + "epoch": 1.33, + "learning_rate": 0.001002286259829661, + "loss": 0.072, + "step": 53010 + }, + { + "epoch": 1.33, + "learning_rate": 0.001001909403813783, + "loss": 0.0687, + "step": 53020 + }, + { + "epoch": 1.33, + "learning_rate": 0.0010015325477979046, + "loss": 0.0701, + "step": 53030 + }, + { + "epoch": 1.33, + "learning_rate": 0.0010011556917820265, + "loss": 0.072, + "step": 53040 + }, + { + "epoch": 1.33, + "learning_rate": 0.0010007788357661483, + "loss": 0.0746, + "step": 53050 + }, + { + "epoch": 1.33, + "learning_rate": 0.0010004019797502702, + "loss": 0.0726, + "step": 53060 + }, + { + "epoch": 1.33, + "learning_rate": 0.001000025123734392, + "loss": 0.0694, + "step": 53070 + }, + { + "epoch": 1.33, + "learning_rate": 0.0009996482677185137, + "loss": 0.0733, + "step": 53080 + }, + { + "epoch": 1.33, + "learning_rate": 0.0009992714117026355, + "loss": 0.0767, + "step": 53090 + }, + { + "epoch": 1.33, + "learning_rate": 0.0009988945556867574, + "loss": 0.0724, + "step": 53100 + }, + { + "epoch": 1.33, + "learning_rate": 0.0009985176996708792, + "loss": 0.0753, + "step": 53110 + }, + { + "epoch": 1.33, + "learning_rate": 0.000998140843655001, + "loss": 0.0718, + "step": 53120 + }, + { + "epoch": 1.33, + "learning_rate": 0.0009977639876391226, + "loss": 0.0731, + "step": 53130 + }, + { + "epoch": 1.34, + "learning_rate": 0.0009973871316232446, + "loss": 0.073, + "step": 53140 + }, + { + "epoch": 1.34, + "learning_rate": 0.0009970102756073664, + "loss": 0.0725, + "step": 53150 + }, + { + "epoch": 1.34, + "learning_rate": 0.000996633419591488, + "loss": 0.0702, + "step": 53160 + }, + { + "epoch": 1.34, + "learning_rate": 0.0009962565635756098, + "loss": 0.0718, + "step": 53170 + }, + { + "epoch": 1.34, + "learning_rate": 0.0009958797075597316, + "loss": 0.0698, + "step": 53180 + }, + { + "epoch": 1.34, + "learning_rate": 0.0009955028515438535, + "loss": 0.0738, + "step": 53190 + }, + { + "epoch": 1.34, + "learning_rate": 0.0009951259955279753, + "loss": 0.0708, + "step": 53200 + }, + { + "epoch": 1.34, + "learning_rate": 0.000994749139512097, + "loss": 0.0719, + "step": 53210 + }, + { + "epoch": 1.34, + "learning_rate": 0.0009943722834962188, + "loss": 0.0705, + "step": 53220 + }, + { + "epoch": 1.34, + "learning_rate": 0.0009939954274803407, + "loss": 0.0735, + "step": 53230 + }, + { + "epoch": 1.34, + "learning_rate": 0.0009936185714644625, + "loss": 0.0689, + "step": 53240 + }, + { + "epoch": 1.34, + "learning_rate": 0.0009932417154485842, + "loss": 0.0734, + "step": 53250 + }, + { + "epoch": 1.34, + "learning_rate": 0.000992864859432706, + "loss": 0.0702, + "step": 53260 + }, + { + "epoch": 1.34, + "learning_rate": 0.000992488003416828, + "loss": 0.0728, + "step": 53270 + }, + { + "epoch": 1.34, + "learning_rate": 0.0009921111474009497, + "loss": 0.0755, + "step": 53280 + }, + { + "epoch": 1.34, + "learning_rate": 0.0009917342913850716, + "loss": 0.0705, + "step": 53290 + }, + { + "epoch": 1.34, + "learning_rate": 0.0009913574353691932, + "loss": 0.0708, + "step": 53300 + }, + { + "epoch": 1.34, + "learning_rate": 0.0009909805793533151, + "loss": 0.0678, + "step": 53310 + }, + { + "epoch": 1.34, + "learning_rate": 0.0009906037233374369, + "loss": 0.0701, + "step": 53320 + }, + { + "epoch": 1.34, + "learning_rate": 0.0009902268673215588, + "loss": 0.0708, + "step": 53330 + }, + { + "epoch": 1.34, + "learning_rate": 0.0009898500113056804, + "loss": 0.0682, + "step": 53340 + }, + { + "epoch": 1.34, + "learning_rate": 0.0009894731552898023, + "loss": 0.0692, + "step": 53350 + }, + { + "epoch": 1.34, + "learning_rate": 0.000989096299273924, + "loss": 0.0732, + "step": 53360 + }, + { + "epoch": 1.34, + "learning_rate": 0.000988719443258046, + "loss": 0.0717, + "step": 53370 + }, + { + "epoch": 1.34, + "learning_rate": 0.0009883425872421678, + "loss": 0.0711, + "step": 53380 + }, + { + "epoch": 1.34, + "learning_rate": 0.0009879657312262895, + "loss": 0.0732, + "step": 53390 + }, + { + "epoch": 1.34, + "learning_rate": 0.0009875888752104113, + "loss": 0.0734, + "step": 53400 + }, + { + "epoch": 1.34, + "learning_rate": 0.000987212019194533, + "loss": 0.0754, + "step": 53410 + }, + { + "epoch": 1.34, + "learning_rate": 0.000986835163178655, + "loss": 0.0732, + "step": 53420 + }, + { + "epoch": 1.34, + "learning_rate": 0.0009864583071627767, + "loss": 0.0717, + "step": 53430 + }, + { + "epoch": 1.34, + "learning_rate": 0.0009860814511468985, + "loss": 0.0724, + "step": 53440 + }, + { + "epoch": 1.34, + "learning_rate": 0.0009857045951310202, + "loss": 0.0711, + "step": 53450 + }, + { + "epoch": 1.34, + "learning_rate": 0.0009853277391151422, + "loss": 0.0715, + "step": 53460 + }, + { + "epoch": 1.34, + "learning_rate": 0.000984950883099264, + "loss": 0.07, + "step": 53470 + }, + { + "epoch": 1.34, + "learning_rate": 0.0009845740270833857, + "loss": 0.073, + "step": 53480 + }, + { + "epoch": 1.34, + "learning_rate": 0.0009841971710675074, + "loss": 0.0724, + "step": 53490 + }, + { + "epoch": 1.34, + "learning_rate": 0.0009838203150516294, + "loss": 0.0686, + "step": 53500 + }, + { + "epoch": 1.34, + "eval_cer": 0.6653375084877, + "eval_loss": 0.06101470813155174, + "eval_runtime": 90.6137, + "eval_samples_per_second": 110.348, + "eval_steps_per_second": 6.897, + "step": 53500 + }, + { + "epoch": 1.34, + "learning_rate": 0.0009834434590357511, + "loss": 0.0681, + "step": 53510 + }, + { + "epoch": 1.34, + "learning_rate": 0.0009830666030198729, + "loss": 0.067, + "step": 53520 + }, + { + "epoch": 1.34, + "learning_rate": 0.0009826897470039946, + "loss": 0.0727, + "step": 53530 + }, + { + "epoch": 1.35, + "learning_rate": 0.0009823128909881166, + "loss": 0.0722, + "step": 53540 + }, + { + "epoch": 1.35, + "learning_rate": 0.0009819360349722383, + "loss": 0.0716, + "step": 53550 + }, + { + "epoch": 1.35, + "learning_rate": 0.00098155917895636, + "loss": 0.0718, + "step": 53560 + }, + { + "epoch": 1.35, + "learning_rate": 0.0009811823229404818, + "loss": 0.0726, + "step": 53570 + }, + { + "epoch": 1.35, + "learning_rate": 0.0009808054669246038, + "loss": 0.0677, + "step": 53580 + }, + { + "epoch": 1.35, + "learning_rate": 0.0009804286109087255, + "loss": 0.0702, + "step": 53590 + }, + { + "epoch": 1.35, + "learning_rate": 0.0009800517548928475, + "loss": 0.0701, + "step": 53600 + }, + { + "epoch": 1.35, + "learning_rate": 0.000979674898876969, + "loss": 0.072, + "step": 53610 + }, + { + "epoch": 1.35, + "learning_rate": 0.0009792980428610907, + "loss": 0.0723, + "step": 53620 + }, + { + "epoch": 1.35, + "learning_rate": 0.0009789211868452127, + "loss": 0.0696, + "step": 53630 + }, + { + "epoch": 1.35, + "learning_rate": 0.0009785443308293344, + "loss": 0.0715, + "step": 53640 + }, + { + "epoch": 1.35, + "learning_rate": 0.0009781674748134564, + "loss": 0.0733, + "step": 53650 + }, + { + "epoch": 1.35, + "learning_rate": 0.000977790618797578, + "loss": 0.0751, + "step": 53660 + }, + { + "epoch": 1.35, + "learning_rate": 0.0009774137627817, + "loss": 0.0722, + "step": 53670 + }, + { + "epoch": 1.35, + "learning_rate": 0.0009770369067658216, + "loss": 0.0675, + "step": 53680 + }, + { + "epoch": 1.35, + "learning_rate": 0.0009766600507499436, + "loss": 0.068, + "step": 53690 + }, + { + "epoch": 1.35, + "learning_rate": 0.0009762831947340652, + "loss": 0.0714, + "step": 53700 + }, + { + "epoch": 1.35, + "learning_rate": 0.0009759063387181871, + "loss": 0.0723, + "step": 53710 + }, + { + "epoch": 1.35, + "learning_rate": 0.0009755294827023088, + "loss": 0.073, + "step": 53720 + }, + { + "epoch": 1.35, + "learning_rate": 0.0009751526266864307, + "loss": 0.0702, + "step": 53730 + }, + { + "epoch": 1.35, + "learning_rate": 0.0009747757706705524, + "loss": 0.0757, + "step": 53740 + }, + { + "epoch": 1.35, + "learning_rate": 0.0009743989146546744, + "loss": 0.0702, + "step": 53750 + }, + { + "epoch": 1.35, + "learning_rate": 0.000974022058638796, + "loss": 0.0722, + "step": 53760 + }, + { + "epoch": 1.35, + "learning_rate": 0.000973645202622918, + "loss": 0.0747, + "step": 53770 + }, + { + "epoch": 1.35, + "learning_rate": 0.0009732683466070396, + "loss": 0.0731, + "step": 53780 + }, + { + "epoch": 1.35, + "learning_rate": 0.0009728914905911616, + "loss": 0.0745, + "step": 53790 + }, + { + "epoch": 1.35, + "learning_rate": 0.0009725146345752832, + "loss": 0.0717, + "step": 53800 + }, + { + "epoch": 1.35, + "learning_rate": 0.0009721377785594052, + "loss": 0.0748, + "step": 53810 + }, + { + "epoch": 1.35, + "learning_rate": 0.0009717609225435269, + "loss": 0.0734, + "step": 53820 + }, + { + "epoch": 1.35, + "learning_rate": 0.0009713840665276488, + "loss": 0.0734, + "step": 53830 + }, + { + "epoch": 1.35, + "learning_rate": 0.0009710072105117705, + "loss": 0.0695, + "step": 53840 + }, + { + "epoch": 1.35, + "learning_rate": 0.0009706303544958922, + "loss": 0.0715, + "step": 53850 + }, + { + "epoch": 1.35, + "learning_rate": 0.0009702534984800141, + "loss": 0.0708, + "step": 53860 + }, + { + "epoch": 1.35, + "learning_rate": 0.0009698766424641359, + "loss": 0.07, + "step": 53870 + }, + { + "epoch": 1.35, + "learning_rate": 0.0009694997864482577, + "loss": 0.0709, + "step": 53880 + }, + { + "epoch": 1.35, + "learning_rate": 0.0009691229304323795, + "loss": 0.0742, + "step": 53890 + }, + { + "epoch": 1.35, + "learning_rate": 0.0009687460744165013, + "loss": 0.0708, + "step": 53900 + }, + { + "epoch": 1.35, + "learning_rate": 0.0009683692184006231, + "loss": 0.0711, + "step": 53910 + }, + { + "epoch": 1.35, + "learning_rate": 0.0009679923623847449, + "loss": 0.068, + "step": 53920 + }, + { + "epoch": 1.35, + "learning_rate": 0.0009676155063688667, + "loss": 0.0715, + "step": 53930 + }, + { + "epoch": 1.36, + "learning_rate": 0.0009672386503529885, + "loss": 0.073, + "step": 53940 + }, + { + "epoch": 1.36, + "learning_rate": 0.0009668617943371103, + "loss": 0.0709, + "step": 53950 + }, + { + "epoch": 1.36, + "learning_rate": 0.0009664849383212321, + "loss": 0.0699, + "step": 53960 + }, + { + "epoch": 1.36, + "learning_rate": 0.0009661080823053539, + "loss": 0.0715, + "step": 53970 + }, + { + "epoch": 1.36, + "learning_rate": 0.0009657312262894757, + "loss": 0.0722, + "step": 53980 + }, + { + "epoch": 1.36, + "learning_rate": 0.0009653543702735975, + "loss": 0.0668, + "step": 53990 + }, + { + "epoch": 1.36, + "learning_rate": 0.0009649775142577193, + "loss": 0.0688, + "step": 54000 + }, + { + "epoch": 1.36, + "eval_cer": 0.6656522331252974, + "eval_loss": 0.060397226363420486, + "eval_runtime": 90.8096, + "eval_samples_per_second": 110.11, + "eval_steps_per_second": 6.883, + "step": 54000 + }, + { + "epoch": 1.36, + "learning_rate": 0.000964600658241841, + "loss": 0.0686, + "step": 54010 + }, + { + "epoch": 1.36, + "learning_rate": 0.0009642238022259629, + "loss": 0.0727, + "step": 54020 + }, + { + "epoch": 1.36, + "learning_rate": 0.0009638469462100847, + "loss": 0.0683, + "step": 54030 + }, + { + "epoch": 1.36, + "learning_rate": 0.0009634700901942066, + "loss": 0.0678, + "step": 54040 + }, + { + "epoch": 1.36, + "learning_rate": 0.0009630932341783282, + "loss": 0.0718, + "step": 54050 + }, + { + "epoch": 1.36, + "learning_rate": 0.0009627163781624502, + "loss": 0.0727, + "step": 54060 + }, + { + "epoch": 1.36, + "learning_rate": 0.0009623395221465718, + "loss": 0.0712, + "step": 54070 + }, + { + "epoch": 1.36, + "learning_rate": 0.0009619626661306936, + "loss": 0.0725, + "step": 54080 + }, + { + "epoch": 1.36, + "learning_rate": 0.0009615858101148154, + "loss": 0.0715, + "step": 54090 + }, + { + "epoch": 1.36, + "learning_rate": 0.0009612089540989372, + "loss": 0.0701, + "step": 54100 + }, + { + "epoch": 1.36, + "learning_rate": 0.0009608320980830591, + "loss": 0.0725, + "step": 54110 + }, + { + "epoch": 1.36, + "learning_rate": 0.0009604552420671808, + "loss": 0.075, + "step": 54120 + }, + { + "epoch": 1.36, + "learning_rate": 0.0009600783860513027, + "loss": 0.0692, + "step": 54130 + }, + { + "epoch": 1.36, + "learning_rate": 0.0009597015300354244, + "loss": 0.0724, + "step": 54140 + }, + { + "epoch": 1.36, + "learning_rate": 0.0009593246740195463, + "loss": 0.067, + "step": 54150 + }, + { + "epoch": 1.36, + "learning_rate": 0.0009589478180036681, + "loss": 0.0737, + "step": 54160 + }, + { + "epoch": 1.36, + "learning_rate": 0.0009585709619877899, + "loss": 0.0668, + "step": 54170 + }, + { + "epoch": 1.36, + "learning_rate": 0.0009581941059719117, + "loss": 0.0715, + "step": 54180 + }, + { + "epoch": 1.36, + "learning_rate": 0.0009578172499560335, + "loss": 0.0717, + "step": 54190 + }, + { + "epoch": 1.36, + "learning_rate": 0.0009574403939401553, + "loss": 0.0748, + "step": 54200 + }, + { + "epoch": 1.36, + "learning_rate": 0.0009570635379242771, + "loss": 0.0702, + "step": 54210 + }, + { + "epoch": 1.36, + "learning_rate": 0.0009566866819083989, + "loss": 0.0734, + "step": 54220 + }, + { + "epoch": 1.36, + "learning_rate": 0.0009563098258925207, + "loss": 0.0703, + "step": 54230 + }, + { + "epoch": 1.36, + "learning_rate": 0.0009559329698766425, + "loss": 0.0712, + "step": 54240 + }, + { + "epoch": 1.36, + "learning_rate": 0.0009555561138607643, + "loss": 0.0733, + "step": 54250 + }, + { + "epoch": 1.36, + "learning_rate": 0.0009551792578448861, + "loss": 0.0693, + "step": 54260 + }, + { + "epoch": 1.36, + "learning_rate": 0.0009548024018290079, + "loss": 0.0699, + "step": 54270 + }, + { + "epoch": 1.36, + "learning_rate": 0.0009544255458131297, + "loss": 0.0729, + "step": 54280 + }, + { + "epoch": 1.36, + "learning_rate": 0.0009540486897972514, + "loss": 0.0699, + "step": 54290 + }, + { + "epoch": 1.36, + "learning_rate": 0.0009536718337813733, + "loss": 0.0693, + "step": 54300 + }, + { + "epoch": 1.36, + "learning_rate": 0.000953294977765495, + "loss": 0.0734, + "step": 54310 + }, + { + "epoch": 1.36, + "learning_rate": 0.0009529181217496169, + "loss": 0.0684, + "step": 54320 + }, + { + "epoch": 1.36, + "learning_rate": 0.0009525412657337386, + "loss": 0.0711, + "step": 54330 + }, + { + "epoch": 1.37, + "learning_rate": 0.0009521644097178605, + "loss": 0.0725, + "step": 54340 + }, + { + "epoch": 1.37, + "learning_rate": 0.0009517875537019822, + "loss": 0.074, + "step": 54350 + }, + { + "epoch": 1.37, + "learning_rate": 0.0009514106976861041, + "loss": 0.0689, + "step": 54360 + }, + { + "epoch": 1.37, + "learning_rate": 0.0009510338416702258, + "loss": 0.0725, + "step": 54370 + }, + { + "epoch": 1.37, + "learning_rate": 0.0009506569856543477, + "loss": 0.0691, + "step": 54380 + }, + { + "epoch": 1.37, + "learning_rate": 0.0009502801296384694, + "loss": 0.0711, + "step": 54390 + }, + { + "epoch": 1.37, + "learning_rate": 0.0009499032736225914, + "loss": 0.0654, + "step": 54400 + }, + { + "epoch": 1.37, + "learning_rate": 0.000949526417606713, + "loss": 0.0706, + "step": 54410 + }, + { + "epoch": 1.37, + "learning_rate": 0.000949149561590835, + "loss": 0.0704, + "step": 54420 + }, + { + "epoch": 1.37, + "learning_rate": 0.0009487727055749566, + "loss": 0.0744, + "step": 54430 + }, + { + "epoch": 1.37, + "learning_rate": 0.0009483958495590786, + "loss": 0.0717, + "step": 54440 + }, + { + "epoch": 1.37, + "learning_rate": 0.0009480189935432003, + "loss": 0.0697, + "step": 54450 + }, + { + "epoch": 1.37, + "learning_rate": 0.0009476421375273222, + "loss": 0.0716, + "step": 54460 + }, + { + "epoch": 1.37, + "learning_rate": 0.0009472652815114439, + "loss": 0.069, + "step": 54470 + }, + { + "epoch": 1.37, + "learning_rate": 0.0009468884254955658, + "loss": 0.0711, + "step": 54480 + }, + { + "epoch": 1.37, + "learning_rate": 0.0009465115694796875, + "loss": 0.0708, + "step": 54490 + }, + { + "epoch": 1.37, + "learning_rate": 0.0009461347134638094, + "loss": 0.0694, + "step": 54500 + }, + { + "epoch": 1.37, + "eval_cer": 0.6656171033110091, + "eval_loss": 0.06041229888796806, + "eval_runtime": 90.7001, + "eval_samples_per_second": 110.242, + "eval_steps_per_second": 6.891, + "step": 54500 + }, + { + "epoch": 1.37, + "learning_rate": 0.0009457578574479311, + "loss": 0.0685, + "step": 54510 + }, + { + "epoch": 1.37, + "learning_rate": 0.0009453810014320528, + "loss": 0.071, + "step": 54520 + }, + { + "epoch": 1.37, + "learning_rate": 0.0009450041454161747, + "loss": 0.0692, + "step": 54530 + }, + { + "epoch": 1.37, + "learning_rate": 0.0009446272894002964, + "loss": 0.0709, + "step": 54540 + }, + { + "epoch": 1.37, + "learning_rate": 0.0009442504333844183, + "loss": 0.077, + "step": 54550 + }, + { + "epoch": 1.37, + "learning_rate": 0.00094387357736854, + "loss": 0.0719, + "step": 54560 + }, + { + "epoch": 1.37, + "learning_rate": 0.0009434967213526619, + "loss": 0.0736, + "step": 54570 + }, + { + "epoch": 1.37, + "learning_rate": 0.0009431198653367836, + "loss": 0.0701, + "step": 54580 + }, + { + "epoch": 1.37, + "learning_rate": 0.0009427430093209055, + "loss": 0.0678, + "step": 54590 + }, + { + "epoch": 1.37, + "learning_rate": 0.0009423661533050272, + "loss": 0.072, + "step": 54600 + }, + { + "epoch": 1.37, + "learning_rate": 0.0009419892972891491, + "loss": 0.0728, + "step": 54610 + }, + { + "epoch": 1.37, + "learning_rate": 0.0009416124412732708, + "loss": 0.0688, + "step": 54620 + }, + { + "epoch": 1.37, + "learning_rate": 0.0009412355852573927, + "loss": 0.0728, + "step": 54630 + }, + { + "epoch": 1.37, + "learning_rate": 0.0009408587292415144, + "loss": 0.0724, + "step": 54640 + }, + { + "epoch": 1.37, + "learning_rate": 0.0009404818732256363, + "loss": 0.0699, + "step": 54650 + }, + { + "epoch": 1.37, + "learning_rate": 0.000940105017209758, + "loss": 0.0712, + "step": 54660 + }, + { + "epoch": 1.37, + "learning_rate": 0.0009397281611938799, + "loss": 0.0722, + "step": 54670 + }, + { + "epoch": 1.37, + "learning_rate": 0.0009393513051780016, + "loss": 0.0721, + "step": 54680 + }, + { + "epoch": 1.37, + "learning_rate": 0.0009389744491621236, + "loss": 0.0688, + "step": 54690 + }, + { + "epoch": 1.37, + "learning_rate": 0.0009385975931462452, + "loss": 0.0696, + "step": 54700 + }, + { + "epoch": 1.37, + "learning_rate": 0.0009382207371303672, + "loss": 0.0704, + "step": 54710 + }, + { + "epoch": 1.37, + "learning_rate": 0.0009378438811144888, + "loss": 0.0704, + "step": 54720 + }, + { + "epoch": 1.38, + "learning_rate": 0.0009374670250986108, + "loss": 0.0748, + "step": 54730 + }, + { + "epoch": 1.38, + "learning_rate": 0.0009370901690827325, + "loss": 0.067, + "step": 54740 + }, + { + "epoch": 1.38, + "learning_rate": 0.0009367133130668542, + "loss": 0.0719, + "step": 54750 + }, + { + "epoch": 1.38, + "learning_rate": 0.0009363364570509761, + "loss": 0.0705, + "step": 54760 + }, + { + "epoch": 1.38, + "learning_rate": 0.0009359596010350978, + "loss": 0.0705, + "step": 54770 + }, + { + "epoch": 1.38, + "learning_rate": 0.0009355827450192197, + "loss": 0.0705, + "step": 54780 + }, + { + "epoch": 1.38, + "learning_rate": 0.0009352058890033414, + "loss": 0.0725, + "step": 54790 + }, + { + "epoch": 1.38, + "learning_rate": 0.0009348290329874633, + "loss": 0.0699, + "step": 54800 + }, + { + "epoch": 1.38, + "learning_rate": 0.0009344521769715851, + "loss": 0.0701, + "step": 54810 + }, + { + "epoch": 1.38, + "learning_rate": 0.0009340753209557069, + "loss": 0.0711, + "step": 54820 + }, + { + "epoch": 1.38, + "learning_rate": 0.0009336984649398287, + "loss": 0.0724, + "step": 54830 + }, + { + "epoch": 1.38, + "learning_rate": 0.0009333216089239505, + "loss": 0.0732, + "step": 54840 + }, + { + "epoch": 1.38, + "learning_rate": 0.0009329447529080723, + "loss": 0.0687, + "step": 54850 + }, + { + "epoch": 1.38, + "learning_rate": 0.0009325678968921941, + "loss": 0.0717, + "step": 54860 + }, + { + "epoch": 1.38, + "learning_rate": 0.0009321910408763159, + "loss": 0.0716, + "step": 54870 + }, + { + "epoch": 1.38, + "learning_rate": 0.0009318141848604377, + "loss": 0.0712, + "step": 54880 + }, + { + "epoch": 1.38, + "learning_rate": 0.0009314373288445595, + "loss": 0.0679, + "step": 54890 + }, + { + "epoch": 1.38, + "learning_rate": 0.0009310604728286813, + "loss": 0.0662, + "step": 54900 + }, + { + "epoch": 1.38, + "learning_rate": 0.0009306836168128031, + "loss": 0.0686, + "step": 54910 + }, + { + "epoch": 1.38, + "learning_rate": 0.0009303067607969249, + "loss": 0.0679, + "step": 54920 + }, + { + "epoch": 1.38, + "learning_rate": 0.0009299299047810467, + "loss": 0.0724, + "step": 54930 + }, + { + "epoch": 1.38, + "learning_rate": 0.0009295530487651685, + "loss": 0.0689, + "step": 54940 + }, + { + "epoch": 1.38, + "learning_rate": 0.0009291761927492903, + "loss": 0.0714, + "step": 54950 + }, + { + "epoch": 1.38, + "learning_rate": 0.000928799336733412, + "loss": 0.0718, + "step": 54960 + }, + { + "epoch": 1.38, + "learning_rate": 0.0009284224807175338, + "loss": 0.0682, + "step": 54970 + }, + { + "epoch": 1.38, + "learning_rate": 0.0009280456247016556, + "loss": 0.0673, + "step": 54980 + }, + { + "epoch": 1.38, + "learning_rate": 0.0009276687686857774, + "loss": 0.0715, + "step": 54990 + }, + { + "epoch": 1.38, + "learning_rate": 0.0009272919126698992, + "loss": 0.0736, + "step": 55000 + }, + { + "epoch": 1.38, + "eval_cer": 0.6655213384747982, + "eval_loss": 0.059801023453474045, + "eval_runtime": 90.8051, + "eval_samples_per_second": 110.115, + "eval_steps_per_second": 6.883, + "step": 55000 + }, + { + "epoch": 1.38, + "learning_rate": 0.000926915056654021, + "loss": 0.074, + "step": 55010 + }, + { + "epoch": 1.38, + "learning_rate": 0.0009265382006381428, + "loss": 0.0714, + "step": 55020 + }, + { + "epoch": 1.38, + "learning_rate": 0.0009261613446222648, + "loss": 0.0728, + "step": 55030 + }, + { + "epoch": 1.38, + "learning_rate": 0.0009257844886063864, + "loss": 0.0733, + "step": 55040 + }, + { + "epoch": 1.38, + "learning_rate": 0.0009254076325905083, + "loss": 0.0697, + "step": 55050 + }, + { + "epoch": 1.38, + "learning_rate": 0.00092503077657463, + "loss": 0.0711, + "step": 55060 + }, + { + "epoch": 1.38, + "learning_rate": 0.000924653920558752, + "loss": 0.0707, + "step": 55070 + }, + { + "epoch": 1.38, + "learning_rate": 0.0009242770645428736, + "loss": 0.0692, + "step": 55080 + }, + { + "epoch": 1.38, + "learning_rate": 0.0009239002085269955, + "loss": 0.071, + "step": 55090 + }, + { + "epoch": 1.38, + "learning_rate": 0.0009235233525111173, + "loss": 0.0689, + "step": 55100 + }, + { + "epoch": 1.38, + "learning_rate": 0.0009231464964952391, + "loss": 0.0699, + "step": 55110 + }, + { + "epoch": 1.38, + "learning_rate": 0.0009227696404793609, + "loss": 0.0722, + "step": 55120 + }, + { + "epoch": 1.39, + "learning_rate": 0.0009223927844634827, + "loss": 0.0718, + "step": 55130 + }, + { + "epoch": 1.39, + "learning_rate": 0.0009220159284476045, + "loss": 0.069, + "step": 55140 + }, + { + "epoch": 1.39, + "learning_rate": 0.0009216390724317263, + "loss": 0.0707, + "step": 55150 + }, + { + "epoch": 1.39, + "learning_rate": 0.0009212622164158481, + "loss": 0.0696, + "step": 55160 + }, + { + "epoch": 1.39, + "learning_rate": 0.0009208853603999699, + "loss": 0.0671, + "step": 55170 + }, + { + "epoch": 1.39, + "learning_rate": 0.0009205085043840917, + "loss": 0.0723, + "step": 55180 + }, + { + "epoch": 1.39, + "learning_rate": 0.0009201316483682134, + "loss": 0.0706, + "step": 55190 + }, + { + "epoch": 1.39, + "learning_rate": 0.0009197547923523353, + "loss": 0.0695, + "step": 55200 + }, + { + "epoch": 1.39, + "learning_rate": 0.000919377936336457, + "loss": 0.0707, + "step": 55210 + }, + { + "epoch": 1.39, + "learning_rate": 0.0009190010803205789, + "loss": 0.0723, + "step": 55220 + }, + { + "epoch": 1.39, + "learning_rate": 0.0009186242243047006, + "loss": 0.0666, + "step": 55230 + }, + { + "epoch": 1.39, + "learning_rate": 0.0009182473682888225, + "loss": 0.0687, + "step": 55240 + }, + { + "epoch": 1.39, + "learning_rate": 0.0009178705122729442, + "loss": 0.0699, + "step": 55250 + }, + { + "epoch": 1.39, + "learning_rate": 0.0009174936562570661, + "loss": 0.0686, + "step": 55260 + }, + { + "epoch": 1.39, + "learning_rate": 0.0009171168002411878, + "loss": 0.0704, + "step": 55270 + }, + { + "epoch": 1.39, + "learning_rate": 0.0009167399442253097, + "loss": 0.0706, + "step": 55280 + }, + { + "epoch": 1.39, + "learning_rate": 0.0009163630882094314, + "loss": 0.0693, + "step": 55290 + }, + { + "epoch": 1.39, + "learning_rate": 0.0009159862321935533, + "loss": 0.0702, + "step": 55300 + }, + { + "epoch": 1.39, + "learning_rate": 0.000915609376177675, + "loss": 0.0685, + "step": 55310 + }, + { + "epoch": 1.39, + "learning_rate": 0.000915232520161797, + "loss": 0.0718, + "step": 55320 + }, + { + "epoch": 1.39, + "learning_rate": 0.0009148556641459186, + "loss": 0.0691, + "step": 55330 + }, + { + "epoch": 1.39, + "learning_rate": 0.0009144788081300406, + "loss": 0.0696, + "step": 55340 + }, + { + "epoch": 1.39, + "learning_rate": 0.0009141019521141622, + "loss": 0.0705, + "step": 55350 + }, + { + "epoch": 1.39, + "learning_rate": 0.0009137250960982842, + "loss": 0.0708, + "step": 55360 + }, + { + "epoch": 1.39, + "learning_rate": 0.0009133482400824058, + "loss": 0.0705, + "step": 55370 + }, + { + "epoch": 1.39, + "learning_rate": 0.0009129713840665278, + "loss": 0.0694, + "step": 55380 + }, + { + "epoch": 1.39, + "learning_rate": 0.0009125945280506495, + "loss": 0.0729, + "step": 55390 + }, + { + "epoch": 1.39, + "learning_rate": 0.0009122176720347711, + "loss": 0.0701, + "step": 55400 + }, + { + "epoch": 1.39, + "learning_rate": 0.0009118408160188931, + "loss": 0.0708, + "step": 55410 + }, + { + "epoch": 1.39, + "learning_rate": 0.0009114639600030147, + "loss": 0.0693, + "step": 55420 + }, + { + "epoch": 1.39, + "learning_rate": 0.0009110871039871367, + "loss": 0.0724, + "step": 55430 + }, + { + "epoch": 1.39, + "learning_rate": 0.0009107102479712584, + "loss": 0.072, + "step": 55440 + }, + { + "epoch": 1.39, + "learning_rate": 0.0009103333919553803, + "loss": 0.0703, + "step": 55450 + }, + { + "epoch": 1.39, + "learning_rate": 0.000909956535939502, + "loss": 0.0678, + "step": 55460 + }, + { + "epoch": 1.39, + "learning_rate": 0.0009095796799236239, + "loss": 0.0695, + "step": 55470 + }, + { + "epoch": 1.39, + "learning_rate": 0.0009092028239077456, + "loss": 0.0668, + "step": 55480 + }, + { + "epoch": 1.39, + "learning_rate": 0.0009088259678918675, + "loss": 0.0688, + "step": 55490 + }, + { + "epoch": 1.39, + "learning_rate": 0.0009084491118759892, + "loss": 0.0674, + "step": 55500 + }, + { + "epoch": 1.39, + "eval_cer": 0.665315371892395, + "eval_loss": 0.059912025928497314, + "eval_runtime": 90.584, + "eval_samples_per_second": 110.384, + "eval_steps_per_second": 6.9, + "step": 55500 + }, + { + "epoch": 1.39, + "learning_rate": 0.0009080722558601111, + "loss": 0.0715, + "step": 55510 + }, + { + "epoch": 1.39, + "learning_rate": 0.0009076953998442328, + "loss": 0.0731, + "step": 55520 + }, + { + "epoch": 1.4, + "learning_rate": 0.0009073185438283547, + "loss": 0.0715, + "step": 55530 + }, + { + "epoch": 1.4, + "learning_rate": 0.0009069416878124764, + "loss": 0.07, + "step": 55540 + }, + { + "epoch": 1.4, + "learning_rate": 0.0009065648317965983, + "loss": 0.0687, + "step": 55550 + }, + { + "epoch": 1.4, + "learning_rate": 0.00090618797578072, + "loss": 0.0687, + "step": 55560 + }, + { + "epoch": 1.4, + "learning_rate": 0.0009058111197648419, + "loss": 0.0694, + "step": 55570 + }, + { + "epoch": 1.4, + "learning_rate": 0.0009054342637489636, + "loss": 0.0672, + "step": 55580 + }, + { + "epoch": 1.4, + "learning_rate": 0.0009050574077330855, + "loss": 0.0667, + "step": 55590 + }, + { + "epoch": 1.4, + "learning_rate": 0.0009046805517172072, + "loss": 0.072, + "step": 55600 + }, + { + "epoch": 1.4, + "learning_rate": 0.0009043036957013292, + "loss": 0.0723, + "step": 55610 + }, + { + "epoch": 1.4, + "learning_rate": 0.0009039268396854508, + "loss": 0.075, + "step": 55620 + }, + { + "epoch": 1.4, + "learning_rate": 0.0009035499836695726, + "loss": 0.069, + "step": 55630 + }, + { + "epoch": 1.4, + "learning_rate": 0.0009031731276536944, + "loss": 0.0707, + "step": 55640 + }, + { + "epoch": 1.4, + "learning_rate": 0.0009027962716378162, + "loss": 0.0713, + "step": 55650 + }, + { + "epoch": 1.4, + "learning_rate": 0.0009024194156219381, + "loss": 0.0738, + "step": 55660 + }, + { + "epoch": 1.4, + "learning_rate": 0.0009020425596060598, + "loss": 0.0692, + "step": 55670 + }, + { + "epoch": 1.4, + "learning_rate": 0.0009016657035901817, + "loss": 0.0703, + "step": 55680 + }, + { + "epoch": 1.4, + "learning_rate": 0.0009012888475743034, + "loss": 0.0706, + "step": 55690 + }, + { + "epoch": 1.4, + "learning_rate": 0.0009009119915584253, + "loss": 0.0711, + "step": 55700 + }, + { + "epoch": 1.4, + "learning_rate": 0.000900535135542547, + "loss": 0.0732, + "step": 55710 + }, + { + "epoch": 1.4, + "learning_rate": 0.0009001582795266689, + "loss": 0.0699, + "step": 55720 + }, + { + "epoch": 1.4, + "learning_rate": 0.0008997814235107907, + "loss": 0.0732, + "step": 55730 + }, + { + "epoch": 1.4, + "learning_rate": 0.0008994045674949125, + "loss": 0.0711, + "step": 55740 + }, + { + "epoch": 1.4, + "learning_rate": 0.0008990277114790343, + "loss": 0.069, + "step": 55750 + }, + { + "epoch": 1.4, + "learning_rate": 0.0008986508554631561, + "loss": 0.0747, + "step": 55760 + }, + { + "epoch": 1.4, + "learning_rate": 0.0008982739994472779, + "loss": 0.0718, + "step": 55770 + }, + { + "epoch": 1.4, + "learning_rate": 0.0008978971434313997, + "loss": 0.0675, + "step": 55780 + }, + { + "epoch": 1.4, + "learning_rate": 0.0008975202874155215, + "loss": 0.0723, + "step": 55790 + }, + { + "epoch": 1.4, + "learning_rate": 0.0008971434313996433, + "loss": 0.0714, + "step": 55800 + }, + { + "epoch": 1.4, + "learning_rate": 0.0008967665753837651, + "loss": 0.0693, + "step": 55810 + }, + { + "epoch": 1.4, + "learning_rate": 0.0008963897193678869, + "loss": 0.069, + "step": 55820 + }, + { + "epoch": 1.4, + "learning_rate": 0.0008960128633520087, + "loss": 0.0718, + "step": 55830 + }, + { + "epoch": 1.4, + "learning_rate": 0.0008956360073361305, + "loss": 0.0678, + "step": 55840 + }, + { + "epoch": 1.4, + "learning_rate": 0.0008952591513202523, + "loss": 0.0672, + "step": 55850 + }, + { + "epoch": 1.4, + "learning_rate": 0.000894882295304374, + "loss": 0.0708, + "step": 55860 + }, + { + "epoch": 1.4, + "learning_rate": 0.0008945054392884959, + "loss": 0.0695, + "step": 55870 + }, + { + "epoch": 1.4, + "learning_rate": 0.0008941285832726176, + "loss": 0.0705, + "step": 55880 + }, + { + "epoch": 1.4, + "learning_rate": 0.0008937517272567395, + "loss": 0.0687, + "step": 55890 + }, + { + "epoch": 1.4, + "learning_rate": 0.0008933748712408612, + "loss": 0.0712, + "step": 55900 + }, + { + "epoch": 1.4, + "learning_rate": 0.000892998015224983, + "loss": 0.0717, + "step": 55910 + }, + { + "epoch": 1.4, + "learning_rate": 0.0008926211592091048, + "loss": 0.0693, + "step": 55920 + }, + { + "epoch": 1.41, + "learning_rate": 0.0008922443031932266, + "loss": 0.069, + "step": 55930 + }, + { + "epoch": 1.41, + "learning_rate": 0.0008918674471773484, + "loss": 0.0694, + "step": 55940 + }, + { + "epoch": 1.41, + "learning_rate": 0.0008914905911614704, + "loss": 0.0716, + "step": 55950 + }, + { + "epoch": 1.41, + "learning_rate": 0.000891113735145592, + "loss": 0.0703, + "step": 55960 + }, + { + "epoch": 1.41, + "learning_rate": 0.000890736879129714, + "loss": 0.0703, + "step": 55970 + }, + { + "epoch": 1.41, + "learning_rate": 0.0008903600231138356, + "loss": 0.0733, + "step": 55980 + }, + { + "epoch": 1.41, + "learning_rate": 0.0008899831670979575, + "loss": 0.0722, + "step": 55990 + }, + { + "epoch": 1.41, + "learning_rate": 0.0008896063110820792, + "loss": 0.0681, + "step": 56000 + }, + { + "epoch": 1.41, + "eval_cer": 0.6655227821657964, + "eval_loss": 0.059231605380773544, + "eval_runtime": 90.4542, + "eval_samples_per_second": 110.542, + "eval_steps_per_second": 6.91, + "step": 56000 + }, + { + "epoch": 1.41, + "learning_rate": 0.0008892294550662011, + "loss": 0.0705, + "step": 56010 + }, + { + "epoch": 1.41, + "learning_rate": 0.0008888525990503229, + "loss": 0.0708, + "step": 56020 + }, + { + "epoch": 1.41, + "learning_rate": 0.0008884757430344447, + "loss": 0.0687, + "step": 56030 + }, + { + "epoch": 1.41, + "learning_rate": 0.0008880988870185665, + "loss": 0.0679, + "step": 56040 + }, + { + "epoch": 1.41, + "learning_rate": 0.0008877220310026883, + "loss": 0.0681, + "step": 56050 + }, + { + "epoch": 1.41, + "learning_rate": 0.0008873451749868101, + "loss": 0.0703, + "step": 56060 + }, + { + "epoch": 1.41, + "learning_rate": 0.0008869683189709317, + "loss": 0.0706, + "step": 56070 + }, + { + "epoch": 1.41, + "learning_rate": 0.0008865914629550537, + "loss": 0.0731, + "step": 56080 + }, + { + "epoch": 1.41, + "learning_rate": 0.0008862146069391754, + "loss": 0.0723, + "step": 56090 + }, + { + "epoch": 1.41, + "learning_rate": 0.0008858377509232973, + "loss": 0.0696, + "step": 56100 + }, + { + "epoch": 1.41, + "learning_rate": 0.000885460894907419, + "loss": 0.0691, + "step": 56110 + }, + { + "epoch": 1.41, + "learning_rate": 0.0008850840388915409, + "loss": 0.0697, + "step": 56120 + }, + { + "epoch": 1.41, + "learning_rate": 0.0008847071828756626, + "loss": 0.0686, + "step": 56130 + }, + { + "epoch": 1.41, + "learning_rate": 0.0008843303268597845, + "loss": 0.0689, + "step": 56140 + }, + { + "epoch": 1.41, + "learning_rate": 0.0008839534708439062, + "loss": 0.0694, + "step": 56150 + }, + { + "epoch": 1.41, + "learning_rate": 0.0008835766148280281, + "loss": 0.0686, + "step": 56160 + }, + { + "epoch": 1.41, + "learning_rate": 0.0008831997588121498, + "loss": 0.0716, + "step": 56170 + }, + { + "epoch": 1.41, + "learning_rate": 0.0008828229027962717, + "loss": 0.0738, + "step": 56180 + }, + { + "epoch": 1.41, + "learning_rate": 0.0008824460467803934, + "loss": 0.0708, + "step": 56190 + }, + { + "epoch": 1.41, + "learning_rate": 0.0008820691907645153, + "loss": 0.0705, + "step": 56200 + }, + { + "epoch": 1.41, + "learning_rate": 0.000881692334748637, + "loss": 0.0699, + "step": 56210 + }, + { + "epoch": 1.41, + "learning_rate": 0.0008813154787327589, + "loss": 0.0711, + "step": 56220 + }, + { + "epoch": 1.41, + "learning_rate": 0.0008809386227168806, + "loss": 0.0703, + "step": 56230 + }, + { + "epoch": 1.41, + "learning_rate": 0.0008805617667010026, + "loss": 0.0686, + "step": 56240 + }, + { + "epoch": 1.41, + "learning_rate": 0.0008801849106851242, + "loss": 0.0713, + "step": 56250 + }, + { + "epoch": 1.41, + "learning_rate": 0.0008798080546692462, + "loss": 0.0688, + "step": 56260 + }, + { + "epoch": 1.41, + "learning_rate": 0.0008794311986533678, + "loss": 0.0703, + "step": 56270 + }, + { + "epoch": 1.41, + "learning_rate": 0.0008790543426374898, + "loss": 0.0685, + "step": 56280 + }, + { + "epoch": 1.41, + "learning_rate": 0.0008786774866216114, + "loss": 0.0714, + "step": 56290 + }, + { + "epoch": 1.41, + "learning_rate": 0.0008783006306057331, + "loss": 0.0715, + "step": 56300 + }, + { + "epoch": 1.41, + "learning_rate": 0.0008779237745898551, + "loss": 0.0664, + "step": 56310 + }, + { + "epoch": 1.41, + "learning_rate": 0.0008775469185739767, + "loss": 0.0706, + "step": 56320 + }, + { + "epoch": 1.42, + "learning_rate": 0.0008771700625580987, + "loss": 0.0698, + "step": 56330 + }, + { + "epoch": 1.42, + "learning_rate": 0.0008767932065422203, + "loss": 0.0704, + "step": 56340 + }, + { + "epoch": 1.42, + "learning_rate": 0.0008764163505263423, + "loss": 0.0672, + "step": 56350 + }, + { + "epoch": 1.42, + "learning_rate": 0.000876039494510464, + "loss": 0.0731, + "step": 56360 + }, + { + "epoch": 1.42, + "learning_rate": 0.0008756626384945859, + "loss": 0.0681, + "step": 56370 + }, + { + "epoch": 1.42, + "learning_rate": 0.0008752857824787076, + "loss": 0.0683, + "step": 56380 + }, + { + "epoch": 1.42, + "learning_rate": 0.0008749089264628295, + "loss": 0.0711, + "step": 56390 + }, + { + "epoch": 1.42, + "learning_rate": 0.0008745320704469512, + "loss": 0.0711, + "step": 56400 + }, + { + "epoch": 1.42, + "learning_rate": 0.0008741552144310731, + "loss": 0.0723, + "step": 56410 + }, + { + "epoch": 1.42, + "learning_rate": 0.0008737783584151948, + "loss": 0.0676, + "step": 56420 + }, + { + "epoch": 1.42, + "learning_rate": 0.0008734015023993167, + "loss": 0.0705, + "step": 56430 + }, + { + "epoch": 1.42, + "learning_rate": 0.0008730246463834384, + "loss": 0.0724, + "step": 56440 + }, + { + "epoch": 1.42, + "learning_rate": 0.0008726477903675603, + "loss": 0.0676, + "step": 56450 + }, + { + "epoch": 1.42, + "learning_rate": 0.000872270934351682, + "loss": 0.0701, + "step": 56460 + }, + { + "epoch": 1.42, + "learning_rate": 0.0008718940783358039, + "loss": 0.0708, + "step": 56470 + }, + { + "epoch": 1.42, + "learning_rate": 0.0008715172223199256, + "loss": 0.0662, + "step": 56480 + }, + { + "epoch": 1.42, + "learning_rate": 0.0008711403663040475, + "loss": 0.0735, + "step": 56490 + }, + { + "epoch": 1.42, + "learning_rate": 0.0008707635102881692, + "loss": 0.07, + "step": 56500 + }, + { + "epoch": 1.42, + "eval_cer": 0.6653206654260548, + "eval_loss": 0.05919070169329643, + "eval_runtime": 90.4988, + "eval_samples_per_second": 110.488, + "eval_steps_per_second": 6.906, + "step": 56500 + }, + { + "epoch": 1.42, + "learning_rate": 0.0008703866542722911, + "loss": 0.071, + "step": 56510 + }, + { + "epoch": 1.42, + "learning_rate": 0.0008700097982564128, + "loss": 0.0711, + "step": 56520 + }, + { + "epoch": 1.42, + "learning_rate": 0.0008696329422405346, + "loss": 0.0723, + "step": 56530 + }, + { + "epoch": 1.42, + "learning_rate": 0.0008692560862246564, + "loss": 0.0702, + "step": 56540 + }, + { + "epoch": 1.42, + "learning_rate": 0.0008688792302087782, + "loss": 0.0691, + "step": 56550 + }, + { + "epoch": 1.42, + "learning_rate": 0.0008685023741929, + "loss": 0.0707, + "step": 56560 + }, + { + "epoch": 1.42, + "learning_rate": 0.0008681255181770218, + "loss": 0.0702, + "step": 56570 + }, + { + "epoch": 1.42, + "learning_rate": 0.0008677486621611436, + "loss": 0.072, + "step": 56580 + }, + { + "epoch": 1.42, + "learning_rate": 0.0008673718061452654, + "loss": 0.0715, + "step": 56590 + }, + { + "epoch": 1.42, + "learning_rate": 0.0008669949501293873, + "loss": 0.0694, + "step": 56600 + }, + { + "epoch": 1.42, + "learning_rate": 0.000866618094113509, + "loss": 0.0682, + "step": 56610 + }, + { + "epoch": 1.42, + "learning_rate": 0.0008662412380976309, + "loss": 0.0685, + "step": 56620 + }, + { + "epoch": 1.42, + "learning_rate": 0.0008658643820817526, + "loss": 0.068, + "step": 56630 + }, + { + "epoch": 1.42, + "learning_rate": 0.0008654875260658745, + "loss": 0.066, + "step": 56640 + }, + { + "epoch": 1.42, + "learning_rate": 0.0008651106700499963, + "loss": 0.0713, + "step": 56650 + }, + { + "epoch": 1.42, + "learning_rate": 0.0008647338140341181, + "loss": 0.0654, + "step": 56660 + }, + { + "epoch": 1.42, + "learning_rate": 0.0008643569580182399, + "loss": 0.0682, + "step": 56670 + }, + { + "epoch": 1.42, + "learning_rate": 0.0008639801020023617, + "loss": 0.0673, + "step": 56680 + }, + { + "epoch": 1.42, + "learning_rate": 0.0008636032459864835, + "loss": 0.0668, + "step": 56690 + }, + { + "epoch": 1.42, + "learning_rate": 0.0008632263899706053, + "loss": 0.0708, + "step": 56700 + }, + { + "epoch": 1.42, + "learning_rate": 0.0008628495339547271, + "loss": 0.0666, + "step": 56710 + }, + { + "epoch": 1.42, + "learning_rate": 0.0008624726779388489, + "loss": 0.0719, + "step": 56720 + }, + { + "epoch": 1.43, + "learning_rate": 0.0008620958219229707, + "loss": 0.0704, + "step": 56730 + }, + { + "epoch": 1.43, + "learning_rate": 0.0008617189659070924, + "loss": 0.0675, + "step": 56740 + }, + { + "epoch": 1.43, + "learning_rate": 0.0008613421098912143, + "loss": 0.0689, + "step": 56750 + }, + { + "epoch": 1.43, + "learning_rate": 0.000860965253875336, + "loss": 0.0683, + "step": 56760 + }, + { + "epoch": 1.43, + "learning_rate": 0.0008605883978594579, + "loss": 0.0668, + "step": 56770 + }, + { + "epoch": 1.43, + "learning_rate": 0.0008602115418435796, + "loss": 0.0726, + "step": 56780 + }, + { + "epoch": 1.43, + "learning_rate": 0.0008598346858277015, + "loss": 0.0677, + "step": 56790 + }, + { + "epoch": 1.43, + "learning_rate": 0.0008594578298118232, + "loss": 0.0704, + "step": 56800 + }, + { + "epoch": 1.43, + "learning_rate": 0.000859080973795945, + "loss": 0.0705, + "step": 56810 + }, + { + "epoch": 1.43, + "learning_rate": 0.0008587041177800668, + "loss": 0.0696, + "step": 56820 + }, + { + "epoch": 1.43, + "learning_rate": 0.0008583272617641887, + "loss": 0.07, + "step": 56830 + }, + { + "epoch": 1.43, + "learning_rate": 0.0008579504057483104, + "loss": 0.0723, + "step": 56840 + }, + { + "epoch": 1.43, + "learning_rate": 0.0008575735497324322, + "loss": 0.0681, + "step": 56850 + }, + { + "epoch": 1.43, + "learning_rate": 0.000857196693716554, + "loss": 0.0662, + "step": 56860 + }, + { + "epoch": 1.43, + "learning_rate": 0.0008568198377006758, + "loss": 0.0682, + "step": 56870 + }, + { + "epoch": 1.43, + "learning_rate": 0.0008564429816847976, + "loss": 0.0712, + "step": 56880 + }, + { + "epoch": 1.43, + "learning_rate": 0.0008560661256689196, + "loss": 0.0707, + "step": 56890 + }, + { + "epoch": 1.43, + "learning_rate": 0.0008556892696530412, + "loss": 0.0727, + "step": 56900 + }, + { + "epoch": 1.43, + "learning_rate": 0.0008553124136371631, + "loss": 0.0705, + "step": 56910 + }, + { + "epoch": 1.43, + "learning_rate": 0.0008549355576212848, + "loss": 0.068, + "step": 56920 + }, + { + "epoch": 1.43, + "learning_rate": 0.0008545587016054067, + "loss": 0.0701, + "step": 56930 + }, + { + "epoch": 1.43, + "learning_rate": 0.0008541818455895285, + "loss": 0.0712, + "step": 56940 + }, + { + "epoch": 1.43, + "learning_rate": 0.0008538049895736503, + "loss": 0.0691, + "step": 56950 + }, + { + "epoch": 1.43, + "learning_rate": 0.0008534281335577721, + "loss": 0.0715, + "step": 56960 + }, + { + "epoch": 1.43, + "learning_rate": 0.0008530512775418937, + "loss": 0.0693, + "step": 56970 + }, + { + "epoch": 1.43, + "learning_rate": 0.0008526744215260157, + "loss": 0.0713, + "step": 56980 + }, + { + "epoch": 1.43, + "learning_rate": 0.0008522975655101373, + "loss": 0.0708, + "step": 56990 + }, + { + "epoch": 1.43, + "learning_rate": 0.0008519207094942593, + "loss": 0.0704, + "step": 57000 + }, + { + "epoch": 1.43, + "eval_cer": 0.6655526184464249, + "eval_loss": 0.05909842625260353, + "eval_runtime": 90.4968, + "eval_samples_per_second": 110.49, + "eval_steps_per_second": 6.906, + "step": 57000 + }, + { + "epoch": 1.43, + "learning_rate": 0.000851543853478381, + "loss": 0.0703, + "step": 57010 + }, + { + "epoch": 1.43, + "learning_rate": 0.0008511669974625029, + "loss": 0.0675, + "step": 57020 + }, + { + "epoch": 1.43, + "learning_rate": 0.0008507901414466246, + "loss": 0.0671, + "step": 57030 + }, + { + "epoch": 1.43, + "learning_rate": 0.0008504132854307465, + "loss": 0.0711, + "step": 57040 + }, + { + "epoch": 1.43, + "learning_rate": 0.0008500364294148682, + "loss": 0.0675, + "step": 57050 + }, + { + "epoch": 1.43, + "learning_rate": 0.0008496595733989901, + "loss": 0.0713, + "step": 57060 + }, + { + "epoch": 1.43, + "learning_rate": 0.0008492827173831118, + "loss": 0.0689, + "step": 57070 + }, + { + "epoch": 1.43, + "learning_rate": 0.0008489058613672337, + "loss": 0.0674, + "step": 57080 + }, + { + "epoch": 1.43, + "learning_rate": 0.0008485290053513554, + "loss": 0.0687, + "step": 57090 + }, + { + "epoch": 1.43, + "learning_rate": 0.0008481521493354773, + "loss": 0.0704, + "step": 57100 + }, + { + "epoch": 1.43, + "learning_rate": 0.000847775293319599, + "loss": 0.0711, + "step": 57110 + }, + { + "epoch": 1.44, + "learning_rate": 0.0008473984373037209, + "loss": 0.0692, + "step": 57120 + }, + { + "epoch": 1.44, + "learning_rate": 0.0008470215812878426, + "loss": 0.0673, + "step": 57130 + }, + { + "epoch": 1.44, + "learning_rate": 0.0008466447252719645, + "loss": 0.0716, + "step": 57140 + }, + { + "epoch": 1.44, + "learning_rate": 0.0008462678692560862, + "loss": 0.0707, + "step": 57150 + }, + { + "epoch": 1.44, + "learning_rate": 0.0008458910132402081, + "loss": 0.0698, + "step": 57160 + }, + { + "epoch": 1.44, + "learning_rate": 0.0008455141572243298, + "loss": 0.069, + "step": 57170 + }, + { + "epoch": 1.44, + "learning_rate": 0.0008451373012084516, + "loss": 0.0683, + "step": 57180 + }, + { + "epoch": 1.44, + "learning_rate": 0.0008447604451925734, + "loss": 0.0663, + "step": 57190 + }, + { + "epoch": 1.44, + "learning_rate": 0.0008443835891766952, + "loss": 0.0678, + "step": 57200 + }, + { + "epoch": 1.44, + "learning_rate": 0.000844006733160817, + "loss": 0.0642, + "step": 57210 + }, + { + "epoch": 1.44, + "learning_rate": 0.0008436298771449388, + "loss": 0.068, + "step": 57220 + }, + { + "epoch": 1.44, + "learning_rate": 0.0008432530211290607, + "loss": 0.0674, + "step": 57230 + }, + { + "epoch": 1.44, + "learning_rate": 0.0008428761651131823, + "loss": 0.0709, + "step": 57240 + }, + { + "epoch": 1.44, + "learning_rate": 0.0008424993090973043, + "loss": 0.071, + "step": 57250 + }, + { + "epoch": 1.44, + "learning_rate": 0.000842122453081426, + "loss": 0.0688, + "step": 57260 + }, + { + "epoch": 1.44, + "learning_rate": 0.0008417455970655479, + "loss": 0.0658, + "step": 57270 + }, + { + "epoch": 1.44, + "learning_rate": 0.0008413687410496695, + "loss": 0.0731, + "step": 57280 + }, + { + "epoch": 1.44, + "learning_rate": 0.0008409918850337915, + "loss": 0.0689, + "step": 57290 + }, + { + "epoch": 1.44, + "learning_rate": 0.0008406150290179132, + "loss": 0.0702, + "step": 57300 + }, + { + "epoch": 1.44, + "learning_rate": 0.0008402381730020351, + "loss": 0.0701, + "step": 57310 + }, + { + "epoch": 1.44, + "learning_rate": 0.0008398613169861568, + "loss": 0.0686, + "step": 57320 + }, + { + "epoch": 1.44, + "learning_rate": 0.0008394844609702787, + "loss": 0.0696, + "step": 57330 + }, + { + "epoch": 1.44, + "learning_rate": 0.0008391076049544004, + "loss": 0.071, + "step": 57340 + }, + { + "epoch": 1.44, + "learning_rate": 0.0008387307489385223, + "loss": 0.0677, + "step": 57350 + }, + { + "epoch": 1.44, + "learning_rate": 0.000838353892922644, + "loss": 0.0688, + "step": 57360 + }, + { + "epoch": 1.44, + "learning_rate": 0.0008379770369067659, + "loss": 0.0669, + "step": 57370 + }, + { + "epoch": 1.44, + "learning_rate": 0.0008376001808908876, + "loss": 0.0696, + "step": 57380 + }, + { + "epoch": 1.44, + "learning_rate": 0.0008372233248750095, + "loss": 0.0704, + "step": 57390 + }, + { + "epoch": 1.44, + "learning_rate": 0.0008368464688591312, + "loss": 0.0708, + "step": 57400 + }, + { + "epoch": 1.44, + "learning_rate": 0.000836469612843253, + "loss": 0.0712, + "step": 57410 + }, + { + "epoch": 1.44, + "learning_rate": 0.0008360927568273748, + "loss": 0.0688, + "step": 57420 + }, + { + "epoch": 1.44, + "learning_rate": 0.0008357159008114966, + "loss": 0.0688, + "step": 57430 + }, + { + "epoch": 1.44, + "learning_rate": 0.0008353390447956184, + "loss": 0.0703, + "step": 57440 + }, + { + "epoch": 1.44, + "learning_rate": 0.0008349621887797402, + "loss": 0.0675, + "step": 57450 + }, + { + "epoch": 1.44, + "learning_rate": 0.000834585332763862, + "loss": 0.0696, + "step": 57460 + }, + { + "epoch": 1.44, + "learning_rate": 0.0008342084767479838, + "loss": 0.0662, + "step": 57470 + }, + { + "epoch": 1.44, + "learning_rate": 0.0008338316207321056, + "loss": 0.0691, + "step": 57480 + }, + { + "epoch": 1.44, + "learning_rate": 0.0008334547647162274, + "loss": 0.071, + "step": 57490 + }, + { + "epoch": 1.44, + "learning_rate": 0.0008330779087003492, + "loss": 0.0719, + "step": 57500 + }, + { + "epoch": 1.44, + "eval_cer": 0.6653355835663691, + "eval_loss": 0.058829259127378464, + "eval_runtime": 90.5112, + "eval_samples_per_second": 110.473, + "eval_steps_per_second": 6.905, + "step": 57500 + }, + { + "epoch": 1.44, + "learning_rate": 0.000832701052684471, + "loss": 0.0701, + "step": 57510 + }, + { + "epoch": 1.45, + "learning_rate": 0.0008323241966685929, + "loss": 0.0698, + "step": 57520 + }, + { + "epoch": 1.45, + "learning_rate": 0.0008319473406527146, + "loss": 0.0723, + "step": 57530 + }, + { + "epoch": 1.45, + "learning_rate": 0.0008315704846368365, + "loss": 0.0698, + "step": 57540 + }, + { + "epoch": 1.45, + "learning_rate": 0.0008311936286209582, + "loss": 0.0693, + "step": 57550 + }, + { + "epoch": 1.45, + "learning_rate": 0.0008308167726050801, + "loss": 0.0703, + "step": 57560 + }, + { + "epoch": 1.45, + "learning_rate": 0.0008304399165892018, + "loss": 0.0689, + "step": 57570 + }, + { + "epoch": 1.45, + "learning_rate": 0.0008300630605733237, + "loss": 0.0676, + "step": 57580 + }, + { + "epoch": 1.45, + "learning_rate": 0.0008296862045574455, + "loss": 0.0668, + "step": 57590 + }, + { + "epoch": 1.45, + "learning_rate": 0.0008293093485415673, + "loss": 0.0671, + "step": 57600 + }, + { + "epoch": 1.45, + "learning_rate": 0.0008289324925256891, + "loss": 0.0717, + "step": 57610 + }, + { + "epoch": 1.45, + "learning_rate": 0.0008285556365098109, + "loss": 0.0691, + "step": 57620 + }, + { + "epoch": 1.45, + "learning_rate": 0.0008281787804939327, + "loss": 0.0706, + "step": 57630 + }, + { + "epoch": 1.45, + "learning_rate": 0.0008278019244780544, + "loss": 0.0736, + "step": 57640 + }, + { + "epoch": 1.45, + "learning_rate": 0.0008274250684621763, + "loss": 0.0663, + "step": 57650 + }, + { + "epoch": 1.45, + "learning_rate": 0.000827048212446298, + "loss": 0.0708, + "step": 57660 + }, + { + "epoch": 1.45, + "learning_rate": 0.0008266713564304199, + "loss": 0.0745, + "step": 57670 + }, + { + "epoch": 1.45, + "learning_rate": 0.0008262945004145416, + "loss": 0.0712, + "step": 57680 + }, + { + "epoch": 1.45, + "learning_rate": 0.0008259176443986635, + "loss": 0.067, + "step": 57690 + }, + { + "epoch": 1.45, + "learning_rate": 0.0008255407883827852, + "loss": 0.0707, + "step": 57700 + }, + { + "epoch": 1.45, + "learning_rate": 0.0008251639323669071, + "loss": 0.0684, + "step": 57710 + }, + { + "epoch": 1.45, + "learning_rate": 0.0008247870763510288, + "loss": 0.07, + "step": 57720 + }, + { + "epoch": 1.45, + "learning_rate": 0.0008244102203351507, + "loss": 0.0695, + "step": 57730 + }, + { + "epoch": 1.45, + "learning_rate": 0.0008240333643192724, + "loss": 0.0666, + "step": 57740 + }, + { + "epoch": 1.45, + "learning_rate": 0.0008236565083033943, + "loss": 0.0733, + "step": 57750 + }, + { + "epoch": 1.45, + "learning_rate": 0.000823279652287516, + "loss": 0.0692, + "step": 57760 + }, + { + "epoch": 1.45, + "learning_rate": 0.0008229027962716378, + "loss": 0.0668, + "step": 57770 + }, + { + "epoch": 1.45, + "learning_rate": 0.0008225259402557596, + "loss": 0.0707, + "step": 57780 + }, + { + "epoch": 1.45, + "learning_rate": 0.0008221490842398814, + "loss": 0.0703, + "step": 57790 + }, + { + "epoch": 1.45, + "learning_rate": 0.0008217722282240032, + "loss": 0.0685, + "step": 57800 + }, + { + "epoch": 1.45, + "learning_rate": 0.0008213953722081252, + "loss": 0.0707, + "step": 57810 + }, + { + "epoch": 1.45, + "learning_rate": 0.0008210185161922468, + "loss": 0.0687, + "step": 57820 + }, + { + "epoch": 1.45, + "learning_rate": 0.0008206416601763688, + "loss": 0.0694, + "step": 57830 + }, + { + "epoch": 1.45, + "learning_rate": 0.0008202648041604904, + "loss": 0.0684, + "step": 57840 + }, + { + "epoch": 1.45, + "learning_rate": 0.0008198879481446121, + "loss": 0.0704, + "step": 57850 + }, + { + "epoch": 1.45, + "learning_rate": 0.000819511092128734, + "loss": 0.068, + "step": 57860 + }, + { + "epoch": 1.45, + "learning_rate": 0.0008191342361128557, + "loss": 0.0702, + "step": 57870 + }, + { + "epoch": 1.45, + "learning_rate": 0.0008187573800969777, + "loss": 0.0674, + "step": 57880 + }, + { + "epoch": 1.45, + "learning_rate": 0.0008183805240810993, + "loss": 0.0683, + "step": 57890 + }, + { + "epoch": 1.45, + "learning_rate": 0.0008180036680652213, + "loss": 0.0692, + "step": 57900 + }, + { + "epoch": 1.45, + "learning_rate": 0.0008176268120493429, + "loss": 0.0696, + "step": 57910 + }, + { + "epoch": 1.46, + "learning_rate": 0.0008172499560334649, + "loss": 0.0678, + "step": 57920 + }, + { + "epoch": 1.46, + "learning_rate": 0.0008168731000175866, + "loss": 0.0715, + "step": 57930 + }, + { + "epoch": 1.46, + "learning_rate": 0.0008164962440017085, + "loss": 0.0721, + "step": 57940 + }, + { + "epoch": 1.46, + "learning_rate": 0.0008161193879858302, + "loss": 0.0677, + "step": 57950 + }, + { + "epoch": 1.46, + "learning_rate": 0.0008157425319699521, + "loss": 0.0688, + "step": 57960 + }, + { + "epoch": 1.46, + "learning_rate": 0.0008153656759540738, + "loss": 0.0709, + "step": 57970 + }, + { + "epoch": 1.46, + "learning_rate": 0.0008149888199381957, + "loss": 0.0701, + "step": 57980 + }, + { + "epoch": 1.46, + "learning_rate": 0.0008146119639223174, + "loss": 0.0693, + "step": 57990 + }, + { + "epoch": 1.46, + "learning_rate": 0.0008142351079064393, + "loss": 0.0667, + "step": 58000 + }, + { + "epoch": 1.46, + "eval_cer": 0.6652869793027646, + "eval_loss": 0.058723725378513336, + "eval_runtime": 90.5517, + "eval_samples_per_second": 110.423, + "eval_steps_per_second": 6.902, + "step": 58000 + }, + { + "epoch": 1.46, + "learning_rate": 0.000813858251890561, + "loss": 0.0663, + "step": 58010 + }, + { + "epoch": 1.46, + "learning_rate": 0.0008134813958746829, + "loss": 0.0664, + "step": 58020 + }, + { + "epoch": 1.46, + "learning_rate": 0.0008131045398588046, + "loss": 0.0718, + "step": 58030 + }, + { + "epoch": 1.46, + "learning_rate": 0.0008127276838429265, + "loss": 0.0731, + "step": 58040 + }, + { + "epoch": 1.46, + "learning_rate": 0.0008123508278270482, + "loss": 0.0666, + "step": 58050 + }, + { + "epoch": 1.46, + "learning_rate": 0.0008119739718111701, + "loss": 0.0696, + "step": 58060 + }, + { + "epoch": 1.46, + "learning_rate": 0.0008115971157952918, + "loss": 0.0671, + "step": 58070 + }, + { + "epoch": 1.46, + "learning_rate": 0.0008112202597794136, + "loss": 0.0664, + "step": 58080 + }, + { + "epoch": 1.46, + "learning_rate": 0.0008108434037635354, + "loss": 0.0686, + "step": 58090 + }, + { + "epoch": 1.46, + "learning_rate": 0.0008104665477476572, + "loss": 0.0685, + "step": 58100 + }, + { + "epoch": 1.46, + "learning_rate": 0.000810089691731779, + "loss": 0.071, + "step": 58110 + }, + { + "epoch": 1.46, + "learning_rate": 0.0008097128357159008, + "loss": 0.0643, + "step": 58120 + }, + { + "epoch": 1.46, + "learning_rate": 0.0008093359797000226, + "loss": 0.0684, + "step": 58130 + }, + { + "epoch": 1.46, + "learning_rate": 0.0008089591236841444, + "loss": 0.0697, + "step": 58140 + }, + { + "epoch": 1.46, + "learning_rate": 0.0008085822676682662, + "loss": 0.0708, + "step": 58150 + }, + { + "epoch": 1.46, + "learning_rate": 0.000808205411652388, + "loss": 0.0678, + "step": 58160 + }, + { + "epoch": 1.46, + "learning_rate": 0.0008078285556365099, + "loss": 0.0682, + "step": 58170 + }, + { + "epoch": 1.46, + "learning_rate": 0.0008074516996206315, + "loss": 0.0681, + "step": 58180 + }, + { + "epoch": 1.46, + "learning_rate": 0.0008070748436047535, + "loss": 0.0668, + "step": 58190 + }, + { + "epoch": 1.46, + "learning_rate": 0.0008066979875888751, + "loss": 0.07, + "step": 58200 + }, + { + "epoch": 1.46, + "learning_rate": 0.0008063211315729971, + "loss": 0.0689, + "step": 58210 + }, + { + "epoch": 1.46, + "learning_rate": 0.0008059442755571189, + "loss": 0.069, + "step": 58220 + }, + { + "epoch": 1.46, + "learning_rate": 0.0008055674195412407, + "loss": 0.0717, + "step": 58230 + }, + { + "epoch": 1.46, + "learning_rate": 0.0008051905635253624, + "loss": 0.0697, + "step": 58240 + }, + { + "epoch": 1.46, + "learning_rate": 0.0008048137075094843, + "loss": 0.0678, + "step": 58250 + }, + { + "epoch": 1.46, + "learning_rate": 0.000804436851493606, + "loss": 0.0652, + "step": 58260 + }, + { + "epoch": 1.46, + "learning_rate": 0.0008040599954777279, + "loss": 0.0689, + "step": 58270 + }, + { + "epoch": 1.46, + "learning_rate": 0.0008036831394618496, + "loss": 0.0715, + "step": 58280 + }, + { + "epoch": 1.46, + "learning_rate": 0.0008033062834459715, + "loss": 0.0672, + "step": 58290 + }, + { + "epoch": 1.46, + "learning_rate": 0.0008029294274300932, + "loss": 0.0701, + "step": 58300 + }, + { + "epoch": 1.46, + "learning_rate": 0.000802552571414215, + "loss": 0.0684, + "step": 58310 + }, + { + "epoch": 1.47, + "learning_rate": 0.0008021757153983368, + "loss": 0.0669, + "step": 58320 + }, + { + "epoch": 1.47, + "learning_rate": 0.0008017988593824586, + "loss": 0.0674, + "step": 58330 + }, + { + "epoch": 1.47, + "learning_rate": 0.0008014220033665804, + "loss": 0.0695, + "step": 58340 + }, + { + "epoch": 1.47, + "learning_rate": 0.0008010451473507022, + "loss": 0.066, + "step": 58350 + }, + { + "epoch": 1.47, + "learning_rate": 0.000800668291334824, + "loss": 0.0672, + "step": 58360 + }, + { + "epoch": 1.47, + "learning_rate": 0.0008002914353189458, + "loss": 0.0698, + "step": 58370 + }, + { + "epoch": 1.47, + "learning_rate": 0.0007999145793030676, + "loss": 0.0669, + "step": 58380 + }, + { + "epoch": 1.47, + "learning_rate": 0.0007995377232871894, + "loss": 0.0664, + "step": 58390 + }, + { + "epoch": 1.47, + "learning_rate": 0.0007991608672713112, + "loss": 0.0687, + "step": 58400 + }, + { + "epoch": 1.47, + "learning_rate": 0.000798784011255433, + "loss": 0.0633, + "step": 58410 + }, + { + "epoch": 1.47, + "learning_rate": 0.0007984071552395548, + "loss": 0.0722, + "step": 58420 + }, + { + "epoch": 1.47, + "learning_rate": 0.0007980302992236766, + "loss": 0.0679, + "step": 58430 + }, + { + "epoch": 1.47, + "learning_rate": 0.0007976534432077984, + "loss": 0.07, + "step": 58440 + }, + { + "epoch": 1.47, + "learning_rate": 0.0007972765871919202, + "loss": 0.0702, + "step": 58450 + }, + { + "epoch": 1.47, + "learning_rate": 0.0007968997311760421, + "loss": 0.0662, + "step": 58460 + }, + { + "epoch": 1.47, + "learning_rate": 0.0007965228751601638, + "loss": 0.0692, + "step": 58470 + }, + { + "epoch": 1.47, + "learning_rate": 0.0007961460191442857, + "loss": 0.0649, + "step": 58480 + }, + { + "epoch": 1.47, + "learning_rate": 0.0007957691631284074, + "loss": 0.0691, + "step": 58490 + }, + { + "epoch": 1.47, + "learning_rate": 0.0007953923071125293, + "loss": 0.0694, + "step": 58500 + }, + { + "epoch": 1.47, + "eval_cer": 0.6653269214203802, + "eval_loss": 0.05830288305878639, + "eval_runtime": 90.732, + "eval_samples_per_second": 110.204, + "eval_steps_per_second": 6.888, + "step": 58500 + }, + { + "epoch": 1.47, + "learning_rate": 0.0007950154510966511, + "loss": 0.0678, + "step": 58510 + }, + { + "epoch": 1.47, + "learning_rate": 0.0007946385950807727, + "loss": 0.0685, + "step": 58520 + }, + { + "epoch": 1.47, + "learning_rate": 0.0007942617390648947, + "loss": 0.0665, + "step": 58530 + }, + { + "epoch": 1.47, + "learning_rate": 0.0007938848830490163, + "loss": 0.0687, + "step": 58540 + }, + { + "epoch": 1.47, + "learning_rate": 0.0007935080270331383, + "loss": 0.0717, + "step": 58550 + }, + { + "epoch": 1.47, + "learning_rate": 0.0007931311710172599, + "loss": 0.0654, + "step": 58560 + }, + { + "epoch": 1.47, + "learning_rate": 0.0007927543150013819, + "loss": 0.0671, + "step": 58570 + }, + { + "epoch": 1.47, + "learning_rate": 0.0007923774589855036, + "loss": 0.0703, + "step": 58580 + }, + { + "epoch": 1.47, + "learning_rate": 0.0007920006029696255, + "loss": 0.0691, + "step": 58590 + }, + { + "epoch": 1.47, + "learning_rate": 0.0007916237469537472, + "loss": 0.0692, + "step": 58600 + }, + { + "epoch": 1.47, + "learning_rate": 0.0007912468909378691, + "loss": 0.066, + "step": 58610 + }, + { + "epoch": 1.47, + "learning_rate": 0.0007908700349219908, + "loss": 0.0667, + "step": 58620 + }, + { + "epoch": 1.47, + "learning_rate": 0.0007904931789061127, + "loss": 0.0678, + "step": 58630 + }, + { + "epoch": 1.47, + "learning_rate": 0.0007901163228902344, + "loss": 0.0698, + "step": 58640 + }, + { + "epoch": 1.47, + "learning_rate": 0.0007897394668743563, + "loss": 0.0684, + "step": 58650 + }, + { + "epoch": 1.47, + "learning_rate": 0.000789362610858478, + "loss": 0.0677, + "step": 58660 + }, + { + "epoch": 1.47, + "learning_rate": 0.0007889857548425999, + "loss": 0.0695, + "step": 58670 + }, + { + "epoch": 1.47, + "learning_rate": 0.0007886088988267216, + "loss": 0.0644, + "step": 58680 + }, + { + "epoch": 1.47, + "learning_rate": 0.0007882320428108435, + "loss": 0.066, + "step": 58690 + }, + { + "epoch": 1.47, + "learning_rate": 0.0007878551867949652, + "loss": 0.068, + "step": 58700 + }, + { + "epoch": 1.47, + "learning_rate": 0.000787478330779087, + "loss": 0.0684, + "step": 58710 + }, + { + "epoch": 1.48, + "learning_rate": 0.0007871014747632088, + "loss": 0.0709, + "step": 58720 + }, + { + "epoch": 1.48, + "learning_rate": 0.0007867246187473308, + "loss": 0.0706, + "step": 58730 + }, + { + "epoch": 1.48, + "learning_rate": 0.0007863477627314524, + "loss": 0.0724, + "step": 58740 + }, + { + "epoch": 1.48, + "learning_rate": 0.0007859709067155741, + "loss": 0.0707, + "step": 58750 + }, + { + "epoch": 1.48, + "learning_rate": 0.000785594050699696, + "loss": 0.0661, + "step": 58760 + }, + { + "epoch": 1.48, + "learning_rate": 0.0007852171946838177, + "loss": 0.0663, + "step": 58770 + }, + { + "epoch": 1.48, + "learning_rate": 0.0007848403386679396, + "loss": 0.0678, + "step": 58780 + }, + { + "epoch": 1.48, + "learning_rate": 0.0007844634826520613, + "loss": 0.0678, + "step": 58790 + }, + { + "epoch": 1.48, + "learning_rate": 0.0007840866266361833, + "loss": 0.0676, + "step": 58800 + }, + { + "epoch": 1.48, + "learning_rate": 0.0007837097706203049, + "loss": 0.0677, + "step": 58810 + }, + { + "epoch": 1.48, + "learning_rate": 0.0007833329146044269, + "loss": 0.0691, + "step": 58820 + }, + { + "epoch": 1.48, + "learning_rate": 0.0007829560585885485, + "loss": 0.068, + "step": 58830 + }, + { + "epoch": 1.48, + "learning_rate": 0.0007825792025726705, + "loss": 0.0702, + "step": 58840 + }, + { + "epoch": 1.48, + "learning_rate": 0.0007822023465567921, + "loss": 0.0686, + "step": 58850 + }, + { + "epoch": 1.48, + "learning_rate": 0.0007818254905409141, + "loss": 0.0674, + "step": 58860 + }, + { + "epoch": 1.48, + "learning_rate": 0.0007814486345250358, + "loss": 0.0677, + "step": 58870 + }, + { + "epoch": 1.48, + "learning_rate": 0.0007810717785091577, + "loss": 0.0682, + "step": 58880 + }, + { + "epoch": 1.48, + "learning_rate": 0.0007806949224932794, + "loss": 0.0694, + "step": 58890 + }, + { + "epoch": 1.48, + "learning_rate": 0.0007803180664774013, + "loss": 0.0678, + "step": 58900 + }, + { + "epoch": 1.48, + "learning_rate": 0.000779941210461523, + "loss": 0.0662, + "step": 58910 + }, + { + "epoch": 1.48, + "learning_rate": 0.0007795643544456449, + "loss": 0.0691, + "step": 58920 + }, + { + "epoch": 1.48, + "learning_rate": 0.0007791874984297666, + "loss": 0.069, + "step": 58930 + }, + { + "epoch": 1.48, + "learning_rate": 0.0007788106424138885, + "loss": 0.0671, + "step": 58940 + }, + { + "epoch": 1.48, + "learning_rate": 0.0007784337863980102, + "loss": 0.0676, + "step": 58950 + }, + { + "epoch": 1.48, + "learning_rate": 0.000778056930382132, + "loss": 0.0716, + "step": 58960 + }, + { + "epoch": 1.48, + "learning_rate": 0.0007776800743662538, + "loss": 0.0661, + "step": 58970 + }, + { + "epoch": 1.48, + "learning_rate": 0.0007773032183503756, + "loss": 0.0663, + "step": 58980 + }, + { + "epoch": 1.48, + "learning_rate": 0.0007769263623344974, + "loss": 0.0721, + "step": 58990 + }, + { + "epoch": 1.48, + "learning_rate": 0.0007765495063186192, + "loss": 0.0709, + "step": 59000 + }, + { + "epoch": 1.48, + "eval_cer": 0.6655189323231346, + "eval_loss": 0.05791353061795235, + "eval_runtime": 90.8528, + "eval_samples_per_second": 110.057, + "eval_steps_per_second": 6.879, + "step": 59000 + }, + { + "epoch": 1.48, + "learning_rate": 0.000776172650302741, + "loss": 0.067, + "step": 59010 + }, + { + "epoch": 1.48, + "learning_rate": 0.0007757957942868628, + "loss": 0.0698, + "step": 59020 + }, + { + "epoch": 1.48, + "learning_rate": 0.0007754189382709846, + "loss": 0.0648, + "step": 59030 + }, + { + "epoch": 1.48, + "learning_rate": 0.0007750420822551064, + "loss": 0.072, + "step": 59040 + }, + { + "epoch": 1.48, + "learning_rate": 0.0007746652262392282, + "loss": 0.0671, + "step": 59050 + }, + { + "epoch": 1.48, + "learning_rate": 0.00077428837022335, + "loss": 0.0685, + "step": 59060 + }, + { + "epoch": 1.48, + "learning_rate": 0.0007739115142074718, + "loss": 0.0673, + "step": 59070 + }, + { + "epoch": 1.48, + "learning_rate": 0.0007735346581915936, + "loss": 0.0664, + "step": 59080 + }, + { + "epoch": 1.48, + "learning_rate": 0.0007731578021757155, + "loss": 0.0675, + "step": 59090 + }, + { + "epoch": 1.48, + "learning_rate": 0.0007727809461598371, + "loss": 0.0644, + "step": 59100 + }, + { + "epoch": 1.49, + "learning_rate": 0.0007724040901439591, + "loss": 0.0687, + "step": 59110 + }, + { + "epoch": 1.49, + "learning_rate": 0.0007720272341280807, + "loss": 0.0703, + "step": 59120 + }, + { + "epoch": 1.49, + "learning_rate": 0.0007716503781122027, + "loss": 0.0687, + "step": 59130 + }, + { + "epoch": 1.49, + "learning_rate": 0.0007712735220963245, + "loss": 0.0705, + "step": 59140 + }, + { + "epoch": 1.49, + "learning_rate": 0.0007708966660804463, + "loss": 0.07, + "step": 59150 + }, + { + "epoch": 1.49, + "learning_rate": 0.000770519810064568, + "loss": 0.0704, + "step": 59160 + }, + { + "epoch": 1.49, + "learning_rate": 0.0007701429540486899, + "loss": 0.0653, + "step": 59170 + }, + { + "epoch": 1.49, + "learning_rate": 0.0007697660980328116, + "loss": 0.0672, + "step": 59180 + }, + { + "epoch": 1.49, + "learning_rate": 0.0007693892420169333, + "loss": 0.0728, + "step": 59190 + }, + { + "epoch": 1.49, + "learning_rate": 0.0007690123860010552, + "loss": 0.065, + "step": 59200 + }, + { + "epoch": 1.49, + "learning_rate": 0.000768635529985177, + "loss": 0.0676, + "step": 59210 + }, + { + "epoch": 1.49, + "learning_rate": 0.0007682586739692988, + "loss": 0.0692, + "step": 59220 + }, + { + "epoch": 1.49, + "learning_rate": 0.0007678818179534206, + "loss": 0.068, + "step": 59230 + }, + { + "epoch": 1.49, + "learning_rate": 0.0007675049619375424, + "loss": 0.0699, + "step": 59240 + }, + { + "epoch": 1.49, + "learning_rate": 0.0007671281059216642, + "loss": 0.0665, + "step": 59250 + }, + { + "epoch": 1.49, + "learning_rate": 0.000766751249905786, + "loss": 0.067, + "step": 59260 + }, + { + "epoch": 1.49, + "learning_rate": 0.0007663743938899078, + "loss": 0.0695, + "step": 59270 + }, + { + "epoch": 1.49, + "learning_rate": 0.0007659975378740296, + "loss": 0.0686, + "step": 59280 + }, + { + "epoch": 1.49, + "learning_rate": 0.0007656206818581514, + "loss": 0.0672, + "step": 59290 + }, + { + "epoch": 1.49, + "learning_rate": 0.0007652438258422732, + "loss": 0.0696, + "step": 59300 + }, + { + "epoch": 1.49, + "learning_rate": 0.000764866969826395, + "loss": 0.0683, + "step": 59310 + }, + { + "epoch": 1.49, + "learning_rate": 0.0007644901138105168, + "loss": 0.0688, + "step": 59320 + }, + { + "epoch": 1.49, + "learning_rate": 0.0007641132577946386, + "loss": 0.0678, + "step": 59330 + }, + { + "epoch": 1.49, + "learning_rate": 0.0007637364017787604, + "loss": 0.0669, + "step": 59340 + }, + { + "epoch": 1.49, + "learning_rate": 0.0007633595457628822, + "loss": 0.0649, + "step": 59350 + }, + { + "epoch": 1.49, + "learning_rate": 0.000762982689747004, + "loss": 0.0686, + "step": 59360 + }, + { + "epoch": 1.49, + "learning_rate": 0.0007626058337311258, + "loss": 0.0664, + "step": 59370 + }, + { + "epoch": 1.49, + "learning_rate": 0.0007622289777152477, + "loss": 0.0705, + "step": 59380 + }, + { + "epoch": 1.49, + "learning_rate": 0.0007618521216993694, + "loss": 0.0707, + "step": 59390 + }, + { + "epoch": 1.49, + "learning_rate": 0.0007614752656834913, + "loss": 0.0661, + "step": 59400 + }, + { + "epoch": 1.49, + "learning_rate": 0.000761098409667613, + "loss": 0.0675, + "step": 59410 + }, + { + "epoch": 1.49, + "learning_rate": 0.0007607215536517347, + "loss": 0.0721, + "step": 59420 + }, + { + "epoch": 1.49, + "learning_rate": 0.0007603446976358567, + "loss": 0.0701, + "step": 59430 + }, + { + "epoch": 1.49, + "learning_rate": 0.0007599678416199783, + "loss": 0.0692, + "step": 59440 + }, + { + "epoch": 1.49, + "learning_rate": 0.0007595909856041003, + "loss": 0.0692, + "step": 59450 + }, + { + "epoch": 1.49, + "learning_rate": 0.0007592141295882219, + "loss": 0.0671, + "step": 59460 + }, + { + "epoch": 1.49, + "learning_rate": 0.0007588372735723439, + "loss": 0.0707, + "step": 59470 + }, + { + "epoch": 1.49, + "learning_rate": 0.0007584604175564655, + "loss": 0.0657, + "step": 59480 + }, + { + "epoch": 1.49, + "learning_rate": 0.0007580835615405875, + "loss": 0.0668, + "step": 59490 + }, + { + "epoch": 1.49, + "learning_rate": 0.0007577067055247092, + "loss": 0.0661, + "step": 59500 + }, + { + "epoch": 1.49, + "eval_cer": 0.6654530037675522, + "eval_loss": 0.05784814804792404, + "eval_runtime": 90.4465, + "eval_samples_per_second": 110.552, + "eval_steps_per_second": 6.91, + "step": 59500 + }, + { + "epoch": 1.5, + "learning_rate": 0.0007573298495088311, + "loss": 0.0689, + "step": 59510 + }, + { + "epoch": 1.5, + "learning_rate": 0.0007569529934929528, + "loss": 0.0678, + "step": 59520 + }, + { + "epoch": 1.5, + "learning_rate": 0.0007565761374770747, + "loss": 0.0683, + "step": 59530 + }, + { + "epoch": 1.5, + "learning_rate": 0.0007561992814611964, + "loss": 0.0712, + "step": 59540 + }, + { + "epoch": 1.5, + "learning_rate": 0.0007558224254453183, + "loss": 0.0658, + "step": 59550 + }, + { + "epoch": 1.5, + "learning_rate": 0.00075544556942944, + "loss": 0.0672, + "step": 59560 + }, + { + "epoch": 1.5, + "learning_rate": 0.0007550687134135619, + "loss": 0.0662, + "step": 59570 + }, + { + "epoch": 1.5, + "learning_rate": 0.0007546918573976836, + "loss": 0.0709, + "step": 59580 + }, + { + "epoch": 1.5, + "learning_rate": 0.0007543150013818055, + "loss": 0.0666, + "step": 59590 + }, + { + "epoch": 1.5, + "learning_rate": 0.0007539381453659272, + "loss": 0.0676, + "step": 59600 + }, + { + "epoch": 1.5, + "learning_rate": 0.000753561289350049, + "loss": 0.0709, + "step": 59610 + }, + { + "epoch": 1.5, + "learning_rate": 0.0007531844333341708, + "loss": 0.0698, + "step": 59620 + }, + { + "epoch": 1.5, + "learning_rate": 0.0007528075773182925, + "loss": 0.0671, + "step": 59630 + }, + { + "epoch": 1.5, + "learning_rate": 0.0007524307213024144, + "loss": 0.0737, + "step": 59640 + }, + { + "epoch": 1.5, + "learning_rate": 0.0007520538652865361, + "loss": 0.0681, + "step": 59650 + }, + { + "epoch": 1.5, + "learning_rate": 0.000751677009270658, + "loss": 0.0679, + "step": 59660 + }, + { + "epoch": 1.5, + "learning_rate": 0.0007513001532547797, + "loss": 0.0661, + "step": 59670 + }, + { + "epoch": 1.5, + "learning_rate": 0.0007509232972389016, + "loss": 0.0725, + "step": 59680 + }, + { + "epoch": 1.5, + "learning_rate": 0.0007505464412230233, + "loss": 0.0681, + "step": 59690 + }, + { + "epoch": 1.5, + "learning_rate": 0.0007501695852071452, + "loss": 0.0677, + "step": 59700 + }, + { + "epoch": 1.5, + "learning_rate": 0.000749792729191267, + "loss": 0.0694, + "step": 59710 + }, + { + "epoch": 1.5, + "learning_rate": 0.0007494158731753889, + "loss": 0.0684, + "step": 59720 + }, + { + "epoch": 1.5, + "learning_rate": 0.0007490390171595106, + "loss": 0.0678, + "step": 59730 + }, + { + "epoch": 1.5, + "learning_rate": 0.0007486621611436324, + "loss": 0.0685, + "step": 59740 + }, + { + "epoch": 1.5, + "learning_rate": 0.0007482853051277541, + "loss": 0.0681, + "step": 59750 + }, + { + "epoch": 1.5, + "learning_rate": 0.000747908449111876, + "loss": 0.0665, + "step": 59760 + }, + { + "epoch": 1.5, + "learning_rate": 0.0007475315930959977, + "loss": 0.0667, + "step": 59770 + }, + { + "epoch": 1.5, + "learning_rate": 0.0007471547370801196, + "loss": 0.0655, + "step": 59780 + }, + { + "epoch": 1.5, + "learning_rate": 0.0007467778810642414, + "loss": 0.0664, + "step": 59790 + }, + { + "epoch": 1.5, + "learning_rate": 0.0007464010250483632, + "loss": 0.0687, + "step": 59800 + }, + { + "epoch": 1.5, + "learning_rate": 0.000746024169032485, + "loss": 0.0664, + "step": 59810 + }, + { + "epoch": 1.5, + "learning_rate": 0.0007456473130166068, + "loss": 0.068, + "step": 59820 + }, + { + "epoch": 1.5, + "learning_rate": 0.0007452704570007286, + "loss": 0.0693, + "step": 59830 + }, + { + "epoch": 1.5, + "learning_rate": 0.0007448936009848504, + "loss": 0.0672, + "step": 59840 + }, + { + "epoch": 1.5, + "learning_rate": 0.0007445167449689722, + "loss": 0.0705, + "step": 59850 + }, + { + "epoch": 1.5, + "learning_rate": 0.000744139888953094, + "loss": 0.0661, + "step": 59860 + }, + { + "epoch": 1.5, + "learning_rate": 0.0007437630329372158, + "loss": 0.0674, + "step": 59870 + }, + { + "epoch": 1.5, + "learning_rate": 0.0007433861769213376, + "loss": 0.0716, + "step": 59880 + }, + { + "epoch": 1.5, + "learning_rate": 0.0007430093209054594, + "loss": 0.0687, + "step": 59890 + }, + { + "epoch": 1.5, + "learning_rate": 0.0007426324648895813, + "loss": 0.0663, + "step": 59900 + }, + { + "epoch": 1.51, + "learning_rate": 0.000742255608873703, + "loss": 0.0694, + "step": 59910 + }, + { + "epoch": 1.51, + "learning_rate": 0.0007418787528578249, + "loss": 0.0667, + "step": 59920 + }, + { + "epoch": 1.51, + "learning_rate": 0.0007415018968419466, + "loss": 0.0679, + "step": 59930 + }, + { + "epoch": 1.51, + "learning_rate": 0.0007411250408260685, + "loss": 0.0711, + "step": 59940 + }, + { + "epoch": 1.51, + "learning_rate": 0.0007407481848101902, + "loss": 0.0689, + "step": 59950 + }, + { + "epoch": 1.51, + "learning_rate": 0.0007403713287943121, + "loss": 0.0662, + "step": 59960 + }, + { + "epoch": 1.51, + "learning_rate": 0.0007399944727784338, + "loss": 0.0675, + "step": 59970 + }, + { + "epoch": 1.51, + "learning_rate": 0.0007396176167625556, + "loss": 0.0701, + "step": 59980 + }, + { + "epoch": 1.51, + "learning_rate": 0.0007392407607466774, + "loss": 0.0718, + "step": 59990 + }, + { + "epoch": 1.51, + "learning_rate": 0.0007388639047307992, + "loss": 0.0682, + "step": 60000 + }, + { + "epoch": 1.51, + "eval_cer": 0.6654611846832085, + "eval_loss": 0.05754994973540306, + "eval_runtime": 90.0145, + "eval_samples_per_second": 111.082, + "eval_steps_per_second": 6.943, + "step": 60000 + }, + { + "epoch": 1.51, + "learning_rate": 0.000738487048714921, + "loss": 0.0691, + "step": 60010 + }, + { + "epoch": 1.51, + "learning_rate": 0.0007381101926990427, + "loss": 0.0659, + "step": 60020 + }, + { + "epoch": 1.51, + "learning_rate": 0.0007377333366831646, + "loss": 0.0685, + "step": 60030 + }, + { + "epoch": 1.51, + "learning_rate": 0.0007373564806672863, + "loss": 0.066, + "step": 60040 + }, + { + "epoch": 1.51, + "learning_rate": 0.0007369796246514082, + "loss": 0.07, + "step": 60050 + }, + { + "epoch": 1.51, + "learning_rate": 0.0007366027686355299, + "loss": 0.0656, + "step": 60060 + }, + { + "epoch": 1.51, + "learning_rate": 0.0007362259126196518, + "loss": 0.0708, + "step": 60070 + }, + { + "epoch": 1.51, + "learning_rate": 0.0007358490566037737, + "loss": 0.0699, + "step": 60080 + }, + { + "epoch": 1.51, + "learning_rate": 0.0007354722005878954, + "loss": 0.0696, + "step": 60090 + }, + { + "epoch": 1.51, + "learning_rate": 0.0007350953445720172, + "loss": 0.0668, + "step": 60100 + }, + { + "epoch": 1.51, + "learning_rate": 0.000734718488556139, + "loss": 0.0668, + "step": 60110 + }, + { + "epoch": 1.51, + "learning_rate": 0.0007343416325402608, + "loss": 0.0692, + "step": 60120 + }, + { + "epoch": 1.51, + "learning_rate": 0.0007339647765243826, + "loss": 0.0663, + "step": 60130 + }, + { + "epoch": 1.51, + "learning_rate": 0.0007335879205085044, + "loss": 0.0665, + "step": 60140 + }, + { + "epoch": 1.51, + "learning_rate": 0.0007332110644926262, + "loss": 0.0671, + "step": 60150 + }, + { + "epoch": 1.51, + "learning_rate": 0.000732834208476748, + "loss": 0.0675, + "step": 60160 + }, + { + "epoch": 1.51, + "learning_rate": 0.0007324573524608698, + "loss": 0.0667, + "step": 60170 + }, + { + "epoch": 1.51, + "learning_rate": 0.0007320804964449916, + "loss": 0.0687, + "step": 60180 + }, + { + "epoch": 1.51, + "learning_rate": 0.0007317036404291134, + "loss": 0.0699, + "step": 60190 + }, + { + "epoch": 1.51, + "learning_rate": 0.0007313267844132351, + "loss": 0.0704, + "step": 60200 + }, + { + "epoch": 1.51, + "learning_rate": 0.000730949928397357, + "loss": 0.0676, + "step": 60210 + }, + { + "epoch": 1.51, + "learning_rate": 0.0007305730723814787, + "loss": 0.0685, + "step": 60220 + }, + { + "epoch": 1.51, + "learning_rate": 0.0007301962163656006, + "loss": 0.0681, + "step": 60230 + }, + { + "epoch": 1.51, + "learning_rate": 0.0007298193603497223, + "loss": 0.0703, + "step": 60240 + }, + { + "epoch": 1.51, + "learning_rate": 0.0007294425043338442, + "loss": 0.068, + "step": 60250 + }, + { + "epoch": 1.51, + "learning_rate": 0.000729065648317966, + "loss": 0.067, + "step": 60260 + }, + { + "epoch": 1.51, + "learning_rate": 0.0007286887923020878, + "loss": 0.0683, + "step": 60270 + }, + { + "epoch": 1.51, + "learning_rate": 0.0007283119362862096, + "loss": 0.0679, + "step": 60280 + }, + { + "epoch": 1.51, + "learning_rate": 0.0007279350802703314, + "loss": 0.0664, + "step": 60290 + }, + { + "epoch": 1.51, + "learning_rate": 0.0007275582242544532, + "loss": 0.0672, + "step": 60300 + }, + { + "epoch": 1.52, + "learning_rate": 0.000727181368238575, + "loss": 0.0662, + "step": 60310 + }, + { + "epoch": 1.52, + "learning_rate": 0.0007268045122226968, + "loss": 0.0686, + "step": 60320 + }, + { + "epoch": 1.52, + "learning_rate": 0.0007264276562068186, + "loss": 0.0696, + "step": 60330 + }, + { + "epoch": 1.52, + "learning_rate": 0.0007260508001909404, + "loss": 0.0707, + "step": 60340 + }, + { + "epoch": 1.52, + "learning_rate": 0.0007256739441750622, + "loss": 0.0688, + "step": 60350 + }, + { + "epoch": 1.52, + "learning_rate": 0.000725297088159184, + "loss": 0.0695, + "step": 60360 + }, + { + "epoch": 1.52, + "learning_rate": 0.0007249202321433059, + "loss": 0.065, + "step": 60370 + }, + { + "epoch": 1.52, + "learning_rate": 0.0007245433761274276, + "loss": 0.0668, + "step": 60380 + }, + { + "epoch": 1.52, + "learning_rate": 0.0007241665201115495, + "loss": 0.0684, + "step": 60390 + }, + { + "epoch": 1.52, + "learning_rate": 0.0007237896640956712, + "loss": 0.0677, + "step": 60400 + }, + { + "epoch": 1.52, + "learning_rate": 0.000723412808079793, + "loss": 0.0666, + "step": 60410 + }, + { + "epoch": 1.52, + "learning_rate": 0.0007230359520639148, + "loss": 0.0679, + "step": 60420 + }, + { + "epoch": 1.52, + "learning_rate": 0.0007226590960480366, + "loss": 0.0676, + "step": 60430 + }, + { + "epoch": 1.52, + "learning_rate": 0.0007222822400321584, + "loss": 0.0691, + "step": 60440 + }, + { + "epoch": 1.52, + "learning_rate": 0.0007219053840162802, + "loss": 0.0655, + "step": 60450 + }, + { + "epoch": 1.52, + "learning_rate": 0.000721528528000402, + "loss": 0.0656, + "step": 60460 + }, + { + "epoch": 1.52, + "learning_rate": 0.0007211516719845238, + "loss": 0.068, + "step": 60470 + }, + { + "epoch": 1.52, + "learning_rate": 0.0007207748159686456, + "loss": 0.069, + "step": 60480 + }, + { + "epoch": 1.52, + "learning_rate": 0.0007203979599527673, + "loss": 0.0673, + "step": 60490 + }, + { + "epoch": 1.52, + "learning_rate": 0.0007200211039368892, + "loss": 0.0668, + "step": 60500 + }, + { + "epoch": 1.52, + "eval_cer": 0.6654361607059072, + "eval_loss": 0.057778164744377136, + "eval_runtime": 90.8472, + "eval_samples_per_second": 110.064, + "eval_steps_per_second": 6.88, + "step": 60500 + }, + { + "epoch": 1.52, + "learning_rate": 0.000719644247921011, + "loss": 0.0698, + "step": 60510 + }, + { + "epoch": 1.52, + "learning_rate": 0.0007192673919051328, + "loss": 0.0697, + "step": 60520 + }, + { + "epoch": 1.52, + "learning_rate": 0.0007188905358892545, + "loss": 0.0695, + "step": 60530 + }, + { + "epoch": 1.52, + "learning_rate": 0.0007185136798733764, + "loss": 0.0689, + "step": 60540 + }, + { + "epoch": 1.52, + "learning_rate": 0.0007181368238574983, + "loss": 0.0695, + "step": 60550 + }, + { + "epoch": 1.52, + "learning_rate": 0.00071775996784162, + "loss": 0.0681, + "step": 60560 + }, + { + "epoch": 1.52, + "learning_rate": 0.0007173831118257418, + "loss": 0.068, + "step": 60570 + }, + { + "epoch": 1.52, + "learning_rate": 0.0007170062558098636, + "loss": 0.0631, + "step": 60580 + }, + { + "epoch": 1.52, + "learning_rate": 0.0007166293997939854, + "loss": 0.0691, + "step": 60590 + }, + { + "epoch": 1.52, + "learning_rate": 0.0007162525437781072, + "loss": 0.0687, + "step": 60600 + }, + { + "epoch": 1.52, + "learning_rate": 0.000715875687762229, + "loss": 0.067, + "step": 60610 + }, + { + "epoch": 1.52, + "learning_rate": 0.0007154988317463508, + "loss": 0.0693, + "step": 60620 + }, + { + "epoch": 1.52, + "learning_rate": 0.0007151219757304725, + "loss": 0.0688, + "step": 60630 + }, + { + "epoch": 1.52, + "learning_rate": 0.0007147451197145944, + "loss": 0.0675, + "step": 60640 + }, + { + "epoch": 1.52, + "learning_rate": 0.0007143682636987161, + "loss": 0.0664, + "step": 60650 + }, + { + "epoch": 1.52, + "learning_rate": 0.000713991407682838, + "loss": 0.0664, + "step": 60660 + }, + { + "epoch": 1.52, + "learning_rate": 0.0007136145516669597, + "loss": 0.0685, + "step": 60670 + }, + { + "epoch": 1.52, + "learning_rate": 0.0007132376956510816, + "loss": 0.0655, + "step": 60680 + }, + { + "epoch": 1.52, + "learning_rate": 0.0007128608396352033, + "loss": 0.0665, + "step": 60690 + }, + { + "epoch": 1.52, + "learning_rate": 0.0007124839836193252, + "loss": 0.0638, + "step": 60700 + }, + { + "epoch": 1.53, + "learning_rate": 0.000712107127603447, + "loss": 0.0678, + "step": 60710 + }, + { + "epoch": 1.53, + "learning_rate": 0.0007117302715875688, + "loss": 0.0653, + "step": 60720 + }, + { + "epoch": 1.53, + "learning_rate": 0.0007113534155716906, + "loss": 0.067, + "step": 60730 + }, + { + "epoch": 1.53, + "learning_rate": 0.0007109765595558124, + "loss": 0.0661, + "step": 60740 + }, + { + "epoch": 1.53, + "learning_rate": 0.0007105997035399342, + "loss": 0.0675, + "step": 60750 + }, + { + "epoch": 1.53, + "learning_rate": 0.000710222847524056, + "loss": 0.0693, + "step": 60760 + }, + { + "epoch": 1.53, + "learning_rate": 0.0007098459915081778, + "loss": 0.0674, + "step": 60770 + }, + { + "epoch": 1.53, + "learning_rate": 0.0007094691354922996, + "loss": 0.0656, + "step": 60780 + }, + { + "epoch": 1.53, + "learning_rate": 0.0007090922794764214, + "loss": 0.0652, + "step": 60790 + }, + { + "epoch": 1.53, + "learning_rate": 0.0007087154234605432, + "loss": 0.0667, + "step": 60800 + }, + { + "epoch": 1.53, + "learning_rate": 0.000708338567444665, + "loss": 0.0663, + "step": 60810 + }, + { + "epoch": 1.53, + "learning_rate": 0.0007079617114287869, + "loss": 0.0697, + "step": 60820 + }, + { + "epoch": 1.53, + "learning_rate": 0.0007075848554129086, + "loss": 0.0671, + "step": 60830 + }, + { + "epoch": 1.53, + "learning_rate": 0.0007072079993970305, + "loss": 0.0667, + "step": 60840 + }, + { + "epoch": 1.53, + "learning_rate": 0.0007068311433811522, + "loss": 0.068, + "step": 60850 + }, + { + "epoch": 1.53, + "learning_rate": 0.000706454287365274, + "loss": 0.0701, + "step": 60860 + }, + { + "epoch": 1.53, + "learning_rate": 0.0007060774313493957, + "loss": 0.0699, + "step": 60870 + }, + { + "epoch": 1.53, + "learning_rate": 0.0007057005753335176, + "loss": 0.067, + "step": 60880 + }, + { + "epoch": 1.53, + "learning_rate": 0.0007053237193176394, + "loss": 0.0658, + "step": 60890 + }, + { + "epoch": 1.53, + "learning_rate": 0.0007049468633017612, + "loss": 0.0675, + "step": 60900 + }, + { + "epoch": 1.53, + "learning_rate": 0.000704570007285883, + "loss": 0.0681, + "step": 60910 + }, + { + "epoch": 1.53, + "learning_rate": 0.0007041931512700048, + "loss": 0.0667, + "step": 60920 + }, + { + "epoch": 1.53, + "learning_rate": 0.0007038162952541266, + "loss": 0.0652, + "step": 60930 + }, + { + "epoch": 1.53, + "learning_rate": 0.0007034394392382484, + "loss": 0.068, + "step": 60940 + }, + { + "epoch": 1.53, + "learning_rate": 0.0007030625832223702, + "loss": 0.0657, + "step": 60950 + }, + { + "epoch": 1.53, + "learning_rate": 0.000702685727206492, + "loss": 0.0681, + "step": 60960 + }, + { + "epoch": 1.53, + "learning_rate": 0.0007023088711906138, + "loss": 0.0685, + "step": 60970 + }, + { + "epoch": 1.53, + "learning_rate": 0.0007019320151747355, + "loss": 0.0691, + "step": 60980 + }, + { + "epoch": 1.53, + "learning_rate": 0.0007015551591588574, + "loss": 0.0701, + "step": 60990 + }, + { + "epoch": 1.53, + "learning_rate": 0.0007011783031429793, + "loss": 0.0684, + "step": 61000 + }, + { + "epoch": 1.53, + "eval_cer": 0.6652614740951306, + "eval_loss": 0.05754827708005905, + "eval_runtime": 90.703, + "eval_samples_per_second": 110.239, + "eval_steps_per_second": 6.891, + "step": 61000 + }, + { + "epoch": 1.53, + "learning_rate": 0.000700801447127101, + "loss": 0.0681, + "step": 61010 + }, + { + "epoch": 1.53, + "learning_rate": 0.0007004245911112229, + "loss": 0.0694, + "step": 61020 + }, + { + "epoch": 1.53, + "learning_rate": 0.0007000477350953446, + "loss": 0.0651, + "step": 61030 + }, + { + "epoch": 1.53, + "learning_rate": 0.0006996708790794664, + "loss": 0.0684, + "step": 61040 + }, + { + "epoch": 1.53, + "learning_rate": 0.0006992940230635882, + "loss": 0.0679, + "step": 61050 + }, + { + "epoch": 1.53, + "learning_rate": 0.00069891716704771, + "loss": 0.0683, + "step": 61060 + }, + { + "epoch": 1.53, + "learning_rate": 0.0006985403110318318, + "loss": 0.0679, + "step": 61070 + }, + { + "epoch": 1.53, + "learning_rate": 0.0006981634550159535, + "loss": 0.0656, + "step": 61080 + }, + { + "epoch": 1.53, + "learning_rate": 0.0006977865990000754, + "loss": 0.065, + "step": 61090 + }, + { + "epoch": 1.54, + "learning_rate": 0.0006974097429841971, + "loss": 0.0667, + "step": 61100 + }, + { + "epoch": 1.54, + "learning_rate": 0.000697032886968319, + "loss": 0.067, + "step": 61110 + }, + { + "epoch": 1.54, + "learning_rate": 0.0006966560309524407, + "loss": 0.068, + "step": 61120 + }, + { + "epoch": 1.54, + "learning_rate": 0.0006962791749365626, + "loss": 0.0671, + "step": 61130 + }, + { + "epoch": 1.54, + "learning_rate": 0.0006959023189206843, + "loss": 0.0662, + "step": 61140 + }, + { + "epoch": 1.54, + "learning_rate": 0.0006955254629048062, + "loss": 0.0676, + "step": 61150 + }, + { + "epoch": 1.54, + "learning_rate": 0.0006951486068889279, + "loss": 0.0679, + "step": 61160 + }, + { + "epoch": 1.54, + "learning_rate": 0.0006947717508730498, + "loss": 0.0686, + "step": 61170 + }, + { + "epoch": 1.54, + "learning_rate": 0.0006943948948571716, + "loss": 0.0684, + "step": 61180 + }, + { + "epoch": 1.54, + "learning_rate": 0.0006940180388412934, + "loss": 0.0653, + "step": 61190 + }, + { + "epoch": 1.54, + "learning_rate": 0.0006936411828254152, + "loss": 0.0682, + "step": 61200 + }, + { + "epoch": 1.54, + "learning_rate": 0.000693264326809537, + "loss": 0.0668, + "step": 61210 + }, + { + "epoch": 1.54, + "learning_rate": 0.0006928874707936588, + "loss": 0.0671, + "step": 61220 + }, + { + "epoch": 1.54, + "learning_rate": 0.0006925106147777806, + "loss": 0.065, + "step": 61230 + }, + { + "epoch": 1.54, + "learning_rate": 0.0006921337587619024, + "loss": 0.0694, + "step": 61240 + }, + { + "epoch": 1.54, + "learning_rate": 0.0006917569027460242, + "loss": 0.0658, + "step": 61250 + }, + { + "epoch": 1.54, + "learning_rate": 0.000691380046730146, + "loss": 0.0692, + "step": 61260 + }, + { + "epoch": 1.54, + "learning_rate": 0.0006910031907142678, + "loss": 0.066, + "step": 61270 + }, + { + "epoch": 1.54, + "learning_rate": 0.0006906263346983896, + "loss": 0.0656, + "step": 61280 + }, + { + "epoch": 1.54, + "learning_rate": 0.0006902494786825115, + "loss": 0.0684, + "step": 61290 + }, + { + "epoch": 1.54, + "learning_rate": 0.0006898726226666331, + "loss": 0.0674, + "step": 61300 + }, + { + "epoch": 1.54, + "learning_rate": 0.000689495766650755, + "loss": 0.0688, + "step": 61310 + }, + { + "epoch": 1.54, + "learning_rate": 0.0006891189106348767, + "loss": 0.0688, + "step": 61320 + }, + { + "epoch": 1.54, + "learning_rate": 0.0006887420546189986, + "loss": 0.0672, + "step": 61330 + }, + { + "epoch": 1.54, + "learning_rate": 0.0006883651986031203, + "loss": 0.065, + "step": 61340 + }, + { + "epoch": 1.54, + "learning_rate": 0.0006879883425872422, + "loss": 0.0691, + "step": 61350 + }, + { + "epoch": 1.54, + "learning_rate": 0.000687611486571364, + "loss": 0.0709, + "step": 61360 + }, + { + "epoch": 1.54, + "learning_rate": 0.0006872346305554858, + "loss": 0.0676, + "step": 61370 + }, + { + "epoch": 1.54, + "learning_rate": 0.0006868577745396076, + "loss": 0.0668, + "step": 61380 + }, + { + "epoch": 1.54, + "learning_rate": 0.0006864809185237294, + "loss": 0.069, + "step": 61390 + }, + { + "epoch": 1.54, + "learning_rate": 0.0006861040625078512, + "loss": 0.064, + "step": 61400 + }, + { + "epoch": 1.54, + "learning_rate": 0.000685727206491973, + "loss": 0.0661, + "step": 61410 + }, + { + "epoch": 1.54, + "learning_rate": 0.0006853503504760948, + "loss": 0.0712, + "step": 61420 + }, + { + "epoch": 1.54, + "learning_rate": 0.0006849734944602165, + "loss": 0.0652, + "step": 61430 + }, + { + "epoch": 1.54, + "learning_rate": 0.0006845966384443384, + "loss": 0.0686, + "step": 61440 + }, + { + "epoch": 1.54, + "learning_rate": 0.0006842197824284601, + "loss": 0.0654, + "step": 61450 + }, + { + "epoch": 1.54, + "learning_rate": 0.000683842926412582, + "loss": 0.0674, + "step": 61460 + }, + { + "epoch": 1.54, + "learning_rate": 0.0006834660703967039, + "loss": 0.0647, + "step": 61470 + }, + { + "epoch": 1.54, + "learning_rate": 0.0006830892143808256, + "loss": 0.0708, + "step": 61480 + }, + { + "epoch": 1.54, + "learning_rate": 0.0006827123583649474, + "loss": 0.0674, + "step": 61490 + }, + { + "epoch": 1.55, + "learning_rate": 0.0006823355023490692, + "loss": 0.0688, + "step": 61500 + }, + { + "epoch": 1.55, + "eval_cer": 0.6651676341802506, + "eval_loss": 0.057114891707897186, + "eval_runtime": 90.5132, + "eval_samples_per_second": 110.47, + "eval_steps_per_second": 6.905, + "step": 61500 + }, + { + "epoch": 1.55, + "learning_rate": 0.000681958646333191, + "loss": 0.0684, + "step": 61510 + }, + { + "epoch": 1.55, + "learning_rate": 0.0006815817903173128, + "loss": 0.0659, + "step": 61520 + }, + { + "epoch": 1.55, + "learning_rate": 0.0006812049343014345, + "loss": 0.0671, + "step": 61530 + }, + { + "epoch": 1.55, + "learning_rate": 0.0006808280782855564, + "loss": 0.0678, + "step": 61540 + }, + { + "epoch": 1.55, + "learning_rate": 0.0006804512222696781, + "loss": 0.0649, + "step": 61550 + }, + { + "epoch": 1.55, + "learning_rate": 0.0006800743662538, + "loss": 0.065, + "step": 61560 + }, + { + "epoch": 1.55, + "learning_rate": 0.0006796975102379217, + "loss": 0.0647, + "step": 61570 + }, + { + "epoch": 1.55, + "learning_rate": 0.0006793206542220436, + "loss": 0.0667, + "step": 61580 + }, + { + "epoch": 1.55, + "learning_rate": 0.0006789437982061653, + "loss": 0.0674, + "step": 61590 + }, + { + "epoch": 1.55, + "learning_rate": 0.0006785669421902872, + "loss": 0.0648, + "step": 61600 + }, + { + "epoch": 1.55, + "learning_rate": 0.0006781900861744089, + "loss": 0.0641, + "step": 61610 + }, + { + "epoch": 1.55, + "learning_rate": 0.0006778132301585308, + "loss": 0.0651, + "step": 61620 + }, + { + "epoch": 1.55, + "learning_rate": 0.0006774363741426525, + "loss": 0.0684, + "step": 61630 + }, + { + "epoch": 1.55, + "learning_rate": 0.0006770595181267744, + "loss": 0.0655, + "step": 61640 + }, + { + "epoch": 1.55, + "learning_rate": 0.0006766826621108962, + "loss": 0.0677, + "step": 61650 + }, + { + "epoch": 1.55, + "learning_rate": 0.000676305806095018, + "loss": 0.068, + "step": 61660 + }, + { + "epoch": 1.55, + "learning_rate": 0.0006759289500791398, + "loss": 0.0647, + "step": 61670 + }, + { + "epoch": 1.55, + "learning_rate": 0.0006755520940632616, + "loss": 0.0642, + "step": 61680 + }, + { + "epoch": 1.55, + "learning_rate": 0.0006751752380473834, + "loss": 0.0663, + "step": 61690 + }, + { + "epoch": 1.55, + "learning_rate": 0.0006747983820315052, + "loss": 0.0642, + "step": 61700 + }, + { + "epoch": 1.55, + "learning_rate": 0.000674421526015627, + "loss": 0.0679, + "step": 61710 + }, + { + "epoch": 1.55, + "learning_rate": 0.0006740446699997488, + "loss": 0.0702, + "step": 61720 + }, + { + "epoch": 1.55, + "learning_rate": 0.0006736678139838706, + "loss": 0.0678, + "step": 61730 + }, + { + "epoch": 1.55, + "learning_rate": 0.0006732909579679924, + "loss": 0.0685, + "step": 61740 + }, + { + "epoch": 1.55, + "learning_rate": 0.0006729141019521141, + "loss": 0.0663, + "step": 61750 + }, + { + "epoch": 1.55, + "learning_rate": 0.000672537245936236, + "loss": 0.0666, + "step": 61760 + }, + { + "epoch": 1.55, + "learning_rate": 0.0006721603899203577, + "loss": 0.0691, + "step": 61770 + }, + { + "epoch": 1.55, + "learning_rate": 0.0006717835339044796, + "loss": 0.066, + "step": 61780 + }, + { + "epoch": 1.55, + "learning_rate": 0.0006714066778886013, + "loss": 0.0692, + "step": 61790 + }, + { + "epoch": 1.55, + "learning_rate": 0.0006710298218727232, + "loss": 0.0679, + "step": 61800 + }, + { + "epoch": 1.55, + "learning_rate": 0.000670652965856845, + "loss": 0.066, + "step": 61810 + }, + { + "epoch": 1.55, + "learning_rate": 0.0006702761098409668, + "loss": 0.0687, + "step": 61820 + }, + { + "epoch": 1.55, + "learning_rate": 0.0006698992538250886, + "loss": 0.069, + "step": 61830 + }, + { + "epoch": 1.55, + "learning_rate": 0.0006695223978092104, + "loss": 0.0663, + "step": 61840 + }, + { + "epoch": 1.55, + "learning_rate": 0.0006691455417933322, + "loss": 0.067, + "step": 61850 + }, + { + "epoch": 1.55, + "learning_rate": 0.000668768685777454, + "loss": 0.0697, + "step": 61860 + }, + { + "epoch": 1.55, + "learning_rate": 0.0006683918297615758, + "loss": 0.0657, + "step": 61870 + }, + { + "epoch": 1.55, + "learning_rate": 0.0006680149737456976, + "loss": 0.0666, + "step": 61880 + }, + { + "epoch": 1.55, + "learning_rate": 0.0006676381177298194, + "loss": 0.0674, + "step": 61890 + }, + { + "epoch": 1.56, + "learning_rate": 0.0006672612617139411, + "loss": 0.0653, + "step": 61900 + }, + { + "epoch": 1.56, + "learning_rate": 0.000666884405698063, + "loss": 0.0667, + "step": 61910 + }, + { + "epoch": 1.56, + "learning_rate": 0.0006665075496821847, + "loss": 0.0651, + "step": 61920 + }, + { + "epoch": 1.56, + "learning_rate": 0.0006661306936663066, + "loss": 0.0667, + "step": 61930 + }, + { + "epoch": 1.56, + "learning_rate": 0.0006657538376504285, + "loss": 0.065, + "step": 61940 + }, + { + "epoch": 1.56, + "learning_rate": 0.0006653769816345502, + "loss": 0.068, + "step": 61950 + }, + { + "epoch": 1.56, + "learning_rate": 0.000665000125618672, + "loss": 0.0639, + "step": 61960 + }, + { + "epoch": 1.56, + "learning_rate": 0.0006646232696027937, + "loss": 0.0669, + "step": 61970 + }, + { + "epoch": 1.56, + "learning_rate": 0.0006642464135869155, + "loss": 0.0688, + "step": 61980 + }, + { + "epoch": 1.56, + "learning_rate": 0.0006638695575710374, + "loss": 0.0689, + "step": 61990 + }, + { + "epoch": 1.56, + "learning_rate": 0.0006634927015551591, + "loss": 0.068, + "step": 62000 + }, + { + "epoch": 1.56, + "eval_cer": 0.6652715799321176, + "eval_loss": 0.057154275476932526, + "eval_runtime": 90.7336, + "eval_samples_per_second": 110.202, + "eval_steps_per_second": 6.888, + "step": 62000 + }, + { + "epoch": 1.56, + "learning_rate": 0.000663115845539281, + "loss": 0.0659, + "step": 62010 + }, + { + "epoch": 1.56, + "learning_rate": 0.0006627389895234027, + "loss": 0.0678, + "step": 62020 + }, + { + "epoch": 1.56, + "learning_rate": 0.0006623621335075246, + "loss": 0.0661, + "step": 62030 + }, + { + "epoch": 1.56, + "learning_rate": 0.0006619852774916463, + "loss": 0.0668, + "step": 62040 + }, + { + "epoch": 1.56, + "learning_rate": 0.0006616084214757682, + "loss": 0.0666, + "step": 62050 + }, + { + "epoch": 1.56, + "learning_rate": 0.0006612315654598899, + "loss": 0.0656, + "step": 62060 + }, + { + "epoch": 1.56, + "learning_rate": 0.0006608547094440118, + "loss": 0.0658, + "step": 62070 + }, + { + "epoch": 1.56, + "learning_rate": 0.0006604778534281335, + "loss": 0.0661, + "step": 62080 + }, + { + "epoch": 1.56, + "learning_rate": 0.0006601009974122554, + "loss": 0.0676, + "step": 62090 + }, + { + "epoch": 1.56, + "learning_rate": 0.0006597241413963772, + "loss": 0.0702, + "step": 62100 + }, + { + "epoch": 1.56, + "learning_rate": 0.000659347285380499, + "loss": 0.0653, + "step": 62110 + }, + { + "epoch": 1.56, + "learning_rate": 0.0006589704293646208, + "loss": 0.0682, + "step": 62120 + }, + { + "epoch": 1.56, + "learning_rate": 0.0006585935733487426, + "loss": 0.0672, + "step": 62130 + }, + { + "epoch": 1.56, + "learning_rate": 0.0006582167173328644, + "loss": 0.0708, + "step": 62140 + }, + { + "epoch": 1.56, + "learning_rate": 0.0006578398613169862, + "loss": 0.0669, + "step": 62150 + }, + { + "epoch": 1.56, + "learning_rate": 0.000657463005301108, + "loss": 0.0646, + "step": 62160 + }, + { + "epoch": 1.56, + "learning_rate": 0.0006570861492852298, + "loss": 0.0681, + "step": 62170 + }, + { + "epoch": 1.56, + "learning_rate": 0.0006567092932693516, + "loss": 0.0662, + "step": 62180 + }, + { + "epoch": 1.56, + "learning_rate": 0.0006563324372534734, + "loss": 0.0659, + "step": 62190 + }, + { + "epoch": 1.56, + "learning_rate": 0.0006559555812375951, + "loss": 0.0683, + "step": 62200 + }, + { + "epoch": 1.56, + "learning_rate": 0.000655578725221717, + "loss": 0.0662, + "step": 62210 + }, + { + "epoch": 1.56, + "learning_rate": 0.0006552018692058387, + "loss": 0.0671, + "step": 62220 + }, + { + "epoch": 1.56, + "learning_rate": 0.0006548250131899606, + "loss": 0.0654, + "step": 62230 + }, + { + "epoch": 1.56, + "learning_rate": 0.0006544481571740823, + "loss": 0.0672, + "step": 62240 + }, + { + "epoch": 1.56, + "learning_rate": 0.0006540713011582042, + "loss": 0.0675, + "step": 62250 + }, + { + "epoch": 1.56, + "learning_rate": 0.0006536944451423259, + "loss": 0.0648, + "step": 62260 + }, + { + "epoch": 1.56, + "learning_rate": 0.0006533175891264478, + "loss": 0.0667, + "step": 62270 + }, + { + "epoch": 1.56, + "learning_rate": 0.0006529407331105696, + "loss": 0.0675, + "step": 62280 + }, + { + "epoch": 1.56, + "learning_rate": 0.0006525638770946914, + "loss": 0.069, + "step": 62290 + }, + { + "epoch": 1.57, + "learning_rate": 0.0006521870210788132, + "loss": 0.0685, + "step": 62300 + }, + { + "epoch": 1.57, + "learning_rate": 0.000651810165062935, + "loss": 0.0672, + "step": 62310 + }, + { + "epoch": 1.57, + "learning_rate": 0.0006514333090470568, + "loss": 0.0685, + "step": 62320 + }, + { + "epoch": 1.57, + "learning_rate": 0.0006510564530311786, + "loss": 0.0649, + "step": 62330 + }, + { + "epoch": 1.57, + "learning_rate": 0.0006506795970153004, + "loss": 0.0662, + "step": 62340 + }, + { + "epoch": 1.57, + "learning_rate": 0.0006503027409994221, + "loss": 0.0644, + "step": 62350 + }, + { + "epoch": 1.57, + "learning_rate": 0.000649925884983544, + "loss": 0.0676, + "step": 62360 + }, + { + "epoch": 1.57, + "learning_rate": 0.0006495490289676657, + "loss": 0.0633, + "step": 62370 + }, + { + "epoch": 1.57, + "learning_rate": 0.0006491721729517876, + "loss": 0.0665, + "step": 62380 + }, + { + "epoch": 1.57, + "learning_rate": 0.0006487953169359095, + "loss": 0.0652, + "step": 62390 + }, + { + "epoch": 1.57, + "learning_rate": 0.0006484184609200312, + "loss": 0.0693, + "step": 62400 + }, + { + "epoch": 1.57, + "learning_rate": 0.0006480416049041529, + "loss": 0.0653, + "step": 62410 + }, + { + "epoch": 1.57, + "learning_rate": 0.0006476647488882747, + "loss": 0.0638, + "step": 62420 + }, + { + "epoch": 1.57, + "learning_rate": 0.0006472878928723965, + "loss": 0.0688, + "step": 62430 + }, + { + "epoch": 1.57, + "learning_rate": 0.0006469110368565183, + "loss": 0.0649, + "step": 62440 + }, + { + "epoch": 1.57, + "learning_rate": 0.0006465341808406401, + "loss": 0.0673, + "step": 62450 + }, + { + "epoch": 1.57, + "learning_rate": 0.000646157324824762, + "loss": 0.0677, + "step": 62460 + }, + { + "epoch": 1.57, + "learning_rate": 0.0006457804688088837, + "loss": 0.0645, + "step": 62470 + }, + { + "epoch": 1.57, + "learning_rate": 0.0006454036127930056, + "loss": 0.0678, + "step": 62480 + }, + { + "epoch": 1.57, + "learning_rate": 0.0006450267567771273, + "loss": 0.0665, + "step": 62490 + }, + { + "epoch": 1.57, + "learning_rate": 0.0006446499007612492, + "loss": 0.0694, + "step": 62500 + }, + { + "epoch": 1.57, + "eval_cer": 0.6654116179589386, + "eval_loss": 0.056619539856910706, + "eval_runtime": 90.723, + "eval_samples_per_second": 110.215, + "eval_steps_per_second": 6.889, + "step": 62500 + }, + { + "epoch": 1.57, + "learning_rate": 0.0006442730447453709, + "loss": 0.0661, + "step": 62510 + }, + { + "epoch": 1.57, + "learning_rate": 0.0006438961887294928, + "loss": 0.0666, + "step": 62520 + }, + { + "epoch": 1.57, + "learning_rate": 0.0006435193327136145, + "loss": 0.0644, + "step": 62530 + }, + { + "epoch": 1.57, + "learning_rate": 0.0006431424766977364, + "loss": 0.0678, + "step": 62540 + }, + { + "epoch": 1.57, + "learning_rate": 0.0006427656206818581, + "loss": 0.0662, + "step": 62550 + }, + { + "epoch": 1.57, + "learning_rate": 0.00064238876466598, + "loss": 0.0655, + "step": 62560 + }, + { + "epoch": 1.57, + "learning_rate": 0.0006420119086501018, + "loss": 0.0678, + "step": 62570 + }, + { + "epoch": 1.57, + "learning_rate": 0.0006416350526342236, + "loss": 0.0658, + "step": 62580 + }, + { + "epoch": 1.57, + "learning_rate": 0.0006412581966183454, + "loss": 0.0639, + "step": 62590 + }, + { + "epoch": 1.57, + "learning_rate": 0.0006408813406024672, + "loss": 0.0676, + "step": 62600 + }, + { + "epoch": 1.57, + "learning_rate": 0.000640504484586589, + "loss": 0.0629, + "step": 62610 + }, + { + "epoch": 1.57, + "learning_rate": 0.0006401276285707108, + "loss": 0.0663, + "step": 62620 + }, + { + "epoch": 1.57, + "learning_rate": 0.0006397507725548326, + "loss": 0.0672, + "step": 62630 + }, + { + "epoch": 1.57, + "learning_rate": 0.0006393739165389544, + "loss": 0.0659, + "step": 62640 + }, + { + "epoch": 1.57, + "learning_rate": 0.0006389970605230761, + "loss": 0.0648, + "step": 62650 + }, + { + "epoch": 1.57, + "learning_rate": 0.000638620204507198, + "loss": 0.0633, + "step": 62660 + }, + { + "epoch": 1.57, + "learning_rate": 0.0006382433484913197, + "loss": 0.0688, + "step": 62670 + }, + { + "epoch": 1.57, + "learning_rate": 0.0006378664924754416, + "loss": 0.0658, + "step": 62680 + }, + { + "epoch": 1.57, + "learning_rate": 0.0006374896364595633, + "loss": 0.0654, + "step": 62690 + }, + { + "epoch": 1.58, + "learning_rate": 0.0006371127804436852, + "loss": 0.0673, + "step": 62700 + }, + { + "epoch": 1.58, + "learning_rate": 0.0006367359244278069, + "loss": 0.0643, + "step": 62710 + }, + { + "epoch": 1.58, + "learning_rate": 0.0006363590684119288, + "loss": 0.0677, + "step": 62720 + }, + { + "epoch": 1.58, + "learning_rate": 0.0006359822123960505, + "loss": 0.0652, + "step": 62730 + }, + { + "epoch": 1.58, + "learning_rate": 0.0006356053563801724, + "loss": 0.0651, + "step": 62740 + }, + { + "epoch": 1.58, + "learning_rate": 0.0006352285003642942, + "loss": 0.0663, + "step": 62750 + }, + { + "epoch": 1.58, + "learning_rate": 0.000634851644348416, + "loss": 0.067, + "step": 62760 + }, + { + "epoch": 1.58, + "learning_rate": 0.0006344747883325378, + "loss": 0.0712, + "step": 62770 + }, + { + "epoch": 1.58, + "learning_rate": 0.0006340979323166596, + "loss": 0.0674, + "step": 62780 + }, + { + "epoch": 1.58, + "learning_rate": 0.0006337210763007814, + "loss": 0.0645, + "step": 62790 + }, + { + "epoch": 1.58, + "learning_rate": 0.0006333442202849032, + "loss": 0.0656, + "step": 62800 + }, + { + "epoch": 1.58, + "learning_rate": 0.000632967364269025, + "loss": 0.0675, + "step": 62810 + }, + { + "epoch": 1.58, + "learning_rate": 0.0006325905082531467, + "loss": 0.0687, + "step": 62820 + }, + { + "epoch": 1.58, + "learning_rate": 0.0006322136522372686, + "loss": 0.0671, + "step": 62830 + }, + { + "epoch": 1.58, + "learning_rate": 0.0006318367962213903, + "loss": 0.0662, + "step": 62840 + }, + { + "epoch": 1.58, + "learning_rate": 0.0006314599402055122, + "loss": 0.0606, + "step": 62850 + }, + { + "epoch": 1.58, + "learning_rate": 0.0006310830841896339, + "loss": 0.0666, + "step": 62860 + }, + { + "epoch": 1.58, + "learning_rate": 0.0006307062281737557, + "loss": 0.0664, + "step": 62870 + }, + { + "epoch": 1.58, + "learning_rate": 0.0006303293721578775, + "loss": 0.0684, + "step": 62880 + }, + { + "epoch": 1.58, + "learning_rate": 0.0006299525161419993, + "loss": 0.066, + "step": 62890 + }, + { + "epoch": 1.58, + "learning_rate": 0.0006295756601261211, + "loss": 0.0689, + "step": 62900 + }, + { + "epoch": 1.58, + "learning_rate": 0.000629198804110243, + "loss": 0.0677, + "step": 62910 + }, + { + "epoch": 1.58, + "learning_rate": 0.0006288219480943647, + "loss": 0.0666, + "step": 62920 + }, + { + "epoch": 1.58, + "learning_rate": 0.0006284450920784866, + "loss": 0.0675, + "step": 62930 + }, + { + "epoch": 1.58, + "learning_rate": 0.0006280682360626083, + "loss": 0.0684, + "step": 62940 + }, + { + "epoch": 1.58, + "learning_rate": 0.0006276913800467302, + "loss": 0.0654, + "step": 62950 + }, + { + "epoch": 1.58, + "learning_rate": 0.0006273145240308519, + "loss": 0.0703, + "step": 62960 + }, + { + "epoch": 1.58, + "learning_rate": 0.0006269376680149738, + "loss": 0.0691, + "step": 62970 + }, + { + "epoch": 1.58, + "learning_rate": 0.0006265608119990955, + "loss": 0.064, + "step": 62980 + }, + { + "epoch": 1.58, + "learning_rate": 0.0006261839559832174, + "loss": 0.066, + "step": 62990 + }, + { + "epoch": 1.58, + "learning_rate": 0.0006258070999673391, + "loss": 0.0642, + "step": 63000 + }, + { + "epoch": 1.58, + "eval_cer": 0.6652528119491417, + "eval_loss": 0.056862492114305496, + "eval_runtime": 90.801, + "eval_samples_per_second": 110.12, + "eval_steps_per_second": 6.883, + "step": 63000 + }, + { + "epoch": 1.58, + "learning_rate": 0.000625430243951461, + "loss": 0.0663, + "step": 63010 + }, + { + "epoch": 1.58, + "learning_rate": 0.0006250533879355827, + "loss": 0.0663, + "step": 63020 + }, + { + "epoch": 1.58, + "learning_rate": 0.0006246765319197046, + "loss": 0.0627, + "step": 63030 + }, + { + "epoch": 1.58, + "learning_rate": 0.0006242996759038264, + "loss": 0.0667, + "step": 63040 + }, + { + "epoch": 1.58, + "learning_rate": 0.0006239228198879482, + "loss": 0.0653, + "step": 63050 + }, + { + "epoch": 1.58, + "learning_rate": 0.00062354596387207, + "loss": 0.0663, + "step": 63060 + }, + { + "epoch": 1.58, + "learning_rate": 0.0006231691078561918, + "loss": 0.0646, + "step": 63070 + }, + { + "epoch": 1.58, + "learning_rate": 0.0006227922518403135, + "loss": 0.0679, + "step": 63080 + }, + { + "epoch": 1.59, + "learning_rate": 0.0006224153958244354, + "loss": 0.0661, + "step": 63090 + }, + { + "epoch": 1.59, + "learning_rate": 0.0006220385398085571, + "loss": 0.0638, + "step": 63100 + }, + { + "epoch": 1.59, + "learning_rate": 0.000621661683792679, + "loss": 0.0663, + "step": 63110 + }, + { + "epoch": 1.59, + "learning_rate": 0.0006212848277768007, + "loss": 0.0645, + "step": 63120 + }, + { + "epoch": 1.59, + "learning_rate": 0.0006209079717609226, + "loss": 0.0713, + "step": 63130 + }, + { + "epoch": 1.59, + "learning_rate": 0.0006205311157450443, + "loss": 0.0679, + "step": 63140 + }, + { + "epoch": 1.59, + "learning_rate": 0.0006201542597291662, + "loss": 0.0675, + "step": 63150 + }, + { + "epoch": 1.59, + "learning_rate": 0.0006197774037132879, + "loss": 0.0652, + "step": 63160 + }, + { + "epoch": 1.59, + "learning_rate": 0.0006194005476974098, + "loss": 0.0698, + "step": 63170 + }, + { + "epoch": 1.59, + "learning_rate": 0.0006190236916815315, + "loss": 0.066, + "step": 63180 + }, + { + "epoch": 1.59, + "learning_rate": 0.0006186468356656534, + "loss": 0.0676, + "step": 63190 + }, + { + "epoch": 1.59, + "learning_rate": 0.0006182699796497752, + "loss": 0.0651, + "step": 63200 + }, + { + "epoch": 1.59, + "learning_rate": 0.000617893123633897, + "loss": 0.0647, + "step": 63210 + }, + { + "epoch": 1.59, + "learning_rate": 0.0006175162676180188, + "loss": 0.0659, + "step": 63220 + }, + { + "epoch": 1.59, + "learning_rate": 0.0006171394116021406, + "loss": 0.0676, + "step": 63230 + }, + { + "epoch": 1.59, + "learning_rate": 0.0006167625555862624, + "loss": 0.069, + "step": 63240 + }, + { + "epoch": 1.59, + "learning_rate": 0.0006163856995703842, + "loss": 0.0658, + "step": 63250 + }, + { + "epoch": 1.59, + "learning_rate": 0.000616008843554506, + "loss": 0.0674, + "step": 63260 + }, + { + "epoch": 1.59, + "learning_rate": 0.0006156319875386278, + "loss": 0.0663, + "step": 63270 + }, + { + "epoch": 1.59, + "learning_rate": 0.0006152551315227496, + "loss": 0.0642, + "step": 63280 + }, + { + "epoch": 1.59, + "learning_rate": 0.0006148782755068713, + "loss": 0.0672, + "step": 63290 + }, + { + "epoch": 1.59, + "learning_rate": 0.0006145014194909931, + "loss": 0.0697, + "step": 63300 + }, + { + "epoch": 1.59, + "learning_rate": 0.000614124563475115, + "loss": 0.0687, + "step": 63310 + }, + { + "epoch": 1.59, + "learning_rate": 0.0006137477074592367, + "loss": 0.0691, + "step": 63320 + }, + { + "epoch": 1.59, + "learning_rate": 0.0006133708514433585, + "loss": 0.0636, + "step": 63330 + }, + { + "epoch": 1.59, + "learning_rate": 0.0006129939954274803, + "loss": 0.0646, + "step": 63340 + }, + { + "epoch": 1.59, + "learning_rate": 0.0006126171394116021, + "loss": 0.0679, + "step": 63350 + }, + { + "epoch": 1.59, + "learning_rate": 0.0006122402833957239, + "loss": 0.0681, + "step": 63360 + }, + { + "epoch": 1.59, + "learning_rate": 0.0006118634273798457, + "loss": 0.0677, + "step": 63370 + }, + { + "epoch": 1.59, + "learning_rate": 0.0006114865713639676, + "loss": 0.069, + "step": 63380 + }, + { + "epoch": 1.59, + "learning_rate": 0.0006111097153480893, + "loss": 0.0669, + "step": 63390 + }, + { + "epoch": 1.59, + "learning_rate": 0.0006107328593322112, + "loss": 0.0653, + "step": 63400 + }, + { + "epoch": 1.59, + "learning_rate": 0.0006103560033163329, + "loss": 0.0675, + "step": 63410 + }, + { + "epoch": 1.59, + "learning_rate": 0.0006099791473004548, + "loss": 0.0661, + "step": 63420 + }, + { + "epoch": 1.59, + "learning_rate": 0.0006096022912845765, + "loss": 0.0651, + "step": 63430 + }, + { + "epoch": 1.59, + "learning_rate": 0.0006092254352686984, + "loss": 0.0635, + "step": 63440 + }, + { + "epoch": 1.59, + "learning_rate": 0.0006088485792528201, + "loss": 0.0673, + "step": 63450 + }, + { + "epoch": 1.59, + "learning_rate": 0.000608471723236942, + "loss": 0.0665, + "step": 63460 + }, + { + "epoch": 1.59, + "learning_rate": 0.0006080948672210637, + "loss": 0.0647, + "step": 63470 + }, + { + "epoch": 1.59, + "learning_rate": 0.0006077180112051856, + "loss": 0.0682, + "step": 63480 + }, + { + "epoch": 1.6, + "learning_rate": 0.0006073411551893074, + "loss": 0.0642, + "step": 63490 + }, + { + "epoch": 1.6, + "learning_rate": 0.0006069642991734292, + "loss": 0.0646, + "step": 63500 + }, + { + "epoch": 1.6, + "eval_cer": 0.6655126763288093, + "eval_loss": 0.05644620954990387, + "eval_runtime": 90.7214, + "eval_samples_per_second": 110.217, + "eval_steps_per_second": 6.889, + "step": 63500 + }, + { + "epoch": 1.6, + "learning_rate": 0.000606587443157551, + "loss": 0.0665, + "step": 63510 + }, + { + "epoch": 1.6, + "learning_rate": 0.0006062105871416728, + "loss": 0.069, + "step": 63520 + }, + { + "epoch": 1.6, + "learning_rate": 0.0006058337311257945, + "loss": 0.0634, + "step": 63530 + }, + { + "epoch": 1.6, + "learning_rate": 0.0006054568751099163, + "loss": 0.0679, + "step": 63540 + }, + { + "epoch": 1.6, + "learning_rate": 0.0006050800190940381, + "loss": 0.0672, + "step": 63550 + }, + { + "epoch": 1.6, + "learning_rate": 0.00060470316307816, + "loss": 0.0651, + "step": 63560 + }, + { + "epoch": 1.6, + "learning_rate": 0.0006043263070622817, + "loss": 0.0625, + "step": 63570 + }, + { + "epoch": 1.6, + "learning_rate": 0.0006039494510464036, + "loss": 0.0644, + "step": 63580 + }, + { + "epoch": 1.6, + "learning_rate": 0.0006035725950305253, + "loss": 0.065, + "step": 63590 + }, + { + "epoch": 1.6, + "learning_rate": 0.0006031957390146472, + "loss": 0.0662, + "step": 63600 + }, + { + "epoch": 1.6, + "learning_rate": 0.0006028188829987689, + "loss": 0.0648, + "step": 63610 + }, + { + "epoch": 1.6, + "learning_rate": 0.0006024420269828908, + "loss": 0.0689, + "step": 63620 + }, + { + "epoch": 1.6, + "learning_rate": 0.0006020651709670125, + "loss": 0.0633, + "step": 63630 + }, + { + "epoch": 1.6, + "learning_rate": 0.0006016883149511344, + "loss": 0.0662, + "step": 63640 + }, + { + "epoch": 1.6, + "learning_rate": 0.0006013114589352561, + "loss": 0.0696, + "step": 63650 + }, + { + "epoch": 1.6, + "learning_rate": 0.000600934602919378, + "loss": 0.0647, + "step": 63660 + }, + { + "epoch": 1.6, + "learning_rate": 0.0006005577469034998, + "loss": 0.0669, + "step": 63670 + }, + { + "epoch": 1.6, + "learning_rate": 0.0006001808908876216, + "loss": 0.0628, + "step": 63680 + }, + { + "epoch": 1.6, + "learning_rate": 0.0005998040348717434, + "loss": 0.0649, + "step": 63690 + }, + { + "epoch": 1.6, + "learning_rate": 0.0005994271788558652, + "loss": 0.0676, + "step": 63700 + }, + { + "epoch": 1.6, + "learning_rate": 0.000599050322839987, + "loss": 0.0674, + "step": 63710 + }, + { + "epoch": 1.6, + "learning_rate": 0.0005986734668241088, + "loss": 0.0672, + "step": 63720 + }, + { + "epoch": 1.6, + "learning_rate": 0.0005982966108082306, + "loss": 0.0637, + "step": 63730 + }, + { + "epoch": 1.6, + "learning_rate": 0.0005979197547923524, + "loss": 0.0671, + "step": 63740 + }, + { + "epoch": 1.6, + "learning_rate": 0.0005975428987764741, + "loss": 0.0642, + "step": 63750 + }, + { + "epoch": 1.6, + "learning_rate": 0.000597166042760596, + "loss": 0.0694, + "step": 63760 + }, + { + "epoch": 1.6, + "learning_rate": 0.0005967891867447177, + "loss": 0.068, + "step": 63770 + }, + { + "epoch": 1.6, + "learning_rate": 0.0005964123307288395, + "loss": 0.0648, + "step": 63780 + }, + { + "epoch": 1.6, + "learning_rate": 0.0005960354747129613, + "loss": 0.0637, + "step": 63790 + }, + { + "epoch": 1.6, + "learning_rate": 0.0005956586186970831, + "loss": 0.0667, + "step": 63800 + }, + { + "epoch": 1.6, + "learning_rate": 0.0005952817626812049, + "loss": 0.0638, + "step": 63810 + }, + { + "epoch": 1.6, + "learning_rate": 0.0005949049066653267, + "loss": 0.0678, + "step": 63820 + }, + { + "epoch": 1.6, + "learning_rate": 0.0005945280506494485, + "loss": 0.0645, + "step": 63830 + }, + { + "epoch": 1.6, + "learning_rate": 0.0005941511946335703, + "loss": 0.0645, + "step": 63840 + }, + { + "epoch": 1.6, + "learning_rate": 0.0005937743386176922, + "loss": 0.0652, + "step": 63850 + }, + { + "epoch": 1.6, + "learning_rate": 0.0005933974826018139, + "loss": 0.0653, + "step": 63860 + }, + { + "epoch": 1.6, + "learning_rate": 0.0005930206265859358, + "loss": 0.0644, + "step": 63870 + }, + { + "epoch": 1.6, + "learning_rate": 0.0005926437705700575, + "loss": 0.0653, + "step": 63880 + }, + { + "epoch": 1.61, + "learning_rate": 0.0005922669145541794, + "loss": 0.0655, + "step": 63890 + }, + { + "epoch": 1.61, + "learning_rate": 0.0005918900585383011, + "loss": 0.0626, + "step": 63900 + }, + { + "epoch": 1.61, + "learning_rate": 0.000591513202522423, + "loss": 0.0648, + "step": 63910 + }, + { + "epoch": 1.61, + "learning_rate": 0.0005911363465065447, + "loss": 0.0666, + "step": 63920 + }, + { + "epoch": 1.61, + "learning_rate": 0.0005907594904906666, + "loss": 0.064, + "step": 63930 + }, + { + "epoch": 1.61, + "learning_rate": 0.0005903826344747883, + "loss": 0.0659, + "step": 63940 + }, + { + "epoch": 1.61, + "learning_rate": 0.0005900057784589102, + "loss": 0.0617, + "step": 63950 + }, + { + "epoch": 1.61, + "learning_rate": 0.000589628922443032, + "loss": 0.0635, + "step": 63960 + }, + { + "epoch": 1.61, + "learning_rate": 0.0005892520664271537, + "loss": 0.0669, + "step": 63970 + }, + { + "epoch": 1.61, + "learning_rate": 0.0005888752104112755, + "loss": 0.0678, + "step": 63980 + }, + { + "epoch": 1.61, + "learning_rate": 0.0005884983543953973, + "loss": 0.0632, + "step": 63990 + }, + { + "epoch": 1.61, + "learning_rate": 0.0005881214983795191, + "loss": 0.0633, + "step": 64000 + }, + { + "epoch": 1.61, + "eval_cer": 0.6652961226790862, + "eval_loss": 0.05655200034379959, + "eval_runtime": 90.5197, + "eval_samples_per_second": 110.462, + "eval_steps_per_second": 6.905, + "step": 64000 + }, + { + "epoch": 1.61, + "learning_rate": 0.0005877446423636409, + "loss": 0.0661, + "step": 64010 + }, + { + "epoch": 1.61, + "learning_rate": 0.0005873677863477627, + "loss": 0.063, + "step": 64020 + }, + { + "epoch": 1.61, + "learning_rate": 0.0005869909303318846, + "loss": 0.0653, + "step": 64030 + }, + { + "epoch": 1.61, + "learning_rate": 0.0005866140743160063, + "loss": 0.0647, + "step": 64040 + }, + { + "epoch": 1.61, + "learning_rate": 0.0005862372183001282, + "loss": 0.0686, + "step": 64050 + }, + { + "epoch": 1.61, + "learning_rate": 0.0005858603622842499, + "loss": 0.0668, + "step": 64060 + }, + { + "epoch": 1.61, + "learning_rate": 0.0005854835062683718, + "loss": 0.066, + "step": 64070 + }, + { + "epoch": 1.61, + "learning_rate": 0.0005851066502524935, + "loss": 0.0656, + "step": 64080 + }, + { + "epoch": 1.61, + "learning_rate": 0.0005847297942366154, + "loss": 0.0696, + "step": 64090 + }, + { + "epoch": 1.61, + "learning_rate": 0.0005843529382207371, + "loss": 0.068, + "step": 64100 + }, + { + "epoch": 1.61, + "learning_rate": 0.000583976082204859, + "loss": 0.065, + "step": 64110 + }, + { + "epoch": 1.61, + "learning_rate": 0.0005835992261889807, + "loss": 0.0653, + "step": 64120 + }, + { + "epoch": 1.61, + "learning_rate": 0.0005832223701731026, + "loss": 0.0636, + "step": 64130 + }, + { + "epoch": 1.61, + "learning_rate": 0.0005828455141572244, + "loss": 0.0648, + "step": 64140 + }, + { + "epoch": 1.61, + "learning_rate": 0.0005824686581413462, + "loss": 0.0673, + "step": 64150 + }, + { + "epoch": 1.61, + "learning_rate": 0.000582091802125468, + "loss": 0.0669, + "step": 64160 + }, + { + "epoch": 1.61, + "learning_rate": 0.0005817149461095898, + "loss": 0.068, + "step": 64170 + }, + { + "epoch": 1.61, + "learning_rate": 0.0005813380900937116, + "loss": 0.0673, + "step": 64180 + }, + { + "epoch": 1.61, + "learning_rate": 0.0005809612340778334, + "loss": 0.0646, + "step": 64190 + }, + { + "epoch": 1.61, + "learning_rate": 0.0005805843780619551, + "loss": 0.0648, + "step": 64200 + }, + { + "epoch": 1.61, + "learning_rate": 0.000580207522046077, + "loss": 0.0657, + "step": 64210 + }, + { + "epoch": 1.61, + "learning_rate": 0.0005798306660301987, + "loss": 0.0656, + "step": 64220 + }, + { + "epoch": 1.61, + "learning_rate": 0.0005794538100143205, + "loss": 0.068, + "step": 64230 + }, + { + "epoch": 1.61, + "learning_rate": 0.0005790769539984423, + "loss": 0.0678, + "step": 64240 + }, + { + "epoch": 1.61, + "learning_rate": 0.0005787000979825641, + "loss": 0.0629, + "step": 64250 + }, + { + "epoch": 1.61, + "learning_rate": 0.0005783232419666859, + "loss": 0.0649, + "step": 64260 + }, + { + "epoch": 1.61, + "learning_rate": 0.0005779463859508077, + "loss": 0.0661, + "step": 64270 + }, + { + "epoch": 1.61, + "learning_rate": 0.0005775695299349295, + "loss": 0.0647, + "step": 64280 + }, + { + "epoch": 1.62, + "learning_rate": 0.0005771926739190513, + "loss": 0.0655, + "step": 64290 + }, + { + "epoch": 1.62, + "learning_rate": 0.0005768158179031732, + "loss": 0.0672, + "step": 64300 + }, + { + "epoch": 1.62, + "learning_rate": 0.0005764389618872949, + "loss": 0.064, + "step": 64310 + }, + { + "epoch": 1.62, + "learning_rate": 0.0005760621058714168, + "loss": 0.0671, + "step": 64320 + }, + { + "epoch": 1.62, + "learning_rate": 0.0005756852498555385, + "loss": 0.0636, + "step": 64330 + }, + { + "epoch": 1.62, + "learning_rate": 0.0005753083938396604, + "loss": 0.0665, + "step": 64340 + }, + { + "epoch": 1.62, + "learning_rate": 0.0005749315378237821, + "loss": 0.066, + "step": 64350 + }, + { + "epoch": 1.62, + "learning_rate": 0.000574554681807904, + "loss": 0.0613, + "step": 64360 + }, + { + "epoch": 1.62, + "learning_rate": 0.0005741778257920257, + "loss": 0.0641, + "step": 64370 + }, + { + "epoch": 1.62, + "learning_rate": 0.0005738009697761476, + "loss": 0.0628, + "step": 64380 + }, + { + "epoch": 1.62, + "learning_rate": 0.0005734241137602693, + "loss": 0.0681, + "step": 64390 + }, + { + "epoch": 1.62, + "learning_rate": 0.0005730472577443912, + "loss": 0.0676, + "step": 64400 + }, + { + "epoch": 1.62, + "learning_rate": 0.0005726704017285129, + "loss": 0.0678, + "step": 64410 + }, + { + "epoch": 1.62, + "learning_rate": 0.0005722935457126347, + "loss": 0.0646, + "step": 64420 + }, + { + "epoch": 1.62, + "learning_rate": 0.0005719166896967565, + "loss": 0.0644, + "step": 64430 + }, + { + "epoch": 1.62, + "learning_rate": 0.0005715398336808783, + "loss": 0.0644, + "step": 64440 + }, + { + "epoch": 1.62, + "learning_rate": 0.0005711629776650001, + "loss": 0.0675, + "step": 64450 + }, + { + "epoch": 1.62, + "learning_rate": 0.0005707861216491219, + "loss": 0.0668, + "step": 64460 + }, + { + "epoch": 1.62, + "learning_rate": 0.0005704092656332437, + "loss": 0.0619, + "step": 64470 + }, + { + "epoch": 1.62, + "learning_rate": 0.0005700324096173656, + "loss": 0.0675, + "step": 64480 + }, + { + "epoch": 1.62, + "learning_rate": 0.0005696555536014873, + "loss": 0.0654, + "step": 64490 + }, + { + "epoch": 1.62, + "learning_rate": 0.0005692786975856092, + "loss": 0.0677, + "step": 64500 + }, + { + "epoch": 1.62, + "eval_cer": 0.6652701362411195, + "eval_loss": 0.05630192533135414, + "eval_runtime": 90.474, + "eval_samples_per_second": 110.518, + "eval_steps_per_second": 6.908, + "step": 64500 + }, + { + "epoch": 1.62, + "learning_rate": 0.0005689018415697309, + "loss": 0.064, + "step": 64510 + }, + { + "epoch": 1.62, + "learning_rate": 0.0005685249855538528, + "loss": 0.0656, + "step": 64520 + }, + { + "epoch": 1.62, + "learning_rate": 0.0005681481295379745, + "loss": 0.0626, + "step": 64530 + }, + { + "epoch": 1.62, + "learning_rate": 0.0005677712735220964, + "loss": 0.0626, + "step": 64540 + }, + { + "epoch": 1.62, + "learning_rate": 0.0005673944175062181, + "loss": 0.0692, + "step": 64550 + }, + { + "epoch": 1.62, + "learning_rate": 0.00056701756149034, + "loss": 0.0661, + "step": 64560 + }, + { + "epoch": 1.62, + "learning_rate": 0.0005666407054744617, + "loss": 0.0655, + "step": 64570 + }, + { + "epoch": 1.62, + "learning_rate": 0.0005662638494585836, + "loss": 0.0658, + "step": 64580 + }, + { + "epoch": 1.62, + "learning_rate": 0.0005658869934427054, + "loss": 0.0648, + "step": 64590 + }, + { + "epoch": 1.62, + "learning_rate": 0.0005655101374268272, + "loss": 0.0638, + "step": 64600 + }, + { + "epoch": 1.62, + "learning_rate": 0.000565133281410949, + "loss": 0.0643, + "step": 64610 + }, + { + "epoch": 1.62, + "learning_rate": 0.0005647564253950708, + "loss": 0.0643, + "step": 64620 + }, + { + "epoch": 1.62, + "learning_rate": 0.0005643795693791926, + "loss": 0.0664, + "step": 64630 + }, + { + "epoch": 1.62, + "learning_rate": 0.0005640027133633142, + "loss": 0.0682, + "step": 64640 + }, + { + "epoch": 1.62, + "learning_rate": 0.0005636258573474361, + "loss": 0.0688, + "step": 64650 + }, + { + "epoch": 1.62, + "learning_rate": 0.000563249001331558, + "loss": 0.0664, + "step": 64660 + }, + { + "epoch": 1.62, + "learning_rate": 0.0005628721453156797, + "loss": 0.0647, + "step": 64670 + }, + { + "epoch": 1.62, + "learning_rate": 0.0005624952892998015, + "loss": 0.0635, + "step": 64680 + }, + { + "epoch": 1.63, + "learning_rate": 0.0005621184332839233, + "loss": 0.0644, + "step": 64690 + }, + { + "epoch": 1.63, + "learning_rate": 0.0005617415772680451, + "loss": 0.0669, + "step": 64700 + }, + { + "epoch": 1.63, + "learning_rate": 0.0005613647212521669, + "loss": 0.0636, + "step": 64710 + }, + { + "epoch": 1.63, + "learning_rate": 0.0005609878652362887, + "loss": 0.0647, + "step": 64720 + }, + { + "epoch": 1.63, + "learning_rate": 0.0005606110092204105, + "loss": 0.0663, + "step": 64730 + }, + { + "epoch": 1.63, + "learning_rate": 0.0005602341532045323, + "loss": 0.0654, + "step": 64740 + }, + { + "epoch": 1.63, + "learning_rate": 0.0005598572971886541, + "loss": 0.0649, + "step": 64750 + }, + { + "epoch": 1.63, + "learning_rate": 0.0005594804411727759, + "loss": 0.0633, + "step": 64760 + }, + { + "epoch": 1.63, + "learning_rate": 0.0005591035851568978, + "loss": 0.0635, + "step": 64770 + }, + { + "epoch": 1.63, + "learning_rate": 0.0005587267291410195, + "loss": 0.0627, + "step": 64780 + }, + { + "epoch": 1.63, + "learning_rate": 0.0005583498731251414, + "loss": 0.064, + "step": 64790 + }, + { + "epoch": 1.63, + "learning_rate": 0.0005579730171092631, + "loss": 0.0653, + "step": 64800 + }, + { + "epoch": 1.63, + "learning_rate": 0.000557596161093385, + "loss": 0.063, + "step": 64810 + }, + { + "epoch": 1.63, + "learning_rate": 0.0005572193050775067, + "loss": 0.0668, + "step": 64820 + }, + { + "epoch": 1.63, + "learning_rate": 0.0005568424490616286, + "loss": 0.0655, + "step": 64830 + }, + { + "epoch": 1.63, + "learning_rate": 0.0005564655930457503, + "loss": 0.0681, + "step": 64840 + }, + { + "epoch": 1.63, + "learning_rate": 0.0005560887370298722, + "loss": 0.0654, + "step": 64850 + }, + { + "epoch": 1.63, + "learning_rate": 0.0005557118810139939, + "loss": 0.0632, + "step": 64860 + }, + { + "epoch": 1.63, + "learning_rate": 0.0005553350249981157, + "loss": 0.0668, + "step": 64870 + }, + { + "epoch": 1.63, + "learning_rate": 0.0005549581689822375, + "loss": 0.0655, + "step": 64880 + }, + { + "epoch": 1.63, + "learning_rate": 0.0005545813129663593, + "loss": 0.0659, + "step": 64890 + }, + { + "epoch": 1.63, + "learning_rate": 0.0005542044569504811, + "loss": 0.0676, + "step": 64900 + }, + { + "epoch": 1.63, + "learning_rate": 0.0005538276009346029, + "loss": 0.0656, + "step": 64910 + }, + { + "epoch": 1.63, + "learning_rate": 0.0005534507449187247, + "loss": 0.0672, + "step": 64920 + }, + { + "epoch": 1.63, + "learning_rate": 0.0005530738889028465, + "loss": 0.0659, + "step": 64930 + }, + { + "epoch": 1.63, + "learning_rate": 0.0005526970328869683, + "loss": 0.0657, + "step": 64940 + }, + { + "epoch": 1.63, + "learning_rate": 0.0005523201768710902, + "loss": 0.0641, + "step": 64950 + }, + { + "epoch": 1.63, + "learning_rate": 0.0005519433208552119, + "loss": 0.0668, + "step": 64960 + }, + { + "epoch": 1.63, + "learning_rate": 0.0005515664648393338, + "loss": 0.0665, + "step": 64970 + }, + { + "epoch": 1.63, + "learning_rate": 0.0005511896088234555, + "loss": 0.067, + "step": 64980 + }, + { + "epoch": 1.63, + "learning_rate": 0.0005508127528075774, + "loss": 0.0687, + "step": 64990 + }, + { + "epoch": 1.63, + "learning_rate": 0.0005504358967916991, + "loss": 0.0649, + "step": 65000 + }, + { + "epoch": 1.63, + "eval_cer": 0.6651690778712488, + "eval_loss": 0.05603507161140442, + "eval_runtime": 90.44, + "eval_samples_per_second": 110.559, + "eval_steps_per_second": 6.911, + "step": 65000 + }, + { + "epoch": 1.63, + "learning_rate": 0.000550059040775821, + "loss": 0.0629, + "step": 65010 + }, + { + "epoch": 1.63, + "learning_rate": 0.0005496821847599427, + "loss": 0.0616, + "step": 65020 + }, + { + "epoch": 1.63, + "learning_rate": 0.0005493053287440646, + "loss": 0.0668, + "step": 65030 + }, + { + "epoch": 1.63, + "learning_rate": 0.0005489284727281863, + "loss": 0.064, + "step": 65040 + }, + { + "epoch": 1.63, + "learning_rate": 0.0005485516167123082, + "loss": 0.0649, + "step": 65050 + }, + { + "epoch": 1.63, + "learning_rate": 0.00054817476069643, + "loss": 0.065, + "step": 65060 + }, + { + "epoch": 1.63, + "learning_rate": 0.0005477979046805518, + "loss": 0.0659, + "step": 65070 + }, + { + "epoch": 1.64, + "learning_rate": 0.0005474210486646735, + "loss": 0.0644, + "step": 65080 + }, + { + "epoch": 1.64, + "learning_rate": 0.0005470441926487952, + "loss": 0.0645, + "step": 65090 + }, + { + "epoch": 1.64, + "learning_rate": 0.0005466673366329171, + "loss": 0.0669, + "step": 65100 + }, + { + "epoch": 1.64, + "learning_rate": 0.0005462904806170388, + "loss": 0.0662, + "step": 65110 + }, + { + "epoch": 1.64, + "learning_rate": 0.0005459136246011607, + "loss": 0.068, + "step": 65120 + }, + { + "epoch": 1.64, + "learning_rate": 0.0005455367685852826, + "loss": 0.0655, + "step": 65130 + }, + { + "epoch": 1.64, + "learning_rate": 0.0005451599125694043, + "loss": 0.0704, + "step": 65140 + }, + { + "epoch": 1.64, + "learning_rate": 0.0005447830565535261, + "loss": 0.0653, + "step": 65150 + }, + { + "epoch": 1.64, + "learning_rate": 0.0005444062005376479, + "loss": 0.0651, + "step": 65160 + }, + { + "epoch": 1.64, + "learning_rate": 0.0005440293445217697, + "loss": 0.0663, + "step": 65170 + }, + { + "epoch": 1.64, + "learning_rate": 0.0005436524885058915, + "loss": 0.0675, + "step": 65180 + }, + { + "epoch": 1.64, + "learning_rate": 0.0005432756324900133, + "loss": 0.0658, + "step": 65190 + }, + { + "epoch": 1.64, + "learning_rate": 0.0005428987764741351, + "loss": 0.0637, + "step": 65200 + }, + { + "epoch": 1.64, + "learning_rate": 0.0005425219204582569, + "loss": 0.0678, + "step": 65210 + }, + { + "epoch": 1.64, + "learning_rate": 0.0005421450644423787, + "loss": 0.0674, + "step": 65220 + }, + { + "epoch": 1.64, + "learning_rate": 0.0005417682084265005, + "loss": 0.0656, + "step": 65230 + }, + { + "epoch": 1.64, + "learning_rate": 0.0005413913524106224, + "loss": 0.0645, + "step": 65240 + }, + { + "epoch": 1.64, + "learning_rate": 0.0005410144963947441, + "loss": 0.0657, + "step": 65250 + }, + { + "epoch": 1.64, + "learning_rate": 0.000540637640378866, + "loss": 0.0663, + "step": 65260 + }, + { + "epoch": 1.64, + "learning_rate": 0.0005402607843629877, + "loss": 0.0638, + "step": 65270 + }, + { + "epoch": 1.64, + "learning_rate": 0.0005398839283471096, + "loss": 0.0677, + "step": 65280 + }, + { + "epoch": 1.64, + "learning_rate": 0.0005395070723312313, + "loss": 0.0631, + "step": 65290 + }, + { + "epoch": 1.64, + "learning_rate": 0.0005391302163153532, + "loss": 0.0664, + "step": 65300 + }, + { + "epoch": 1.64, + "learning_rate": 0.0005387533602994749, + "loss": 0.0653, + "step": 65310 + }, + { + "epoch": 1.64, + "learning_rate": 0.0005383765042835967, + "loss": 0.066, + "step": 65320 + }, + { + "epoch": 1.64, + "learning_rate": 0.0005379996482677185, + "loss": 0.0665, + "step": 65330 + }, + { + "epoch": 1.64, + "learning_rate": 0.0005376227922518403, + "loss": 0.0672, + "step": 65340 + }, + { + "epoch": 1.64, + "learning_rate": 0.0005372459362359621, + "loss": 0.0644, + "step": 65350 + }, + { + "epoch": 1.64, + "learning_rate": 0.0005368690802200839, + "loss": 0.0683, + "step": 65360 + }, + { + "epoch": 1.64, + "learning_rate": 0.0005364922242042057, + "loss": 0.0643, + "step": 65370 + }, + { + "epoch": 1.64, + "learning_rate": 0.0005361153681883275, + "loss": 0.066, + "step": 65380 + }, + { + "epoch": 1.64, + "learning_rate": 0.0005357385121724493, + "loss": 0.0647, + "step": 65390 + }, + { + "epoch": 1.64, + "learning_rate": 0.0005353616561565711, + "loss": 0.0621, + "step": 65400 + }, + { + "epoch": 1.64, + "learning_rate": 0.0005349848001406929, + "loss": 0.0645, + "step": 65410 + }, + { + "epoch": 1.64, + "learning_rate": 0.0005346079441248148, + "loss": 0.0677, + "step": 65420 + }, + { + "epoch": 1.64, + "learning_rate": 0.0005342310881089365, + "loss": 0.0653, + "step": 65430 + }, + { + "epoch": 1.64, + "learning_rate": 0.0005338542320930584, + "loss": 0.07, + "step": 65440 + }, + { + "epoch": 1.64, + "learning_rate": 0.0005334773760771801, + "loss": 0.0645, + "step": 65450 + }, + { + "epoch": 1.64, + "learning_rate": 0.000533100520061302, + "loss": 0.0657, + "step": 65460 + }, + { + "epoch": 1.64, + "learning_rate": 0.0005327236640454237, + "loss": 0.0654, + "step": 65470 + }, + { + "epoch": 1.65, + "learning_rate": 0.0005323468080295456, + "loss": 0.0639, + "step": 65480 + }, + { + "epoch": 1.65, + "learning_rate": 0.0005319699520136673, + "loss": 0.0633, + "step": 65490 + }, + { + "epoch": 1.65, + "learning_rate": 0.0005315930959977892, + "loss": 0.0654, + "step": 65500 + }, + { + "epoch": 1.65, + "eval_cer": 0.6653707133806576, + "eval_loss": 0.0557679682970047, + "eval_runtime": 90.7481, + "eval_samples_per_second": 110.184, + "eval_steps_per_second": 6.887, + "step": 65500 + }, + { + "epoch": 1.65, + "learning_rate": 0.0005312162399819109, + "loss": 0.0639, + "step": 65510 + }, + { + "epoch": 1.65, + "learning_rate": 0.0005308393839660328, + "loss": 0.0685, + "step": 65520 + }, + { + "epoch": 1.65, + "learning_rate": 0.0005304625279501545, + "loss": 0.0661, + "step": 65530 + }, + { + "epoch": 1.65, + "learning_rate": 0.0005300856719342762, + "loss": 0.066, + "step": 65540 + }, + { + "epoch": 1.65, + "learning_rate": 0.0005297088159183981, + "loss": 0.0622, + "step": 65550 + }, + { + "epoch": 1.65, + "learning_rate": 0.0005293319599025198, + "loss": 0.0649, + "step": 65560 + }, + { + "epoch": 1.65, + "learning_rate": 0.0005289551038866417, + "loss": 0.0658, + "step": 65570 + }, + { + "epoch": 1.65, + "learning_rate": 0.0005285782478707636, + "loss": 0.0627, + "step": 65580 + }, + { + "epoch": 1.65, + "learning_rate": 0.0005282013918548853, + "loss": 0.0638, + "step": 65590 + }, + { + "epoch": 1.65, + "learning_rate": 0.0005278245358390072, + "loss": 0.0647, + "step": 65600 + }, + { + "epoch": 1.65, + "learning_rate": 0.0005274476798231289, + "loss": 0.0678, + "step": 65610 + }, + { + "epoch": 1.65, + "learning_rate": 0.0005270708238072507, + "loss": 0.0658, + "step": 65620 + }, + { + "epoch": 1.65, + "learning_rate": 0.0005266939677913725, + "loss": 0.066, + "step": 65630 + }, + { + "epoch": 1.65, + "learning_rate": 0.0005263171117754943, + "loss": 0.0658, + "step": 65640 + }, + { + "epoch": 1.65, + "learning_rate": 0.0005259402557596161, + "loss": 0.0644, + "step": 65650 + }, + { + "epoch": 1.65, + "learning_rate": 0.0005255633997437379, + "loss": 0.0633, + "step": 65660 + }, + { + "epoch": 1.65, + "learning_rate": 0.0005251865437278597, + "loss": 0.0645, + "step": 65670 + }, + { + "epoch": 1.65, + "learning_rate": 0.0005248096877119815, + "loss": 0.0627, + "step": 65680 + }, + { + "epoch": 1.65, + "learning_rate": 0.0005244328316961034, + "loss": 0.0643, + "step": 65690 + }, + { + "epoch": 1.65, + "learning_rate": 0.0005240559756802251, + "loss": 0.064, + "step": 65700 + }, + { + "epoch": 1.65, + "learning_rate": 0.000523679119664347, + "loss": 0.0699, + "step": 65710 + }, + { + "epoch": 1.65, + "learning_rate": 0.0005233022636484687, + "loss": 0.0665, + "step": 65720 + }, + { + "epoch": 1.65, + "learning_rate": 0.0005229254076325906, + "loss": 0.0674, + "step": 65730 + }, + { + "epoch": 1.65, + "learning_rate": 0.0005225485516167123, + "loss": 0.0638, + "step": 65740 + }, + { + "epoch": 1.65, + "learning_rate": 0.0005221716956008341, + "loss": 0.0632, + "step": 65750 + }, + { + "epoch": 1.65, + "learning_rate": 0.0005217948395849559, + "loss": 0.0636, + "step": 65760 + }, + { + "epoch": 1.65, + "learning_rate": 0.0005214179835690777, + "loss": 0.066, + "step": 65770 + }, + { + "epoch": 1.65, + "learning_rate": 0.0005210411275531995, + "loss": 0.0657, + "step": 65780 + }, + { + "epoch": 1.65, + "learning_rate": 0.0005206642715373213, + "loss": 0.0628, + "step": 65790 + }, + { + "epoch": 1.65, + "learning_rate": 0.0005202874155214431, + "loss": 0.0642, + "step": 65800 + }, + { + "epoch": 1.65, + "learning_rate": 0.0005199105595055649, + "loss": 0.0656, + "step": 65810 + }, + { + "epoch": 1.65, + "learning_rate": 0.0005195337034896867, + "loss": 0.0672, + "step": 65820 + }, + { + "epoch": 1.65, + "learning_rate": 0.0005191568474738085, + "loss": 0.0685, + "step": 65830 + }, + { + "epoch": 1.65, + "learning_rate": 0.0005187799914579303, + "loss": 0.0626, + "step": 65840 + }, + { + "epoch": 1.65, + "learning_rate": 0.0005184031354420521, + "loss": 0.0654, + "step": 65850 + }, + { + "epoch": 1.65, + "learning_rate": 0.0005180262794261739, + "loss": 0.0644, + "step": 65860 + }, + { + "epoch": 1.65, + "learning_rate": 0.0005176494234102958, + "loss": 0.0666, + "step": 65870 + }, + { + "epoch": 1.66, + "learning_rate": 0.0005172725673944175, + "loss": 0.0637, + "step": 65880 + }, + { + "epoch": 1.66, + "learning_rate": 0.0005168957113785394, + "loss": 0.0681, + "step": 65890 + }, + { + "epoch": 1.66, + "learning_rate": 0.0005165188553626611, + "loss": 0.0655, + "step": 65900 + }, + { + "epoch": 1.66, + "learning_rate": 0.000516141999346783, + "loss": 0.065, + "step": 65910 + }, + { + "epoch": 1.66, + "learning_rate": 0.0005157651433309047, + "loss": 0.0626, + "step": 65920 + }, + { + "epoch": 1.66, + "learning_rate": 0.0005153882873150266, + "loss": 0.066, + "step": 65930 + }, + { + "epoch": 1.66, + "learning_rate": 0.0005150114312991483, + "loss": 0.066, + "step": 65940 + }, + { + "epoch": 1.66, + "learning_rate": 0.0005146345752832702, + "loss": 0.0675, + "step": 65950 + }, + { + "epoch": 1.66, + "learning_rate": 0.0005142577192673919, + "loss": 0.0637, + "step": 65960 + }, + { + "epoch": 1.66, + "learning_rate": 0.0005138808632515137, + "loss": 0.0619, + "step": 65970 + }, + { + "epoch": 1.66, + "learning_rate": 0.0005135040072356355, + "loss": 0.0646, + "step": 65980 + }, + { + "epoch": 1.66, + "learning_rate": 0.0005131271512197573, + "loss": 0.0666, + "step": 65990 + }, + { + "epoch": 1.66, + "learning_rate": 0.0005127502952038791, + "loss": 0.0675, + "step": 66000 + }, + { + "epoch": 1.66, + "eval_cer": 0.6653572389313415, + "eval_loss": 0.055686622858047485, + "eval_runtime": 90.4669, + "eval_samples_per_second": 110.527, + "eval_steps_per_second": 6.909, + "step": 66000 + }, + { + "epoch": 1.66, + "learning_rate": 0.0005123734391880008, + "loss": 0.0614, + "step": 66010 + }, + { + "epoch": 1.66, + "learning_rate": 0.0005119965831721227, + "loss": 0.06, + "step": 66020 + }, + { + "epoch": 1.66, + "learning_rate": 0.0005116197271562444, + "loss": 0.066, + "step": 66030 + }, + { + "epoch": 1.66, + "learning_rate": 0.0005112428711403663, + "loss": 0.0651, + "step": 66040 + }, + { + "epoch": 1.66, + "learning_rate": 0.0005108660151244882, + "loss": 0.0605, + "step": 66050 + }, + { + "epoch": 1.66, + "learning_rate": 0.0005104891591086099, + "loss": 0.066, + "step": 66060 + }, + { + "epoch": 1.66, + "learning_rate": 0.0005101123030927318, + "loss": 0.0629, + "step": 66070 + }, + { + "epoch": 1.66, + "learning_rate": 0.0005097354470768535, + "loss": 0.0677, + "step": 66080 + }, + { + "epoch": 1.66, + "learning_rate": 0.0005093585910609753, + "loss": 0.0661, + "step": 66090 + }, + { + "epoch": 1.66, + "learning_rate": 0.0005089817350450971, + "loss": 0.0614, + "step": 66100 + }, + { + "epoch": 1.66, + "learning_rate": 0.000508604879029219, + "loss": 0.065, + "step": 66110 + }, + { + "epoch": 1.66, + "learning_rate": 0.0005082280230133407, + "loss": 0.066, + "step": 66120 + }, + { + "epoch": 1.66, + "learning_rate": 0.0005078511669974625, + "loss": 0.0661, + "step": 66130 + }, + { + "epoch": 1.66, + "learning_rate": 0.0005074743109815843, + "loss": 0.0672, + "step": 66140 + }, + { + "epoch": 1.66, + "learning_rate": 0.0005070974549657061, + "loss": 0.0624, + "step": 66150 + }, + { + "epoch": 1.66, + "learning_rate": 0.000506720598949828, + "loss": 0.0657, + "step": 66160 + }, + { + "epoch": 1.66, + "learning_rate": 0.0005063437429339497, + "loss": 0.0635, + "step": 66170 + }, + { + "epoch": 1.66, + "learning_rate": 0.0005059668869180716, + "loss": 0.0648, + "step": 66180 + }, + { + "epoch": 1.66, + "learning_rate": 0.0005055900309021933, + "loss": 0.0635, + "step": 66190 + }, + { + "epoch": 1.66, + "learning_rate": 0.0005052131748863151, + "loss": 0.0688, + "step": 66200 + }, + { + "epoch": 1.66, + "learning_rate": 0.0005048363188704368, + "loss": 0.0642, + "step": 66210 + }, + { + "epoch": 1.66, + "learning_rate": 0.0005044594628545587, + "loss": 0.0639, + "step": 66220 + }, + { + "epoch": 1.66, + "learning_rate": 0.0005040826068386805, + "loss": 0.0654, + "step": 66230 + }, + { + "epoch": 1.66, + "learning_rate": 0.0005037057508228023, + "loss": 0.0638, + "step": 66240 + }, + { + "epoch": 1.66, + "learning_rate": 0.0005033288948069241, + "loss": 0.0643, + "step": 66250 + }, + { + "epoch": 1.66, + "learning_rate": 0.0005029520387910459, + "loss": 0.0629, + "step": 66260 + }, + { + "epoch": 1.66, + "learning_rate": 0.0005025751827751677, + "loss": 0.0676, + "step": 66270 + }, + { + "epoch": 1.67, + "learning_rate": 0.0005021983267592895, + "loss": 0.0636, + "step": 66280 + }, + { + "epoch": 1.67, + "learning_rate": 0.0005018214707434113, + "loss": 0.064, + "step": 66290 + }, + { + "epoch": 1.67, + "learning_rate": 0.0005014446147275331, + "loss": 0.0663, + "step": 66300 + }, + { + "epoch": 1.67, + "learning_rate": 0.0005010677587116549, + "loss": 0.0632, + "step": 66310 + }, + { + "epoch": 1.67, + "learning_rate": 0.0005006909026957767, + "loss": 0.0647, + "step": 66320 + }, + { + "epoch": 1.67, + "learning_rate": 0.0005003140466798985, + "loss": 0.0668, + "step": 66330 + }, + { + "epoch": 1.67, + "learning_rate": 0.0004999371906640204, + "loss": 0.063, + "step": 66340 + }, + { + "epoch": 1.67, + "learning_rate": 0.0004995603346481421, + "loss": 0.0659, + "step": 66350 + }, + { + "epoch": 1.67, + "learning_rate": 0.000499183478632264, + "loss": 0.0625, + "step": 66360 + }, + { + "epoch": 1.67, + "learning_rate": 0.0004988066226163857, + "loss": 0.0643, + "step": 66370 + }, + { + "epoch": 1.67, + "learning_rate": 0.0004984297666005076, + "loss": 0.0633, + "step": 66380 + }, + { + "epoch": 1.67, + "learning_rate": 0.0004980529105846293, + "loss": 0.0624, + "step": 66390 + }, + { + "epoch": 1.67, + "learning_rate": 0.0004976760545687512, + "loss": 0.0631, + "step": 66400 + }, + { + "epoch": 1.67, + "learning_rate": 0.0004972991985528729, + "loss": 0.0695, + "step": 66410 + }, + { + "epoch": 1.67, + "learning_rate": 0.0004969223425369947, + "loss": 0.0637, + "step": 66420 + }, + { + "epoch": 1.67, + "learning_rate": 0.0004965454865211165, + "loss": 0.0675, + "step": 66430 + }, + { + "epoch": 1.67, + "learning_rate": 0.0004961686305052383, + "loss": 0.0655, + "step": 66440 + }, + { + "epoch": 1.67, + "learning_rate": 0.0004957917744893601, + "loss": 0.0669, + "step": 66450 + }, + { + "epoch": 1.67, + "learning_rate": 0.0004954149184734819, + "loss": 0.0624, + "step": 66460 + }, + { + "epoch": 1.67, + "learning_rate": 0.0004950380624576037, + "loss": 0.0642, + "step": 66470 + }, + { + "epoch": 1.67, + "learning_rate": 0.0004946612064417254, + "loss": 0.0632, + "step": 66480 + }, + { + "epoch": 1.67, + "learning_rate": 0.0004942843504258473, + "loss": 0.062, + "step": 66490 + }, + { + "epoch": 1.67, + "learning_rate": 0.000493907494409969, + "loss": 0.0642, + "step": 66500 + }, + { + "epoch": 1.67, + "eval_cer": 0.6652633990164615, + "eval_loss": 0.05538139119744301, + "eval_runtime": 90.5902, + "eval_samples_per_second": 110.376, + "eval_steps_per_second": 6.899, + "step": 66500 + }, + { + "epoch": 1.67, + "learning_rate": 0.0004935306383940909, + "loss": 0.0635, + "step": 66510 + }, + { + "epoch": 1.67, + "learning_rate": 0.0004931537823782128, + "loss": 0.0623, + "step": 66520 + }, + { + "epoch": 1.67, + "learning_rate": 0.0004927769263623345, + "loss": 0.0643, + "step": 66530 + }, + { + "epoch": 1.67, + "learning_rate": 0.0004924000703464564, + "loss": 0.0654, + "step": 66540 + }, + { + "epoch": 1.67, + "learning_rate": 0.0004920232143305781, + "loss": 0.0633, + "step": 66550 + }, + { + "epoch": 1.67, + "learning_rate": 0.0004916463583147, + "loss": 0.0623, + "step": 66560 + }, + { + "epoch": 1.67, + "learning_rate": 0.0004912695022988217, + "loss": 0.0653, + "step": 66570 + }, + { + "epoch": 1.67, + "learning_rate": 0.0004908926462829435, + "loss": 0.0664, + "step": 66580 + }, + { + "epoch": 1.67, + "learning_rate": 0.0004905157902670653, + "loss": 0.0634, + "step": 66590 + }, + { + "epoch": 1.67, + "learning_rate": 0.0004901389342511871, + "loss": 0.0645, + "step": 66600 + }, + { + "epoch": 1.67, + "learning_rate": 0.0004897620782353089, + "loss": 0.0648, + "step": 66610 + }, + { + "epoch": 1.67, + "learning_rate": 0.0004893852222194307, + "loss": 0.0649, + "step": 66620 + }, + { + "epoch": 1.67, + "learning_rate": 0.0004890083662035526, + "loss": 0.0646, + "step": 66630 + }, + { + "epoch": 1.67, + "learning_rate": 0.0004886315101876742, + "loss": 0.0655, + "step": 66640 + }, + { + "epoch": 1.67, + "learning_rate": 0.0004882546541717961, + "loss": 0.068, + "step": 66650 + }, + { + "epoch": 1.67, + "learning_rate": 0.0004878777981559179, + "loss": 0.0673, + "step": 66660 + }, + { + "epoch": 1.67, + "learning_rate": 0.0004875009421400397, + "loss": 0.0641, + "step": 66670 + }, + { + "epoch": 1.68, + "learning_rate": 0.0004871240861241615, + "loss": 0.0661, + "step": 66680 + }, + { + "epoch": 1.68, + "learning_rate": 0.0004867472301082833, + "loss": 0.0666, + "step": 66690 + }, + { + "epoch": 1.68, + "learning_rate": 0.0004863703740924051, + "loss": 0.0673, + "step": 66700 + }, + { + "epoch": 1.68, + "learning_rate": 0.0004859935180765269, + "loss": 0.0659, + "step": 66710 + }, + { + "epoch": 1.68, + "learning_rate": 0.0004856166620606487, + "loss": 0.0659, + "step": 66720 + }, + { + "epoch": 1.68, + "learning_rate": 0.0004852398060447705, + "loss": 0.0659, + "step": 66730 + }, + { + "epoch": 1.68, + "learning_rate": 0.0004848629500288923, + "loss": 0.0636, + "step": 66740 + }, + { + "epoch": 1.68, + "learning_rate": 0.0004844860940130141, + "loss": 0.0669, + "step": 66750 + }, + { + "epoch": 1.68, + "learning_rate": 0.0004841092379971359, + "loss": 0.0649, + "step": 66760 + }, + { + "epoch": 1.68, + "learning_rate": 0.0004837323819812577, + "loss": 0.0637, + "step": 66770 + }, + { + "epoch": 1.68, + "learning_rate": 0.0004833555259653795, + "loss": 0.0647, + "step": 66780 + }, + { + "epoch": 1.68, + "learning_rate": 0.0004829786699495013, + "loss": 0.0651, + "step": 66790 + }, + { + "epoch": 1.68, + "learning_rate": 0.0004826018139336231, + "loss": 0.0656, + "step": 66800 + }, + { + "epoch": 1.68, + "learning_rate": 0.0004822249579177449, + "loss": 0.0657, + "step": 66810 + }, + { + "epoch": 1.68, + "learning_rate": 0.0004818481019018667, + "loss": 0.0638, + "step": 66820 + }, + { + "epoch": 1.68, + "learning_rate": 0.0004814712458859885, + "loss": 0.0625, + "step": 66830 + }, + { + "epoch": 1.68, + "learning_rate": 0.0004810943898701103, + "loss": 0.0637, + "step": 66840 + }, + { + "epoch": 1.68, + "learning_rate": 0.00048071753385423217, + "loss": 0.0656, + "step": 66850 + }, + { + "epoch": 1.68, + "learning_rate": 0.00048034067783835386, + "loss": 0.0632, + "step": 66860 + }, + { + "epoch": 1.68, + "learning_rate": 0.00047996382182247566, + "loss": 0.0643, + "step": 66870 + }, + { + "epoch": 1.68, + "learning_rate": 0.00047958696580659746, + "loss": 0.0636, + "step": 66880 + }, + { + "epoch": 1.68, + "learning_rate": 0.00047921010979071926, + "loss": 0.0649, + "step": 66890 + }, + { + "epoch": 1.68, + "learning_rate": 0.00047883325377484105, + "loss": 0.0657, + "step": 66900 + }, + { + "epoch": 1.68, + "learning_rate": 0.0004784563977589629, + "loss": 0.0675, + "step": 66910 + }, + { + "epoch": 1.68, + "learning_rate": 0.0004780795417430847, + "loss": 0.0676, + "step": 66920 + }, + { + "epoch": 1.68, + "learning_rate": 0.0004777026857272065, + "loss": 0.0649, + "step": 66930 + }, + { + "epoch": 1.68, + "learning_rate": 0.0004773258297113283, + "loss": 0.0616, + "step": 66940 + }, + { + "epoch": 1.68, + "learning_rate": 0.0004769489736954501, + "loss": 0.0631, + "step": 66950 + }, + { + "epoch": 1.68, + "learning_rate": 0.0004765721176795719, + "loss": 0.0618, + "step": 66960 + }, + { + "epoch": 1.68, + "learning_rate": 0.0004761952616636937, + "loss": 0.0641, + "step": 66970 + }, + { + "epoch": 1.68, + "learning_rate": 0.0004758184056478155, + "loss": 0.0636, + "step": 66980 + }, + { + "epoch": 1.68, + "learning_rate": 0.0004754415496319373, + "loss": 0.0654, + "step": 66990 + }, + { + "epoch": 1.68, + "learning_rate": 0.0004750646936160591, + "loss": 0.0631, + "step": 67000 + }, + { + "epoch": 1.68, + "eval_cer": 0.6653168155833932, + "eval_loss": 0.055216867476701736, + "eval_runtime": 90.7608, + "eval_samples_per_second": 110.169, + "eval_steps_per_second": 6.886, + "step": 67000 + }, + { + "epoch": 1.68, + "learning_rate": 0.0004746878376001809, + "loss": 0.0644, + "step": 67010 + }, + { + "epoch": 1.68, + "learning_rate": 0.0004743109815843027, + "loss": 0.0647, + "step": 67020 + }, + { + "epoch": 1.68, + "learning_rate": 0.00047393412556842455, + "loss": 0.0632, + "step": 67030 + }, + { + "epoch": 1.68, + "learning_rate": 0.00047355726955254635, + "loss": 0.062, + "step": 67040 + }, + { + "epoch": 1.68, + "learning_rate": 0.00047318041353666815, + "loss": 0.0641, + "step": 67050 + }, + { + "epoch": 1.68, + "learning_rate": 0.00047280355752078994, + "loss": 0.0653, + "step": 67060 + }, + { + "epoch": 1.69, + "learning_rate": 0.00047242670150491174, + "loss": 0.0645, + "step": 67070 + }, + { + "epoch": 1.69, + "learning_rate": 0.00047204984548903343, + "loss": 0.0645, + "step": 67080 + }, + { + "epoch": 1.69, + "learning_rate": 0.0004716729894731553, + "loss": 0.0659, + "step": 67090 + }, + { + "epoch": 1.69, + "learning_rate": 0.0004712961334572771, + "loss": 0.0632, + "step": 67100 + }, + { + "epoch": 1.69, + "learning_rate": 0.0004709192774413989, + "loss": 0.0632, + "step": 67110 + }, + { + "epoch": 1.69, + "learning_rate": 0.0004705424214255207, + "loss": 0.0652, + "step": 67120 + }, + { + "epoch": 1.69, + "learning_rate": 0.0004701655654096425, + "loss": 0.0635, + "step": 67130 + }, + { + "epoch": 1.69, + "learning_rate": 0.0004697887093937643, + "loss": 0.0662, + "step": 67140 + }, + { + "epoch": 1.69, + "learning_rate": 0.0004694118533778861, + "loss": 0.0637, + "step": 67150 + }, + { + "epoch": 1.69, + "learning_rate": 0.0004690349973620079, + "loss": 0.0631, + "step": 67160 + }, + { + "epoch": 1.69, + "learning_rate": 0.0004686581413461297, + "loss": 0.0635, + "step": 67170 + }, + { + "epoch": 1.69, + "learning_rate": 0.0004682812853302515, + "loss": 0.0649, + "step": 67180 + }, + { + "epoch": 1.69, + "learning_rate": 0.0004679044293143733, + "loss": 0.0615, + "step": 67190 + }, + { + "epoch": 1.69, + "learning_rate": 0.00046752757329849513, + "loss": 0.0638, + "step": 67200 + }, + { + "epoch": 1.69, + "learning_rate": 0.0004671507172826169, + "loss": 0.0635, + "step": 67210 + }, + { + "epoch": 1.69, + "learning_rate": 0.0004667738612667387, + "loss": 0.0627, + "step": 67220 + }, + { + "epoch": 1.69, + "learning_rate": 0.0004663970052508605, + "loss": 0.0625, + "step": 67230 + }, + { + "epoch": 1.69, + "learning_rate": 0.0004660201492349823, + "loss": 0.065, + "step": 67240 + }, + { + "epoch": 1.69, + "learning_rate": 0.0004656432932191041, + "loss": 0.0622, + "step": 67250 + }, + { + "epoch": 1.69, + "learning_rate": 0.0004652664372032259, + "loss": 0.061, + "step": 67260 + }, + { + "epoch": 1.69, + "learning_rate": 0.0004648895811873477, + "loss": 0.0652, + "step": 67270 + }, + { + "epoch": 1.69, + "learning_rate": 0.0004645127251714695, + "loss": 0.0642, + "step": 67280 + }, + { + "epoch": 1.69, + "learning_rate": 0.0004641358691555913, + "loss": 0.0662, + "step": 67290 + }, + { + "epoch": 1.69, + "learning_rate": 0.0004637590131397131, + "loss": 0.0655, + "step": 67300 + }, + { + "epoch": 1.69, + "learning_rate": 0.00046338215712383486, + "loss": 0.0635, + "step": 67310 + }, + { + "epoch": 1.69, + "learning_rate": 0.00046300530110795666, + "loss": 0.0662, + "step": 67320 + }, + { + "epoch": 1.69, + "learning_rate": 0.00046262844509207846, + "loss": 0.065, + "step": 67330 + }, + { + "epoch": 1.69, + "learning_rate": 0.00046225158907620026, + "loss": 0.0637, + "step": 67340 + }, + { + "epoch": 1.69, + "learning_rate": 0.00046187473306032206, + "loss": 0.0661, + "step": 67350 + }, + { + "epoch": 1.69, + "learning_rate": 0.00046149787704444385, + "loss": 0.0652, + "step": 67360 + }, + { + "epoch": 1.69, + "learning_rate": 0.00046112102102856565, + "loss": 0.0644, + "step": 67370 + }, + { + "epoch": 1.69, + "learning_rate": 0.0004607441650126875, + "loss": 0.0658, + "step": 67380 + }, + { + "epoch": 1.69, + "learning_rate": 0.0004603673089968093, + "loss": 0.0686, + "step": 67390 + }, + { + "epoch": 1.69, + "learning_rate": 0.0004599904529809311, + "loss": 0.065, + "step": 67400 + }, + { + "epoch": 1.69, + "learning_rate": 0.0004596135969650529, + "loss": 0.0682, + "step": 67410 + }, + { + "epoch": 1.69, + "learning_rate": 0.0004592367409491747, + "loss": 0.063, + "step": 67420 + }, + { + "epoch": 1.69, + "learning_rate": 0.0004588598849332965, + "loss": 0.0654, + "step": 67430 + }, + { + "epoch": 1.69, + "learning_rate": 0.0004584830289174183, + "loss": 0.0643, + "step": 67440 + }, + { + "epoch": 1.69, + "learning_rate": 0.0004581061729015401, + "loss": 0.0652, + "step": 67450 + }, + { + "epoch": 1.69, + "learning_rate": 0.0004577293168856619, + "loss": 0.0653, + "step": 67460 + }, + { + "epoch": 1.7, + "learning_rate": 0.0004573524608697837, + "loss": 0.0661, + "step": 67470 + }, + { + "epoch": 1.7, + "learning_rate": 0.0004569756048539055, + "loss": 0.0639, + "step": 67480 + }, + { + "epoch": 1.7, + "learning_rate": 0.00045659874883802735, + "loss": 0.0663, + "step": 67490 + }, + { + "epoch": 1.7, + "learning_rate": 0.00045622189282214915, + "loss": 0.0628, + "step": 67500 + }, + { + "epoch": 1.7, + "eval_cer": 0.6652359688874965, + "eval_loss": 0.05516913905739784, + "eval_runtime": 90.7509, + "eval_samples_per_second": 110.181, + "eval_steps_per_second": 6.887, + "step": 67500 + }, + { + "epoch": 1.7, + "learning_rate": 0.00045584503680627095, + "loss": 0.0653, + "step": 67510 + }, + { + "epoch": 1.7, + "learning_rate": 0.00045546818079039274, + "loss": 0.0623, + "step": 67520 + }, + { + "epoch": 1.7, + "learning_rate": 0.00045509132477451443, + "loss": 0.0636, + "step": 67530 + }, + { + "epoch": 1.7, + "learning_rate": 0.00045471446875863623, + "loss": 0.0632, + "step": 67540 + }, + { + "epoch": 1.7, + "learning_rate": 0.0004543376127427581, + "loss": 0.0632, + "step": 67550 + }, + { + "epoch": 1.7, + "learning_rate": 0.0004539607567268799, + "loss": 0.0662, + "step": 67560 + }, + { + "epoch": 1.7, + "learning_rate": 0.0004535839007110017, + "loss": 0.0645, + "step": 67570 + }, + { + "epoch": 1.7, + "learning_rate": 0.0004532070446951235, + "loss": 0.0639, + "step": 67580 + }, + { + "epoch": 1.7, + "learning_rate": 0.0004528301886792453, + "loss": 0.0679, + "step": 67590 + }, + { + "epoch": 1.7, + "learning_rate": 0.0004524533326633671, + "loss": 0.0674, + "step": 67600 + }, + { + "epoch": 1.7, + "learning_rate": 0.0004520764766474889, + "loss": 0.0624, + "step": 67610 + }, + { + "epoch": 1.7, + "learning_rate": 0.0004516996206316107, + "loss": 0.0614, + "step": 67620 + }, + { + "epoch": 1.7, + "learning_rate": 0.0004513227646157325, + "loss": 0.062, + "step": 67630 + }, + { + "epoch": 1.7, + "learning_rate": 0.0004509459085998543, + "loss": 0.0642, + "step": 67640 + }, + { + "epoch": 1.7, + "learning_rate": 0.0004505690525839761, + "loss": 0.0649, + "step": 67650 + }, + { + "epoch": 1.7, + "learning_rate": 0.0004501921965680979, + "loss": 0.0637, + "step": 67660 + }, + { + "epoch": 1.7, + "learning_rate": 0.00044981534055221973, + "loss": 0.0626, + "step": 67670 + }, + { + "epoch": 1.7, + "learning_rate": 0.0004494384845363415, + "loss": 0.0662, + "step": 67680 + }, + { + "epoch": 1.7, + "learning_rate": 0.0004490616285204633, + "loss": 0.0695, + "step": 67690 + }, + { + "epoch": 1.7, + "learning_rate": 0.0004486847725045851, + "loss": 0.066, + "step": 67700 + }, + { + "epoch": 1.7, + "learning_rate": 0.0004483079164887069, + "loss": 0.0671, + "step": 67710 + }, + { + "epoch": 1.7, + "learning_rate": 0.0004479310604728287, + "loss": 0.0642, + "step": 67720 + }, + { + "epoch": 1.7, + "learning_rate": 0.0004475542044569505, + "loss": 0.0618, + "step": 67730 + }, + { + "epoch": 1.7, + "learning_rate": 0.0004471773484410723, + "loss": 0.0681, + "step": 67740 + }, + { + "epoch": 1.7, + "learning_rate": 0.00044680049242519406, + "loss": 0.0649, + "step": 67750 + }, + { + "epoch": 1.7, + "learning_rate": 0.00044642363640931586, + "loss": 0.0679, + "step": 67760 + }, + { + "epoch": 1.7, + "learning_rate": 0.00044604678039343766, + "loss": 0.0629, + "step": 67770 + }, + { + "epoch": 1.7, + "learning_rate": 0.00044566992437755946, + "loss": 0.067, + "step": 67780 + }, + { + "epoch": 1.7, + "learning_rate": 0.00044529306836168126, + "loss": 0.0653, + "step": 67790 + }, + { + "epoch": 1.7, + "learning_rate": 0.00044491621234580306, + "loss": 0.0646, + "step": 67800 + }, + { + "epoch": 1.7, + "learning_rate": 0.00044453935632992486, + "loss": 0.0647, + "step": 67810 + }, + { + "epoch": 1.7, + "learning_rate": 0.00044416250031404666, + "loss": 0.0633, + "step": 67820 + }, + { + "epoch": 1.7, + "learning_rate": 0.00044378564429816845, + "loss": 0.0661, + "step": 67830 + }, + { + "epoch": 1.7, + "learning_rate": 0.0004434087882822903, + "loss": 0.0662, + "step": 67840 + }, + { + "epoch": 1.7, + "learning_rate": 0.0004430319322664121, + "loss": 0.063, + "step": 67850 + }, + { + "epoch": 1.7, + "learning_rate": 0.0004426550762505339, + "loss": 0.0631, + "step": 67860 + }, + { + "epoch": 1.71, + "learning_rate": 0.0004422782202346557, + "loss": 0.0687, + "step": 67870 + }, + { + "epoch": 1.71, + "learning_rate": 0.0004419013642187775, + "loss": 0.0646, + "step": 67880 + }, + { + "epoch": 1.71, + "learning_rate": 0.0004415245082028993, + "loss": 0.0644, + "step": 67890 + }, + { + "epoch": 1.71, + "learning_rate": 0.0004411476521870211, + "loss": 0.0619, + "step": 67900 + }, + { + "epoch": 1.71, + "learning_rate": 0.0004407707961711429, + "loss": 0.0628, + "step": 67910 + }, + { + "epoch": 1.71, + "learning_rate": 0.0004403939401552647, + "loss": 0.0617, + "step": 67920 + }, + { + "epoch": 1.71, + "learning_rate": 0.0004400170841393865, + "loss": 0.065, + "step": 67930 + }, + { + "epoch": 1.71, + "learning_rate": 0.0004396402281235083, + "loss": 0.0642, + "step": 67940 + }, + { + "epoch": 1.71, + "learning_rate": 0.0004392633721076301, + "loss": 0.0633, + "step": 67950 + }, + { + "epoch": 1.71, + "learning_rate": 0.00043888651609175195, + "loss": 0.063, + "step": 67960 + }, + { + "epoch": 1.71, + "learning_rate": 0.00043850966007587364, + "loss": 0.0654, + "step": 67970 + }, + { + "epoch": 1.71, + "learning_rate": 0.00043813280405999544, + "loss": 0.0636, + "step": 67980 + }, + { + "epoch": 1.71, + "learning_rate": 0.00043775594804411724, + "loss": 0.0649, + "step": 67990 + }, + { + "epoch": 1.71, + "learning_rate": 0.00043737909202823903, + "loss": 0.0658, + "step": 68000 + }, + { + "epoch": 1.71, + "eval_cer": 0.6652422248818218, + "eval_loss": 0.05499656870961189, + "eval_runtime": 90.5701, + "eval_samples_per_second": 110.401, + "eval_steps_per_second": 6.901, + "step": 68000 + }, + { + "epoch": 1.71, + "learning_rate": 0.00043700223601236083, + "loss": 0.0656, + "step": 68010 + }, + { + "epoch": 1.71, + "learning_rate": 0.0004366253799964827, + "loss": 0.0626, + "step": 68020 + }, + { + "epoch": 1.71, + "learning_rate": 0.0004362485239806045, + "loss": 0.0635, + "step": 68030 + }, + { + "epoch": 1.71, + "learning_rate": 0.0004358716679647263, + "loss": 0.0634, + "step": 68040 + }, + { + "epoch": 1.71, + "learning_rate": 0.0004354948119488481, + "loss": 0.0625, + "step": 68050 + }, + { + "epoch": 1.71, + "learning_rate": 0.0004351179559329699, + "loss": 0.0659, + "step": 68060 + }, + { + "epoch": 1.71, + "learning_rate": 0.0004347410999170917, + "loss": 0.0648, + "step": 68070 + }, + { + "epoch": 1.71, + "learning_rate": 0.0004343642439012135, + "loss": 0.0658, + "step": 68080 + }, + { + "epoch": 1.71, + "learning_rate": 0.0004339873878853353, + "loss": 0.0642, + "step": 68090 + }, + { + "epoch": 1.71, + "learning_rate": 0.0004336105318694571, + "loss": 0.0599, + "step": 68100 + }, + { + "epoch": 1.71, + "learning_rate": 0.0004332336758535789, + "loss": 0.063, + "step": 68110 + }, + { + "epoch": 1.71, + "learning_rate": 0.0004328568198377007, + "loss": 0.0649, + "step": 68120 + }, + { + "epoch": 1.71, + "learning_rate": 0.00043247996382182253, + "loss": 0.0663, + "step": 68130 + }, + { + "epoch": 1.71, + "learning_rate": 0.0004321031078059443, + "loss": 0.0652, + "step": 68140 + }, + { + "epoch": 1.71, + "learning_rate": 0.0004317262517900661, + "loss": 0.0635, + "step": 68150 + }, + { + "epoch": 1.71, + "learning_rate": 0.0004313493957741879, + "loss": 0.0666, + "step": 68160 + }, + { + "epoch": 1.71, + "learning_rate": 0.0004309725397583097, + "loss": 0.0679, + "step": 68170 + }, + { + "epoch": 1.71, + "learning_rate": 0.0004305956837424315, + "loss": 0.0618, + "step": 68180 + }, + { + "epoch": 1.71, + "learning_rate": 0.0004302188277265533, + "loss": 0.0659, + "step": 68190 + }, + { + "epoch": 1.71, + "learning_rate": 0.00042984197171067507, + "loss": 0.0622, + "step": 68200 + }, + { + "epoch": 1.71, + "learning_rate": 0.00042946511569479686, + "loss": 0.0654, + "step": 68210 + }, + { + "epoch": 1.71, + "learning_rate": 0.00042908825967891866, + "loss": 0.0605, + "step": 68220 + }, + { + "epoch": 1.71, + "learning_rate": 0.00042871140366304046, + "loss": 0.0613, + "step": 68230 + }, + { + "epoch": 1.71, + "learning_rate": 0.00042833454764716226, + "loss": 0.0616, + "step": 68240 + }, + { + "epoch": 1.71, + "learning_rate": 0.00042795769163128406, + "loss": 0.0642, + "step": 68250 + }, + { + "epoch": 1.71, + "learning_rate": 0.00042758083561540586, + "loss": 0.0647, + "step": 68260 + }, + { + "epoch": 1.72, + "learning_rate": 0.00042720397959952766, + "loss": 0.0618, + "step": 68270 + }, + { + "epoch": 1.72, + "learning_rate": 0.00042682712358364946, + "loss": 0.0622, + "step": 68280 + }, + { + "epoch": 1.72, + "learning_rate": 0.00042645026756777125, + "loss": 0.0674, + "step": 68290 + }, + { + "epoch": 1.72, + "learning_rate": 0.00042607341155189305, + "loss": 0.0645, + "step": 68300 + }, + { + "epoch": 1.72, + "learning_rate": 0.0004256965555360149, + "loss": 0.0643, + "step": 68310 + }, + { + "epoch": 1.72, + "learning_rate": 0.0004253196995201367, + "loss": 0.0659, + "step": 68320 + }, + { + "epoch": 1.72, + "learning_rate": 0.0004249428435042585, + "loss": 0.0641, + "step": 68330 + }, + { + "epoch": 1.72, + "learning_rate": 0.0004245659874883803, + "loss": 0.0638, + "step": 68340 + }, + { + "epoch": 1.72, + "learning_rate": 0.0004241891314725021, + "loss": 0.0638, + "step": 68350 + }, + { + "epoch": 1.72, + "learning_rate": 0.0004238122754566239, + "loss": 0.0624, + "step": 68360 + }, + { + "epoch": 1.72, + "learning_rate": 0.0004234354194407457, + "loss": 0.064, + "step": 68370 + }, + { + "epoch": 1.72, + "learning_rate": 0.0004230585634248675, + "loss": 0.0614, + "step": 68380 + }, + { + "epoch": 1.72, + "learning_rate": 0.0004226817074089893, + "loss": 0.0629, + "step": 68390 + }, + { + "epoch": 1.72, + "learning_rate": 0.0004223048513931111, + "loss": 0.065, + "step": 68400 + }, + { + "epoch": 1.72, + "learning_rate": 0.0004219279953772329, + "loss": 0.0652, + "step": 68410 + }, + { + "epoch": 1.72, + "learning_rate": 0.00042155113936135464, + "loss": 0.0619, + "step": 68420 + }, + { + "epoch": 1.72, + "learning_rate": 0.00042117428334547644, + "loss": 0.0639, + "step": 68430 + }, + { + "epoch": 1.72, + "learning_rate": 0.00042079742732959824, + "loss": 0.0622, + "step": 68440 + }, + { + "epoch": 1.72, + "learning_rate": 0.00042042057131372004, + "loss": 0.0649, + "step": 68450 + }, + { + "epoch": 1.72, + "learning_rate": 0.00042004371529784184, + "loss": 0.0617, + "step": 68460 + }, + { + "epoch": 1.72, + "learning_rate": 0.00041966685928196363, + "loss": 0.0616, + "step": 68470 + }, + { + "epoch": 1.72, + "learning_rate": 0.0004192900032660855, + "loss": 0.0656, + "step": 68480 + }, + { + "epoch": 1.72, + "learning_rate": 0.0004189131472502073, + "loss": 0.0644, + "step": 68490 + }, + { + "epoch": 1.72, + "learning_rate": 0.0004185362912343291, + "loss": 0.0654, + "step": 68500 + }, + { + "epoch": 1.72, + "eval_cer": 0.6652802420781065, + "eval_loss": 0.05473272502422333, + "eval_runtime": 90.6389, + "eval_samples_per_second": 110.317, + "eval_steps_per_second": 6.895, + "step": 68500 + }, + { + "epoch": 1.72, + "learning_rate": 0.0004181594352184509, + "loss": 0.0607, + "step": 68510 + }, + { + "epoch": 1.72, + "learning_rate": 0.0004177825792025727, + "loss": 0.0648, + "step": 68520 + }, + { + "epoch": 1.72, + "learning_rate": 0.0004174057231866945, + "loss": 0.0613, + "step": 68530 + }, + { + "epoch": 1.72, + "learning_rate": 0.0004170288671708163, + "loss": 0.0652, + "step": 68540 + }, + { + "epoch": 1.72, + "learning_rate": 0.0004166520111549381, + "loss": 0.0624, + "step": 68550 + }, + { + "epoch": 1.72, + "learning_rate": 0.0004162751551390599, + "loss": 0.0648, + "step": 68560 + }, + { + "epoch": 1.72, + "learning_rate": 0.0004158982991231817, + "loss": 0.0624, + "step": 68570 + }, + { + "epoch": 1.72, + "learning_rate": 0.0004155214431073035, + "loss": 0.0628, + "step": 68580 + }, + { + "epoch": 1.72, + "learning_rate": 0.00041514458709142533, + "loss": 0.0655, + "step": 68590 + }, + { + "epoch": 1.72, + "learning_rate": 0.00041476773107554713, + "loss": 0.0661, + "step": 68600 + }, + { + "epoch": 1.72, + "learning_rate": 0.0004143908750596689, + "loss": 0.0627, + "step": 68610 + }, + { + "epoch": 1.72, + "learning_rate": 0.0004140140190437907, + "loss": 0.063, + "step": 68620 + }, + { + "epoch": 1.72, + "learning_rate": 0.0004136371630279125, + "loss": 0.0662, + "step": 68630 + }, + { + "epoch": 1.72, + "learning_rate": 0.0004132603070120342, + "loss": 0.0645, + "step": 68640 + }, + { + "epoch": 1.72, + "learning_rate": 0.00041288345099615607, + "loss": 0.062, + "step": 68650 + }, + { + "epoch": 1.72, + "learning_rate": 0.00041250659498027787, + "loss": 0.0633, + "step": 68660 + }, + { + "epoch": 1.73, + "learning_rate": 0.00041212973896439966, + "loss": 0.0664, + "step": 68670 + }, + { + "epoch": 1.73, + "learning_rate": 0.00041175288294852146, + "loss": 0.0625, + "step": 68680 + }, + { + "epoch": 1.73, + "learning_rate": 0.00041137602693264326, + "loss": 0.0637, + "step": 68690 + }, + { + "epoch": 1.73, + "learning_rate": 0.00041099917091676506, + "loss": 0.0653, + "step": 68700 + }, + { + "epoch": 1.73, + "learning_rate": 0.00041062231490088686, + "loss": 0.0622, + "step": 68710 + }, + { + "epoch": 1.73, + "learning_rate": 0.00041024545888500866, + "loss": 0.0637, + "step": 68720 + }, + { + "epoch": 1.73, + "learning_rate": 0.00040986860286913046, + "loss": 0.0634, + "step": 68730 + }, + { + "epoch": 1.73, + "learning_rate": 0.00040949174685325226, + "loss": 0.0658, + "step": 68740 + }, + { + "epoch": 1.73, + "learning_rate": 0.00040911489083737406, + "loss": 0.0646, + "step": 68750 + }, + { + "epoch": 1.73, + "learning_rate": 0.00040873803482149585, + "loss": 0.0644, + "step": 68760 + }, + { + "epoch": 1.73, + "learning_rate": 0.0004083611788056177, + "loss": 0.064, + "step": 68770 + }, + { + "epoch": 1.73, + "learning_rate": 0.0004079843227897395, + "loss": 0.0608, + "step": 68780 + }, + { + "epoch": 1.73, + "learning_rate": 0.0004076074667738613, + "loss": 0.0658, + "step": 68790 + }, + { + "epoch": 1.73, + "learning_rate": 0.0004072306107579831, + "loss": 0.0641, + "step": 68800 + }, + { + "epoch": 1.73, + "learning_rate": 0.0004068537547421049, + "loss": 0.0634, + "step": 68810 + }, + { + "epoch": 1.73, + "learning_rate": 0.0004064768987262267, + "loss": 0.0649, + "step": 68820 + }, + { + "epoch": 1.73, + "learning_rate": 0.0004061000427103485, + "loss": 0.0632, + "step": 68830 + }, + { + "epoch": 1.73, + "learning_rate": 0.0004057231866944703, + "loss": 0.0661, + "step": 68840 + }, + { + "epoch": 1.73, + "learning_rate": 0.0004053463306785921, + "loss": 0.065, + "step": 68850 + }, + { + "epoch": 1.73, + "learning_rate": 0.00040496947466271384, + "loss": 0.0658, + "step": 68860 + }, + { + "epoch": 1.73, + "learning_rate": 0.00040459261864683564, + "loss": 0.0654, + "step": 68870 + }, + { + "epoch": 1.73, + "learning_rate": 0.00040421576263095744, + "loss": 0.0607, + "step": 68880 + }, + { + "epoch": 1.73, + "learning_rate": 0.00040383890661507924, + "loss": 0.0647, + "step": 68890 + }, + { + "epoch": 1.73, + "learning_rate": 0.00040346205059920104, + "loss": 0.0608, + "step": 68900 + }, + { + "epoch": 1.73, + "learning_rate": 0.00040308519458332284, + "loss": 0.0642, + "step": 68910 + }, + { + "epoch": 1.73, + "learning_rate": 0.00040270833856744464, + "loss": 0.0664, + "step": 68920 + }, + { + "epoch": 1.73, + "learning_rate": 0.00040233148255156643, + "loss": 0.063, + "step": 68930 + }, + { + "epoch": 1.73, + "learning_rate": 0.0004019546265356883, + "loss": 0.0614, + "step": 68940 + }, + { + "epoch": 1.73, + "learning_rate": 0.0004015777705198101, + "loss": 0.0619, + "step": 68950 + }, + { + "epoch": 1.73, + "learning_rate": 0.0004012009145039319, + "loss": 0.064, + "step": 68960 + }, + { + "epoch": 1.73, + "learning_rate": 0.0004008240584880537, + "loss": 0.061, + "step": 68970 + }, + { + "epoch": 1.73, + "learning_rate": 0.0004004472024721755, + "loss": 0.0616, + "step": 68980 + }, + { + "epoch": 1.73, + "learning_rate": 0.0004000703464562973, + "loss": 0.0635, + "step": 68990 + }, + { + "epoch": 1.73, + "learning_rate": 0.0003996934904404191, + "loss": 0.0648, + "step": 69000 + }, + { + "epoch": 1.73, + "eval_cer": 0.6652388562694929, + "eval_loss": 0.05441926792263985, + "eval_runtime": 90.7649, + "eval_samples_per_second": 110.164, + "eval_steps_per_second": 6.886, + "step": 69000 + }, + { + "epoch": 1.73, + "learning_rate": 0.0003993166344245409, + "loss": 0.0631, + "step": 69010 + }, + { + "epoch": 1.73, + "learning_rate": 0.0003989397784086627, + "loss": 0.061, + "step": 69020 + }, + { + "epoch": 1.73, + "learning_rate": 0.0003985629223927845, + "loss": 0.0661, + "step": 69030 + }, + { + "epoch": 1.73, + "learning_rate": 0.0003981860663769063, + "loss": 0.068, + "step": 69040 + }, + { + "epoch": 1.73, + "learning_rate": 0.0003978092103610281, + "loss": 0.0634, + "step": 69050 + }, + { + "epoch": 1.74, + "learning_rate": 0.00039743235434514993, + "loss": 0.0636, + "step": 69060 + }, + { + "epoch": 1.74, + "learning_rate": 0.0003970554983292717, + "loss": 0.0637, + "step": 69070 + }, + { + "epoch": 1.74, + "learning_rate": 0.0003966786423133935, + "loss": 0.0637, + "step": 69080 + }, + { + "epoch": 1.74, + "learning_rate": 0.0003963017862975152, + "loss": 0.0616, + "step": 69090 + }, + { + "epoch": 1.74, + "learning_rate": 0.000395924930281637, + "loss": 0.0616, + "step": 69100 + }, + { + "epoch": 1.74, + "learning_rate": 0.0003955480742657588, + "loss": 0.0612, + "step": 69110 + }, + { + "epoch": 1.74, + "learning_rate": 0.00039517121824988067, + "loss": 0.0644, + "step": 69120 + }, + { + "epoch": 1.74, + "learning_rate": 0.00039479436223400247, + "loss": 0.0623, + "step": 69130 + }, + { + "epoch": 1.74, + "learning_rate": 0.00039441750621812426, + "loss": 0.0671, + "step": 69140 + }, + { + "epoch": 1.74, + "learning_rate": 0.00039404065020224606, + "loss": 0.0638, + "step": 69150 + }, + { + "epoch": 1.74, + "learning_rate": 0.00039366379418636786, + "loss": 0.0653, + "step": 69160 + }, + { + "epoch": 1.74, + "learning_rate": 0.00039328693817048966, + "loss": 0.0618, + "step": 69170 + }, + { + "epoch": 1.74, + "learning_rate": 0.00039291008215461146, + "loss": 0.0682, + "step": 69180 + }, + { + "epoch": 1.74, + "learning_rate": 0.00039253322613873326, + "loss": 0.066, + "step": 69190 + }, + { + "epoch": 1.74, + "learning_rate": 0.00039215637012285506, + "loss": 0.0612, + "step": 69200 + }, + { + "epoch": 1.74, + "learning_rate": 0.00039177951410697686, + "loss": 0.0609, + "step": 69210 + }, + { + "epoch": 1.74, + "learning_rate": 0.00039140265809109866, + "loss": 0.0658, + "step": 69220 + }, + { + "epoch": 1.74, + "learning_rate": 0.0003910258020752205, + "loss": 0.0637, + "step": 69230 + }, + { + "epoch": 1.74, + "learning_rate": 0.0003906489460593423, + "loss": 0.0654, + "step": 69240 + }, + { + "epoch": 1.74, + "learning_rate": 0.0003902720900434641, + "loss": 0.0591, + "step": 69250 + }, + { + "epoch": 1.74, + "learning_rate": 0.0003898952340275859, + "loss": 0.067, + "step": 69260 + }, + { + "epoch": 1.74, + "learning_rate": 0.0003895183780117077, + "loss": 0.0627, + "step": 69270 + }, + { + "epoch": 1.74, + "learning_rate": 0.0003891415219958295, + "loss": 0.064, + "step": 69280 + }, + { + "epoch": 1.74, + "learning_rate": 0.0003887646659799513, + "loss": 0.0615, + "step": 69290 + }, + { + "epoch": 1.74, + "learning_rate": 0.0003883878099640731, + "loss": 0.0631, + "step": 69300 + }, + { + "epoch": 1.74, + "learning_rate": 0.00038801095394819484, + "loss": 0.0646, + "step": 69310 + }, + { + "epoch": 1.74, + "learning_rate": 0.00038763409793231664, + "loss": 0.0618, + "step": 69320 + }, + { + "epoch": 1.74, + "learning_rate": 0.00038725724191643844, + "loss": 0.0627, + "step": 69330 + }, + { + "epoch": 1.74, + "learning_rate": 0.00038688038590056024, + "loss": 0.0637, + "step": 69340 + }, + { + "epoch": 1.74, + "learning_rate": 0.00038650352988468204, + "loss": 0.066, + "step": 69350 + }, + { + "epoch": 1.74, + "learning_rate": 0.00038612667386880384, + "loss": 0.0635, + "step": 69360 + }, + { + "epoch": 1.74, + "learning_rate": 0.00038574981785292564, + "loss": 0.0645, + "step": 69370 + }, + { + "epoch": 1.74, + "learning_rate": 0.00038537296183704744, + "loss": 0.0632, + "step": 69380 + }, + { + "epoch": 1.74, + "learning_rate": 0.00038499610582116924, + "loss": 0.0679, + "step": 69390 + }, + { + "epoch": 1.74, + "learning_rate": 0.00038461924980529103, + "loss": 0.0631, + "step": 69400 + }, + { + "epoch": 1.74, + "learning_rate": 0.0003842423937894129, + "loss": 0.0632, + "step": 69410 + }, + { + "epoch": 1.74, + "learning_rate": 0.0003838655377735347, + "loss": 0.0607, + "step": 69420 + }, + { + "epoch": 1.74, + "learning_rate": 0.0003834886817576565, + "loss": 0.061, + "step": 69430 + }, + { + "epoch": 1.74, + "learning_rate": 0.0003831118257417783, + "loss": 0.0644, + "step": 69440 + }, + { + "epoch": 1.74, + "learning_rate": 0.0003827349697259001, + "loss": 0.0632, + "step": 69450 + }, + { + "epoch": 1.75, + "learning_rate": 0.0003823581137100219, + "loss": 0.0652, + "step": 69460 + }, + { + "epoch": 1.75, + "learning_rate": 0.0003819812576941437, + "loss": 0.0638, + "step": 69470 + }, + { + "epoch": 1.75, + "learning_rate": 0.0003816044016782655, + "loss": 0.0644, + "step": 69480 + }, + { + "epoch": 1.75, + "learning_rate": 0.0003812275456623873, + "loss": 0.0632, + "step": 69490 + }, + { + "epoch": 1.75, + "learning_rate": 0.0003808506896465091, + "loss": 0.0634, + "step": 69500 + }, + { + "epoch": 1.75, + "eval_cer": 0.6652205695168496, + "eval_loss": 0.05466347932815552, + "eval_runtime": 90.7872, + "eval_samples_per_second": 110.137, + "eval_steps_per_second": 6.884, + "step": 69500 + }, + { + "epoch": 1.75, + "learning_rate": 0.0003804738336306309, + "loss": 0.0635, + "step": 69510 + }, + { + "epoch": 1.75, + "learning_rate": 0.00038009697761475273, + "loss": 0.0631, + "step": 69520 + }, + { + "epoch": 1.75, + "learning_rate": 0.0003797201215988744, + "loss": 0.0653, + "step": 69530 + }, + { + "epoch": 1.75, + "learning_rate": 0.0003793432655829962, + "loss": 0.0644, + "step": 69540 + }, + { + "epoch": 1.75, + "learning_rate": 0.000378966409567118, + "loss": 0.0607, + "step": 69550 + }, + { + "epoch": 1.75, + "learning_rate": 0.0003785895535512398, + "loss": 0.0663, + "step": 69560 + }, + { + "epoch": 1.75, + "learning_rate": 0.0003782126975353616, + "loss": 0.0646, + "step": 69570 + }, + { + "epoch": 1.75, + "learning_rate": 0.00037783584151948347, + "loss": 0.0633, + "step": 69580 + }, + { + "epoch": 1.75, + "learning_rate": 0.00037745898550360527, + "loss": 0.064, + "step": 69590 + }, + { + "epoch": 1.75, + "learning_rate": 0.00037708212948772707, + "loss": 0.0619, + "step": 69600 + }, + { + "epoch": 1.75, + "learning_rate": 0.00037670527347184886, + "loss": 0.06, + "step": 69610 + }, + { + "epoch": 1.75, + "learning_rate": 0.00037632841745597066, + "loss": 0.0627, + "step": 69620 + }, + { + "epoch": 1.75, + "learning_rate": 0.00037595156144009246, + "loss": 0.0618, + "step": 69630 + }, + { + "epoch": 1.75, + "learning_rate": 0.00037557470542421426, + "loss": 0.0643, + "step": 69640 + }, + { + "epoch": 1.75, + "learning_rate": 0.00037519784940833606, + "loss": 0.0647, + "step": 69650 + }, + { + "epoch": 1.75, + "learning_rate": 0.00037482099339245786, + "loss": 0.0622, + "step": 69660 + }, + { + "epoch": 1.75, + "learning_rate": 0.00037444413737657966, + "loss": 0.0646, + "step": 69670 + }, + { + "epoch": 1.75, + "learning_rate": 0.00037406728136070146, + "loss": 0.0632, + "step": 69680 + }, + { + "epoch": 1.75, + "learning_rate": 0.00037369042534482325, + "loss": 0.0615, + "step": 69690 + }, + { + "epoch": 1.75, + "learning_rate": 0.00037331356932894505, + "loss": 0.0654, + "step": 69700 + }, + { + "epoch": 1.75, + "learning_rate": 0.00037293671331306685, + "loss": 0.0621, + "step": 69710 + }, + { + "epoch": 1.75, + "learning_rate": 0.00037255985729718865, + "loss": 0.0611, + "step": 69720 + }, + { + "epoch": 1.75, + "learning_rate": 0.00037218300128131045, + "loss": 0.0651, + "step": 69730 + }, + { + "epoch": 1.75, + "learning_rate": 0.00037180614526543225, + "loss": 0.0624, + "step": 69740 + }, + { + "epoch": 1.75, + "learning_rate": 0.00037142928924955405, + "loss": 0.0651, + "step": 69750 + }, + { + "epoch": 1.75, + "learning_rate": 0.00037105243323367585, + "loss": 0.0625, + "step": 69760 + }, + { + "epoch": 1.75, + "learning_rate": 0.00037067557721779765, + "loss": 0.0627, + "step": 69770 + }, + { + "epoch": 1.75, + "learning_rate": 0.0003702987212019195, + "loss": 0.0657, + "step": 69780 + }, + { + "epoch": 1.75, + "learning_rate": 0.0003699218651860413, + "loss": 0.0654, + "step": 69790 + }, + { + "epoch": 1.75, + "learning_rate": 0.0003695450091701631, + "loss": 0.0615, + "step": 69800 + }, + { + "epoch": 1.75, + "learning_rate": 0.00036916815315428484, + "loss": 0.0639, + "step": 69810 + }, + { + "epoch": 1.75, + "learning_rate": 0.00036879129713840664, + "loss": 0.0629, + "step": 69820 + }, + { + "epoch": 1.75, + "learning_rate": 0.00036841444112252844, + "loss": 0.0632, + "step": 69830 + }, + { + "epoch": 1.75, + "learning_rate": 0.00036803758510665024, + "loss": 0.0595, + "step": 69840 + }, + { + "epoch": 1.75, + "learning_rate": 0.00036766072909077204, + "loss": 0.0634, + "step": 69850 + }, + { + "epoch": 1.76, + "learning_rate": 0.00036728387307489383, + "loss": 0.0647, + "step": 69860 + }, + { + "epoch": 1.76, + "learning_rate": 0.0003669070170590157, + "loss": 0.0643, + "step": 69870 + }, + { + "epoch": 1.76, + "learning_rate": 0.0003665301610431375, + "loss": 0.0602, + "step": 69880 + }, + { + "epoch": 1.76, + "learning_rate": 0.0003661533050272593, + "loss": 0.065, + "step": 69890 + }, + { + "epoch": 1.76, + "learning_rate": 0.0003657764490113811, + "loss": 0.0646, + "step": 69900 + }, + { + "epoch": 1.76, + "learning_rate": 0.0003653995929955029, + "loss": 0.0644, + "step": 69910 + }, + { + "epoch": 1.76, + "learning_rate": 0.00036502273697962463, + "loss": 0.0673, + "step": 69920 + }, + { + "epoch": 1.76, + "learning_rate": 0.0003646458809637464, + "loss": 0.0615, + "step": 69930 + }, + { + "epoch": 1.76, + "learning_rate": 0.0003642690249478682, + "loss": 0.0612, + "step": 69940 + }, + { + "epoch": 1.76, + "learning_rate": 0.00036389216893199, + "loss": 0.0609, + "step": 69950 + }, + { + "epoch": 1.76, + "learning_rate": 0.0003635153129161119, + "loss": 0.0653, + "step": 69960 + }, + { + "epoch": 1.76, + "learning_rate": 0.0003631384569002337, + "loss": 0.0605, + "step": 69970 + }, + { + "epoch": 1.76, + "learning_rate": 0.0003627616008843555, + "loss": 0.064, + "step": 69980 + }, + { + "epoch": 1.76, + "learning_rate": 0.0003623847448684773, + "loss": 0.0625, + "step": 69990 + }, + { + "epoch": 1.76, + "learning_rate": 0.00036200788885259907, + "loss": 0.0642, + "step": 70000 + }, + { + "epoch": 1.76, + "eval_cer": 0.6653692696896594, + "eval_loss": 0.054389722645282745, + "eval_runtime": 90.734, + "eval_samples_per_second": 110.201, + "eval_steps_per_second": 6.888, + "step": 70000 + }, + { + "epoch": 1.76, + "learning_rate": 0.00036163103283672087, + "loss": 0.0622, + "step": 70010 + }, + { + "epoch": 1.76, + "learning_rate": 0.00036125417682084267, + "loss": 0.0612, + "step": 70020 + }, + { + "epoch": 1.76, + "learning_rate": 0.0003608773208049644, + "loss": 0.0615, + "step": 70030 + }, + { + "epoch": 1.76, + "learning_rate": 0.0003605004647890862, + "loss": 0.0621, + "step": 70040 + }, + { + "epoch": 1.76, + "learning_rate": 0.00036012360877320807, + "loss": 0.0629, + "step": 70050 + }, + { + "epoch": 1.76, + "learning_rate": 0.00035974675275732987, + "loss": 0.0632, + "step": 70060 + }, + { + "epoch": 1.76, + "learning_rate": 0.00035936989674145166, + "loss": 0.0636, + "step": 70070 + }, + { + "epoch": 1.76, + "learning_rate": 0.00035899304072557346, + "loss": 0.0664, + "step": 70080 + }, + { + "epoch": 1.76, + "learning_rate": 0.00035861618470969526, + "loss": 0.0626, + "step": 70090 + }, + { + "epoch": 1.76, + "learning_rate": 0.00035823932869381706, + "loss": 0.0607, + "step": 70100 + }, + { + "epoch": 1.76, + "learning_rate": 0.00035786247267793886, + "loss": 0.0632, + "step": 70110 + }, + { + "epoch": 1.76, + "learning_rate": 0.00035748561666206066, + "loss": 0.0652, + "step": 70120 + }, + { + "epoch": 1.76, + "learning_rate": 0.00035710876064618246, + "loss": 0.0649, + "step": 70130 + }, + { + "epoch": 1.76, + "learning_rate": 0.00035673190463030426, + "loss": 0.0622, + "step": 70140 + }, + { + "epoch": 1.76, + "learning_rate": 0.00035635504861442606, + "loss": 0.0669, + "step": 70150 + }, + { + "epoch": 1.76, + "learning_rate": 0.00035597819259854785, + "loss": 0.0627, + "step": 70160 + }, + { + "epoch": 1.76, + "learning_rate": 0.00035560133658266965, + "loss": 0.0651, + "step": 70170 + }, + { + "epoch": 1.76, + "learning_rate": 0.00035522448056679145, + "loss": 0.0624, + "step": 70180 + }, + { + "epoch": 1.76, + "learning_rate": 0.00035484762455091325, + "loss": 0.0621, + "step": 70190 + }, + { + "epoch": 1.76, + "learning_rate": 0.00035447076853503505, + "loss": 0.0648, + "step": 70200 + }, + { + "epoch": 1.76, + "learning_rate": 0.00035409391251915685, + "loss": 0.0621, + "step": 70210 + }, + { + "epoch": 1.76, + "learning_rate": 0.00035371705650327865, + "loss": 0.0623, + "step": 70220 + }, + { + "epoch": 1.76, + "learning_rate": 0.00035334020048740045, + "loss": 0.0631, + "step": 70230 + }, + { + "epoch": 1.76, + "learning_rate": 0.00035296334447152224, + "loss": 0.0619, + "step": 70240 + }, + { + "epoch": 1.76, + "learning_rate": 0.0003525864884556441, + "loss": 0.0611, + "step": 70250 + }, + { + "epoch": 1.77, + "learning_rate": 0.00035220963243976584, + "loss": 0.0656, + "step": 70260 + }, + { + "epoch": 1.77, + "learning_rate": 0.00035183277642388764, + "loss": 0.0644, + "step": 70270 + }, + { + "epoch": 1.77, + "learning_rate": 0.00035145592040800944, + "loss": 0.0662, + "step": 70280 + }, + { + "epoch": 1.77, + "learning_rate": 0.00035107906439213124, + "loss": 0.0625, + "step": 70290 + }, + { + "epoch": 1.77, + "learning_rate": 0.00035070220837625304, + "loss": 0.0634, + "step": 70300 + }, + { + "epoch": 1.77, + "learning_rate": 0.00035032535236037484, + "loss": 0.0604, + "step": 70310 + }, + { + "epoch": 1.77, + "learning_rate": 0.00034994849634449664, + "loss": 0.0602, + "step": 70320 + }, + { + "epoch": 1.77, + "learning_rate": 0.0003495716403286185, + "loss": 0.0634, + "step": 70330 + }, + { + "epoch": 1.77, + "learning_rate": 0.0003491947843127403, + "loss": 0.0613, + "step": 70340 + }, + { + "epoch": 1.77, + "learning_rate": 0.0003488179282968621, + "loss": 0.0648, + "step": 70350 + }, + { + "epoch": 1.77, + "learning_rate": 0.0003484410722809839, + "loss": 0.0603, + "step": 70360 + }, + { + "epoch": 1.77, + "learning_rate": 0.00034806421626510563, + "loss": 0.0621, + "step": 70370 + }, + { + "epoch": 1.77, + "learning_rate": 0.00034768736024922743, + "loss": 0.0659, + "step": 70380 + }, + { + "epoch": 1.77, + "learning_rate": 0.00034731050423334923, + "loss": 0.0619, + "step": 70390 + }, + { + "epoch": 1.77, + "learning_rate": 0.000346933648217471, + "loss": 0.0652, + "step": 70400 + }, + { + "epoch": 1.77, + "learning_rate": 0.0003465567922015928, + "loss": 0.0612, + "step": 70410 + }, + { + "epoch": 1.77, + "learning_rate": 0.0003461799361857147, + "loss": 0.0631, + "step": 70420 + }, + { + "epoch": 1.77, + "learning_rate": 0.0003458030801698365, + "loss": 0.0613, + "step": 70430 + }, + { + "epoch": 1.77, + "learning_rate": 0.0003454262241539583, + "loss": 0.0624, + "step": 70440 + }, + { + "epoch": 1.77, + "learning_rate": 0.0003450493681380801, + "loss": 0.0639, + "step": 70450 + }, + { + "epoch": 1.77, + "learning_rate": 0.0003446725121222019, + "loss": 0.0672, + "step": 70460 + }, + { + "epoch": 1.77, + "learning_rate": 0.00034429565610632367, + "loss": 0.0618, + "step": 70470 + }, + { + "epoch": 1.77, + "learning_rate": 0.0003439188000904454, + "loss": 0.0622, + "step": 70480 + }, + { + "epoch": 1.77, + "learning_rate": 0.0003435419440745672, + "loss": 0.0607, + "step": 70490 + }, + { + "epoch": 1.77, + "learning_rate": 0.000343165088058689, + "loss": 0.0649, + "step": 70500 + }, + { + "epoch": 1.77, + "eval_cer": 0.66524366857282, + "eval_loss": 0.054241545498371124, + "eval_runtime": 90.7441, + "eval_samples_per_second": 110.189, + "eval_steps_per_second": 6.887, + "step": 70500 + }, + { + "epoch": 1.77, + "learning_rate": 0.00034278823204281087, + "loss": 0.0606, + "step": 70510 + }, + { + "epoch": 1.77, + "learning_rate": 0.00034241137602693267, + "loss": 0.0609, + "step": 70520 + }, + { + "epoch": 1.77, + "learning_rate": 0.00034203452001105447, + "loss": 0.0649, + "step": 70530 + }, + { + "epoch": 1.77, + "learning_rate": 0.00034165766399517626, + "loss": 0.0642, + "step": 70540 + }, + { + "epoch": 1.77, + "learning_rate": 0.00034128080797929806, + "loss": 0.0622, + "step": 70550 + }, + { + "epoch": 1.77, + "learning_rate": 0.00034090395196341986, + "loss": 0.065, + "step": 70560 + }, + { + "epoch": 1.77, + "learning_rate": 0.00034052709594754166, + "loss": 0.0619, + "step": 70570 + }, + { + "epoch": 1.77, + "learning_rate": 0.00034015023993166346, + "loss": 0.0651, + "step": 70580 + }, + { + "epoch": 1.77, + "learning_rate": 0.0003397733839157852, + "loss": 0.0682, + "step": 70590 + }, + { + "epoch": 1.77, + "learning_rate": 0.00033939652789990706, + "loss": 0.0646, + "step": 70600 + }, + { + "epoch": 1.77, + "learning_rate": 0.00033901967188402886, + "loss": 0.0616, + "step": 70610 + }, + { + "epoch": 1.77, + "learning_rate": 0.00033864281586815065, + "loss": 0.0637, + "step": 70620 + }, + { + "epoch": 1.77, + "learning_rate": 0.00033826595985227245, + "loss": 0.0624, + "step": 70630 + }, + { + "epoch": 1.77, + "learning_rate": 0.00033788910383639425, + "loss": 0.0632, + "step": 70640 + }, + { + "epoch": 1.77, + "learning_rate": 0.00033751224782051605, + "loss": 0.0624, + "step": 70650 + }, + { + "epoch": 1.78, + "learning_rate": 0.00033713539180463785, + "loss": 0.0621, + "step": 70660 + }, + { + "epoch": 1.78, + "learning_rate": 0.00033675853578875965, + "loss": 0.0638, + "step": 70670 + }, + { + "epoch": 1.78, + "learning_rate": 0.00033638167977288145, + "loss": 0.0678, + "step": 70680 + }, + { + "epoch": 1.78, + "learning_rate": 0.00033600482375700325, + "loss": 0.0651, + "step": 70690 + }, + { + "epoch": 1.78, + "learning_rate": 0.00033562796774112505, + "loss": 0.0675, + "step": 70700 + }, + { + "epoch": 1.78, + "learning_rate": 0.00033525111172524684, + "loss": 0.0615, + "step": 70710 + }, + { + "epoch": 1.78, + "learning_rate": 0.00033487425570936864, + "loss": 0.0636, + "step": 70720 + }, + { + "epoch": 1.78, + "learning_rate": 0.00033449739969349044, + "loss": 0.0627, + "step": 70730 + }, + { + "epoch": 1.78, + "learning_rate": 0.00033412054367761224, + "loss": 0.0677, + "step": 70740 + }, + { + "epoch": 1.78, + "learning_rate": 0.00033374368766173404, + "loss": 0.0682, + "step": 70750 + }, + { + "epoch": 1.78, + "learning_rate": 0.00033336683164585584, + "loss": 0.0618, + "step": 70760 + }, + { + "epoch": 1.78, + "learning_rate": 0.00033298997562997764, + "loss": 0.064, + "step": 70770 + }, + { + "epoch": 1.78, + "learning_rate": 0.00033261311961409944, + "loss": 0.0645, + "step": 70780 + }, + { + "epoch": 1.78, + "learning_rate": 0.00033223626359822124, + "loss": 0.0644, + "step": 70790 + }, + { + "epoch": 1.78, + "learning_rate": 0.0003318594075823431, + "loss": 0.0653, + "step": 70800 + }, + { + "epoch": 1.78, + "learning_rate": 0.00033148255156646483, + "loss": 0.0629, + "step": 70810 + }, + { + "epoch": 1.78, + "learning_rate": 0.00033110569555058663, + "loss": 0.0617, + "step": 70820 + }, + { + "epoch": 1.78, + "learning_rate": 0.00033072883953470843, + "loss": 0.062, + "step": 70830 + }, + { + "epoch": 1.78, + "learning_rate": 0.00033035198351883023, + "loss": 0.0629, + "step": 70840 + }, + { + "epoch": 1.78, + "learning_rate": 0.00032997512750295203, + "loss": 0.0628, + "step": 70850 + }, + { + "epoch": 1.78, + "learning_rate": 0.0003295982714870738, + "loss": 0.0653, + "step": 70860 + }, + { + "epoch": 1.78, + "learning_rate": 0.0003292214154711956, + "loss": 0.0627, + "step": 70870 + }, + { + "epoch": 1.78, + "learning_rate": 0.0003288445594553175, + "loss": 0.0641, + "step": 70880 + }, + { + "epoch": 1.78, + "learning_rate": 0.0003284677034394393, + "loss": 0.0656, + "step": 70890 + }, + { + "epoch": 1.78, + "learning_rate": 0.0003280908474235611, + "loss": 0.0652, + "step": 70900 + }, + { + "epoch": 1.78, + "learning_rate": 0.0003277139914076829, + "loss": 0.0614, + "step": 70910 + }, + { + "epoch": 1.78, + "learning_rate": 0.0003273371353918046, + "loss": 0.0635, + "step": 70920 + }, + { + "epoch": 1.78, + "learning_rate": 0.0003269602793759264, + "loss": 0.0615, + "step": 70930 + }, + { + "epoch": 1.78, + "learning_rate": 0.0003265834233600482, + "loss": 0.0628, + "step": 70940 + }, + { + "epoch": 1.78, + "learning_rate": 0.00032620656734417, + "loss": 0.0638, + "step": 70950 + }, + { + "epoch": 1.78, + "learning_rate": 0.0003258297113282918, + "loss": 0.0637, + "step": 70960 + }, + { + "epoch": 1.78, + "learning_rate": 0.00032545285531241367, + "loss": 0.0605, + "step": 70970 + }, + { + "epoch": 1.78, + "learning_rate": 0.00032507599929653547, + "loss": 0.0628, + "step": 70980 + }, + { + "epoch": 1.78, + "learning_rate": 0.00032469914328065727, + "loss": 0.0627, + "step": 70990 + }, + { + "epoch": 1.78, + "learning_rate": 0.00032432228726477906, + "loss": 0.0641, + "step": 71000 + }, + { + "epoch": 1.78, + "eval_cer": 0.6652013203035408, + "eval_loss": 0.053951624780893326, + "eval_runtime": 90.7661, + "eval_samples_per_second": 110.162, + "eval_steps_per_second": 6.886, + "step": 71000 + }, + { + "epoch": 1.78, + "learning_rate": 0.00032394543124890086, + "loss": 0.0643, + "step": 71010 + }, + { + "epoch": 1.78, + "learning_rate": 0.00032356857523302266, + "loss": 0.0586, + "step": 71020 + }, + { + "epoch": 1.78, + "learning_rate": 0.0003231917192171444, + "loss": 0.0624, + "step": 71030 + }, + { + "epoch": 1.78, + "learning_rate": 0.0003228148632012662, + "loss": 0.0617, + "step": 71040 + }, + { + "epoch": 1.79, + "learning_rate": 0.000322438007185388, + "loss": 0.0641, + "step": 71050 + }, + { + "epoch": 1.79, + "learning_rate": 0.00032206115116950986, + "loss": 0.062, + "step": 71060 + }, + { + "epoch": 1.79, + "learning_rate": 0.00032168429515363166, + "loss": 0.0642, + "step": 71070 + }, + { + "epoch": 1.79, + "learning_rate": 0.00032130743913775346, + "loss": 0.0607, + "step": 71080 + }, + { + "epoch": 1.79, + "learning_rate": 0.00032093058312187525, + "loss": 0.0608, + "step": 71090 + }, + { + "epoch": 1.79, + "learning_rate": 0.00032055372710599705, + "loss": 0.0588, + "step": 71100 + }, + { + "epoch": 1.79, + "learning_rate": 0.00032017687109011885, + "loss": 0.0639, + "step": 71110 + }, + { + "epoch": 1.79, + "learning_rate": 0.00031980001507424065, + "loss": 0.0629, + "step": 71120 + }, + { + "epoch": 1.79, + "learning_rate": 0.00031942315905836245, + "loss": 0.0616, + "step": 71130 + }, + { + "epoch": 1.79, + "learning_rate": 0.00031904630304248425, + "loss": 0.0612, + "step": 71140 + }, + { + "epoch": 1.79, + "learning_rate": 0.00031866944702660605, + "loss": 0.0648, + "step": 71150 + }, + { + "epoch": 1.79, + "learning_rate": 0.00031829259101072785, + "loss": 0.0631, + "step": 71160 + }, + { + "epoch": 1.79, + "learning_rate": 0.00031791573499484965, + "loss": 0.0609, + "step": 71170 + }, + { + "epoch": 1.79, + "learning_rate": 0.00031753887897897144, + "loss": 0.0603, + "step": 71180 + }, + { + "epoch": 1.79, + "learning_rate": 0.00031716202296309324, + "loss": 0.0636, + "step": 71190 + }, + { + "epoch": 1.79, + "learning_rate": 0.00031678516694721504, + "loss": 0.0587, + "step": 71200 + }, + { + "epoch": 1.79, + "learning_rate": 0.00031640831093133684, + "loss": 0.0612, + "step": 71210 + }, + { + "epoch": 1.79, + "learning_rate": 0.00031603145491545864, + "loss": 0.0611, + "step": 71220 + }, + { + "epoch": 1.79, + "learning_rate": 0.00031565459889958044, + "loss": 0.063, + "step": 71230 + }, + { + "epoch": 1.79, + "learning_rate": 0.00031527774288370224, + "loss": 0.0617, + "step": 71240 + }, + { + "epoch": 1.79, + "learning_rate": 0.00031490088686782404, + "loss": 0.0621, + "step": 71250 + }, + { + "epoch": 1.79, + "learning_rate": 0.00031452403085194583, + "loss": 0.0598, + "step": 71260 + }, + { + "epoch": 1.79, + "learning_rate": 0.00031414717483606763, + "loss": 0.0627, + "step": 71270 + }, + { + "epoch": 1.79, + "learning_rate": 0.00031377031882018943, + "loss": 0.0653, + "step": 71280 + }, + { + "epoch": 1.79, + "learning_rate": 0.00031339346280431123, + "loss": 0.059, + "step": 71290 + }, + { + "epoch": 1.79, + "learning_rate": 0.00031301660678843303, + "loss": 0.0609, + "step": 71300 + }, + { + "epoch": 1.79, + "learning_rate": 0.00031263975077255483, + "loss": 0.0641, + "step": 71310 + }, + { + "epoch": 1.79, + "learning_rate": 0.00031226289475667663, + "loss": 0.0651, + "step": 71320 + }, + { + "epoch": 1.79, + "learning_rate": 0.0003118860387407984, + "loss": 0.063, + "step": 71330 + }, + { + "epoch": 1.79, + "learning_rate": 0.0003115091827249202, + "loss": 0.0604, + "step": 71340 + }, + { + "epoch": 1.79, + "learning_rate": 0.0003111323267090421, + "loss": 0.0629, + "step": 71350 + }, + { + "epoch": 1.79, + "learning_rate": 0.0003107554706931639, + "loss": 0.0601, + "step": 71360 + }, + { + "epoch": 1.79, + "learning_rate": 0.0003103786146772856, + "loss": 0.0604, + "step": 71370 + }, + { + "epoch": 1.79, + "learning_rate": 0.0003100017586614074, + "loss": 0.0625, + "step": 71380 + }, + { + "epoch": 1.79, + "learning_rate": 0.0003096249026455292, + "loss": 0.0602, + "step": 71390 + }, + { + "epoch": 1.79, + "learning_rate": 0.000309248046629651, + "loss": 0.064, + "step": 71400 + }, + { + "epoch": 1.79, + "learning_rate": 0.0003088711906137728, + "loss": 0.0646, + "step": 71410 + }, + { + "epoch": 1.79, + "learning_rate": 0.0003084943345978946, + "loss": 0.0625, + "step": 71420 + }, + { + "epoch": 1.79, + "learning_rate": 0.0003081174785820164, + "loss": 0.0599, + "step": 71430 + }, + { + "epoch": 1.79, + "learning_rate": 0.00030774062256613827, + "loss": 0.0649, + "step": 71440 + }, + { + "epoch": 1.8, + "learning_rate": 0.00030736376655026007, + "loss": 0.0652, + "step": 71450 + }, + { + "epoch": 1.8, + "learning_rate": 0.00030698691053438187, + "loss": 0.063, + "step": 71460 + }, + { + "epoch": 1.8, + "learning_rate": 0.00030661005451850366, + "loss": 0.0613, + "step": 71470 + }, + { + "epoch": 1.8, + "learning_rate": 0.0003062331985026254, + "loss": 0.0652, + "step": 71480 + }, + { + "epoch": 1.8, + "learning_rate": 0.0003058563424867472, + "loss": 0.062, + "step": 71490 + }, + { + "epoch": 1.8, + "learning_rate": 0.000305479486470869, + "loss": 0.0659, + "step": 71500 + }, + { + "epoch": 1.8, + "eval_cer": 0.6653043035947425, + "eval_loss": 0.05395006760954857, + "eval_runtime": 90.8279, + "eval_samples_per_second": 110.087, + "eval_steps_per_second": 6.881, + "step": 71500 + }, + { + "epoch": 1.8, + "learning_rate": 0.0003051026304549908, + "loss": 0.0621, + "step": 71510 + }, + { + "epoch": 1.8, + "learning_rate": 0.00030472577443911266, + "loss": 0.059, + "step": 71520 + }, + { + "epoch": 1.8, + "learning_rate": 0.00030434891842323446, + "loss": 0.0615, + "step": 71530 + }, + { + "epoch": 1.8, + "learning_rate": 0.00030397206240735626, + "loss": 0.0614, + "step": 71540 + }, + { + "epoch": 1.8, + "learning_rate": 0.00030359520639147806, + "loss": 0.0612, + "step": 71550 + }, + { + "epoch": 1.8, + "learning_rate": 0.00030321835037559985, + "loss": 0.0659, + "step": 71560 + }, + { + "epoch": 1.8, + "learning_rate": 0.00030284149435972165, + "loss": 0.0637, + "step": 71570 + }, + { + "epoch": 1.8, + "learning_rate": 0.00030246463834384345, + "loss": 0.063, + "step": 71580 + }, + { + "epoch": 1.8, + "learning_rate": 0.0003020877823279652, + "loss": 0.0588, + "step": 71590 + }, + { + "epoch": 1.8, + "learning_rate": 0.000301710926312087, + "loss": 0.0634, + "step": 71600 + }, + { + "epoch": 1.8, + "learning_rate": 0.00030133407029620885, + "loss": 0.0591, + "step": 71610 + }, + { + "epoch": 1.8, + "learning_rate": 0.00030095721428033065, + "loss": 0.0631, + "step": 71620 + }, + { + "epoch": 1.8, + "learning_rate": 0.00030058035826445245, + "loss": 0.0608, + "step": 71630 + }, + { + "epoch": 1.8, + "learning_rate": 0.00030020350224857424, + "loss": 0.0653, + "step": 71640 + }, + { + "epoch": 1.8, + "learning_rate": 0.00029982664623269604, + "loss": 0.065, + "step": 71650 + }, + { + "epoch": 1.8, + "learning_rate": 0.00029944979021681784, + "loss": 0.0664, + "step": 71660 + }, + { + "epoch": 1.8, + "learning_rate": 0.00029907293420093964, + "loss": 0.064, + "step": 71670 + }, + { + "epoch": 1.8, + "learning_rate": 0.00029869607818506144, + "loss": 0.0653, + "step": 71680 + }, + { + "epoch": 1.8, + "learning_rate": 0.00029831922216918324, + "loss": 0.0609, + "step": 71690 + }, + { + "epoch": 1.8, + "learning_rate": 0.00029794236615330504, + "loss": 0.06, + "step": 71700 + }, + { + "epoch": 1.8, + "learning_rate": 0.00029756551013742684, + "loss": 0.0614, + "step": 71710 + }, + { + "epoch": 1.8, + "learning_rate": 0.00029718865412154864, + "loss": 0.0588, + "step": 71720 + }, + { + "epoch": 1.8, + "learning_rate": 0.00029681179810567043, + "loss": 0.0643, + "step": 71730 + }, + { + "epoch": 1.8, + "learning_rate": 0.00029643494208979223, + "loss": 0.0627, + "step": 71740 + }, + { + "epoch": 1.8, + "learning_rate": 0.00029605808607391403, + "loss": 0.0608, + "step": 71750 + }, + { + "epoch": 1.8, + "learning_rate": 0.00029568123005803583, + "loss": 0.0638, + "step": 71760 + }, + { + "epoch": 1.8, + "learning_rate": 0.00029530437404215763, + "loss": 0.063, + "step": 71770 + }, + { + "epoch": 1.8, + "learning_rate": 0.00029492751802627943, + "loss": 0.064, + "step": 71780 + }, + { + "epoch": 1.8, + "learning_rate": 0.00029455066201040123, + "loss": 0.0607, + "step": 71790 + }, + { + "epoch": 1.8, + "learning_rate": 0.000294173805994523, + "loss": 0.0645, + "step": 71800 + }, + { + "epoch": 1.8, + "learning_rate": 0.0002937969499786448, + "loss": 0.0607, + "step": 71810 + }, + { + "epoch": 1.8, + "learning_rate": 0.0002934200939627666, + "loss": 0.0641, + "step": 71820 + }, + { + "epoch": 1.8, + "learning_rate": 0.0002930432379468884, + "loss": 0.0632, + "step": 71830 + }, + { + "epoch": 1.8, + "learning_rate": 0.0002926663819310102, + "loss": 0.065, + "step": 71840 + }, + { + "epoch": 1.81, + "learning_rate": 0.000292289525915132, + "loss": 0.0644, + "step": 71850 + }, + { + "epoch": 1.81, + "learning_rate": 0.0002919126698992538, + "loss": 0.0651, + "step": 71860 + }, + { + "epoch": 1.81, + "learning_rate": 0.0002915358138833756, + "loss": 0.0606, + "step": 71870 + }, + { + "epoch": 1.81, + "learning_rate": 0.0002911589578674974, + "loss": 0.0585, + "step": 71880 + }, + { + "epoch": 1.81, + "learning_rate": 0.0002907821018516192, + "loss": 0.0641, + "step": 71890 + }, + { + "epoch": 1.81, + "learning_rate": 0.00029040524583574107, + "loss": 0.0615, + "step": 71900 + }, + { + "epoch": 1.81, + "learning_rate": 0.00029002838981986287, + "loss": 0.0648, + "step": 71910 + }, + { + "epoch": 1.81, + "learning_rate": 0.0002896515338039846, + "loss": 0.0629, + "step": 71920 + }, + { + "epoch": 1.81, + "learning_rate": 0.0002892746777881064, + "loss": 0.0605, + "step": 71930 + }, + { + "epoch": 1.81, + "learning_rate": 0.0002888978217722282, + "loss": 0.0626, + "step": 71940 + }, + { + "epoch": 1.81, + "learning_rate": 0.00028852096575635, + "loss": 0.0632, + "step": 71950 + }, + { + "epoch": 1.81, + "learning_rate": 0.0002881441097404718, + "loss": 0.0635, + "step": 71960 + }, + { + "epoch": 1.81, + "learning_rate": 0.0002877672537245936, + "loss": 0.0633, + "step": 71970 + }, + { + "epoch": 1.81, + "learning_rate": 0.0002873903977087154, + "loss": 0.0655, + "step": 71980 + }, + { + "epoch": 1.81, + "learning_rate": 0.00028701354169283726, + "loss": 0.0627, + "step": 71990 + }, + { + "epoch": 1.81, + "learning_rate": 0.00028663668567695906, + "loss": 0.0651, + "step": 72000 + }, + { + "epoch": 1.81, + "eval_cer": 0.6652186445955187, + "eval_loss": 0.053641460835933685, + "eval_runtime": 90.6025, + "eval_samples_per_second": 110.361, + "eval_steps_per_second": 6.898, + "step": 72000 + }, + { + "epoch": 1.81, + "learning_rate": 0.00028625982966108086, + "loss": 0.0627, + "step": 72010 + }, + { + "epoch": 1.81, + "learning_rate": 0.00028588297364520265, + "loss": 0.0629, + "step": 72020 + }, + { + "epoch": 1.81, + "learning_rate": 0.00028550611762932445, + "loss": 0.0617, + "step": 72030 + }, + { + "epoch": 1.81, + "learning_rate": 0.0002851292616134462, + "loss": 0.0637, + "step": 72040 + }, + { + "epoch": 1.81, + "learning_rate": 0.000284752405597568, + "loss": 0.0618, + "step": 72050 + }, + { + "epoch": 1.81, + "learning_rate": 0.0002843755495816898, + "loss": 0.0641, + "step": 72060 + }, + { + "epoch": 1.81, + "learning_rate": 0.00028399869356581165, + "loss": 0.0624, + "step": 72070 + }, + { + "epoch": 1.81, + "learning_rate": 0.00028362183754993345, + "loss": 0.0617, + "step": 72080 + }, + { + "epoch": 1.81, + "learning_rate": 0.00028324498153405525, + "loss": 0.0627, + "step": 72090 + }, + { + "epoch": 1.81, + "learning_rate": 0.00028286812551817705, + "loss": 0.0636, + "step": 72100 + }, + { + "epoch": 1.81, + "learning_rate": 0.00028249126950229884, + "loss": 0.0631, + "step": 72110 + }, + { + "epoch": 1.81, + "learning_rate": 0.00028211441348642064, + "loss": 0.0613, + "step": 72120 + }, + { + "epoch": 1.81, + "learning_rate": 0.00028173755747054244, + "loss": 0.0608, + "step": 72130 + }, + { + "epoch": 1.81, + "learning_rate": 0.00028136070145466424, + "loss": 0.063, + "step": 72140 + }, + { + "epoch": 1.81, + "learning_rate": 0.000280983845438786, + "loss": 0.0623, + "step": 72150 + }, + { + "epoch": 1.81, + "learning_rate": 0.00028060698942290784, + "loss": 0.0613, + "step": 72160 + }, + { + "epoch": 1.81, + "learning_rate": 0.00028023013340702964, + "loss": 0.0598, + "step": 72170 + }, + { + "epoch": 1.81, + "learning_rate": 0.00027985327739115144, + "loss": 0.0657, + "step": 72180 + }, + { + "epoch": 1.81, + "learning_rate": 0.00027947642137527323, + "loss": 0.061, + "step": 72190 + }, + { + "epoch": 1.81, + "learning_rate": 0.00027909956535939503, + "loss": 0.0615, + "step": 72200 + }, + { + "epoch": 1.81, + "learning_rate": 0.00027872270934351683, + "loss": 0.0625, + "step": 72210 + }, + { + "epoch": 1.81, + "learning_rate": 0.00027834585332763863, + "loss": 0.0626, + "step": 72220 + }, + { + "epoch": 1.81, + "learning_rate": 0.00027796899731176043, + "loss": 0.0669, + "step": 72230 + }, + { + "epoch": 1.81, + "learning_rate": 0.00027759214129588223, + "loss": 0.0622, + "step": 72240 + }, + { + "epoch": 1.82, + "learning_rate": 0.00027721528528000403, + "loss": 0.0625, + "step": 72250 + }, + { + "epoch": 1.82, + "learning_rate": 0.0002768384292641258, + "loss": 0.0602, + "step": 72260 + }, + { + "epoch": 1.82, + "learning_rate": 0.0002764615732482476, + "loss": 0.0642, + "step": 72270 + }, + { + "epoch": 1.82, + "learning_rate": 0.0002760847172323694, + "loss": 0.0632, + "step": 72280 + }, + { + "epoch": 1.82, + "learning_rate": 0.0002757078612164912, + "loss": 0.0598, + "step": 72290 + }, + { + "epoch": 1.82, + "learning_rate": 0.000275331005200613, + "loss": 0.0613, + "step": 72300 + }, + { + "epoch": 1.82, + "learning_rate": 0.0002749541491847348, + "loss": 0.0633, + "step": 72310 + }, + { + "epoch": 1.82, + "learning_rate": 0.0002745772931688566, + "loss": 0.0616, + "step": 72320 + }, + { + "epoch": 1.82, + "learning_rate": 0.0002742004371529784, + "loss": 0.061, + "step": 72330 + }, + { + "epoch": 1.82, + "learning_rate": 0.0002738235811371002, + "loss": 0.0608, + "step": 72340 + }, + { + "epoch": 1.82, + "learning_rate": 0.000273446725121222, + "loss": 0.0611, + "step": 72350 + }, + { + "epoch": 1.82, + "learning_rate": 0.00027306986910534387, + "loss": 0.0646, + "step": 72360 + }, + { + "epoch": 1.82, + "learning_rate": 0.0002726930130894656, + "loss": 0.0621, + "step": 72370 + }, + { + "epoch": 1.82, + "learning_rate": 0.0002723161570735874, + "loss": 0.0633, + "step": 72380 + }, + { + "epoch": 1.82, + "learning_rate": 0.0002719393010577092, + "loss": 0.0626, + "step": 72390 + }, + { + "epoch": 1.82, + "learning_rate": 0.000271562445041831, + "loss": 0.0641, + "step": 72400 + }, + { + "epoch": 1.82, + "learning_rate": 0.0002711855890259528, + "loss": 0.0633, + "step": 72410 + }, + { + "epoch": 1.82, + "learning_rate": 0.0002708087330100746, + "loss": 0.062, + "step": 72420 + }, + { + "epoch": 1.82, + "learning_rate": 0.0002704318769941964, + "loss": 0.0646, + "step": 72430 + }, + { + "epoch": 1.82, + "learning_rate": 0.0002700550209783182, + "loss": 0.0604, + "step": 72440 + }, + { + "epoch": 1.82, + "learning_rate": 0.00026967816496244006, + "loss": 0.0631, + "step": 72450 + }, + { + "epoch": 1.82, + "learning_rate": 0.00026930130894656186, + "loss": 0.0602, + "step": 72460 + }, + { + "epoch": 1.82, + "learning_rate": 0.00026892445293068366, + "loss": 0.062, + "step": 72470 + }, + { + "epoch": 1.82, + "learning_rate": 0.0002685475969148054, + "loss": 0.0606, + "step": 72480 + }, + { + "epoch": 1.82, + "learning_rate": 0.0002681707408989272, + "loss": 0.0629, + "step": 72490 + }, + { + "epoch": 1.82, + "learning_rate": 0.000267793884883049, + "loss": 0.0625, + "step": 72500 + }, + { + "epoch": 1.82, + "eval_cer": 0.6651657092589197, + "eval_loss": 0.05356631428003311, + "eval_runtime": 90.9229, + "eval_samples_per_second": 109.972, + "eval_steps_per_second": 6.874, + "step": 72500 + }, + { + "epoch": 1.82, + "learning_rate": 0.0002674170288671708, + "loss": 0.064, + "step": 72510 + }, + { + "epoch": 1.82, + "learning_rate": 0.0002670401728512926, + "loss": 0.0625, + "step": 72520 + }, + { + "epoch": 1.82, + "learning_rate": 0.0002666633168354144, + "loss": 0.0609, + "step": 72530 + }, + { + "epoch": 1.82, + "learning_rate": 0.00026628646081953625, + "loss": 0.0611, + "step": 72540 + }, + { + "epoch": 1.82, + "learning_rate": 0.00026590960480365805, + "loss": 0.0642, + "step": 72550 + }, + { + "epoch": 1.82, + "learning_rate": 0.00026553274878777985, + "loss": 0.0605, + "step": 72560 + }, + { + "epoch": 1.82, + "learning_rate": 0.00026515589277190164, + "loss": 0.0596, + "step": 72570 + }, + { + "epoch": 1.82, + "learning_rate": 0.00026477903675602344, + "loss": 0.0594, + "step": 72580 + }, + { + "epoch": 1.82, + "learning_rate": 0.0002644021807401452, + "loss": 0.0612, + "step": 72590 + }, + { + "epoch": 1.82, + "learning_rate": 0.000264025324724267, + "loss": 0.06, + "step": 72600 + }, + { + "epoch": 1.82, + "learning_rate": 0.0002636484687083888, + "loss": 0.0629, + "step": 72610 + }, + { + "epoch": 1.82, + "learning_rate": 0.00026327161269251064, + "loss": 0.062, + "step": 72620 + }, + { + "epoch": 1.82, + "learning_rate": 0.00026289475667663244, + "loss": 0.0625, + "step": 72630 + }, + { + "epoch": 1.82, + "learning_rate": 0.00026251790066075424, + "loss": 0.061, + "step": 72640 + }, + { + "epoch": 1.83, + "learning_rate": 0.00026214104464487604, + "loss": 0.0599, + "step": 72650 + }, + { + "epoch": 1.83, + "learning_rate": 0.00026176418862899783, + "loss": 0.0616, + "step": 72660 + }, + { + "epoch": 1.83, + "learning_rate": 0.00026138733261311963, + "loss": 0.0633, + "step": 72670 + }, + { + "epoch": 1.83, + "learning_rate": 0.00026101047659724143, + "loss": 0.0604, + "step": 72680 + }, + { + "epoch": 1.83, + "learning_rate": 0.00026063362058136323, + "loss": 0.0581, + "step": 72690 + }, + { + "epoch": 1.83, + "learning_rate": 0.000260256764565485, + "loss": 0.0636, + "step": 72700 + }, + { + "epoch": 1.83, + "learning_rate": 0.00025987990854960683, + "loss": 0.0613, + "step": 72710 + }, + { + "epoch": 1.83, + "learning_rate": 0.00025950305253372863, + "loss": 0.065, + "step": 72720 + }, + { + "epoch": 1.83, + "learning_rate": 0.0002591261965178504, + "loss": 0.0623, + "step": 72730 + }, + { + "epoch": 1.83, + "learning_rate": 0.0002587493405019722, + "loss": 0.0636, + "step": 72740 + }, + { + "epoch": 1.83, + "learning_rate": 0.000258372484486094, + "loss": 0.0666, + "step": 72750 + }, + { + "epoch": 1.83, + "learning_rate": 0.0002579956284702158, + "loss": 0.0629, + "step": 72760 + }, + { + "epoch": 1.83, + "learning_rate": 0.0002576187724543376, + "loss": 0.0617, + "step": 72770 + }, + { + "epoch": 1.83, + "learning_rate": 0.0002572419164384594, + "loss": 0.0617, + "step": 72780 + }, + { + "epoch": 1.83, + "learning_rate": 0.0002568650604225812, + "loss": 0.0678, + "step": 72790 + }, + { + "epoch": 1.83, + "learning_rate": 0.000256488204406703, + "loss": 0.0653, + "step": 72800 + }, + { + "epoch": 1.83, + "learning_rate": 0.0002561113483908248, + "loss": 0.063, + "step": 72810 + }, + { + "epoch": 1.83, + "learning_rate": 0.0002557344923749466, + "loss": 0.0597, + "step": 72820 + }, + { + "epoch": 1.83, + "learning_rate": 0.0002553576363590684, + "loss": 0.0646, + "step": 72830 + }, + { + "epoch": 1.83, + "learning_rate": 0.0002549807803431902, + "loss": 0.0633, + "step": 72840 + }, + { + "epoch": 1.83, + "learning_rate": 0.000254603924327312, + "loss": 0.0611, + "step": 72850 + }, + { + "epoch": 1.83, + "learning_rate": 0.0002542270683114338, + "loss": 0.058, + "step": 72860 + }, + { + "epoch": 1.83, + "learning_rate": 0.0002538502122955556, + "loss": 0.0618, + "step": 72870 + }, + { + "epoch": 1.83, + "learning_rate": 0.0002534733562796774, + "loss": 0.0654, + "step": 72880 + }, + { + "epoch": 1.83, + "learning_rate": 0.0002530965002637992, + "loss": 0.0609, + "step": 72890 + }, + { + "epoch": 1.83, + "learning_rate": 0.000252719644247921, + "loss": 0.0614, + "step": 72900 + }, + { + "epoch": 1.83, + "learning_rate": 0.00025234278823204286, + "loss": 0.0612, + "step": 72910 + }, + { + "epoch": 1.83, + "learning_rate": 0.00025196593221616466, + "loss": 0.0605, + "step": 72920 + }, + { + "epoch": 1.83, + "learning_rate": 0.0002515890762002864, + "loss": 0.0595, + "step": 72930 + }, + { + "epoch": 1.83, + "learning_rate": 0.0002512122201844082, + "loss": 0.0611, + "step": 72940 + }, + { + "epoch": 1.83, + "learning_rate": 0.00025083536416853, + "loss": 0.0629, + "step": 72950 + }, + { + "epoch": 1.83, + "learning_rate": 0.0002504585081526518, + "loss": 0.063, + "step": 72960 + }, + { + "epoch": 1.83, + "learning_rate": 0.0002500816521367736, + "loss": 0.0602, + "step": 72970 + }, + { + "epoch": 1.83, + "learning_rate": 0.0002497047961208954, + "loss": 0.0601, + "step": 72980 + }, + { + "epoch": 1.83, + "learning_rate": 0.0002493279401050172, + "loss": 0.0614, + "step": 72990 + }, + { + "epoch": 1.83, + "learning_rate": 0.00024895108408913905, + "loss": 0.0631, + "step": 73000 + }, + { + "epoch": 1.83, + "eval_cer": 0.6650651321193817, + "eval_loss": 0.053635094314813614, + "eval_runtime": 90.7023, + "eval_samples_per_second": 110.24, + "eval_steps_per_second": 6.891, + "step": 73000 + }, + { + "epoch": 1.83, + "learning_rate": 0.00024857422807326085, + "loss": 0.0621, + "step": 73010 + }, + { + "epoch": 1.83, + "learning_rate": 0.00024819737205738265, + "loss": 0.0643, + "step": 73020 + }, + { + "epoch": 1.83, + "learning_rate": 0.00024782051604150445, + "loss": 0.0621, + "step": 73030 + }, + { + "epoch": 1.84, + "learning_rate": 0.0002474436600256262, + "loss": 0.0642, + "step": 73040 + }, + { + "epoch": 1.84, + "learning_rate": 0.000247066804009748, + "loss": 0.0633, + "step": 73050 + }, + { + "epoch": 1.84, + "learning_rate": 0.0002466899479938698, + "loss": 0.0609, + "step": 73060 + }, + { + "epoch": 1.84, + "learning_rate": 0.0002463130919779916, + "loss": 0.0606, + "step": 73070 + }, + { + "epoch": 1.84, + "learning_rate": 0.0002459362359621134, + "loss": 0.0594, + "step": 73080 + }, + { + "epoch": 1.84, + "learning_rate": 0.00024555937994623524, + "loss": 0.059, + "step": 73090 + }, + { + "epoch": 1.84, + "learning_rate": 0.00024518252393035704, + "loss": 0.0631, + "step": 73100 + }, + { + "epoch": 1.84, + "learning_rate": 0.00024480566791447884, + "loss": 0.0625, + "step": 73110 + }, + { + "epoch": 1.84, + "learning_rate": 0.00024442881189860064, + "loss": 0.064, + "step": 73120 + }, + { + "epoch": 1.84, + "learning_rate": 0.00024405195588272243, + "loss": 0.0611, + "step": 73130 + }, + { + "epoch": 1.84, + "learning_rate": 0.00024367509986684423, + "loss": 0.0629, + "step": 73140 + }, + { + "epoch": 1.84, + "learning_rate": 0.000243298243850966, + "loss": 0.0627, + "step": 73150 + }, + { + "epoch": 1.84, + "learning_rate": 0.0002429213878350878, + "loss": 0.0621, + "step": 73160 + }, + { + "epoch": 1.84, + "learning_rate": 0.0002425445318192096, + "loss": 0.0617, + "step": 73170 + }, + { + "epoch": 1.84, + "learning_rate": 0.0002421676758033314, + "loss": 0.0608, + "step": 73180 + }, + { + "epoch": 1.84, + "learning_rate": 0.0002417908197874532, + "loss": 0.0624, + "step": 73190 + }, + { + "epoch": 1.84, + "learning_rate": 0.00024141396377157503, + "loss": 0.0643, + "step": 73200 + }, + { + "epoch": 1.84, + "learning_rate": 0.00024103710775569682, + "loss": 0.0623, + "step": 73210 + }, + { + "epoch": 1.84, + "learning_rate": 0.00024066025173981862, + "loss": 0.0618, + "step": 73220 + }, + { + "epoch": 1.84, + "learning_rate": 0.00024028339572394042, + "loss": 0.0609, + "step": 73230 + }, + { + "epoch": 1.84, + "learning_rate": 0.00023990653970806222, + "loss": 0.0597, + "step": 73240 + }, + { + "epoch": 1.84, + "learning_rate": 0.00023952968369218402, + "loss": 0.065, + "step": 73250 + }, + { + "epoch": 1.84, + "learning_rate": 0.0002391528276763058, + "loss": 0.0639, + "step": 73260 + }, + { + "epoch": 1.84, + "learning_rate": 0.0002387759716604276, + "loss": 0.0597, + "step": 73270 + }, + { + "epoch": 1.84, + "learning_rate": 0.0002383991156445494, + "loss": 0.0617, + "step": 73280 + }, + { + "epoch": 1.84, + "learning_rate": 0.00023802225962867122, + "loss": 0.0646, + "step": 73290 + }, + { + "epoch": 1.84, + "learning_rate": 0.00023764540361279301, + "loss": 0.0568, + "step": 73300 + }, + { + "epoch": 1.84, + "learning_rate": 0.0002372685475969148, + "loss": 0.06, + "step": 73310 + }, + { + "epoch": 1.84, + "learning_rate": 0.0002368916915810366, + "loss": 0.0624, + "step": 73320 + }, + { + "epoch": 1.84, + "learning_rate": 0.0002365148355651584, + "loss": 0.0653, + "step": 73330 + }, + { + "epoch": 1.84, + "learning_rate": 0.0002361379795492802, + "loss": 0.0644, + "step": 73340 + }, + { + "epoch": 1.84, + "learning_rate": 0.00023576112353340204, + "loss": 0.0611, + "step": 73350 + }, + { + "epoch": 1.84, + "learning_rate": 0.00023538426751752383, + "loss": 0.0641, + "step": 73360 + }, + { + "epoch": 1.84, + "learning_rate": 0.00023500741150164558, + "loss": 0.0611, + "step": 73370 + }, + { + "epoch": 1.84, + "learning_rate": 0.0002346305554857674, + "loss": 0.0613, + "step": 73380 + }, + { + "epoch": 1.84, + "learning_rate": 0.0002342536994698892, + "loss": 0.0643, + "step": 73390 + }, + { + "epoch": 1.84, + "learning_rate": 0.000233876843454011, + "loss": 0.0631, + "step": 73400 + }, + { + "epoch": 1.84, + "learning_rate": 0.0002334999874381328, + "loss": 0.0676, + "step": 73410 + }, + { + "epoch": 1.84, + "learning_rate": 0.0002331231314222546, + "loss": 0.0632, + "step": 73420 + }, + { + "epoch": 1.84, + "learning_rate": 0.0002327462754063764, + "loss": 0.0612, + "step": 73430 + }, + { + "epoch": 1.85, + "learning_rate": 0.00023236941939049822, + "loss": 0.0634, + "step": 73440 + }, + { + "epoch": 1.85, + "learning_rate": 0.00023199256337462002, + "loss": 0.0617, + "step": 73450 + }, + { + "epoch": 1.85, + "learning_rate": 0.00023161570735874182, + "loss": 0.0628, + "step": 73460 + }, + { + "epoch": 1.85, + "learning_rate": 0.00023123885134286362, + "loss": 0.0638, + "step": 73470 + }, + { + "epoch": 1.85, + "learning_rate": 0.0002308619953269854, + "loss": 0.0617, + "step": 73480 + }, + { + "epoch": 1.85, + "learning_rate": 0.0002304851393111072, + "loss": 0.0626, + "step": 73490 + }, + { + "epoch": 1.85, + "learning_rate": 0.000230108283295229, + "loss": 0.0614, + "step": 73500 + }, + { + "epoch": 1.85, + "eval_cer": 0.6650766816473669, + "eval_loss": 0.05350416526198387, + "eval_runtime": 90.6695, + "eval_samples_per_second": 110.28, + "eval_steps_per_second": 6.893, + "step": 73500 + }, + { + "epoch": 1.85, + "learning_rate": 0.0002297314272793508, + "loss": 0.0602, + "step": 73510 + }, + { + "epoch": 1.85, + "learning_rate": 0.00022935457126347262, + "loss": 0.0594, + "step": 73520 + }, + { + "epoch": 1.85, + "learning_rate": 0.00022897771524759441, + "loss": 0.0626, + "step": 73530 + }, + { + "epoch": 1.85, + "learning_rate": 0.0002286008592317162, + "loss": 0.0614, + "step": 73540 + }, + { + "epoch": 1.85, + "learning_rate": 0.000228224003215838, + "loss": 0.0646, + "step": 73550 + }, + { + "epoch": 1.85, + "learning_rate": 0.0002278471471999598, + "loss": 0.0639, + "step": 73560 + }, + { + "epoch": 1.85, + "learning_rate": 0.0002274702911840816, + "loss": 0.0618, + "step": 73570 + }, + { + "epoch": 1.85, + "learning_rate": 0.00022709343516820344, + "loss": 0.0637, + "step": 73580 + }, + { + "epoch": 1.85, + "learning_rate": 0.00022671657915232518, + "loss": 0.0614, + "step": 73590 + }, + { + "epoch": 1.85, + "learning_rate": 0.00022633972313644698, + "loss": 0.0609, + "step": 73600 + }, + { + "epoch": 1.85, + "learning_rate": 0.0002259628671205688, + "loss": 0.0601, + "step": 73610 + }, + { + "epoch": 1.85, + "learning_rate": 0.0002255860111046906, + "loss": 0.0569, + "step": 73620 + }, + { + "epoch": 1.85, + "learning_rate": 0.0002252091550888124, + "loss": 0.0641, + "step": 73630 + }, + { + "epoch": 1.85, + "learning_rate": 0.0002248322990729342, + "loss": 0.0613, + "step": 73640 + }, + { + "epoch": 1.85, + "learning_rate": 0.000224455443057056, + "loss": 0.0633, + "step": 73650 + }, + { + "epoch": 1.85, + "learning_rate": 0.0002240785870411778, + "loss": 0.0618, + "step": 73660 + }, + { + "epoch": 1.85, + "learning_rate": 0.00022370173102529963, + "loss": 0.0619, + "step": 73670 + }, + { + "epoch": 1.85, + "learning_rate": 0.00022332487500942142, + "loss": 0.0642, + "step": 73680 + }, + { + "epoch": 1.85, + "learning_rate": 0.00022294801899354322, + "loss": 0.0618, + "step": 73690 + }, + { + "epoch": 1.85, + "learning_rate": 0.000222571162977665, + "loss": 0.0605, + "step": 73700 + }, + { + "epoch": 1.85, + "learning_rate": 0.0002221943069617868, + "loss": 0.0658, + "step": 73710 + }, + { + "epoch": 1.85, + "learning_rate": 0.0002218174509459086, + "loss": 0.0605, + "step": 73720 + }, + { + "epoch": 1.85, + "learning_rate": 0.0002214405949300304, + "loss": 0.0638, + "step": 73730 + }, + { + "epoch": 1.85, + "learning_rate": 0.0002210637389141522, + "loss": 0.062, + "step": 73740 + }, + { + "epoch": 1.85, + "learning_rate": 0.000220686882898274, + "loss": 0.0607, + "step": 73750 + }, + { + "epoch": 1.85, + "learning_rate": 0.00022031002688239581, + "loss": 0.0656, + "step": 73760 + }, + { + "epoch": 1.85, + "learning_rate": 0.00021993317086651761, + "loss": 0.06, + "step": 73770 + }, + { + "epoch": 1.85, + "learning_rate": 0.0002195563148506394, + "loss": 0.0642, + "step": 73780 + }, + { + "epoch": 1.85, + "learning_rate": 0.0002191794588347612, + "loss": 0.0611, + "step": 73790 + }, + { + "epoch": 1.85, + "learning_rate": 0.000218802602818883, + "loss": 0.062, + "step": 73800 + }, + { + "epoch": 1.85, + "learning_rate": 0.00021842574680300484, + "loss": 0.0585, + "step": 73810 + }, + { + "epoch": 1.85, + "learning_rate": 0.00021804889078712658, + "loss": 0.0629, + "step": 73820 + }, + { + "epoch": 1.85, + "learning_rate": 0.00021767203477124838, + "loss": 0.0611, + "step": 73830 + }, + { + "epoch": 1.86, + "learning_rate": 0.0002172951787553702, + "loss": 0.0585, + "step": 73840 + }, + { + "epoch": 1.86, + "learning_rate": 0.000216918322739492, + "loss": 0.0621, + "step": 73850 + }, + { + "epoch": 1.86, + "learning_rate": 0.0002165414667236138, + "loss": 0.0632, + "step": 73860 + }, + { + "epoch": 1.86, + "learning_rate": 0.0002161646107077356, + "loss": 0.0565, + "step": 73870 + }, + { + "epoch": 1.86, + "learning_rate": 0.0002157877546918574, + "loss": 0.062, + "step": 73880 + }, + { + "epoch": 1.86, + "learning_rate": 0.0002154108986759792, + "loss": 0.0601, + "step": 73890 + }, + { + "epoch": 1.86, + "learning_rate": 0.00021503404266010103, + "loss": 0.0619, + "step": 73900 + }, + { + "epoch": 1.86, + "learning_rate": 0.00021465718664422282, + "loss": 0.0621, + "step": 73910 + }, + { + "epoch": 1.86, + "learning_rate": 0.00021428033062834462, + "loss": 0.063, + "step": 73920 + }, + { + "epoch": 1.86, + "learning_rate": 0.0002139034746124664, + "loss": 0.0603, + "step": 73930 + }, + { + "epoch": 1.86, + "learning_rate": 0.0002135266185965882, + "loss": 0.0611, + "step": 73940 + }, + { + "epoch": 1.86, + "learning_rate": 0.00021314976258071, + "loss": 0.0607, + "step": 73950 + }, + { + "epoch": 1.86, + "learning_rate": 0.0002127729065648318, + "loss": 0.0608, + "step": 73960 + }, + { + "epoch": 1.86, + "learning_rate": 0.0002123960505489536, + "loss": 0.0646, + "step": 73970 + }, + { + "epoch": 1.86, + "learning_rate": 0.0002120191945330754, + "loss": 0.0626, + "step": 73980 + }, + { + "epoch": 1.86, + "learning_rate": 0.00021164233851719722, + "loss": 0.0613, + "step": 73990 + }, + { + "epoch": 1.86, + "learning_rate": 0.00021126548250131901, + "loss": 0.0637, + "step": 74000 + }, + { + "epoch": 1.86, + "eval_cer": 0.6652446310334854, + "eval_loss": 0.05332941189408302, + "eval_runtime": 90.5983, + "eval_samples_per_second": 110.366, + "eval_steps_per_second": 6.899, + "step": 74000 + }, + { + "epoch": 1.86, + "learning_rate": 0.0002108886264854408, + "loss": 0.0586, + "step": 74010 + }, + { + "epoch": 1.86, + "learning_rate": 0.0002105117704695626, + "loss": 0.0622, + "step": 74020 + }, + { + "epoch": 1.86, + "learning_rate": 0.0002101349144536844, + "loss": 0.0609, + "step": 74030 + }, + { + "epoch": 1.86, + "learning_rate": 0.00020975805843780618, + "loss": 0.0626, + "step": 74040 + }, + { + "epoch": 1.86, + "learning_rate": 0.00020938120242192798, + "loss": 0.0623, + "step": 74050 + }, + { + "epoch": 1.86, + "learning_rate": 0.00020900434640604978, + "loss": 0.0624, + "step": 74060 + }, + { + "epoch": 1.86, + "learning_rate": 0.0002086274903901716, + "loss": 0.0633, + "step": 74070 + }, + { + "epoch": 1.86, + "learning_rate": 0.0002082506343742934, + "loss": 0.0606, + "step": 74080 + }, + { + "epoch": 1.86, + "learning_rate": 0.0002078737783584152, + "loss": 0.0606, + "step": 74090 + }, + { + "epoch": 1.86, + "learning_rate": 0.000207496922342537, + "loss": 0.0625, + "step": 74100 + }, + { + "epoch": 1.86, + "learning_rate": 0.0002071200663266588, + "loss": 0.0605, + "step": 74110 + }, + { + "epoch": 1.86, + "learning_rate": 0.0002067432103107806, + "loss": 0.0646, + "step": 74120 + }, + { + "epoch": 1.86, + "learning_rate": 0.00020636635429490243, + "loss": 0.0629, + "step": 74130 + }, + { + "epoch": 1.86, + "learning_rate": 0.00020598949827902422, + "loss": 0.0647, + "step": 74140 + }, + { + "epoch": 1.86, + "learning_rate": 0.00020561264226314597, + "loss": 0.0641, + "step": 74150 + }, + { + "epoch": 1.86, + "learning_rate": 0.0002052357862472678, + "loss": 0.061, + "step": 74160 + }, + { + "epoch": 1.86, + "learning_rate": 0.0002048589302313896, + "loss": 0.0626, + "step": 74170 + }, + { + "epoch": 1.86, + "learning_rate": 0.0002044820742155114, + "loss": 0.061, + "step": 74180 + }, + { + "epoch": 1.86, + "learning_rate": 0.0002041052181996332, + "loss": 0.0581, + "step": 74190 + }, + { + "epoch": 1.86, + "learning_rate": 0.000203728362183755, + "loss": 0.0625, + "step": 74200 + }, + { + "epoch": 1.86, + "learning_rate": 0.0002033515061678768, + "loss": 0.0598, + "step": 74210 + }, + { + "epoch": 1.86, + "learning_rate": 0.00020297465015199862, + "loss": 0.0641, + "step": 74220 + }, + { + "epoch": 1.86, + "learning_rate": 0.00020259779413612041, + "loss": 0.0615, + "step": 74230 + }, + { + "epoch": 1.87, + "learning_rate": 0.0002022209381202422, + "loss": 0.0638, + "step": 74240 + }, + { + "epoch": 1.87, + "learning_rate": 0.000201844082104364, + "loss": 0.0621, + "step": 74250 + }, + { + "epoch": 1.87, + "learning_rate": 0.00020146722608848578, + "loss": 0.0626, + "step": 74260 + }, + { + "epoch": 1.87, + "learning_rate": 0.00020109037007260758, + "loss": 0.0625, + "step": 74270 + }, + { + "epoch": 1.87, + "learning_rate": 0.00020071351405672938, + "loss": 0.0633, + "step": 74280 + }, + { + "epoch": 1.87, + "learning_rate": 0.00020033665804085118, + "loss": 0.062, + "step": 74290 + }, + { + "epoch": 1.87, + "learning_rate": 0.00019995980202497298, + "loss": 0.0593, + "step": 74300 + }, + { + "epoch": 1.87, + "learning_rate": 0.0001995829460090948, + "loss": 0.0612, + "step": 74310 + }, + { + "epoch": 1.87, + "learning_rate": 0.0001992060899932166, + "loss": 0.0609, + "step": 74320 + }, + { + "epoch": 1.87, + "learning_rate": 0.0001988292339773384, + "loss": 0.0638, + "step": 74330 + }, + { + "epoch": 1.87, + "learning_rate": 0.0001984523779614602, + "loss": 0.0621, + "step": 74340 + }, + { + "epoch": 1.87, + "learning_rate": 0.000198075521945582, + "loss": 0.0627, + "step": 74350 + }, + { + "epoch": 1.87, + "learning_rate": 0.00019769866592970383, + "loss": 0.0624, + "step": 74360 + }, + { + "epoch": 1.87, + "learning_rate": 0.00019732180991382557, + "loss": 0.0619, + "step": 74370 + }, + { + "epoch": 1.87, + "learning_rate": 0.00019694495389794737, + "loss": 0.0622, + "step": 74380 + }, + { + "epoch": 1.87, + "learning_rate": 0.0001965680978820692, + "loss": 0.0612, + "step": 74390 + }, + { + "epoch": 1.87, + "learning_rate": 0.000196191241866191, + "loss": 0.0639, + "step": 74400 + }, + { + "epoch": 1.87, + "learning_rate": 0.0001958143858503128, + "loss": 0.0642, + "step": 74410 + }, + { + "epoch": 1.87, + "learning_rate": 0.0001954375298344346, + "loss": 0.0624, + "step": 74420 + }, + { + "epoch": 1.87, + "learning_rate": 0.0001950606738185564, + "loss": 0.06, + "step": 74430 + }, + { + "epoch": 1.87, + "learning_rate": 0.0001946838178026782, + "loss": 0.0627, + "step": 74440 + }, + { + "epoch": 1.87, + "learning_rate": 0.00019430696178680002, + "loss": 0.0621, + "step": 74450 + }, + { + "epoch": 1.87, + "learning_rate": 0.00019393010577092181, + "loss": 0.0616, + "step": 74460 + }, + { + "epoch": 1.87, + "learning_rate": 0.0001935532497550436, + "loss": 0.0637, + "step": 74470 + }, + { + "epoch": 1.87, + "learning_rate": 0.00019317639373916539, + "loss": 0.0612, + "step": 74480 + }, + { + "epoch": 1.87, + "learning_rate": 0.00019279953772328718, + "loss": 0.0613, + "step": 74490 + }, + { + "epoch": 1.87, + "learning_rate": 0.00019242268170740898, + "loss": 0.0619, + "step": 74500 + }, + { + "epoch": 1.87, + "eval_cer": 0.6651796649385685, + "eval_loss": 0.05317223444581032, + "eval_runtime": 90.7609, + "eval_samples_per_second": 110.169, + "eval_steps_per_second": 6.886, + "step": 74500 + }, + { + "epoch": 1.87, + "learning_rate": 0.00019204582569153078, + "loss": 0.0611, + "step": 74510 + }, + { + "epoch": 1.87, + "learning_rate": 0.00019166896967565258, + "loss": 0.0631, + "step": 74520 + }, + { + "epoch": 1.87, + "learning_rate": 0.00019129211365977438, + "loss": 0.0604, + "step": 74530 + }, + { + "epoch": 1.87, + "learning_rate": 0.0001909152576438962, + "loss": 0.0617, + "step": 74540 + }, + { + "epoch": 1.87, + "learning_rate": 0.000190538401628018, + "loss": 0.0622, + "step": 74550 + }, + { + "epoch": 1.87, + "learning_rate": 0.0001901615456121398, + "loss": 0.0611, + "step": 74560 + }, + { + "epoch": 1.87, + "learning_rate": 0.0001897846895962616, + "loss": 0.0623, + "step": 74570 + }, + { + "epoch": 1.87, + "learning_rate": 0.0001894078335803834, + "loss": 0.0642, + "step": 74580 + }, + { + "epoch": 1.87, + "learning_rate": 0.00018903097756450517, + "loss": 0.0606, + "step": 74590 + }, + { + "epoch": 1.87, + "learning_rate": 0.00018865412154862697, + "loss": 0.061, + "step": 74600 + }, + { + "epoch": 1.87, + "learning_rate": 0.00018827726553274877, + "loss": 0.0626, + "step": 74610 + }, + { + "epoch": 1.87, + "learning_rate": 0.00018790040951687057, + "loss": 0.0606, + "step": 74620 + }, + { + "epoch": 1.87, + "learning_rate": 0.0001875235535009924, + "loss": 0.063, + "step": 74630 + }, + { + "epoch": 1.88, + "learning_rate": 0.0001871466974851142, + "loss": 0.0589, + "step": 74640 + }, + { + "epoch": 1.88, + "learning_rate": 0.000186769841469236, + "loss": 0.0607, + "step": 74650 + }, + { + "epoch": 1.88, + "learning_rate": 0.0001863929854533578, + "loss": 0.0611, + "step": 74660 + }, + { + "epoch": 1.88, + "learning_rate": 0.0001860161294374796, + "loss": 0.0629, + "step": 74670 + }, + { + "epoch": 1.88, + "learning_rate": 0.0001856392734216014, + "loss": 0.0618, + "step": 74680 + }, + { + "epoch": 1.88, + "learning_rate": 0.0001852624174057232, + "loss": 0.058, + "step": 74690 + }, + { + "epoch": 1.88, + "learning_rate": 0.000184885561389845, + "loss": 0.0639, + "step": 74700 + }, + { + "epoch": 1.88, + "learning_rate": 0.00018450870537396679, + "loss": 0.0637, + "step": 74710 + }, + { + "epoch": 1.88, + "learning_rate": 0.00018413184935808858, + "loss": 0.0634, + "step": 74720 + }, + { + "epoch": 1.88, + "learning_rate": 0.00018375499334221038, + "loss": 0.0567, + "step": 74730 + }, + { + "epoch": 1.88, + "learning_rate": 0.00018337813732633218, + "loss": 0.0576, + "step": 74740 + }, + { + "epoch": 1.88, + "learning_rate": 0.00018300128131045398, + "loss": 0.0599, + "step": 74750 + }, + { + "epoch": 1.88, + "learning_rate": 0.00018262442529457578, + "loss": 0.0596, + "step": 74760 + }, + { + "epoch": 1.88, + "learning_rate": 0.0001822475692786976, + "loss": 0.0616, + "step": 74770 + }, + { + "epoch": 1.88, + "learning_rate": 0.0001818707132628194, + "loss": 0.0602, + "step": 74780 + }, + { + "epoch": 1.88, + "learning_rate": 0.00018149385724694118, + "loss": 0.0604, + "step": 74790 + }, + { + "epoch": 1.88, + "learning_rate": 0.00018111700123106298, + "loss": 0.0608, + "step": 74800 + }, + { + "epoch": 1.88, + "learning_rate": 0.0001807401452151848, + "loss": 0.0638, + "step": 74810 + }, + { + "epoch": 1.88, + "learning_rate": 0.0001803632891993066, + "loss": 0.0636, + "step": 74820 + }, + { + "epoch": 1.88, + "learning_rate": 0.0001799864331834284, + "loss": 0.0595, + "step": 74830 + }, + { + "epoch": 1.88, + "learning_rate": 0.00017960957716755017, + "loss": 0.0616, + "step": 74840 + }, + { + "epoch": 1.88, + "learning_rate": 0.00017923272115167197, + "loss": 0.0611, + "step": 74850 + }, + { + "epoch": 1.88, + "learning_rate": 0.0001788558651357938, + "loss": 0.0591, + "step": 74860 + }, + { + "epoch": 1.88, + "learning_rate": 0.0001784790091199156, + "loss": 0.0575, + "step": 74870 + }, + { + "epoch": 1.88, + "learning_rate": 0.0001781021531040374, + "loss": 0.0632, + "step": 74880 + }, + { + "epoch": 1.88, + "learning_rate": 0.0001777252970881592, + "loss": 0.062, + "step": 74890 + }, + { + "epoch": 1.88, + "learning_rate": 0.000177348441072281, + "loss": 0.0615, + "step": 74900 + }, + { + "epoch": 1.88, + "learning_rate": 0.0001769715850564028, + "loss": 0.0619, + "step": 74910 + }, + { + "epoch": 1.88, + "learning_rate": 0.0001765947290405246, + "loss": 0.0614, + "step": 74920 + }, + { + "epoch": 1.88, + "learning_rate": 0.0001762178730246464, + "loss": 0.0631, + "step": 74930 + }, + { + "epoch": 1.88, + "learning_rate": 0.00017584101700876819, + "loss": 0.0608, + "step": 74940 + }, + { + "epoch": 1.88, + "learning_rate": 0.00017546416099288998, + "loss": 0.0625, + "step": 74950 + }, + { + "epoch": 1.88, + "learning_rate": 0.00017508730497701178, + "loss": 0.063, + "step": 74960 + }, + { + "epoch": 1.88, + "learning_rate": 0.00017471044896113358, + "loss": 0.059, + "step": 74970 + }, + { + "epoch": 1.88, + "learning_rate": 0.00017433359294525538, + "loss": 0.0625, + "step": 74980 + }, + { + "epoch": 1.88, + "learning_rate": 0.00017395673692937718, + "loss": 0.063, + "step": 74990 + }, + { + "epoch": 1.88, + "learning_rate": 0.000173579880913499, + "loss": 0.061, + "step": 75000 + }, + { + "epoch": 1.88, + "eval_cer": 0.6652123886011934, + "eval_loss": 0.053149040788412094, + "eval_runtime": 90.705, + "eval_samples_per_second": 110.236, + "eval_steps_per_second": 6.89, + "step": 75000 + }, + { + "epoch": 1.88, + "learning_rate": 0.00017320302489762078, + "loss": 0.0612, + "step": 75010 + }, + { + "epoch": 1.88, + "learning_rate": 0.00017282616888174258, + "loss": 0.0604, + "step": 75020 + }, + { + "epoch": 1.89, + "learning_rate": 0.00017244931286586438, + "loss": 0.0622, + "step": 75030 + }, + { + "epoch": 1.89, + "learning_rate": 0.0001720724568499862, + "loss": 0.0589, + "step": 75040 + }, + { + "epoch": 1.89, + "learning_rate": 0.000171695600834108, + "loss": 0.0621, + "step": 75050 + }, + { + "epoch": 1.89, + "learning_rate": 0.0001713187448182298, + "loss": 0.0597, + "step": 75060 + }, + { + "epoch": 1.89, + "learning_rate": 0.00017094188880235157, + "loss": 0.0618, + "step": 75070 + }, + { + "epoch": 1.89, + "learning_rate": 0.00017056503278647337, + "loss": 0.0644, + "step": 75080 + }, + { + "epoch": 1.89, + "learning_rate": 0.0001701881767705952, + "loss": 0.0632, + "step": 75090 + }, + { + "epoch": 1.89, + "learning_rate": 0.000169811320754717, + "loss": 0.0613, + "step": 75100 + }, + { + "epoch": 1.89, + "learning_rate": 0.0001694344647388388, + "loss": 0.0642, + "step": 75110 + }, + { + "epoch": 1.89, + "learning_rate": 0.00016905760872296056, + "loss": 0.0618, + "step": 75120 + }, + { + "epoch": 1.89, + "learning_rate": 0.0001686807527070824, + "loss": 0.0571, + "step": 75130 + }, + { + "epoch": 1.89, + "learning_rate": 0.0001683038966912042, + "loss": 0.0607, + "step": 75140 + }, + { + "epoch": 1.89, + "learning_rate": 0.000167927040675326, + "loss": 0.0586, + "step": 75150 + }, + { + "epoch": 1.89, + "learning_rate": 0.0001675501846594478, + "loss": 0.0608, + "step": 75160 + }, + { + "epoch": 1.89, + "learning_rate": 0.00016717332864356959, + "loss": 0.0623, + "step": 75170 + }, + { + "epoch": 1.89, + "learning_rate": 0.00016679647262769139, + "loss": 0.0565, + "step": 75180 + }, + { + "epoch": 1.89, + "learning_rate": 0.00016641961661181318, + "loss": 0.0645, + "step": 75190 + }, + { + "epoch": 1.89, + "learning_rate": 0.00016604276059593498, + "loss": 0.0638, + "step": 75200 + }, + { + "epoch": 1.89, + "learning_rate": 0.00016566590458005678, + "loss": 0.0612, + "step": 75210 + }, + { + "epoch": 1.89, + "learning_rate": 0.00016528904856417858, + "loss": 0.0626, + "step": 75220 + }, + { + "epoch": 1.89, + "learning_rate": 0.00016491219254830038, + "loss": 0.0621, + "step": 75230 + }, + { + "epoch": 1.89, + "learning_rate": 0.00016453533653242218, + "loss": 0.0595, + "step": 75240 + }, + { + "epoch": 1.89, + "learning_rate": 0.00016415848051654398, + "loss": 0.0615, + "step": 75250 + }, + { + "epoch": 1.89, + "learning_rate": 0.00016378162450066578, + "loss": 0.0623, + "step": 75260 + }, + { + "epoch": 1.89, + "learning_rate": 0.00016340476848478757, + "loss": 0.0596, + "step": 75270 + }, + { + "epoch": 1.89, + "learning_rate": 0.0001630279124689094, + "loss": 0.0609, + "step": 75280 + }, + { + "epoch": 1.89, + "learning_rate": 0.00016265105645303117, + "loss": 0.06, + "step": 75290 + }, + { + "epoch": 1.89, + "learning_rate": 0.00016227420043715297, + "loss": 0.0614, + "step": 75300 + }, + { + "epoch": 1.89, + "learning_rate": 0.00016189734442127477, + "loss": 0.0612, + "step": 75310 + }, + { + "epoch": 1.89, + "learning_rate": 0.0001615204884053966, + "loss": 0.0614, + "step": 75320 + }, + { + "epoch": 1.89, + "learning_rate": 0.0001611436323895184, + "loss": 0.0606, + "step": 75330 + }, + { + "epoch": 1.89, + "learning_rate": 0.00016076677637364017, + "loss": 0.0606, + "step": 75340 + }, + { + "epoch": 1.89, + "learning_rate": 0.00016038992035776197, + "loss": 0.0597, + "step": 75350 + }, + { + "epoch": 1.89, + "learning_rate": 0.0001600130643418838, + "loss": 0.0607, + "step": 75360 + }, + { + "epoch": 1.89, + "learning_rate": 0.0001596362083260056, + "loss": 0.0606, + "step": 75370 + }, + { + "epoch": 1.89, + "learning_rate": 0.0001592593523101274, + "loss": 0.0601, + "step": 75380 + }, + { + "epoch": 1.89, + "learning_rate": 0.0001588824962942492, + "loss": 0.0634, + "step": 75390 + }, + { + "epoch": 1.89, + "learning_rate": 0.00015850564027837096, + "loss": 0.0597, + "step": 75400 + }, + { + "epoch": 1.89, + "learning_rate": 0.00015812878426249279, + "loss": 0.0604, + "step": 75410 + }, + { + "epoch": 1.89, + "learning_rate": 0.00015775192824661458, + "loss": 0.0585, + "step": 75420 + }, + { + "epoch": 1.9, + "learning_rate": 0.00015737507223073638, + "loss": 0.0598, + "step": 75430 + }, + { + "epoch": 1.9, + "learning_rate": 0.00015699821621485818, + "loss": 0.0601, + "step": 75440 + }, + { + "epoch": 1.9, + "learning_rate": 0.00015662136019897998, + "loss": 0.0603, + "step": 75450 + }, + { + "epoch": 1.9, + "learning_rate": 0.00015624450418310178, + "loss": 0.0614, + "step": 75460 + }, + { + "epoch": 1.9, + "learning_rate": 0.00015586764816722358, + "loss": 0.0635, + "step": 75470 + }, + { + "epoch": 1.9, + "learning_rate": 0.00015549079215134538, + "loss": 0.0631, + "step": 75480 + }, + { + "epoch": 1.9, + "learning_rate": 0.00015511393613546718, + "loss": 0.062, + "step": 75490 + }, + { + "epoch": 1.9, + "learning_rate": 0.00015473708011958897, + "loss": 0.0598, + "step": 75500 + }, + { + "epoch": 1.9, + "eval_cer": 0.6651926581575519, + "eval_loss": 0.05298503488302231, + "eval_runtime": 91.1794, + "eval_samples_per_second": 109.663, + "eval_steps_per_second": 6.855, + "step": 75500 + }, + { + "epoch": 1.9, + "learning_rate": 0.00015436022410371077, + "loss": 0.0576, + "step": 75510 + }, + { + "epoch": 1.9, + "learning_rate": 0.00015398336808783257, + "loss": 0.062, + "step": 75520 + }, + { + "epoch": 1.9, + "learning_rate": 0.00015360651207195437, + "loss": 0.061, + "step": 75530 + }, + { + "epoch": 1.9, + "learning_rate": 0.00015322965605607617, + "loss": 0.0636, + "step": 75540 + }, + { + "epoch": 1.9, + "learning_rate": 0.000152852800040198, + "loss": 0.0624, + "step": 75550 + }, + { + "epoch": 1.9, + "learning_rate": 0.0001524759440243198, + "loss": 0.061, + "step": 75560 + }, + { + "epoch": 1.9, + "learning_rate": 0.00015209908800844157, + "loss": 0.0629, + "step": 75570 + }, + { + "epoch": 1.9, + "learning_rate": 0.00015172223199256337, + "loss": 0.0599, + "step": 75580 + }, + { + "epoch": 1.9, + "learning_rate": 0.00015134537597668516, + "loss": 0.0635, + "step": 75590 + }, + { + "epoch": 1.9, + "learning_rate": 0.000150968519960807, + "loss": 0.0559, + "step": 75600 + }, + { + "epoch": 1.9, + "learning_rate": 0.0001505916639449288, + "loss": 0.0611, + "step": 75610 + }, + { + "epoch": 1.9, + "learning_rate": 0.00015021480792905056, + "loss": 0.059, + "step": 75620 + }, + { + "epoch": 1.9, + "learning_rate": 0.00014983795191317236, + "loss": 0.0613, + "step": 75630 + }, + { + "epoch": 1.9, + "learning_rate": 0.00014946109589729419, + "loss": 0.0604, + "step": 75640 + }, + { + "epoch": 1.9, + "learning_rate": 0.00014908423988141598, + "loss": 0.0607, + "step": 75650 + }, + { + "epoch": 1.9, + "learning_rate": 0.00014870738386553778, + "loss": 0.0605, + "step": 75660 + }, + { + "epoch": 1.9, + "learning_rate": 0.00014833052784965958, + "loss": 0.0626, + "step": 75670 + }, + { + "epoch": 1.9, + "learning_rate": 0.00014795367183378138, + "loss": 0.0625, + "step": 75680 + }, + { + "epoch": 1.9, + "learning_rate": 0.00014757681581790318, + "loss": 0.0585, + "step": 75690 + }, + { + "epoch": 1.9, + "learning_rate": 0.00014719995980202498, + "loss": 0.0611, + "step": 75700 + }, + { + "epoch": 1.9, + "learning_rate": 0.00014682310378614678, + "loss": 0.0623, + "step": 75710 + }, + { + "epoch": 1.9, + "learning_rate": 0.00014644624777026858, + "loss": 0.0605, + "step": 75720 + }, + { + "epoch": 1.9, + "learning_rate": 0.00014606939175439038, + "loss": 0.0613, + "step": 75730 + }, + { + "epoch": 1.9, + "learning_rate": 0.00014569253573851217, + "loss": 0.0619, + "step": 75740 + }, + { + "epoch": 1.9, + "learning_rate": 0.00014531567972263397, + "loss": 0.0607, + "step": 75750 + }, + { + "epoch": 1.9, + "learning_rate": 0.00014493882370675577, + "loss": 0.06, + "step": 75760 + }, + { + "epoch": 1.9, + "learning_rate": 0.00014456196769087757, + "loss": 0.0591, + "step": 75770 + }, + { + "epoch": 1.9, + "learning_rate": 0.0001441851116749994, + "loss": 0.0616, + "step": 75780 + }, + { + "epoch": 1.9, + "learning_rate": 0.00014380825565912117, + "loss": 0.0623, + "step": 75790 + }, + { + "epoch": 1.9, + "learning_rate": 0.00014343139964324297, + "loss": 0.062, + "step": 75800 + }, + { + "epoch": 1.9, + "learning_rate": 0.00014305454362736477, + "loss": 0.0624, + "step": 75810 + }, + { + "epoch": 1.9, + "learning_rate": 0.00014267768761148656, + "loss": 0.0652, + "step": 75820 + }, + { + "epoch": 1.91, + "learning_rate": 0.0001423008315956084, + "loss": 0.0615, + "step": 75830 + }, + { + "epoch": 1.91, + "learning_rate": 0.0001419239755797302, + "loss": 0.0632, + "step": 75840 + }, + { + "epoch": 1.91, + "learning_rate": 0.00014154711956385196, + "loss": 0.0638, + "step": 75850 + }, + { + "epoch": 1.91, + "learning_rate": 0.00014117026354797376, + "loss": 0.0614, + "step": 75860 + }, + { + "epoch": 1.91, + "learning_rate": 0.00014079340753209559, + "loss": 0.061, + "step": 75870 + }, + { + "epoch": 1.91, + "learning_rate": 0.00014041655151621738, + "loss": 0.0582, + "step": 75880 + }, + { + "epoch": 1.91, + "learning_rate": 0.00014003969550033918, + "loss": 0.0615, + "step": 75890 + }, + { + "epoch": 1.91, + "learning_rate": 0.00013966283948446096, + "loss": 0.0606, + "step": 75900 + }, + { + "epoch": 1.91, + "learning_rate": 0.00013928598346858275, + "loss": 0.0621, + "step": 75910 + }, + { + "epoch": 1.91, + "learning_rate": 0.00013890912745270458, + "loss": 0.0597, + "step": 75920 + }, + { + "epoch": 1.91, + "learning_rate": 0.00013853227143682638, + "loss": 0.0597, + "step": 75930 + }, + { + "epoch": 1.91, + "learning_rate": 0.00013815541542094818, + "loss": 0.0604, + "step": 75940 + }, + { + "epoch": 1.91, + "learning_rate": 0.00013777855940506998, + "loss": 0.0604, + "step": 75950 + }, + { + "epoch": 1.91, + "learning_rate": 0.00013740170338919178, + "loss": 0.0605, + "step": 75960 + }, + { + "epoch": 1.91, + "learning_rate": 0.00013702484737331357, + "loss": 0.0639, + "step": 75970 + }, + { + "epoch": 1.91, + "learning_rate": 0.00013664799135743537, + "loss": 0.0634, + "step": 75980 + }, + { + "epoch": 1.91, + "learning_rate": 0.00013627113534155717, + "loss": 0.0606, + "step": 75990 + }, + { + "epoch": 1.91, + "learning_rate": 0.00013589427932567897, + "loss": 0.0643, + "step": 76000 + }, + { + "epoch": 1.91, + "eval_cer": 0.6651921769272192, + "eval_loss": 0.05285988375544548, + "eval_runtime": 90.7457, + "eval_samples_per_second": 110.187, + "eval_steps_per_second": 6.887, + "step": 76000 + }, + { + "epoch": 1.91, + "learning_rate": 0.00013551742330980077, + "loss": 0.0622, + "step": 76010 + }, + { + "epoch": 1.91, + "learning_rate": 0.00013514056729392257, + "loss": 0.0618, + "step": 76020 + }, + { + "epoch": 1.91, + "learning_rate": 0.00013476371127804437, + "loss": 0.0587, + "step": 76030 + }, + { + "epoch": 1.91, + "learning_rate": 0.00013438685526216617, + "loss": 0.0587, + "step": 76040 + }, + { + "epoch": 1.91, + "learning_rate": 0.00013400999924628797, + "loss": 0.0647, + "step": 76050 + }, + { + "epoch": 1.91, + "learning_rate": 0.0001336331432304098, + "loss": 0.0577, + "step": 76060 + }, + { + "epoch": 1.91, + "learning_rate": 0.00013325628721453156, + "loss": 0.0638, + "step": 76070 + }, + { + "epoch": 1.91, + "learning_rate": 0.00013287943119865336, + "loss": 0.0638, + "step": 76080 + }, + { + "epoch": 1.91, + "learning_rate": 0.00013250257518277516, + "loss": 0.0592, + "step": 76090 + }, + { + "epoch": 1.91, + "learning_rate": 0.00013212571916689699, + "loss": 0.0623, + "step": 76100 + }, + { + "epoch": 1.91, + "learning_rate": 0.00013174886315101879, + "loss": 0.0623, + "step": 76110 + }, + { + "epoch": 1.91, + "learning_rate": 0.00013137200713514056, + "loss": 0.0616, + "step": 76120 + }, + { + "epoch": 1.91, + "learning_rate": 0.00013099515111926236, + "loss": 0.0626, + "step": 76130 + }, + { + "epoch": 1.91, + "learning_rate": 0.00013061829510338415, + "loss": 0.0611, + "step": 76140 + }, + { + "epoch": 1.91, + "learning_rate": 0.00013024143908750598, + "loss": 0.061, + "step": 76150 + }, + { + "epoch": 1.91, + "learning_rate": 0.00012986458307162778, + "loss": 0.0583, + "step": 76160 + }, + { + "epoch": 1.91, + "learning_rate": 0.00012948772705574958, + "loss": 0.0622, + "step": 76170 + }, + { + "epoch": 1.91, + "learning_rate": 0.00012911087103987135, + "loss": 0.0591, + "step": 76180 + }, + { + "epoch": 1.91, + "learning_rate": 0.00012873401502399318, + "loss": 0.0635, + "step": 76190 + }, + { + "epoch": 1.91, + "learning_rate": 0.00012835715900811497, + "loss": 0.0619, + "step": 76200 + }, + { + "epoch": 1.91, + "learning_rate": 0.00012798030299223677, + "loss": 0.0604, + "step": 76210 + }, + { + "epoch": 1.91, + "learning_rate": 0.00012760344697635857, + "loss": 0.0595, + "step": 76220 + }, + { + "epoch": 1.92, + "learning_rate": 0.00012722659096048037, + "loss": 0.0601, + "step": 76230 + }, + { + "epoch": 1.92, + "learning_rate": 0.00012684973494460217, + "loss": 0.0608, + "step": 76240 + }, + { + "epoch": 1.92, + "learning_rate": 0.00012647287892872397, + "loss": 0.0608, + "step": 76250 + }, + { + "epoch": 1.92, + "learning_rate": 0.00012609602291284577, + "loss": 0.0606, + "step": 76260 + }, + { + "epoch": 1.92, + "learning_rate": 0.00012571916689696757, + "loss": 0.0589, + "step": 76270 + }, + { + "epoch": 1.92, + "learning_rate": 0.00012534231088108937, + "loss": 0.0594, + "step": 76280 + }, + { + "epoch": 1.92, + "learning_rate": 0.00012496545486521116, + "loss": 0.0609, + "step": 76290 + }, + { + "epoch": 1.92, + "learning_rate": 0.00012458859884933296, + "loss": 0.0627, + "step": 76300 + }, + { + "epoch": 1.92, + "learning_rate": 0.00012421174283345476, + "loss": 0.0629, + "step": 76310 + }, + { + "epoch": 1.92, + "learning_rate": 0.00012383488681757656, + "loss": 0.0601, + "step": 76320 + }, + { + "epoch": 1.92, + "learning_rate": 0.0001234580308016984, + "loss": 0.0604, + "step": 76330 + }, + { + "epoch": 1.92, + "learning_rate": 0.00012308117478582019, + "loss": 0.0608, + "step": 76340 + }, + { + "epoch": 1.92, + "learning_rate": 0.00012270431876994196, + "loss": 0.0641, + "step": 76350 + }, + { + "epoch": 1.92, + "learning_rate": 0.00012232746275406376, + "loss": 0.0595, + "step": 76360 + }, + { + "epoch": 1.92, + "learning_rate": 0.00012195060673818557, + "loss": 0.0623, + "step": 76370 + }, + { + "epoch": 1.92, + "learning_rate": 0.00012157375072230737, + "loss": 0.0612, + "step": 76380 + }, + { + "epoch": 1.92, + "learning_rate": 0.00012119689470642918, + "loss": 0.0595, + "step": 76390 + }, + { + "epoch": 1.92, + "learning_rate": 0.00012082003869055095, + "loss": 0.0604, + "step": 76400 + }, + { + "epoch": 1.92, + "learning_rate": 0.00012044318267467276, + "loss": 0.0606, + "step": 76410 + }, + { + "epoch": 1.92, + "learning_rate": 0.00012006632665879456, + "loss": 0.0601, + "step": 76420 + }, + { + "epoch": 1.92, + "learning_rate": 0.00011968947064291636, + "loss": 0.0615, + "step": 76430 + }, + { + "epoch": 1.92, + "learning_rate": 0.00011931261462703817, + "loss": 0.0646, + "step": 76440 + }, + { + "epoch": 1.92, + "learning_rate": 0.00011893575861115997, + "loss": 0.0611, + "step": 76450 + }, + { + "epoch": 1.92, + "learning_rate": 0.00011855890259528176, + "loss": 0.0622, + "step": 76460 + }, + { + "epoch": 1.92, + "learning_rate": 0.00011818204657940356, + "loss": 0.0598, + "step": 76470 + }, + { + "epoch": 1.92, + "learning_rate": 0.00011780519056352537, + "loss": 0.0623, + "step": 76480 + }, + { + "epoch": 1.92, + "learning_rate": 0.00011742833454764717, + "loss": 0.0632, + "step": 76490 + }, + { + "epoch": 1.92, + "learning_rate": 0.00011705147853176897, + "loss": 0.0609, + "step": 76500 + }, + { + "epoch": 1.92, + "eval_cer": 0.6651411665119511, + "eval_loss": 0.05271696671843529, + "eval_runtime": 90.4198, + "eval_samples_per_second": 110.584, + "eval_steps_per_second": 6.912, + "step": 76500 + }, + { + "epoch": 1.92, + "learning_rate": 0.00011667462251589075, + "loss": 0.0632, + "step": 76510 + }, + { + "epoch": 1.92, + "learning_rate": 0.00011629776650001256, + "loss": 0.0614, + "step": 76520 + }, + { + "epoch": 1.92, + "learning_rate": 0.00011592091048413436, + "loss": 0.064, + "step": 76530 + }, + { + "epoch": 1.92, + "learning_rate": 0.00011554405446825616, + "loss": 0.0609, + "step": 76540 + }, + { + "epoch": 1.92, + "learning_rate": 0.00011516719845237797, + "loss": 0.0604, + "step": 76550 + }, + { + "epoch": 1.92, + "learning_rate": 0.00011479034243649977, + "loss": 0.0609, + "step": 76560 + }, + { + "epoch": 1.92, + "learning_rate": 0.00011441348642062156, + "loss": 0.0631, + "step": 76570 + }, + { + "epoch": 1.92, + "learning_rate": 0.00011403663040474336, + "loss": 0.062, + "step": 76580 + }, + { + "epoch": 1.92, + "learning_rate": 0.00011365977438886516, + "loss": 0.0616, + "step": 76590 + }, + { + "epoch": 1.92, + "learning_rate": 0.00011328291837298697, + "loss": 0.059, + "step": 76600 + }, + { + "epoch": 1.92, + "learning_rate": 0.00011290606235710877, + "loss": 0.0602, + "step": 76610 + }, + { + "epoch": 1.92, + "learning_rate": 0.00011252920634123055, + "loss": 0.0621, + "step": 76620 + }, + { + "epoch": 1.93, + "learning_rate": 0.00011215235032535235, + "loss": 0.0595, + "step": 76630 + }, + { + "epoch": 1.93, + "learning_rate": 0.00011177549430947416, + "loss": 0.0604, + "step": 76640 + }, + { + "epoch": 1.93, + "learning_rate": 0.00011139863829359596, + "loss": 0.0627, + "step": 76650 + }, + { + "epoch": 1.93, + "learning_rate": 0.00011102178227771776, + "loss": 0.0638, + "step": 76660 + }, + { + "epoch": 1.93, + "learning_rate": 0.00011064492626183957, + "loss": 0.0595, + "step": 76670 + }, + { + "epoch": 1.93, + "learning_rate": 0.00011026807024596136, + "loss": 0.0613, + "step": 76680 + }, + { + "epoch": 1.93, + "learning_rate": 0.00010989121423008316, + "loss": 0.0623, + "step": 76690 + }, + { + "epoch": 1.93, + "learning_rate": 0.00010951435821420496, + "loss": 0.0575, + "step": 76700 + }, + { + "epoch": 1.93, + "learning_rate": 0.00010913750219832677, + "loss": 0.06, + "step": 76710 + }, + { + "epoch": 1.93, + "learning_rate": 0.00010876064618244857, + "loss": 0.0595, + "step": 76720 + }, + { + "epoch": 1.93, + "learning_rate": 0.00010838379016657037, + "loss": 0.0584, + "step": 76730 + }, + { + "epoch": 1.93, + "learning_rate": 0.00010800693415069215, + "loss": 0.0625, + "step": 76740 + }, + { + "epoch": 1.93, + "learning_rate": 0.00010763007813481395, + "loss": 0.064, + "step": 76750 + }, + { + "epoch": 1.93, + "learning_rate": 0.00010725322211893576, + "loss": 0.0598, + "step": 76760 + }, + { + "epoch": 1.93, + "learning_rate": 0.00010687636610305756, + "loss": 0.0615, + "step": 76770 + }, + { + "epoch": 1.93, + "learning_rate": 0.00010649951008717938, + "loss": 0.0612, + "step": 76780 + }, + { + "epoch": 1.93, + "learning_rate": 0.00010612265407130115, + "loss": 0.0629, + "step": 76790 + }, + { + "epoch": 1.93, + "learning_rate": 0.00010574579805542296, + "loss": 0.0595, + "step": 76800 + }, + { + "epoch": 1.93, + "learning_rate": 0.00010536894203954476, + "loss": 0.06, + "step": 76810 + }, + { + "epoch": 1.93, + "learning_rate": 0.00010499208602366656, + "loss": 0.061, + "step": 76820 + }, + { + "epoch": 1.93, + "learning_rate": 0.00010461523000778837, + "loss": 0.0628, + "step": 76830 + }, + { + "epoch": 1.93, + "learning_rate": 0.00010423837399191017, + "loss": 0.0576, + "step": 76840 + }, + { + "epoch": 1.93, + "learning_rate": 0.00010386151797603195, + "loss": 0.0618, + "step": 76850 + }, + { + "epoch": 1.93, + "learning_rate": 0.00010348466196015375, + "loss": 0.065, + "step": 76860 + }, + { + "epoch": 1.93, + "learning_rate": 0.00010310780594427556, + "loss": 0.0574, + "step": 76870 + }, + { + "epoch": 1.93, + "learning_rate": 0.00010273094992839736, + "loss": 0.0611, + "step": 76880 + }, + { + "epoch": 1.93, + "learning_rate": 0.00010235409391251916, + "loss": 0.0585, + "step": 76890 + }, + { + "epoch": 1.93, + "learning_rate": 0.00010197723789664095, + "loss": 0.0577, + "step": 76900 + }, + { + "epoch": 1.93, + "learning_rate": 0.00010160038188076275, + "loss": 0.0619, + "step": 76910 + }, + { + "epoch": 1.93, + "learning_rate": 0.00010122352586488456, + "loss": 0.0609, + "step": 76920 + }, + { + "epoch": 1.93, + "learning_rate": 0.00010084666984900636, + "loss": 0.062, + "step": 76930 + }, + { + "epoch": 1.93, + "learning_rate": 0.00010046981383312817, + "loss": 0.0603, + "step": 76940 + }, + { + "epoch": 1.93, + "learning_rate": 0.00010009295781724997, + "loss": 0.0619, + "step": 76950 + }, + { + "epoch": 1.93, + "learning_rate": 9.971610180137175e-05, + "loss": 0.0619, + "step": 76960 + }, + { + "epoch": 1.93, + "learning_rate": 9.933924578549355e-05, + "loss": 0.0612, + "step": 76970 + }, + { + "epoch": 1.93, + "learning_rate": 9.896238976961535e-05, + "loss": 0.0588, + "step": 76980 + }, + { + "epoch": 1.93, + "learning_rate": 9.858553375373716e-05, + "loss": 0.0613, + "step": 76990 + }, + { + "epoch": 1.93, + "learning_rate": 9.820867773785896e-05, + "loss": 0.06, + "step": 77000 + }, + { + "epoch": 1.93, + "eval_cer": 0.6651647467982543, + "eval_loss": 0.05269329249858856, + "eval_runtime": 90.4414, + "eval_samples_per_second": 110.558, + "eval_steps_per_second": 6.911, + "step": 77000 + }, + { + "epoch": 1.93, + "learning_rate": 9.783182172198075e-05, + "loss": 0.059, + "step": 77010 + }, + { + "epoch": 1.93, + "learning_rate": 9.745496570610255e-05, + "loss": 0.0612, + "step": 77020 + }, + { + "epoch": 1.94, + "learning_rate": 9.707810969022436e-05, + "loss": 0.0594, + "step": 77030 + }, + { + "epoch": 1.94, + "learning_rate": 9.670125367434616e-05, + "loss": 0.0599, + "step": 77040 + }, + { + "epoch": 1.94, + "learning_rate": 9.632439765846796e-05, + "loss": 0.0639, + "step": 77050 + }, + { + "epoch": 1.94, + "learning_rate": 9.594754164258977e-05, + "loss": 0.0599, + "step": 77060 + }, + { + "epoch": 1.94, + "learning_rate": 9.557068562671155e-05, + "loss": 0.0587, + "step": 77070 + }, + { + "epoch": 1.94, + "learning_rate": 9.519382961083335e-05, + "loss": 0.0657, + "step": 77080 + }, + { + "epoch": 1.94, + "learning_rate": 9.481697359495515e-05, + "loss": 0.0587, + "step": 77090 + }, + { + "epoch": 1.94, + "learning_rate": 9.444011757907696e-05, + "loss": 0.0648, + "step": 77100 + }, + { + "epoch": 1.94, + "learning_rate": 9.406326156319876e-05, + "loss": 0.063, + "step": 77110 + }, + { + "epoch": 1.94, + "learning_rate": 9.368640554732055e-05, + "loss": 0.0626, + "step": 77120 + }, + { + "epoch": 1.94, + "learning_rate": 9.330954953144236e-05, + "loss": 0.0587, + "step": 77130 + }, + { + "epoch": 1.94, + "learning_rate": 9.293269351556415e-05, + "loss": 0.0593, + "step": 77140 + }, + { + "epoch": 1.94, + "learning_rate": 9.255583749968596e-05, + "loss": 0.0608, + "step": 77150 + }, + { + "epoch": 1.94, + "learning_rate": 9.217898148380776e-05, + "loss": 0.0601, + "step": 77160 + }, + { + "epoch": 1.94, + "learning_rate": 9.180212546792956e-05, + "loss": 0.0618, + "step": 77170 + }, + { + "epoch": 1.94, + "learning_rate": 9.142526945205136e-05, + "loss": 0.0609, + "step": 77180 + }, + { + "epoch": 1.94, + "learning_rate": 9.104841343617315e-05, + "loss": 0.0617, + "step": 77190 + }, + { + "epoch": 1.94, + "learning_rate": 9.067155742029495e-05, + "loss": 0.0606, + "step": 77200 + }, + { + "epoch": 1.94, + "learning_rate": 9.029470140441675e-05, + "loss": 0.0592, + "step": 77210 + }, + { + "epoch": 1.94, + "learning_rate": 8.991784538853855e-05, + "loss": 0.0589, + "step": 77220 + }, + { + "epoch": 1.94, + "learning_rate": 8.954098937266035e-05, + "loss": 0.0596, + "step": 77230 + }, + { + "epoch": 1.94, + "learning_rate": 8.916413335678216e-05, + "loss": 0.0613, + "step": 77240 + }, + { + "epoch": 1.94, + "learning_rate": 8.878727734090395e-05, + "loss": 0.0617, + "step": 77250 + }, + { + "epoch": 1.94, + "learning_rate": 8.841042132502576e-05, + "loss": 0.0619, + "step": 77260 + }, + { + "epoch": 1.94, + "learning_rate": 8.803356530914756e-05, + "loss": 0.0617, + "step": 77270 + }, + { + "epoch": 1.94, + "learning_rate": 8.765670929326936e-05, + "loss": 0.0625, + "step": 77280 + }, + { + "epoch": 1.94, + "learning_rate": 8.727985327739116e-05, + "loss": 0.059, + "step": 77290 + }, + { + "epoch": 1.94, + "learning_rate": 8.690299726151296e-05, + "loss": 0.0642, + "step": 77300 + }, + { + "epoch": 1.94, + "learning_rate": 8.652614124563475e-05, + "loss": 0.0595, + "step": 77310 + }, + { + "epoch": 1.94, + "learning_rate": 8.614928522975655e-05, + "loss": 0.06, + "step": 77320 + }, + { + "epoch": 1.94, + "learning_rate": 8.577242921387835e-05, + "loss": 0.0631, + "step": 77330 + }, + { + "epoch": 1.94, + "learning_rate": 8.539557319800015e-05, + "loss": 0.0612, + "step": 77340 + }, + { + "epoch": 1.94, + "learning_rate": 8.501871718212195e-05, + "loss": 0.06, + "step": 77350 + }, + { + "epoch": 1.94, + "learning_rate": 8.464186116624375e-05, + "loss": 0.061, + "step": 77360 + }, + { + "epoch": 1.94, + "learning_rate": 8.426500515036555e-05, + "loss": 0.0617, + "step": 77370 + }, + { + "epoch": 1.94, + "learning_rate": 8.388814913448736e-05, + "loss": 0.0589, + "step": 77380 + }, + { + "epoch": 1.94, + "learning_rate": 8.351129311860914e-05, + "loss": 0.0638, + "step": 77390 + }, + { + "epoch": 1.94, + "learning_rate": 8.313443710273096e-05, + "loss": 0.0593, + "step": 77400 + }, + { + "epoch": 1.94, + "learning_rate": 8.275758108685276e-05, + "loss": 0.0609, + "step": 77410 + }, + { + "epoch": 1.95, + "learning_rate": 8.238072507097455e-05, + "loss": 0.0622, + "step": 77420 + }, + { + "epoch": 1.95, + "learning_rate": 8.200386905509635e-05, + "loss": 0.0592, + "step": 77430 + }, + { + "epoch": 1.95, + "learning_rate": 8.162701303921815e-05, + "loss": 0.0613, + "step": 77440 + }, + { + "epoch": 1.95, + "learning_rate": 8.125015702333995e-05, + "loss": 0.0625, + "step": 77450 + }, + { + "epoch": 1.95, + "learning_rate": 8.087330100746175e-05, + "loss": 0.0615, + "step": 77460 + }, + { + "epoch": 1.95, + "learning_rate": 8.049644499158355e-05, + "loss": 0.0609, + "step": 77470 + }, + { + "epoch": 1.95, + "learning_rate": 8.011958897570535e-05, + "loss": 0.0612, + "step": 77480 + }, + { + "epoch": 1.95, + "learning_rate": 7.974273295982716e-05, + "loss": 0.0612, + "step": 77490 + }, + { + "epoch": 1.95, + "learning_rate": 7.936587694394895e-05, + "loss": 0.0627, + "step": 77500 + }, + { + "epoch": 1.95, + "eval_cer": 0.6651560846522654, + "eval_loss": 0.05267711356282234, + "eval_runtime": 90.8378, + "eval_samples_per_second": 110.075, + "eval_steps_per_second": 6.88, + "step": 77500 + }, + { + "epoch": 1.95, + "learning_rate": 7.898902092807074e-05, + "loss": 0.0632, + "step": 77510 + }, + { + "epoch": 1.95, + "learning_rate": 7.861216491219256e-05, + "loss": 0.0586, + "step": 77520 + }, + { + "epoch": 1.95, + "learning_rate": 7.823530889631434e-05, + "loss": 0.0614, + "step": 77530 + }, + { + "epoch": 1.95, + "learning_rate": 7.785845288043615e-05, + "loss": 0.0623, + "step": 77540 + }, + { + "epoch": 1.95, + "learning_rate": 7.748159686455795e-05, + "loss": 0.0626, + "step": 77550 + }, + { + "epoch": 1.95, + "learning_rate": 7.710474084867975e-05, + "loss": 0.0603, + "step": 77560 + }, + { + "epoch": 1.95, + "learning_rate": 7.672788483280155e-05, + "loss": 0.0623, + "step": 77570 + }, + { + "epoch": 1.95, + "learning_rate": 7.635102881692335e-05, + "loss": 0.063, + "step": 77580 + }, + { + "epoch": 1.95, + "learning_rate": 7.597417280104515e-05, + "loss": 0.0625, + "step": 77590 + }, + { + "epoch": 1.95, + "learning_rate": 7.559731678516695e-05, + "loss": 0.0582, + "step": 77600 + }, + { + "epoch": 1.95, + "learning_rate": 7.522046076928875e-05, + "loss": 0.0616, + "step": 77610 + }, + { + "epoch": 1.95, + "learning_rate": 7.484360475341055e-05, + "loss": 0.0619, + "step": 77620 + }, + { + "epoch": 1.95, + "learning_rate": 7.446674873753236e-05, + "loss": 0.0604, + "step": 77630 + }, + { + "epoch": 1.95, + "learning_rate": 7.408989272165414e-05, + "loss": 0.0649, + "step": 77640 + }, + { + "epoch": 1.95, + "learning_rate": 7.371303670577596e-05, + "loss": 0.0632, + "step": 77650 + }, + { + "epoch": 1.95, + "learning_rate": 7.333618068989775e-05, + "loss": 0.06, + "step": 77660 + }, + { + "epoch": 1.95, + "learning_rate": 7.295932467401954e-05, + "loss": 0.059, + "step": 77670 + }, + { + "epoch": 1.95, + "learning_rate": 7.258246865814135e-05, + "loss": 0.0617, + "step": 77680 + }, + { + "epoch": 1.95, + "learning_rate": 7.220561264226314e-05, + "loss": 0.0604, + "step": 77690 + }, + { + "epoch": 1.95, + "learning_rate": 7.182875662638495e-05, + "loss": 0.0627, + "step": 77700 + }, + { + "epoch": 1.95, + "learning_rate": 7.145190061050675e-05, + "loss": 0.0601, + "step": 77710 + }, + { + "epoch": 1.95, + "learning_rate": 7.107504459462855e-05, + "loss": 0.0644, + "step": 77720 + }, + { + "epoch": 1.95, + "learning_rate": 7.069818857875035e-05, + "loss": 0.0596, + "step": 77730 + }, + { + "epoch": 1.95, + "learning_rate": 7.032133256287214e-05, + "loss": 0.0626, + "step": 77740 + }, + { + "epoch": 1.95, + "learning_rate": 6.994447654699394e-05, + "loss": 0.0589, + "step": 77750 + }, + { + "epoch": 1.95, + "learning_rate": 6.956762053111574e-05, + "loss": 0.0616, + "step": 77760 + }, + { + "epoch": 1.95, + "learning_rate": 6.919076451523755e-05, + "loss": 0.062, + "step": 77770 + }, + { + "epoch": 1.95, + "learning_rate": 6.881390849935934e-05, + "loss": 0.0619, + "step": 77780 + }, + { + "epoch": 1.95, + "learning_rate": 6.843705248348115e-05, + "loss": 0.0602, + "step": 77790 + }, + { + "epoch": 1.95, + "learning_rate": 6.806019646760295e-05, + "loss": 0.0604, + "step": 77800 + }, + { + "epoch": 1.95, + "learning_rate": 6.768334045172475e-05, + "loss": 0.0636, + "step": 77810 + }, + { + "epoch": 1.96, + "learning_rate": 6.730648443584655e-05, + "loss": 0.0588, + "step": 77820 + }, + { + "epoch": 1.96, + "learning_rate": 6.692962841996833e-05, + "loss": 0.0653, + "step": 77830 + }, + { + "epoch": 1.96, + "learning_rate": 6.655277240409015e-05, + "loss": 0.0624, + "step": 77840 + }, + { + "epoch": 1.96, + "learning_rate": 6.617591638821195e-05, + "loss": 0.0609, + "step": 77850 + }, + { + "epoch": 1.96, + "learning_rate": 6.579906037233374e-05, + "loss": 0.0611, + "step": 77860 + }, + { + "epoch": 1.96, + "learning_rate": 6.542220435645554e-05, + "loss": 0.0619, + "step": 77870 + }, + { + "epoch": 1.96, + "learning_rate": 6.504534834057734e-05, + "loss": 0.0622, + "step": 77880 + }, + { + "epoch": 1.96, + "learning_rate": 6.466849232469914e-05, + "loss": 0.0595, + "step": 77890 + }, + { + "epoch": 1.96, + "learning_rate": 6.429163630882094e-05, + "loss": 0.0605, + "step": 77900 + }, + { + "epoch": 1.96, + "learning_rate": 6.391478029294275e-05, + "loss": 0.0599, + "step": 77910 + }, + { + "epoch": 1.96, + "learning_rate": 6.353792427706454e-05, + "loss": 0.0602, + "step": 77920 + }, + { + "epoch": 1.96, + "learning_rate": 6.316106826118635e-05, + "loss": 0.0633, + "step": 77930 + }, + { + "epoch": 1.96, + "learning_rate": 6.278421224530815e-05, + "loss": 0.0625, + "step": 77940 + }, + { + "epoch": 1.96, + "learning_rate": 6.240735622942995e-05, + "loss": 0.06, + "step": 77950 + }, + { + "epoch": 1.96, + "learning_rate": 6.203050021355175e-05, + "loss": 0.059, + "step": 77960 + }, + { + "epoch": 1.96, + "learning_rate": 6.165364419767355e-05, + "loss": 0.0586, + "step": 77970 + }, + { + "epoch": 1.96, + "learning_rate": 6.127678818179534e-05, + "loss": 0.0617, + "step": 77980 + }, + { + "epoch": 1.96, + "learning_rate": 6.089993216591715e-05, + "loss": 0.0621, + "step": 77990 + }, + { + "epoch": 1.96, + "learning_rate": 6.052307615003894e-05, + "loss": 0.0607, + "step": 78000 + }, + { + "epoch": 1.96, + "eval_cer": 0.6651161425346498, + "eval_loss": 0.052589353173971176, + "eval_runtime": 90.6912, + "eval_samples_per_second": 110.253, + "eval_steps_per_second": 6.892, + "step": 78000 + }, + { + "epoch": 1.96, + "learning_rate": 6.014622013416074e-05, + "loss": 0.0597, + "step": 78010 + }, + { + "epoch": 1.96, + "learning_rate": 5.9769364118282546e-05, + "loss": 0.0611, + "step": 78020 + }, + { + "epoch": 1.96, + "learning_rate": 5.939250810240434e-05, + "loss": 0.0614, + "step": 78030 + }, + { + "epoch": 1.96, + "learning_rate": 5.9015652086526144e-05, + "loss": 0.062, + "step": 78040 + }, + { + "epoch": 1.96, + "learning_rate": 5.863879607064795e-05, + "loss": 0.0651, + "step": 78050 + }, + { + "epoch": 1.96, + "learning_rate": 5.826194005476974e-05, + "loss": 0.0595, + "step": 78060 + }, + { + "epoch": 1.96, + "learning_rate": 5.788508403889155e-05, + "loss": 0.0611, + "step": 78070 + }, + { + "epoch": 1.96, + "learning_rate": 5.750822802301334e-05, + "loss": 0.063, + "step": 78080 + }, + { + "epoch": 1.96, + "learning_rate": 5.713137200713514e-05, + "loss": 0.0613, + "step": 78090 + }, + { + "epoch": 1.96, + "learning_rate": 5.6754515991256943e-05, + "loss": 0.0603, + "step": 78100 + }, + { + "epoch": 1.96, + "learning_rate": 5.6377659975378736e-05, + "loss": 0.0592, + "step": 78110 + }, + { + "epoch": 1.96, + "learning_rate": 5.600080395950054e-05, + "loss": 0.0621, + "step": 78120 + }, + { + "epoch": 1.96, + "learning_rate": 5.562394794362235e-05, + "loss": 0.0623, + "step": 78130 + }, + { + "epoch": 1.96, + "learning_rate": 5.524709192774414e-05, + "loss": 0.06, + "step": 78140 + }, + { + "epoch": 1.96, + "learning_rate": 5.4870235911865944e-05, + "loss": 0.0623, + "step": 78150 + }, + { + "epoch": 1.96, + "learning_rate": 5.449337989598774e-05, + "loss": 0.0603, + "step": 78160 + }, + { + "epoch": 1.96, + "learning_rate": 5.4116523880109535e-05, + "loss": 0.0575, + "step": 78170 + }, + { + "epoch": 1.96, + "learning_rate": 5.373966786423134e-05, + "loss": 0.0605, + "step": 78180 + }, + { + "epoch": 1.96, + "learning_rate": 5.3362811848353147e-05, + "loss": 0.0585, + "step": 78190 + }, + { + "epoch": 1.96, + "learning_rate": 5.298595583247494e-05, + "loss": 0.0596, + "step": 78200 + }, + { + "epoch": 1.96, + "learning_rate": 5.2609099816596744e-05, + "loss": 0.0609, + "step": 78210 + }, + { + "epoch": 1.97, + "learning_rate": 5.2232243800718536e-05, + "loss": 0.0582, + "step": 78220 + }, + { + "epoch": 1.97, + "learning_rate": 5.185538778484034e-05, + "loss": 0.0607, + "step": 78230 + }, + { + "epoch": 1.97, + "learning_rate": 5.147853176896214e-05, + "loss": 0.0582, + "step": 78240 + }, + { + "epoch": 1.97, + "learning_rate": 5.110167575308393e-05, + "loss": 0.0598, + "step": 78250 + }, + { + "epoch": 1.97, + "learning_rate": 5.072481973720574e-05, + "loss": 0.0581, + "step": 78260 + }, + { + "epoch": 1.97, + "learning_rate": 5.0347963721327544e-05, + "loss": 0.0578, + "step": 78270 + }, + { + "epoch": 1.97, + "learning_rate": 4.9971107705449336e-05, + "loss": 0.0608, + "step": 78280 + }, + { + "epoch": 1.97, + "learning_rate": 4.959425168957114e-05, + "loss": 0.0587, + "step": 78290 + }, + { + "epoch": 1.97, + "learning_rate": 4.921739567369294e-05, + "loss": 0.0607, + "step": 78300 + }, + { + "epoch": 1.97, + "learning_rate": 4.884053965781474e-05, + "loss": 0.0617, + "step": 78310 + }, + { + "epoch": 1.97, + "learning_rate": 4.846368364193654e-05, + "loss": 0.0616, + "step": 78320 + }, + { + "epoch": 1.97, + "learning_rate": 4.808682762605833e-05, + "loss": 0.0586, + "step": 78330 + }, + { + "epoch": 1.97, + "learning_rate": 4.7709971610180136e-05, + "loss": 0.0585, + "step": 78340 + }, + { + "epoch": 1.97, + "learning_rate": 4.733311559430194e-05, + "loss": 0.0597, + "step": 78350 + }, + { + "epoch": 1.97, + "learning_rate": 4.6956259578423734e-05, + "loss": 0.0604, + "step": 78360 + }, + { + "epoch": 1.97, + "learning_rate": 4.657940356254554e-05, + "loss": 0.0638, + "step": 78370 + }, + { + "epoch": 1.97, + "learning_rate": 4.620254754666734e-05, + "loss": 0.0605, + "step": 78380 + }, + { + "epoch": 1.97, + "learning_rate": 4.582569153078914e-05, + "loss": 0.0664, + "step": 78390 + }, + { + "epoch": 1.97, + "learning_rate": 4.5448835514910936e-05, + "loss": 0.0597, + "step": 78400 + }, + { + "epoch": 1.97, + "learning_rate": 4.5071979499032734e-05, + "loss": 0.061, + "step": 78410 + }, + { + "epoch": 1.97, + "learning_rate": 4.469512348315453e-05, + "loss": 0.0616, + "step": 78420 + }, + { + "epoch": 1.97, + "learning_rate": 4.431826746727634e-05, + "loss": 0.0611, + "step": 78430 + }, + { + "epoch": 1.97, + "learning_rate": 4.394141145139814e-05, + "loss": 0.0631, + "step": 78440 + }, + { + "epoch": 1.97, + "learning_rate": 4.3564555435519937e-05, + "loss": 0.0592, + "step": 78450 + }, + { + "epoch": 1.97, + "learning_rate": 4.3187699419641735e-05, + "loss": 0.0617, + "step": 78460 + }, + { + "epoch": 1.97, + "learning_rate": 4.2810843403763534e-05, + "loss": 0.0619, + "step": 78470 + }, + { + "epoch": 1.97, + "learning_rate": 4.243398738788533e-05, + "loss": 0.0592, + "step": 78480 + }, + { + "epoch": 1.97, + "learning_rate": 4.205713137200713e-05, + "loss": 0.0607, + "step": 78490 + }, + { + "epoch": 1.97, + "learning_rate": 4.168027535612894e-05, + "loss": 0.0607, + "step": 78500 + }, + { + "epoch": 1.97, + "eval_cer": 0.6651493474276073, + "eval_loss": 0.052500005811452866, + "eval_runtime": 91.3787, + "eval_samples_per_second": 109.424, + "eval_steps_per_second": 6.84, + "step": 78500 + }, + { + "epoch": 1.97, + "learning_rate": 4.1303419340250736e-05, + "loss": 0.0597, + "step": 78510 + }, + { + "epoch": 1.97, + "learning_rate": 4.0926563324372535e-05, + "loss": 0.061, + "step": 78520 + }, + { + "epoch": 1.97, + "learning_rate": 4.054970730849434e-05, + "loss": 0.0643, + "step": 78530 + }, + { + "epoch": 1.97, + "learning_rate": 4.017285129261613e-05, + "loss": 0.0577, + "step": 78540 + }, + { + "epoch": 1.97, + "learning_rate": 3.979599527673793e-05, + "loss": 0.06, + "step": 78550 + }, + { + "epoch": 1.97, + "learning_rate": 3.941913926085973e-05, + "loss": 0.0619, + "step": 78560 + }, + { + "epoch": 1.97, + "learning_rate": 3.9042283244981536e-05, + "loss": 0.0619, + "step": 78570 + }, + { + "epoch": 1.97, + "learning_rate": 3.8665427229103335e-05, + "loss": 0.0575, + "step": 78580 + }, + { + "epoch": 1.97, + "learning_rate": 3.8288571213225134e-05, + "loss": 0.0604, + "step": 78590 + }, + { + "epoch": 1.97, + "learning_rate": 3.791171519734694e-05, + "loss": 0.0616, + "step": 78600 + }, + { + "epoch": 1.97, + "learning_rate": 3.753485918146874e-05, + "loss": 0.0618, + "step": 78610 + }, + { + "epoch": 1.98, + "learning_rate": 3.715800316559053e-05, + "loss": 0.0605, + "step": 78620 + }, + { + "epoch": 1.98, + "learning_rate": 3.678114714971233e-05, + "loss": 0.059, + "step": 78630 + }, + { + "epoch": 1.98, + "learning_rate": 3.6404291133834135e-05, + "loss": 0.0624, + "step": 78640 + }, + { + "epoch": 1.98, + "learning_rate": 3.6027435117955934e-05, + "loss": 0.0597, + "step": 78650 + }, + { + "epoch": 1.98, + "learning_rate": 3.565057910207773e-05, + "loss": 0.0596, + "step": 78660 + }, + { + "epoch": 1.98, + "learning_rate": 3.527372308619954e-05, + "loss": 0.0583, + "step": 78670 + }, + { + "epoch": 1.98, + "learning_rate": 3.489686707032134e-05, + "loss": 0.0632, + "step": 78680 + }, + { + "epoch": 1.98, + "learning_rate": 3.4520011054443136e-05, + "loss": 0.0659, + "step": 78690 + }, + { + "epoch": 1.98, + "learning_rate": 3.414315503856493e-05, + "loss": 0.0619, + "step": 78700 + }, + { + "epoch": 1.98, + "learning_rate": 3.3766299022686733e-05, + "loss": 0.0598, + "step": 78710 + }, + { + "epoch": 1.98, + "learning_rate": 3.338944300680853e-05, + "loss": 0.0597, + "step": 78720 + }, + { + "epoch": 1.98, + "learning_rate": 3.301258699093033e-05, + "loss": 0.06, + "step": 78730 + }, + { + "epoch": 1.98, + "learning_rate": 3.263573097505213e-05, + "loss": 0.0583, + "step": 78740 + }, + { + "epoch": 1.98, + "learning_rate": 3.2258874959173936e-05, + "loss": 0.0622, + "step": 78750 + }, + { + "epoch": 1.98, + "learning_rate": 3.1882018943295734e-05, + "loss": 0.0592, + "step": 78760 + }, + { + "epoch": 1.98, + "learning_rate": 3.150516292741753e-05, + "loss": 0.0594, + "step": 78770 + }, + { + "epoch": 1.98, + "learning_rate": 3.112830691153933e-05, + "loss": 0.0605, + "step": 78780 + }, + { + "epoch": 1.98, + "learning_rate": 3.075145089566113e-05, + "loss": 0.0601, + "step": 78790 + }, + { + "epoch": 1.98, + "learning_rate": 3.037459487978293e-05, + "loss": 0.0599, + "step": 78800 + }, + { + "epoch": 1.98, + "learning_rate": 2.999773886390473e-05, + "loss": 0.0599, + "step": 78810 + }, + { + "epoch": 1.98, + "learning_rate": 2.9620882848026534e-05, + "loss": 0.0627, + "step": 78820 + }, + { + "epoch": 1.98, + "learning_rate": 2.924402683214833e-05, + "loss": 0.0586, + "step": 78830 + }, + { + "epoch": 1.98, + "learning_rate": 2.886717081627013e-05, + "loss": 0.0597, + "step": 78840 + }, + { + "epoch": 1.98, + "learning_rate": 2.8490314800391934e-05, + "loss": 0.0602, + "step": 78850 + }, + { + "epoch": 1.98, + "learning_rate": 2.8113458784513733e-05, + "loss": 0.0621, + "step": 78860 + }, + { + "epoch": 1.98, + "learning_rate": 2.773660276863553e-05, + "loss": 0.0617, + "step": 78870 + }, + { + "epoch": 1.98, + "learning_rate": 2.7359746752757327e-05, + "loss": 0.0595, + "step": 78880 + }, + { + "epoch": 1.98, + "learning_rate": 2.6982890736879133e-05, + "loss": 0.0631, + "step": 78890 + }, + { + "epoch": 1.98, + "learning_rate": 2.660603472100093e-05, + "loss": 0.0568, + "step": 78900 + }, + { + "epoch": 1.98, + "learning_rate": 2.6229178705122727e-05, + "loss": 0.0623, + "step": 78910 + }, + { + "epoch": 1.98, + "learning_rate": 2.5852322689244533e-05, + "loss": 0.0615, + "step": 78920 + }, + { + "epoch": 1.98, + "learning_rate": 2.547546667336633e-05, + "loss": 0.0599, + "step": 78930 + }, + { + "epoch": 1.98, + "learning_rate": 2.509861065748813e-05, + "loss": 0.0592, + "step": 78940 + }, + { + "epoch": 1.98, + "learning_rate": 2.4721754641609926e-05, + "loss": 0.0628, + "step": 78950 + }, + { + "epoch": 1.98, + "learning_rate": 2.434489862573173e-05, + "loss": 0.0603, + "step": 78960 + }, + { + "epoch": 1.98, + "learning_rate": 2.396804260985353e-05, + "loss": 0.0597, + "step": 78970 + }, + { + "epoch": 1.98, + "learning_rate": 2.359118659397533e-05, + "loss": 0.0591, + "step": 78980 + }, + { + "epoch": 1.98, + "learning_rate": 2.3214330578097128e-05, + "loss": 0.0617, + "step": 78990 + }, + { + "epoch": 1.98, + "learning_rate": 2.283747456221893e-05, + "loss": 0.0608, + "step": 79000 + }, + { + "epoch": 1.98, + "eval_cer": 0.6651329855962949, + "eval_loss": 0.0524982325732708, + "eval_runtime": 90.4461, + "eval_samples_per_second": 110.552, + "eval_steps_per_second": 6.91, + "step": 79000 + }, + { + "epoch": 1.98, + "learning_rate": 2.246061854634073e-05, + "loss": 0.0608, + "step": 79010 + }, + { + "epoch": 1.99, + "learning_rate": 2.2083762530462528e-05, + "loss": 0.0595, + "step": 79020 + }, + { + "epoch": 1.99, + "learning_rate": 2.1706906514584327e-05, + "loss": 0.0613, + "step": 79030 + }, + { + "epoch": 1.99, + "learning_rate": 2.133005049870613e-05, + "loss": 0.0617, + "step": 79040 + }, + { + "epoch": 1.99, + "learning_rate": 2.0953194482827928e-05, + "loss": 0.0616, + "step": 79050 + }, + { + "epoch": 1.99, + "learning_rate": 2.0576338466949727e-05, + "loss": 0.0573, + "step": 79060 + }, + { + "epoch": 1.99, + "learning_rate": 2.0199482451071525e-05, + "loss": 0.0622, + "step": 79070 + }, + { + "epoch": 1.99, + "learning_rate": 1.9822626435193328e-05, + "loss": 0.0612, + "step": 79080 + }, + { + "epoch": 1.99, + "learning_rate": 1.944577041931513e-05, + "loss": 0.0601, + "step": 79090 + }, + { + "epoch": 1.99, + "learning_rate": 1.9068914403436925e-05, + "loss": 0.0604, + "step": 79100 + }, + { + "epoch": 1.99, + "learning_rate": 1.8692058387558728e-05, + "loss": 0.0615, + "step": 79110 + }, + { + "epoch": 1.99, + "learning_rate": 1.8315202371680526e-05, + "loss": 0.062, + "step": 79120 + }, + { + "epoch": 1.99, + "learning_rate": 1.793834635580233e-05, + "loss": 0.0617, + "step": 79130 + }, + { + "epoch": 1.99, + "learning_rate": 1.7561490339924124e-05, + "loss": 0.0614, + "step": 79140 + }, + { + "epoch": 1.99, + "learning_rate": 1.7184634324045926e-05, + "loss": 0.0594, + "step": 79150 + }, + { + "epoch": 1.99, + "learning_rate": 1.680777830816773e-05, + "loss": 0.0623, + "step": 79160 + }, + { + "epoch": 1.99, + "learning_rate": 1.6430922292289527e-05, + "loss": 0.057, + "step": 79170 + }, + { + "epoch": 1.99, + "learning_rate": 1.6054066276411326e-05, + "loss": 0.061, + "step": 79180 + }, + { + "epoch": 1.99, + "learning_rate": 1.5677210260533125e-05, + "loss": 0.0611, + "step": 79190 + }, + { + "epoch": 1.99, + "learning_rate": 1.5300354244654927e-05, + "loss": 0.0583, + "step": 79200 + }, + { + "epoch": 1.99, + "learning_rate": 1.4923498228776724e-05, + "loss": 0.0612, + "step": 79210 + }, + { + "epoch": 1.99, + "learning_rate": 1.4546642212898525e-05, + "loss": 0.0616, + "step": 79220 + }, + { + "epoch": 1.99, + "learning_rate": 1.4169786197020324e-05, + "loss": 0.0598, + "step": 79230 + }, + { + "epoch": 1.99, + "learning_rate": 1.3792930181142124e-05, + "loss": 0.0588, + "step": 79240 + }, + { + "epoch": 1.99, + "learning_rate": 1.3416074165263927e-05, + "loss": 0.059, + "step": 79250 + }, + { + "epoch": 1.99, + "learning_rate": 1.3039218149385725e-05, + "loss": 0.0625, + "step": 79260 + }, + { + "epoch": 1.99, + "learning_rate": 1.2662362133507526e-05, + "loss": 0.0611, + "step": 79270 + }, + { + "epoch": 1.99, + "learning_rate": 1.2285506117629325e-05, + "loss": 0.0597, + "step": 79280 + }, + { + "epoch": 1.99, + "learning_rate": 1.1908650101751125e-05, + "loss": 0.0572, + "step": 79290 + }, + { + "epoch": 1.99, + "learning_rate": 1.1531794085872924e-05, + "loss": 0.0631, + "step": 79300 + }, + { + "epoch": 1.99, + "learning_rate": 1.1154938069994725e-05, + "loss": 0.0641, + "step": 79310 + }, + { + "epoch": 1.99, + "learning_rate": 1.0778082054116523e-05, + "loss": 0.0587, + "step": 79320 + }, + { + "epoch": 1.99, + "learning_rate": 1.0401226038238324e-05, + "loss": 0.0644, + "step": 79330 + }, + { + "epoch": 1.99, + "learning_rate": 1.0024370022360123e-05, + "loss": 0.0589, + "step": 79340 + }, + { + "epoch": 1.99, + "learning_rate": 9.647514006481923e-06, + "loss": 0.0602, + "step": 79350 + }, + { + "epoch": 1.99, + "learning_rate": 9.270657990603724e-06, + "loss": 0.0591, + "step": 79360 + }, + { + "epoch": 1.99, + "learning_rate": 8.893801974725524e-06, + "loss": 0.0617, + "step": 79370 + }, + { + "epoch": 1.99, + "learning_rate": 8.516945958847323e-06, + "loss": 0.0602, + "step": 79380 + }, + { + "epoch": 1.99, + "learning_rate": 8.140089942969124e-06, + "loss": 0.0613, + "step": 79390 + }, + { + "epoch": 1.99, + "learning_rate": 7.763233927090923e-06, + "loss": 0.0571, + "step": 79400 + }, + { + "epoch": 2.0, + "learning_rate": 7.386377911212722e-06, + "loss": 0.0634, + "step": 79410 + }, + { + "epoch": 2.0, + "learning_rate": 7.009521895334522e-06, + "loss": 0.062, + "step": 79420 + }, + { + "epoch": 2.0, + "learning_rate": 6.632665879456322e-06, + "loss": 0.0641, + "step": 79430 + }, + { + "epoch": 2.0, + "learning_rate": 6.255809863578123e-06, + "loss": 0.0608, + "step": 79440 + }, + { + "epoch": 2.0, + "learning_rate": 5.878953847699923e-06, + "loss": 0.0603, + "step": 79450 + }, + { + "epoch": 2.0, + "learning_rate": 5.502097831821722e-06, + "loss": 0.0619, + "step": 79460 + }, + { + "epoch": 2.0, + "learning_rate": 5.125241815943522e-06, + "loss": 0.0595, + "step": 79470 + }, + { + "epoch": 2.0, + "learning_rate": 4.748385800065322e-06, + "loss": 0.0601, + "step": 79480 + }, + { + "epoch": 2.0, + "learning_rate": 4.3715297841871215e-06, + "loss": 0.0571, + "step": 79490 + }, + { + "epoch": 2.0, + "learning_rate": 3.994673768308922e-06, + "loss": 0.0609, + "step": 79500 + }, + { + "epoch": 2.0, + "eval_cer": 0.665112292691988, + "eval_loss": 0.0524970106780529, + "eval_runtime": 90.3409, + "eval_samples_per_second": 110.681, + "eval_steps_per_second": 6.918, + "step": 79500 + }, + { + "epoch": 2.0, + "learning_rate": 3.6178177524307217e-06, + "loss": 0.0622, + "step": 79510 + }, + { + "epoch": 2.0, + "learning_rate": 3.2409617365525214e-06, + "loss": 0.0615, + "step": 79520 + }, + { + "epoch": 2.0, + "learning_rate": 2.864105720674321e-06, + "loss": 0.0603, + "step": 79530 + }, + { + "epoch": 2.0, + "learning_rate": 2.4872497047961207e-06, + "loss": 0.0585, + "step": 79540 + }, + { + "epoch": 2.0, + "learning_rate": 2.110393688917921e-06, + "loss": 0.0578, + "step": 79550 + }, + { + "epoch": 2.0, + "learning_rate": 1.7335376730397205e-06, + "loss": 0.0584, + "step": 79560 + }, + { + "epoch": 2.0, + "learning_rate": 1.3566816571615204e-06, + "loss": 0.0625, + "step": 79570 + }, + { + "epoch": 2.0, + "learning_rate": 9.798256412833203e-07, + "loss": 0.0624, + "step": 79580 + }, + { + "epoch": 2.0, + "learning_rate": 6.029696254051202e-07, + "loss": 0.0634, + "step": 79590 + }, + { + "epoch": 2.0, + "learning_rate": 2.261136095269201e-07, + "loss": 0.0606, + "step": 79600 + }, + { + "epoch": 2.0, + "step": 79606, + "total_flos": 3.941634629940987e+18, + "train_loss": 0.1818607694105572, + "train_runtime": 106697.7235, + "train_samples_per_second": 191.002, + "train_steps_per_second": 0.746 + } + ], + "max_steps": 79606, + "num_train_epochs": 2, + "total_flos": 3.941634629940987e+18, + "trial_name": null, + "trial_params": null +}