{ "best_metric": 1.0, "best_model_checkpoint": "./wav2vec2-large-xlsr-am-readspeech/checkpoint-1000", "epoch": 882.3529411764706, "global_step": 300000, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.29, "learning_rate": 9.600000000000001e-07, "loss": 86.8013, "step": 100 }, { "epoch": 0.59, "learning_rate": 1.9500000000000004e-06, "loss": 89.2281, "step": 200 }, { "epoch": 0.88, "learning_rate": 2.9400000000000002e-06, "loss": 88.7762, "step": 300 }, { "epoch": 1.18, "learning_rate": 3.920000000000001e-06, "loss": 77.8155, "step": 400 }, { "epoch": 1.47, "learning_rate": 4.92e-06, "loss": 52.179, "step": 500 }, { "epoch": 1.76, "learning_rate": 5.92e-06, "loss": 35.7863, "step": 600 }, { "epoch": 2.06, "learning_rate": 6.92e-06, "loss": 26.2136, "step": 700 }, { "epoch": 2.35, "learning_rate": 7.92e-06, "loss": 20.6276, "step": 800 }, { "epoch": 2.65, "learning_rate": 8.920000000000001e-06, "loss": 15.9237, "step": 900 }, { "epoch": 2.94, "learning_rate": 9.920000000000002e-06, "loss": 11.6857, "step": 1000 }, { "epoch": 2.94, "eval_cer": 1.0, "eval_loss": 7.346815586090088, "eval_runtime": 5.3, "eval_samples_per_second": 67.735, "eval_steps_per_second": 2.264, "eval_wer": 1.0, "step": 1000 }, { "epoch": 3.24, "learning_rate": 9.999997663999142e-06, "loss": 9.1586, "step": 1100 }, { "epoch": 3.53, "learning_rate": 9.999989825813658e-06, "loss": 7.1107, "step": 1200 }, { "epoch": 3.82, "learning_rate": 9.999976467788685e-06, "loss": 5.7195, "step": 1300 }, { "epoch": 4.12, "learning_rate": 9.999957589938964e-06, "loss": 4.9527, "step": 1400 }, { "epoch": 4.41, "learning_rate": 9.999933192285338e-06, "loss": 4.5071, "step": 1500 }, { "epoch": 4.71, "learning_rate": 9.999903274854741e-06, "loss": 4.3014, "step": 1600 }, { "epoch": 5.0, "learning_rate": 9.9998678376802e-06, "loss": 4.1745, "step": 1700 }, { "epoch": 5.29, "learning_rate": 9.999826880800839e-06, "loss": 4.0713, "step": 1800 }, { "epoch": 5.59, "learning_rate": 9.999780404261869e-06, "loss": 4.0451, "step": 1900 }, { "epoch": 5.88, "learning_rate": 9.999728408114603e-06, "loss": 4.0204, "step": 2000 }, { "epoch": 5.88, "eval_cer": 1.0, "eval_loss": 3.9740476608276367, "eval_runtime": 4.9396, "eval_samples_per_second": 72.677, "eval_steps_per_second": 2.429, "eval_wer": 1.0, "step": 2000 }, { "epoch": 6.18, "learning_rate": 9.99967089241644e-06, "loss": 4.0045, "step": 2100 }, { "epoch": 6.47, "learning_rate": 9.999607857230877e-06, "loss": 3.9876, "step": 2200 }, { "epoch": 6.76, "learning_rate": 9.999539302627506e-06, "loss": 3.9874, "step": 2300 }, { "epoch": 7.06, "learning_rate": 9.999465228682003e-06, "loss": 3.9738, "step": 2400 }, { "epoch": 7.35, "learning_rate": 9.999385635476149e-06, "loss": 3.9781, "step": 2500 }, { "epoch": 7.65, "learning_rate": 9.99930052309781e-06, "loss": 3.9684, "step": 2600 }, { "epoch": 7.94, "learning_rate": 9.999209891640947e-06, "loss": 3.9763, "step": 2700 }, { "epoch": 8.24, "learning_rate": 9.999113741205614e-06, "loss": 3.9637, "step": 2800 }, { "epoch": 8.53, "learning_rate": 9.99901207189796e-06, "loss": 3.9731, "step": 2900 }, { "epoch": 8.82, "learning_rate": 9.998904883830225e-06, "loss": 3.9552, "step": 3000 }, { "epoch": 8.82, "eval_cer": 1.0, "eval_loss": 3.934492826461792, "eval_runtime": 5.2265, "eval_samples_per_second": 68.688, "eval_steps_per_second": 2.296, "eval_wer": 1.0, "step": 3000 }, { "epoch": 9.12, "learning_rate": 9.99879217712074e-06, "loss": 3.9658, "step": 3100 }, { "epoch": 9.41, "learning_rate": 9.998673951893931e-06, "loss": 3.9614, "step": 3200 }, { "epoch": 9.71, "learning_rate": 9.998550208280315e-06, "loss": 3.9444, "step": 3300 }, { "epoch": 10.0, "learning_rate": 9.9984209464165e-06, "loss": 3.9541, "step": 3400 }, { "epoch": 10.29, "learning_rate": 9.998286166445188e-06, "loss": 3.9426, "step": 3500 }, { "epoch": 10.59, "learning_rate": 9.998145868515175e-06, "loss": 3.9418, "step": 3600 }, { "epoch": 10.88, "learning_rate": 9.99800005278134e-06, "loss": 3.9312, "step": 3700 }, { "epoch": 11.18, "learning_rate": 9.997848719404663e-06, "loss": 3.996, "step": 3800 }, { "epoch": 11.47, "learning_rate": 9.99769186855221e-06, "loss": 3.933, "step": 3900 }, { "epoch": 11.76, "learning_rate": 9.997529500397141e-06, "loss": 3.9274, "step": 4000 }, { "epoch": 11.76, "eval_cer": 1.0, "eval_loss": 3.912527322769165, "eval_runtime": 5.1053, "eval_samples_per_second": 70.319, "eval_steps_per_second": 2.35, "eval_wer": 1.0, "step": 4000 }, { "epoch": 12.06, "learning_rate": 9.997361615118704e-06, "loss": 3.9269, "step": 4100 }, { "epoch": 12.35, "learning_rate": 9.997188212902243e-06, "loss": 3.9286, "step": 4200 }, { "epoch": 12.65, "learning_rate": 9.997009293939183e-06, "loss": 3.9162, "step": 4300 }, { "epoch": 12.94, "learning_rate": 9.99682485842705e-06, "loss": 3.9178, "step": 4400 }, { "epoch": 13.24, "learning_rate": 9.996634906569453e-06, "loss": 3.9131, "step": 4500 }, { "epoch": 13.53, "learning_rate": 9.996439438576094e-06, "loss": 3.9081, "step": 4600 }, { "epoch": 13.82, "learning_rate": 9.996238454662763e-06, "loss": 3.9048, "step": 4700 }, { "epoch": 14.12, "learning_rate": 9.996031955051341e-06, "loss": 3.9077, "step": 4800 }, { "epoch": 14.41, "learning_rate": 9.995819939969797e-06, "loss": 3.8908, "step": 4900 }, { "epoch": 14.71, "learning_rate": 9.995602409652191e-06, "loss": 3.8873, "step": 5000 }, { "epoch": 14.71, "eval_cer": 1.0, "eval_loss": 3.8573012351989746, "eval_runtime": 4.9589, "eval_samples_per_second": 72.395, "eval_steps_per_second": 2.42, "eval_wer": 1.0, "step": 5000 }, { "epoch": 15.0, "learning_rate": 9.995379364338668e-06, "loss": 3.8741, "step": 5100 }, { "epoch": 15.29, "learning_rate": 9.995150804275463e-06, "loss": 3.8651, "step": 5200 }, { "epoch": 15.59, "learning_rate": 9.994916729714902e-06, "loss": 3.8553, "step": 5300 }, { "epoch": 15.88, "learning_rate": 9.994677140915393e-06, "loss": 3.8397, "step": 5400 }, { "epoch": 16.18, "learning_rate": 9.994432038141437e-06, "loss": 3.828, "step": 5500 }, { "epoch": 16.47, "learning_rate": 9.994181421663621e-06, "loss": 3.802, "step": 5600 }, { "epoch": 16.76, "learning_rate": 9.993925291758616e-06, "loss": 3.7886, "step": 5700 }, { "epoch": 17.06, "learning_rate": 9.993663648709183e-06, "loss": 3.7534, "step": 5800 }, { "epoch": 17.35, "learning_rate": 9.993396492804167e-06, "loss": 3.7186, "step": 5900 }, { "epoch": 17.65, "learning_rate": 9.993123824338502e-06, "loss": 3.6704, "step": 6000 }, { "epoch": 17.65, "eval_cer": 0.9529227147901138, "eval_loss": 3.5608274936676025, "eval_runtime": 5.4159, "eval_samples_per_second": 66.286, "eval_steps_per_second": 2.216, "eval_wer": 0.9709817830082218, "step": 6000 }, { "epoch": 17.94, "learning_rate": 9.992845643613204e-06, "loss": 3.6186, "step": 6100 }, { "epoch": 18.24, "learning_rate": 9.992561950935379e-06, "loss": 3.5561, "step": 6200 }, { "epoch": 18.53, "learning_rate": 9.99227274661821e-06, "loss": 3.4841, "step": 6300 }, { "epoch": 18.82, "learning_rate": 9.991978030980974e-06, "loss": 3.3961, "step": 6400 }, { "epoch": 19.12, "learning_rate": 9.99167780434903e-06, "loss": 3.2749, "step": 6500 }, { "epoch": 19.41, "learning_rate": 9.991372067053812e-06, "loss": 3.1487, "step": 6600 }, { "epoch": 19.71, "learning_rate": 9.991060819432854e-06, "loss": 3.0266, "step": 6700 }, { "epoch": 20.0, "learning_rate": 9.990744061829757e-06, "loss": 2.8801, "step": 6800 }, { "epoch": 20.29, "learning_rate": 9.990421794594216e-06, "loss": 2.7497, "step": 6900 }, { "epoch": 20.59, "learning_rate": 9.990094018082002e-06, "loss": 2.6412, "step": 7000 }, { "epoch": 20.59, "eval_cer": 0.5278322653764004, "eval_loss": 2.214904546737671, "eval_runtime": 5.2522, "eval_samples_per_second": 68.352, "eval_steps_per_second": 2.285, "eval_wer": 0.9247138481379977, "step": 7000 }, { "epoch": 20.88, "learning_rate": 9.989760732654972e-06, "loss": 2.5238, "step": 7100 }, { "epoch": 21.18, "learning_rate": 9.98942193868106e-06, "loss": 2.4326, "step": 7200 }, { "epoch": 21.47, "learning_rate": 9.98907763653429e-06, "loss": 2.3556, "step": 7300 }, { "epoch": 21.76, "learning_rate": 9.988727826594757e-06, "loss": 2.2815, "step": 7400 }, { "epoch": 22.06, "learning_rate": 9.988372509248643e-06, "loss": 2.2246, "step": 7500 }, { "epoch": 22.35, "learning_rate": 9.988011684888205e-06, "loss": 2.1379, "step": 7600 }, { "epoch": 22.65, "learning_rate": 9.987645353911787e-06, "loss": 2.0879, "step": 7700 }, { "epoch": 22.94, "learning_rate": 9.987273516723803e-06, "loss": 2.0537, "step": 7800 }, { "epoch": 23.24, "learning_rate": 9.986896173734752e-06, "loss": 1.9776, "step": 7900 }, { "epoch": 23.53, "learning_rate": 9.986513325361209e-06, "loss": 1.952, "step": 8000 }, { "epoch": 23.53, "eval_cer": 0.3740464670241053, "eval_loss": 1.5460247993469238, "eval_runtime": 4.7627, "eval_samples_per_second": 75.378, "eval_steps_per_second": 2.52, "eval_wer": 0.8410446558117041, "step": 8000 }, { "epoch": 23.82, "learning_rate": 9.986124972025826e-06, "loss": 1.8922, "step": 8100 }, { "epoch": 24.12, "learning_rate": 9.985731114157335e-06, "loss": 1.8636, "step": 8200 }, { "epoch": 24.41, "learning_rate": 9.985331752190543e-06, "loss": 1.8044, "step": 8300 }, { "epoch": 24.71, "learning_rate": 9.984926886566336e-06, "loss": 1.79, "step": 8400 }, { "epoch": 25.0, "learning_rate": 9.98451651773167e-06, "loss": 1.7611, "step": 8500 }, { "epoch": 25.29, "learning_rate": 9.98410064613958e-06, "loss": 1.7184, "step": 8600 }, { "epoch": 25.59, "learning_rate": 9.98367927224918e-06, "loss": 1.6872, "step": 8700 }, { "epoch": 25.88, "learning_rate": 9.983252396525649e-06, "loss": 1.6614, "step": 8800 }, { "epoch": 26.18, "learning_rate": 9.982820019440246e-06, "loss": 1.638, "step": 8900 }, { "epoch": 26.47, "learning_rate": 9.982382141470308e-06, "loss": 1.6156, "step": 9000 }, { "epoch": 26.47, "eval_cer": 0.30373566976156224, "eval_loss": 1.222609519958496, "eval_runtime": 5.389, "eval_samples_per_second": 66.617, "eval_steps_per_second": 2.227, "eval_wer": 0.7757536675802031, "step": 9000 }, { "epoch": 26.76, "learning_rate": 9.981938763099232e-06, "loss": 1.5778, "step": 9100 }, { "epoch": 27.06, "learning_rate": 9.981489884816498e-06, "loss": 1.5274, "step": 9200 }, { "epoch": 27.35, "learning_rate": 9.981035507117654e-06, "loss": 1.514, "step": 9300 }, { "epoch": 27.65, "learning_rate": 9.98057563050432e-06, "loss": 1.4823, "step": 9400 }, { "epoch": 27.94, "learning_rate": 9.980110255484182e-06, "loss": 1.4603, "step": 9500 }, { "epoch": 28.24, "learning_rate": 9.979639382571006e-06, "loss": 1.4423, "step": 9600 }, { "epoch": 28.53, "learning_rate": 9.979163012284619e-06, "loss": 1.4232, "step": 9700 }, { "epoch": 28.82, "learning_rate": 9.978681145150916e-06, "loss": 1.4045, "step": 9800 }, { "epoch": 29.12, "learning_rate": 9.97819378170187e-06, "loss": 1.386, "step": 9900 }, { "epoch": 29.41, "learning_rate": 9.977700922475513e-06, "loss": 1.3531, "step": 10000 }, { "epoch": 29.41, "eval_cer": 0.257660956366331, "eval_loss": 0.9876303672790527, "eval_runtime": 5.4057, "eval_samples_per_second": 66.412, "eval_steps_per_second": 2.22, "eval_wer": 0.7182008705465097, "step": 10000 }, { "epoch": 29.71, "learning_rate": 9.977202568015948e-06, "loss": 1.3442, "step": 10100 }, { "epoch": 30.0, "learning_rate": 9.97669871887334e-06, "loss": 1.3231, "step": 10200 }, { "epoch": 30.29, "learning_rate": 9.976189375603929e-06, "loss": 1.2896, "step": 10300 }, { "epoch": 30.59, "learning_rate": 9.97567453877001e-06, "loss": 1.2658, "step": 10400 }, { "epoch": 30.88, "learning_rate": 9.975154208939948e-06, "loss": 1.2543, "step": 10500 }, { "epoch": 31.18, "learning_rate": 9.974628386688175e-06, "loss": 1.2248, "step": 10600 }, { "epoch": 31.47, "learning_rate": 9.974097072595177e-06, "loss": 1.2266, "step": 10700 }, { "epoch": 31.76, "learning_rate": 9.973560267247515e-06, "loss": 1.2195, "step": 10800 }, { "epoch": 32.06, "learning_rate": 9.973017971237804e-06, "loss": 1.1713, "step": 10900 }, { "epoch": 32.35, "learning_rate": 9.972470185164722e-06, "loss": 1.1879, "step": 11000 }, { "epoch": 32.35, "eval_cer": 0.22592737892855586, "eval_loss": 0.8309646844863892, "eval_runtime": 4.5066, "eval_samples_per_second": 79.661, "eval_steps_per_second": 2.663, "eval_wer": 0.6782202160245042, "step": 11000 }, { "epoch": 32.65, "learning_rate": 9.971916909633008e-06, "loss": 1.1622, "step": 11100 }, { "epoch": 32.94, "learning_rate": 9.971358145253464e-06, "loss": 1.1509, "step": 11200 }, { "epoch": 33.24, "learning_rate": 9.970793892642948e-06, "loss": 1.1338, "step": 11300 }, { "epoch": 33.53, "learning_rate": 9.970224152424376e-06, "loss": 1.1136, "step": 11400 }, { "epoch": 33.82, "learning_rate": 9.969648925226726e-06, "loss": 1.1073, "step": 11500 }, { "epoch": 34.12, "learning_rate": 9.969068211685031e-06, "loss": 1.0743, "step": 11600 }, { "epoch": 34.41, "learning_rate": 9.968482012440383e-06, "loss": 1.0671, "step": 11700 }, { "epoch": 34.71, "learning_rate": 9.967890328139928e-06, "loss": 1.0719, "step": 11800 }, { "epoch": 35.0, "learning_rate": 9.967293159436865e-06, "loss": 1.0557, "step": 11900 }, { "epoch": 35.29, "learning_rate": 9.966690506990456e-06, "loss": 1.0329, "step": 12000 }, { "epoch": 35.29, "eval_cer": 0.19951179111634193, "eval_loss": 0.7249646782875061, "eval_runtime": 5.2152, "eval_samples_per_second": 68.837, "eval_steps_per_second": 2.301, "eval_wer": 0.619700145091085, "step": 12000 }, { "epoch": 35.59, "learning_rate": 9.966082371466006e-06, "loss": 1.0479, "step": 12100 }, { "epoch": 35.88, "learning_rate": 9.96546875353488e-06, "loss": 1.0269, "step": 12200 }, { "epoch": 36.18, "learning_rate": 9.964849653874494e-06, "loss": 1.03, "step": 12300 }, { "epoch": 36.47, "learning_rate": 9.964225073168317e-06, "loss": 1.0069, "step": 12400 }, { "epoch": 36.76, "learning_rate": 9.963595012105866e-06, "loss": 0.9811, "step": 12500 }, { "epoch": 37.06, "learning_rate": 9.96295947138271e-06, "loss": 0.9897, "step": 12600 }, { "epoch": 37.35, "learning_rate": 9.962318451700465e-06, "loss": 0.9777, "step": 12700 }, { "epoch": 37.65, "learning_rate": 9.961671953766802e-06, "loss": 0.9655, "step": 12800 }, { "epoch": 37.94, "learning_rate": 9.961019978295433e-06, "loss": 0.9528, "step": 12900 }, { "epoch": 38.24, "learning_rate": 9.960362526006118e-06, "loss": 0.9425, "step": 13000 }, { "epoch": 38.24, "eval_cer": 0.18373218255525042, "eval_loss": 0.6471496820449829, "eval_runtime": 5.0928, "eval_samples_per_second": 70.492, "eval_steps_per_second": 2.356, "eval_wer": 0.588102531033371, "step": 13000 }, { "epoch": 38.53, "learning_rate": 9.959699597624666e-06, "loss": 0.9307, "step": 13100 }, { "epoch": 38.82, "learning_rate": 9.95903119388293e-06, "loss": 0.9336, "step": 13200 }, { "epoch": 39.12, "learning_rate": 9.958357315518809e-06, "loss": 0.9246, "step": 13300 }, { "epoch": 39.41, "learning_rate": 9.957677963276242e-06, "loss": 0.9039, "step": 13400 }, { "epoch": 39.71, "learning_rate": 9.956993137905216e-06, "loss": 0.9019, "step": 13500 }, { "epoch": 40.0, "learning_rate": 9.956302840161757e-06, "loss": 0.9067, "step": 13600 }, { "epoch": 40.29, "learning_rate": 9.955607070807934e-06, "loss": 0.8912, "step": 13700 }, { "epoch": 40.59, "learning_rate": 9.954905830611852e-06, "loss": 0.8837, "step": 13800 }, { "epoch": 40.88, "learning_rate": 9.954199120347664e-06, "loss": 0.8715, "step": 13900 }, { "epoch": 41.18, "learning_rate": 9.953486940795553e-06, "loss": 0.8704, "step": 14000 }, { "epoch": 41.18, "eval_cer": 0.17021925809685715, "eval_loss": 0.5903766751289368, "eval_runtime": 4.8914, "eval_samples_per_second": 73.395, "eval_steps_per_second": 2.453, "eval_wer": 0.556504916975657, "step": 14000 }, { "epoch": 41.47, "learning_rate": 9.952769292741748e-06, "loss": 0.8592, "step": 14100 }, { "epoch": 41.76, "learning_rate": 9.952046176978508e-06, "loss": 0.8599, "step": 14200 }, { "epoch": 42.06, "learning_rate": 9.951317594304132e-06, "loss": 0.8541, "step": 14300 }, { "epoch": 42.35, "learning_rate": 9.950583545522953e-06, "loss": 0.8308, "step": 14400 }, { "epoch": 42.65, "learning_rate": 9.94984403144534e-06, "loss": 0.8349, "step": 14500 }, { "epoch": 42.94, "learning_rate": 9.949099052887694e-06, "loss": 0.8297, "step": 14600 }, { "epoch": 43.24, "learning_rate": 9.948356142136993e-06, "loss": 0.8316, "step": 14700 }, { "epoch": 43.53, "learning_rate": 9.947600291716784e-06, "loss": 0.8122, "step": 14800 }, { "epoch": 43.82, "learning_rate": 9.946838979293566e-06, "loss": 0.8249, "step": 14900 }, { "epoch": 44.12, "learning_rate": 9.946072205707802e-06, "loss": 0.8113, "step": 15000 }, { "epoch": 44.12, "eval_cer": 0.16285253476308792, "eval_loss": 0.5454097986221313, "eval_runtime": 5.4231, "eval_samples_per_second": 66.199, "eval_steps_per_second": 2.213, "eval_wer": 0.5442527809124618, "step": 15000 }, { "epoch": 44.41, "learning_rate": 9.945299971805988e-06, "loss": 0.7922, "step": 15100 }, { "epoch": 44.71, "learning_rate": 9.944522278440648e-06, "loss": 0.7931, "step": 15200 }, { "epoch": 45.0, "learning_rate": 9.943739126470331e-06, "loss": 0.7999, "step": 15300 }, { "epoch": 45.29, "learning_rate": 9.942950516759613e-06, "loss": 0.7875, "step": 15400 }, { "epoch": 45.59, "learning_rate": 9.942156450179096e-06, "loss": 0.7786, "step": 15500 }, { "epoch": 45.88, "learning_rate": 9.941356927605407e-06, "loss": 0.7762, "step": 15600 }, { "epoch": 46.18, "learning_rate": 9.940551949921196e-06, "loss": 0.7804, "step": 15700 }, { "epoch": 46.47, "learning_rate": 9.939741518015131e-06, "loss": 0.7618, "step": 15800 }, { "epoch": 46.76, "learning_rate": 9.938925632781907e-06, "loss": 0.7633, "step": 15900 }, { "epoch": 47.06, "learning_rate": 9.938104295122233e-06, "loss": 0.751, "step": 16000 }, { "epoch": 47.06, "eval_cer": 0.15430887929907153, "eval_loss": 0.5159721970558167, "eval_runtime": 5.2316, "eval_samples_per_second": 68.622, "eval_steps_per_second": 2.294, "eval_wer": 0.524907302917943, "step": 16000 }, { "epoch": 47.35, "learning_rate": 9.937277505942848e-06, "loss": 0.7442, "step": 16100 }, { "epoch": 47.65, "learning_rate": 9.936445266156499e-06, "loss": 0.747, "step": 16200 }, { "epoch": 47.94, "learning_rate": 9.935607576681951e-06, "loss": 0.7361, "step": 16300 }, { "epoch": 48.24, "learning_rate": 9.934764438443993e-06, "loss": 0.7332, "step": 16400 }, { "epoch": 48.53, "learning_rate": 9.933915852373421e-06, "loss": 0.7431, "step": 16500 }, { "epoch": 48.82, "learning_rate": 9.933061819407052e-06, "loss": 0.7295, "step": 16600 }, { "epoch": 49.12, "learning_rate": 9.93220234048771e-06, "loss": 0.72, "step": 16700 }, { "epoch": 49.41, "learning_rate": 9.931337416564234e-06, "loss": 0.7169, "step": 16800 }, { "epoch": 49.71, "learning_rate": 9.930467048591479e-06, "loss": 0.7173, "step": 16900 }, { "epoch": 50.0, "learning_rate": 9.929591237530298e-06, "loss": 0.7202, "step": 17000 }, { "epoch": 50.0, "eval_cer": 0.14737805675428273, "eval_loss": 0.4853704273700714, "eval_runtime": 4.7551, "eval_samples_per_second": 75.498, "eval_steps_per_second": 2.524, "eval_wer": 0.5070127357730131, "step": 17000 }, { "epoch": 50.29, "learning_rate": 9.928709984347566e-06, "loss": 0.6911, "step": 17100 }, { "epoch": 50.59, "learning_rate": 9.927823290016156e-06, "loss": 0.7064, "step": 17200 }, { "epoch": 50.88, "learning_rate": 9.926940103785579e-06, "loss": 0.7016, "step": 17300 }, { "epoch": 51.18, "learning_rate": 9.926042584486431e-06, "loss": 0.7164, "step": 17400 }, { "epoch": 51.47, "learning_rate": 9.925139626983336e-06, "loss": 0.6982, "step": 17500 }, { "epoch": 51.76, "learning_rate": 9.924231232273133e-06, "loss": 0.6939, "step": 17600 }, { "epoch": 52.06, "learning_rate": 9.923317401358663e-06, "loss": 0.6864, "step": 17700 }, { "epoch": 52.35, "learning_rate": 9.922398135248766e-06, "loss": 0.6765, "step": 17800 }, { "epoch": 52.65, "learning_rate": 9.921473434958289e-06, "loss": 0.6748, "step": 17900 }, { "epoch": 52.94, "learning_rate": 9.920543301508068e-06, "loss": 0.6876, "step": 18000 }, { "epoch": 52.94, "eval_cer": 0.14423957107362365, "eval_loss": 0.46753910183906555, "eval_runtime": 4.6127, "eval_samples_per_second": 77.829, "eval_steps_per_second": 2.602, "eval_wer": 0.5110430436885378, "step": 18000 }, { "epoch": 53.24, "learning_rate": 9.919607735924945e-06, "loss": 0.6811, "step": 18100 }, { "epoch": 53.53, "learning_rate": 9.918666739241758e-06, "loss": 0.6627, "step": 18200 }, { "epoch": 53.82, "learning_rate": 9.917720312497337e-06, "loss": 0.6605, "step": 18300 }, { "epoch": 54.12, "learning_rate": 9.91676845673651e-06, "loss": 0.67, "step": 18400 }, { "epoch": 54.41, "learning_rate": 9.915811173010097e-06, "loss": 0.649, "step": 18500 }, { "epoch": 54.71, "learning_rate": 9.914848462374911e-06, "loss": 0.6546, "step": 18600 }, { "epoch": 55.0, "learning_rate": 9.913880325893755e-06, "loss": 0.6598, "step": 18700 }, { "epoch": 55.29, "learning_rate": 9.912906764635423e-06, "loss": 0.6558, "step": 18800 }, { "epoch": 55.59, "learning_rate": 9.911927779674696e-06, "loss": 0.6528, "step": 18900 }, { "epoch": 55.88, "learning_rate": 9.910943372092349e-06, "loss": 0.6503, "step": 19000 }, { "epoch": 55.88, "eval_cer": 0.13796259971230548, "eval_loss": 0.4472251534461975, "eval_runtime": 5.2128, "eval_samples_per_second": 68.869, "eval_steps_per_second": 2.302, "eval_wer": 0.4826696759632436, "step": 19000 }, { "epoch": 56.18, "learning_rate": 9.909953542975134e-06, "loss": 0.6274, "step": 19100 }, { "epoch": 56.47, "learning_rate": 9.908958293415795e-06, "loss": 0.6333, "step": 19200 }, { "epoch": 56.76, "learning_rate": 9.907957624513058e-06, "loss": 0.6317, "step": 19300 }, { "epoch": 57.06, "learning_rate": 9.90695153737163e-06, "loss": 0.6302, "step": 19400 }, { "epoch": 57.35, "learning_rate": 9.905950174956017e-06, "loss": 0.6387, "step": 19500 }, { "epoch": 57.65, "learning_rate": 9.904933308829825e-06, "loss": 0.6304, "step": 19600 }, { "epoch": 57.94, "learning_rate": 9.903911027803696e-06, "loss": 0.6136, "step": 19700 }, { "epoch": 58.24, "learning_rate": 9.902883333006202e-06, "loss": 0.6128, "step": 19800 }, { "epoch": 58.53, "learning_rate": 9.901850225571881e-06, "loss": 0.6113, "step": 19900 }, { "epoch": 58.82, "learning_rate": 9.900811706641256e-06, "loss": 0.629, "step": 20000 }, { "epoch": 58.82, "eval_cer": 0.13430103308486988, "eval_loss": 0.43461212515830994, "eval_runtime": 4.8127, "eval_samples_per_second": 74.594, "eval_steps_per_second": 2.493, "eval_wer": 0.46912784136708047, "step": 20000 }, { "epoch": 59.12, "learning_rate": 9.89976777736082e-06, "loss": 0.6202, "step": 20100 }, { "epoch": 59.41, "learning_rate": 9.898718438883044e-06, "loss": 0.6079, "step": 20200 }, { "epoch": 59.71, "learning_rate": 9.89766369236636e-06, "loss": 0.6134, "step": 20300 }, { "epoch": 60.0, "learning_rate": 9.89660353897518e-06, "loss": 0.6198, "step": 20400 }, { "epoch": 60.29, "learning_rate": 9.895537979879882e-06, "loss": 0.6029, "step": 20500 }, { "epoch": 60.59, "learning_rate": 9.89446701625681e-06, "loss": 0.6027, "step": 20600 }, { "epoch": 60.88, "learning_rate": 9.893390649288274e-06, "loss": 0.6029, "step": 20700 }, { "epoch": 61.18, "learning_rate": 9.892308880162558e-06, "loss": 0.5978, "step": 20800 }, { "epoch": 61.47, "learning_rate": 9.891221710073895e-06, "loss": 0.5906, "step": 20900 }, { "epoch": 61.76, "learning_rate": 9.890129140222492e-06, "loss": 0.5847, "step": 21000 }, { "epoch": 61.76, "eval_cer": 0.13168562835098732, "eval_loss": 0.421942800283432, "eval_runtime": 4.6895, "eval_samples_per_second": 76.554, "eval_steps_per_second": 2.559, "eval_wer": 0.47573754634854104, "step": 21000 }, { "epoch": 62.06, "learning_rate": 9.889031171814516e-06, "loss": 0.5831, "step": 21100 }, { "epoch": 62.35, "learning_rate": 9.887927806062085e-06, "loss": 0.5945, "step": 21200 }, { "epoch": 62.65, "learning_rate": 9.886819044183287e-06, "loss": 0.5786, "step": 21300 }, { "epoch": 62.94, "learning_rate": 9.885704887402158e-06, "loss": 0.5858, "step": 21400 }, { "epoch": 63.24, "learning_rate": 9.8845853369487e-06, "loss": 0.5825, "step": 21500 }, { "epoch": 63.53, "learning_rate": 9.883460394058857e-06, "loss": 0.5805, "step": 21600 }, { "epoch": 63.82, "learning_rate": 9.882330059974536e-06, "loss": 0.58, "step": 21700 }, { "epoch": 64.12, "learning_rate": 9.881194335943589e-06, "loss": 0.5717, "step": 21800 }, { "epoch": 64.41, "learning_rate": 9.880053223219826e-06, "loss": 0.5771, "step": 21900 }, { "epoch": 64.71, "learning_rate": 9.878906723062995e-06, "loss": 0.5777, "step": 22000 }, { "epoch": 64.71, "eval_cer": 0.12732662046118304, "eval_loss": 0.4089703857898712, "eval_runtime": 4.8857, "eval_samples_per_second": 73.48, "eval_steps_per_second": 2.456, "eval_wer": 0.4549411575044333, "step": 22000 }, { "epoch": 65.0, "learning_rate": 9.877754836738805e-06, "loss": 0.565, "step": 22100 }, { "epoch": 65.29, "learning_rate": 9.876597565518899e-06, "loss": 0.5735, "step": 22200 }, { "epoch": 65.59, "learning_rate": 9.875434910680871e-06, "loss": 0.5607, "step": 22300 }, { "epoch": 65.88, "learning_rate": 9.87426687350826e-06, "loss": 0.5723, "step": 22400 }, { "epoch": 66.18, "learning_rate": 9.87309345529054e-06, "loss": 0.5574, "step": 22500 }, { "epoch": 66.47, "learning_rate": 9.871914657323133e-06, "loss": 0.5535, "step": 22600 }, { "epoch": 66.76, "learning_rate": 9.870730480907395e-06, "loss": 0.5475, "step": 22700 }, { "epoch": 67.06, "learning_rate": 9.869540927350623e-06, "loss": 0.5536, "step": 22800 }, { "epoch": 67.35, "learning_rate": 9.868345997966044e-06, "loss": 0.5532, "step": 22900 }, { "epoch": 67.65, "learning_rate": 9.867157723711235e-06, "loss": 0.5609, "step": 23000 }, { "epoch": 67.65, "eval_cer": 0.12440608517501417, "eval_loss": 0.40106838941574097, "eval_runtime": 5.3761, "eval_samples_per_second": 66.777, "eval_steps_per_second": 2.232, "eval_wer": 0.45010478800580367, "step": 23000 }, { "epoch": 67.94, "learning_rate": 9.86595210035974e-06, "loss": 0.5303, "step": 23100 }, { "epoch": 68.24, "learning_rate": 9.864741105142399e-06, "loss": 0.536, "step": 23200 }, { "epoch": 68.53, "learning_rate": 9.863524739396117e-06, "loss": 0.5378, "step": 23300 }, { "epoch": 68.82, "learning_rate": 9.86230300446372e-06, "loss": 0.55, "step": 23400 }, { "epoch": 69.12, "learning_rate": 9.861075901693973e-06, "loss": 0.5482, "step": 23500 }, { "epoch": 69.41, "learning_rate": 9.859843432441557e-06, "loss": 0.539, "step": 23600 }, { "epoch": 69.71, "learning_rate": 9.858605598067082e-06, "loss": 0.5286, "step": 23700 }, { "epoch": 70.0, "learning_rate": 9.857362399937081e-06, "loss": 0.5451, "step": 23800 }, { "epoch": 70.29, "learning_rate": 9.856113839424007e-06, "loss": 0.5403, "step": 23900 }, { "epoch": 70.59, "learning_rate": 9.854859917906234e-06, "loss": 0.5287, "step": 24000 }, { "epoch": 70.59, "eval_cer": 0.1208752887842727, "eval_loss": 0.39059486985206604, "eval_runtime": 5.0091, "eval_samples_per_second": 71.669, "eval_steps_per_second": 2.396, "eval_wer": 0.4380138642592294, "step": 24000 }, { "epoch": 70.88, "learning_rate": 9.853600636768053e-06, "loss": 0.5235, "step": 24100 }, { "epoch": 71.18, "learning_rate": 9.852335997399674e-06, "loss": 0.5141, "step": 24200 }, { "epoch": 71.47, "learning_rate": 9.85106600119722e-06, "loss": 0.5232, "step": 24300 }, { "epoch": 71.76, "learning_rate": 9.84979064956273e-06, "loss": 0.514, "step": 24400 }, { "epoch": 72.06, "learning_rate": 9.848509943904152e-06, "loss": 0.5304, "step": 24500 }, { "epoch": 72.35, "learning_rate": 9.84722388563535e-06, "loss": 0.5154, "step": 24600 }, { "epoch": 72.65, "learning_rate": 9.845932476176093e-06, "loss": 0.5131, "step": 24700 }, { "epoch": 72.94, "learning_rate": 9.844635716952054e-06, "loss": 0.5105, "step": 24800 }, { "epoch": 73.24, "learning_rate": 9.843333609394823e-06, "loss": 0.5116, "step": 24900 }, { "epoch": 73.53, "learning_rate": 9.842026154941883e-06, "loss": 0.5048, "step": 25000 }, { "epoch": 73.53, "eval_cer": 0.1172137221568371, "eval_loss": 0.38722869753837585, "eval_runtime": 5.2278, "eval_samples_per_second": 68.671, "eval_steps_per_second": 2.295, "eval_wer": 0.42237626954699337, "step": 25000 }, { "epoch": 73.82, "learning_rate": 9.840713355036629e-06, "loss": 0.5126, "step": 25100 }, { "epoch": 74.12, "learning_rate": 9.839395211128352e-06, "loss": 0.5006, "step": 25200 }, { "epoch": 74.41, "learning_rate": 9.838071724672239e-06, "loss": 0.5051, "step": 25300 }, { "epoch": 74.71, "learning_rate": 9.836742897129383e-06, "loss": 0.507, "step": 25400 }, { "epoch": 75.0, "learning_rate": 9.835422098064685e-06, "loss": 0.5031, "step": 25500 }, { "epoch": 75.29, "learning_rate": 9.834082646129353e-06, "loss": 0.4998, "step": 25600 }, { "epoch": 75.59, "learning_rate": 9.832737857511103e-06, "loss": 0.4934, "step": 25700 }, { "epoch": 75.88, "learning_rate": 9.83138773369454e-06, "loss": 0.5012, "step": 25800 }, { "epoch": 76.18, "learning_rate": 9.830032276170158e-06, "loss": 0.4894, "step": 25900 }, { "epoch": 76.47, "learning_rate": 9.828671486434347e-06, "loss": 0.481, "step": 26000 }, { "epoch": 76.47, "eval_cer": 0.11594960986879387, "eval_loss": 0.38624435663223267, "eval_runtime": 4.6342, "eval_samples_per_second": 77.468, "eval_steps_per_second": 2.589, "eval_wer": 0.4201192971142995, "step": 26000 }, { "epoch": 76.76, "learning_rate": 9.827305365989374e-06, "loss": 0.4965, "step": 26100 }, { "epoch": 77.06, "learning_rate": 9.825933916343396e-06, "loss": 0.4878, "step": 26200 }, { "epoch": 77.35, "learning_rate": 9.824557139010453e-06, "loss": 0.4873, "step": 26300 }, { "epoch": 77.65, "learning_rate": 9.823175035510463e-06, "loss": 0.4824, "step": 26400 }, { "epoch": 77.94, "learning_rate": 9.821787607369233e-06, "loss": 0.4853, "step": 26500 }, { "epoch": 78.24, "learning_rate": 9.820394856118438e-06, "loss": 0.4765, "step": 26600 }, { "epoch": 78.53, "learning_rate": 9.818996783295635e-06, "loss": 0.4826, "step": 26700 }, { "epoch": 78.82, "learning_rate": 9.817593390444255e-06, "loss": 0.4766, "step": 26800 }, { "epoch": 79.12, "learning_rate": 9.816184679113603e-06, "loss": 0.4784, "step": 26900 }, { "epoch": 79.41, "learning_rate": 9.814770650858849e-06, "loss": 0.4762, "step": 27000 }, { "epoch": 79.41, "eval_cer": 0.11289830434593087, "eval_loss": 0.3742750585079193, "eval_runtime": 4.6829, "eval_samples_per_second": 76.661, "eval_steps_per_second": 2.562, "eval_wer": 0.4112526197001451, "step": 27000 }, { "epoch": 79.71, "learning_rate": 9.813351307241043e-06, "loss": 0.481, "step": 27100 }, { "epoch": 80.0, "learning_rate": 9.811926649827097e-06, "loss": 0.4865, "step": 27200 }, { "epoch": 80.29, "learning_rate": 9.810496680189789e-06, "loss": 0.4767, "step": 27300 }, { "epoch": 80.59, "learning_rate": 9.809061399907764e-06, "loss": 0.4693, "step": 27400 }, { "epoch": 80.88, "learning_rate": 9.807620810565528e-06, "loss": 0.4666, "step": 27500 }, { "epoch": 81.18, "learning_rate": 9.806174913753448e-06, "loss": 0.4701, "step": 27600 }, { "epoch": 81.47, "learning_rate": 9.804723711067753e-06, "loss": 0.4746, "step": 27700 }, { "epoch": 81.76, "learning_rate": 9.803267204110525e-06, "loss": 0.469, "step": 27800 }, { "epoch": 82.06, "learning_rate": 9.801805394489707e-06, "loss": 0.4672, "step": 27900 }, { "epoch": 82.35, "learning_rate": 9.80033828381909e-06, "loss": 0.457, "step": 28000 }, { "epoch": 82.35, "eval_cer": 0.11137265158449937, "eval_loss": 0.3707512617111206, "eval_runtime": 4.6031, "eval_samples_per_second": 77.991, "eval_steps_per_second": 2.607, "eval_wer": 0.4064162502015154, "step": 28000 }, { "epoch": 82.65, "learning_rate": 9.798865873718322e-06, "loss": 0.4656, "step": 28100 }, { "epoch": 82.94, "learning_rate": 9.7973881658129e-06, "loss": 0.459, "step": 28200 }, { "epoch": 83.24, "learning_rate": 9.79590516173417e-06, "loss": 0.4512, "step": 28300 }, { "epoch": 83.53, "learning_rate": 9.794416863119322e-06, "loss": 0.4469, "step": 28400 }, { "epoch": 83.82, "learning_rate": 9.792923271611394e-06, "loss": 0.4683, "step": 28500 }, { "epoch": 84.12, "learning_rate": 9.791424388859268e-06, "loss": 0.4602, "step": 28600 }, { "epoch": 84.41, "learning_rate": 9.789920216517665e-06, "loss": 0.4606, "step": 28700 }, { "epoch": 84.71, "learning_rate": 9.788410756247145e-06, "loss": 0.45, "step": 28800 }, { "epoch": 85.0, "learning_rate": 9.78689600971411e-06, "loss": 0.4629, "step": 28900 }, { "epoch": 85.29, "learning_rate": 9.785375978590792e-06, "loss": 0.4471, "step": 29000 }, { "epoch": 85.29, "eval_cer": 0.10819057582494224, "eval_loss": 0.36229872703552246, "eval_runtime": 4.7496, "eval_samples_per_second": 75.585, "eval_steps_per_second": 2.527, "eval_wer": 0.3954538126712881, "step": 29000 }, { "epoch": 85.59, "learning_rate": 9.783850664555262e-06, "loss": 0.4499, "step": 29100 }, { "epoch": 85.88, "learning_rate": 9.782320069291418e-06, "loss": 0.4433, "step": 29200 }, { "epoch": 86.18, "learning_rate": 9.780784194488996e-06, "loss": 0.4469, "step": 29300 }, { "epoch": 86.47, "learning_rate": 9.779243041843552e-06, "loss": 0.4439, "step": 29400 }, { "epoch": 86.76, "learning_rate": 9.777696613056476e-06, "loss": 0.4418, "step": 29500 }, { "epoch": 87.06, "learning_rate": 9.776144909834977e-06, "loss": 0.4423, "step": 29600 }, { "epoch": 87.35, "learning_rate": 9.77460352974585e-06, "loss": 0.432, "step": 29700 }, { "epoch": 87.65, "learning_rate": 9.773041335501925e-06, "loss": 0.4438, "step": 29800 }, { "epoch": 87.94, "learning_rate": 9.771473871962867e-06, "loss": 0.4341, "step": 29900 }, { "epoch": 88.24, "learning_rate": 9.769901140859106e-06, "loss": 0.4398, "step": 30000 }, { "epoch": 88.24, "eval_cer": 0.10762390479926769, "eval_loss": 0.35913577675819397, "eval_runtime": 4.6645, "eval_samples_per_second": 76.965, "eval_steps_per_second": 2.573, "eval_wer": 0.3954538126712881, "step": 30000 }, { "epoch": 88.53, "learning_rate": 9.768323143926892e-06, "loss": 0.4313, "step": 30100 }, { "epoch": 88.82, "learning_rate": 9.766739882908285e-06, "loss": 0.4258, "step": 30200 }, { "epoch": 89.12, "learning_rate": 9.765151359551158e-06, "loss": 0.4304, "step": 30300 }, { "epoch": 89.41, "learning_rate": 9.763557575609193e-06, "loss": 0.4465, "step": 30400 }, { "epoch": 89.71, "learning_rate": 9.761958532841882e-06, "loss": 0.4321, "step": 30500 }, { "epoch": 90.0, "learning_rate": 9.760354233014517e-06, "loss": 0.4274, "step": 30600 }, { "epoch": 90.29, "learning_rate": 9.758744677898202e-06, "loss": 0.4369, "step": 30700 }, { "epoch": 90.59, "learning_rate": 9.757129869269835e-06, "loss": 0.4213, "step": 30800 }, { "epoch": 90.88, "learning_rate": 9.755509808912114e-06, "loss": 0.4364, "step": 30900 }, { "epoch": 91.18, "learning_rate": 9.753884498613542e-06, "loss": 0.4254, "step": 31000 }, { "epoch": 91.18, "eval_cer": 0.10474695959199685, "eval_loss": 0.3557164967060089, "eval_runtime": 4.7708, "eval_samples_per_second": 75.249, "eval_steps_per_second": 2.515, "eval_wer": 0.37901015637594715, "step": 31000 }, { "epoch": 91.47, "learning_rate": 9.75225394016841e-06, "loss": 0.412, "step": 31100 }, { "epoch": 91.76, "learning_rate": 9.750618135376806e-06, "loss": 0.421, "step": 31200 }, { "epoch": 92.06, "learning_rate": 9.74897708604461e-06, "loss": 0.4324, "step": 31300 }, { "epoch": 92.35, "learning_rate": 9.747330793983493e-06, "loss": 0.415, "step": 31400 }, { "epoch": 92.65, "learning_rate": 9.745679261010912e-06, "loss": 0.422, "step": 31500 }, { "epoch": 92.94, "learning_rate": 9.74402248895011e-06, "loss": 0.4192, "step": 31600 }, { "epoch": 93.24, "learning_rate": 9.74236047963011e-06, "loss": 0.4083, "step": 31700 }, { "epoch": 93.53, "learning_rate": 9.740709933242481e-06, "loss": 0.4127, "step": 31800 }, { "epoch": 93.82, "learning_rate": 9.739037507241007e-06, "loss": 0.4061, "step": 31900 }, { "epoch": 94.12, "learning_rate": 9.737359849483607e-06, "loss": 0.4166, "step": 32000 }, { "epoch": 94.12, "eval_cer": 0.1032648969094634, "eval_loss": 0.3532021641731262, "eval_runtime": 5.0385, "eval_samples_per_second": 71.251, "eval_steps_per_second": 2.382, "eval_wer": 0.3785265194260842, "step": 32000 }, { "epoch": 94.41, "learning_rate": 9.73567696182237e-06, "loss": 0.4109, "step": 32100 }, { "epoch": 94.71, "learning_rate": 9.733988846115149e-06, "loss": 0.4132, "step": 32200 }, { "epoch": 95.0, "learning_rate": 9.732295504225576e-06, "loss": 0.4151, "step": 32300 }, { "epoch": 95.29, "learning_rate": 9.73059693802305e-06, "loss": 0.4015, "step": 32400 }, { "epoch": 95.59, "learning_rate": 9.728893149382734e-06, "loss": 0.4102, "step": 32500 }, { "epoch": 95.88, "learning_rate": 9.727184140185564e-06, "loss": 0.4153, "step": 32600 }, { "epoch": 96.18, "learning_rate": 9.725469912318232e-06, "loss": 0.4144, "step": 32700 }, { "epoch": 96.47, "learning_rate": 9.723750467673199e-06, "loss": 0.4073, "step": 32800 }, { "epoch": 96.76, "learning_rate": 9.722025808148674e-06, "loss": 0.3992, "step": 32900 }, { "epoch": 97.06, "learning_rate": 9.720295935648633e-06, "loss": 0.4, "step": 33000 }, { "epoch": 97.06, "eval_cer": 0.10322130683056537, "eval_loss": 0.34583190083503723, "eval_runtime": 4.6042, "eval_samples_per_second": 77.972, "eval_steps_per_second": 2.606, "eval_wer": 0.3833628889247139, "step": 33000 }, { "epoch": 97.35, "learning_rate": 9.718560852082806e-06, "loss": 0.401, "step": 33100 }, { "epoch": 97.65, "learning_rate": 9.716820559366672e-06, "loss": 0.4072, "step": 33200 }, { "epoch": 97.94, "learning_rate": 9.715075059421456e-06, "loss": 0.4067, "step": 33300 }, { "epoch": 98.24, "learning_rate": 9.713324354174148e-06, "loss": 0.4008, "step": 33400 }, { "epoch": 98.53, "learning_rate": 9.711568445557466e-06, "loss": 0.4097, "step": 33500 }, { "epoch": 98.82, "learning_rate": 9.709807335509887e-06, "loss": 0.3962, "step": 33600 }, { "epoch": 99.12, "learning_rate": 9.70804102597562e-06, "loss": 0.3883, "step": 33700 }, { "epoch": 99.41, "learning_rate": 9.706269518904619e-06, "loss": 0.3923, "step": 33800 }, { "epoch": 99.71, "learning_rate": 9.704510608990784e-06, "loss": 0.395, "step": 33900 }, { "epoch": 100.0, "learning_rate": 9.702728764645592e-06, "loss": 0.4022, "step": 34000 }, { "epoch": 100.0, "eval_cer": 0.10160847391133777, "eval_loss": 0.34906402230262756, "eval_runtime": 4.8096, "eval_samples_per_second": 74.642, "eval_steps_per_second": 2.495, "eval_wer": 0.3683701434789618, "step": 34000 }, { "epoch": 100.29, "learning_rate": 9.700941728628244e-06, "loss": 0.3898, "step": 34100 }, { "epoch": 100.59, "learning_rate": 9.699149502911573e-06, "loss": 0.3897, "step": 34200 }, { "epoch": 100.88, "learning_rate": 9.697352089474145e-06, "loss": 0.3872, "step": 34300 }, { "epoch": 101.18, "learning_rate": 9.69554949030025e-06, "loss": 0.3732, "step": 34400 }, { "epoch": 101.47, "learning_rate": 9.693741707379902e-06, "loss": 0.3864, "step": 34500 }, { "epoch": 101.76, "learning_rate": 9.691928742708842e-06, "loss": 0.3826, "step": 34600 }, { "epoch": 102.06, "learning_rate": 9.690110598288529e-06, "loss": 0.3873, "step": 34700 }, { "epoch": 102.35, "learning_rate": 9.688287276126135e-06, "loss": 0.385, "step": 34800 }, { "epoch": 102.65, "learning_rate": 9.686458778234561e-06, "loss": 0.3854, "step": 34900 }, { "epoch": 102.94, "learning_rate": 9.684625106632409e-06, "loss": 0.3896, "step": 35000 }, { "epoch": 102.94, "eval_cer": 0.10012641122880432, "eval_loss": 0.3409387767314911, "eval_runtime": 58.5958, "eval_samples_per_second": 6.127, "eval_steps_per_second": 0.205, "eval_wer": 0.3688537804288248, "step": 35000 }, { "epoch": 103.24, "learning_rate": 9.682786263343997e-06, "loss": 0.3738, "step": 35100 }, { "epoch": 103.53, "learning_rate": 9.680942250399357e-06, "loss": 0.3861, "step": 35200 }, { "epoch": 103.82, "learning_rate": 9.679093069834222e-06, "loss": 0.3821, "step": 35300 }, { "epoch": 104.12, "learning_rate": 9.677238723690032e-06, "loss": 0.3817, "step": 35400 }, { "epoch": 104.41, "learning_rate": 9.67537921401393e-06, "loss": 0.3838, "step": 35500 }, { "epoch": 104.71, "learning_rate": 9.67351454285876e-06, "loss": 0.3896, "step": 35600 }, { "epoch": 105.0, "learning_rate": 9.671644712283061e-06, "loss": 0.3829, "step": 35700 }, { "epoch": 105.29, "learning_rate": 9.669769724351072e-06, "loss": 0.3738, "step": 35800 }, { "epoch": 105.59, "learning_rate": 9.667889581132725e-06, "loss": 0.3801, "step": 35900 }, { "epoch": 105.88, "learning_rate": 9.666004284703638e-06, "loss": 0.3816, "step": 36000 }, { "epoch": 105.88, "eval_cer": 0.09733664617932958, "eval_loss": 0.3380275368690491, "eval_runtime": 34.8574, "eval_samples_per_second": 10.299, "eval_steps_per_second": 0.344, "eval_wer": 0.35563437046590357, "step": 36000 }, { "epoch": 106.18, "learning_rate": 9.664132767111955e-06, "loss": 0.3751, "step": 36100 }, { "epoch": 106.47, "learning_rate": 9.66223722199109e-06, "loss": 0.3835, "step": 36200 }, { "epoch": 106.76, "learning_rate": 9.66033652989952e-06, "loss": 0.379, "step": 36300 }, { "epoch": 107.06, "learning_rate": 9.658430692935558e-06, "loss": 0.3625, "step": 36400 }, { "epoch": 107.35, "learning_rate": 9.656519713203187e-06, "loss": 0.3571, "step": 36500 }, { "epoch": 107.65, "learning_rate": 9.654603592812074e-06, "loss": 0.3687, "step": 36600 }, { "epoch": 107.94, "learning_rate": 9.652682333877558e-06, "loss": 0.3668, "step": 36700 }, { "epoch": 108.24, "learning_rate": 9.65075593852065e-06, "loss": 0.3718, "step": 36800 }, { "epoch": 108.53, "learning_rate": 9.648824408868035e-06, "loss": 0.3668, "step": 36900 }, { "epoch": 108.82, "learning_rate": 9.646887747052065e-06, "loss": 0.3647, "step": 37000 }, { "epoch": 108.82, "eval_cer": 0.09681356523255306, "eval_loss": 0.33798158168792725, "eval_runtime": 35.9194, "eval_samples_per_second": 9.995, "eval_steps_per_second": 0.334, "eval_wer": 0.3541834596163147, "step": 37000 }, { "epoch": 109.12, "learning_rate": 9.644945955210753e-06, "loss": 0.3667, "step": 37100 }, { "epoch": 109.41, "learning_rate": 9.642999035487783e-06, "loss": 0.3653, "step": 37200 }, { "epoch": 109.71, "learning_rate": 9.641046990032494e-06, "loss": 0.3671, "step": 37300 }, { "epoch": 110.0, "learning_rate": 9.639089820999886e-06, "loss": 0.3664, "step": 37400 }, { "epoch": 110.29, "learning_rate": 9.637127530550618e-06, "loss": 0.3663, "step": 37500 }, { "epoch": 110.59, "learning_rate": 9.635160120850996e-06, "loss": 0.3561, "step": 37600 }, { "epoch": 110.88, "learning_rate": 9.633187594072984e-06, "loss": 0.3648, "step": 37700 }, { "epoch": 111.18, "learning_rate": 9.631209952394191e-06, "loss": 0.3632, "step": 37800 }, { "epoch": 111.47, "learning_rate": 9.629227197997876e-06, "loss": 0.3618, "step": 37900 }, { "epoch": 111.76, "learning_rate": 9.62723933307294e-06, "loss": 0.3607, "step": 38000 }, { "epoch": 111.76, "eval_cer": 0.09485201168214115, "eval_loss": 0.33785539865493774, "eval_runtime": 22.4984, "eval_samples_per_second": 15.957, "eval_steps_per_second": 0.533, "eval_wer": 0.3478961792680961, "step": 38000 }, { "epoch": 112.06, "learning_rate": 9.625246359813927e-06, "loss": 0.3587, "step": 38100 }, { "epoch": 112.35, "learning_rate": 9.62324828042102e-06, "loss": 0.3528, "step": 38200 }, { "epoch": 112.65, "learning_rate": 9.621245097100039e-06, "loss": 0.3506, "step": 38300 }, { "epoch": 112.94, "learning_rate": 9.619236812062436e-06, "loss": 0.3573, "step": 38400 }, { "epoch": 113.24, "learning_rate": 9.617223427525302e-06, "loss": 0.3528, "step": 38500 }, { "epoch": 113.53, "learning_rate": 9.615204945711349e-06, "loss": 0.3503, "step": 38600 }, { "epoch": 113.82, "learning_rate": 9.613181368848924e-06, "loss": 0.3521, "step": 38700 }, { "epoch": 114.12, "learning_rate": 9.611173011070848e-06, "loss": 0.3508, "step": 38800 }, { "epoch": 114.41, "learning_rate": 9.60913930171365e-06, "loss": 0.3445, "step": 38900 }, { "epoch": 114.71, "learning_rate": 9.607100504004268e-06, "loss": 0.3561, "step": 39000 }, { "epoch": 114.71, "eval_cer": 0.09432893073536464, "eval_loss": 0.33478814363479614, "eval_runtime": 23.7686, "eval_samples_per_second": 15.104, "eval_steps_per_second": 0.505, "eval_wer": 0.349347090117685, "step": 39000 }, { "epoch": 115.0, "learning_rate": 9.605056620193475e-06, "loss": 0.3502, "step": 39100 }, { "epoch": 115.29, "learning_rate": 9.603007652537659e-06, "loss": 0.351, "step": 39200 }, { "epoch": 115.59, "learning_rate": 9.600953603298815e-06, "loss": 0.3366, "step": 39300 }, { "epoch": 115.88, "learning_rate": 9.598894474744556e-06, "loss": 0.344, "step": 39400 }, { "epoch": 116.18, "learning_rate": 9.596830269148097e-06, "loss": 0.3349, "step": 39500 }, { "epoch": 116.47, "learning_rate": 9.594760988788259e-06, "loss": 0.3499, "step": 39600 }, { "epoch": 116.76, "learning_rate": 9.592686635949466e-06, "loss": 0.337, "step": 39700 }, { "epoch": 117.06, "learning_rate": 9.590607212921742e-06, "loss": 0.3441, "step": 39800 }, { "epoch": 117.35, "learning_rate": 9.588522722000706e-06, "loss": 0.3356, "step": 39900 }, { "epoch": 117.65, "learning_rate": 9.586433165487577e-06, "loss": 0.344, "step": 40000 }, { "epoch": 117.65, "eval_cer": 0.0920622466326664, "eval_loss": 0.33385178446769714, "eval_runtime": 22.867, "eval_samples_per_second": 15.699, "eval_steps_per_second": 0.525, "eval_wer": 0.3417701112364985, "step": 40000 }, { "epoch": 117.94, "learning_rate": 9.584359516942819e-06, "loss": 0.3554, "step": 40100 }, { "epoch": 118.24, "learning_rate": 9.582259886769778e-06, "loss": 0.3421, "step": 40200 }, { "epoch": 118.53, "learning_rate": 9.580155197918625e-06, "loss": 0.3341, "step": 40300 }, { "epoch": 118.82, "learning_rate": 9.578045452712876e-06, "loss": 0.3332, "step": 40400 }, { "epoch": 119.12, "learning_rate": 9.575930653481624e-06, "loss": 0.3365, "step": 40500 }, { "epoch": 119.41, "learning_rate": 9.573810802559544e-06, "loss": 0.338, "step": 40600 }, { "epoch": 119.71, "learning_rate": 9.571685902286891e-06, "loss": 0.3389, "step": 40700 }, { "epoch": 120.0, "learning_rate": 9.569555955009488e-06, "loss": 0.3331, "step": 40800 }, { "epoch": 120.29, "learning_rate": 9.567420963078737e-06, "loss": 0.3195, "step": 40900 }, { "epoch": 120.59, "learning_rate": 9.565280928851602e-06, "loss": 0.337, "step": 41000 }, { "epoch": 120.59, "eval_cer": 0.09219301686936053, "eval_loss": 0.33047986030578613, "eval_runtime": 4.9286, "eval_samples_per_second": 72.84, "eval_steps_per_second": 2.435, "eval_wer": 0.3414476866032565, "step": 41000 }, { "epoch": 120.88, "learning_rate": 9.563135854690617e-06, "loss": 0.3345, "step": 41100 }, { "epoch": 121.18, "learning_rate": 9.560985742963882e-06, "loss": 0.3337, "step": 41200 }, { "epoch": 121.47, "learning_rate": 9.558830596045055e-06, "loss": 0.3205, "step": 41300 }, { "epoch": 121.76, "learning_rate": 9.556670416313354e-06, "loss": 0.3442, "step": 41400 }, { "epoch": 122.06, "learning_rate": 9.554505206153552e-06, "loss": 0.3381, "step": 41500 }, { "epoch": 122.35, "learning_rate": 9.552334967955979e-06, "loss": 0.3314, "step": 41600 }, { "epoch": 122.65, "learning_rate": 9.55015970411651e-06, "loss": 0.3291, "step": 41700 }, { "epoch": 122.94, "learning_rate": 9.547979417036575e-06, "loss": 0.3297, "step": 41800 }, { "epoch": 123.24, "learning_rate": 9.54579410912314e-06, "loss": 0.3262, "step": 41900 }, { "epoch": 123.53, "learning_rate": 9.543603782788727e-06, "loss": 0.3297, "step": 42000 }, { "epoch": 123.53, "eval_cer": 0.09036223355564274, "eval_loss": 0.33064666390419006, "eval_runtime": 4.4896, "eval_samples_per_second": 79.963, "eval_steps_per_second": 2.673, "eval_wer": 0.3311300983395131, "step": 42000 }, { "epoch": 123.82, "learning_rate": 9.541408440451385e-06, "loss": 0.3193, "step": 42100 }, { "epoch": 124.12, "learning_rate": 9.539208084534708e-06, "loss": 0.324, "step": 42200 }, { "epoch": 124.41, "learning_rate": 9.537002717467826e-06, "loss": 0.3244, "step": 42300 }, { "epoch": 124.71, "learning_rate": 9.534792341685395e-06, "loss": 0.3289, "step": 42400 }, { "epoch": 125.0, "learning_rate": 9.532576959627604e-06, "loss": 0.3297, "step": 42500 }, { "epoch": 125.29, "learning_rate": 9.530356573740171e-06, "loss": 0.3193, "step": 42600 }, { "epoch": 125.59, "learning_rate": 9.528131186474335e-06, "loss": 0.3198, "step": 42700 }, { "epoch": 125.88, "learning_rate": 9.525900800286855e-06, "loss": 0.3172, "step": 42800 }, { "epoch": 126.18, "learning_rate": 9.523665417640016e-06, "loss": 0.3288, "step": 42900 }, { "epoch": 126.47, "learning_rate": 9.521425041001606e-06, "loss": 0.3229, "step": 43000 }, { "epoch": 126.47, "eval_cer": 0.09123403513360359, "eval_loss": 0.33507028222084045, "eval_runtime": 4.4014, "eval_samples_per_second": 81.566, "eval_steps_per_second": 2.726, "eval_wer": 0.33548283088827985, "step": 43000 }, { "epoch": 126.76, "learning_rate": 9.519179672844941e-06, "loss": 0.3121, "step": 43100 }, { "epoch": 127.06, "learning_rate": 9.516929315648835e-06, "loss": 0.3136, "step": 43200 }, { "epoch": 127.35, "learning_rate": 9.51467397189762e-06, "loss": 0.3205, "step": 43300 }, { "epoch": 127.65, "learning_rate": 9.512413644081122e-06, "loss": 0.322, "step": 43400 }, { "epoch": 127.94, "learning_rate": 9.510148334694681e-06, "loss": 0.3181, "step": 43500 }, { "epoch": 128.24, "learning_rate": 9.50787804623913e-06, "loss": 0.3117, "step": 43600 }, { "epoch": 128.53, "learning_rate": 9.505602781220798e-06, "loss": 0.3191, "step": 43700 }, { "epoch": 128.82, "learning_rate": 9.503322542151511e-06, "loss": 0.3155, "step": 43800 }, { "epoch": 129.12, "learning_rate": 9.501037331548584e-06, "loss": 0.3125, "step": 43900 }, { "epoch": 129.41, "learning_rate": 9.49874715193482e-06, "loss": 0.3099, "step": 44000 }, { "epoch": 129.41, "eval_cer": 0.08870581055751711, "eval_loss": 0.3309319317340851, "eval_runtime": 4.8326, "eval_samples_per_second": 74.288, "eval_steps_per_second": 2.483, "eval_wer": 0.3283894889569563, "step": 44000 }, { "epoch": 129.71, "learning_rate": 9.496452005838512e-06, "loss": 0.314, "step": 44100 }, { "epoch": 130.0, "learning_rate": 9.494151895793431e-06, "loss": 0.3089, "step": 44200 }, { "epoch": 130.29, "learning_rate": 9.491846824338831e-06, "loss": 0.3162, "step": 44300 }, { "epoch": 130.59, "learning_rate": 9.48953679401944e-06, "loss": 0.3042, "step": 44400 }, { "epoch": 130.88, "learning_rate": 9.487221807385463e-06, "loss": 0.3177, "step": 44500 }, { "epoch": 131.18, "learning_rate": 9.484901866992578e-06, "loss": 0.3209, "step": 44600 }, { "epoch": 131.47, "learning_rate": 9.48260024881784e-06, "loss": 0.3126, "step": 44700 }, { "epoch": 131.76, "learning_rate": 9.480270458069627e-06, "loss": 0.2984, "step": 44800 }, { "epoch": 132.06, "learning_rate": 9.477935721236585e-06, "loss": 0.3085, "step": 44900 }, { "epoch": 132.35, "learning_rate": 9.475596040896196e-06, "loss": 0.3123, "step": 45000 }, { "epoch": 132.35, "eval_cer": 0.09040582363454078, "eval_loss": 0.33625489473342896, "eval_runtime": 5.2006, "eval_samples_per_second": 69.03, "eval_steps_per_second": 2.307, "eval_wer": 0.3364501047880058, "step": 45000 }, { "epoch": 132.65, "learning_rate": 9.473251419631397e-06, "loss": 0.3057, "step": 45100 }, { "epoch": 132.94, "learning_rate": 9.47090186003058e-06, "loss": 0.302, "step": 45200 }, { "epoch": 133.24, "learning_rate": 9.468547364687589e-06, "loss": 0.3071, "step": 45300 }, { "epoch": 133.53, "learning_rate": 9.466187936201714e-06, "loss": 0.2985, "step": 45400 }, { "epoch": 133.82, "learning_rate": 9.463823577177698e-06, "loss": 0.3045, "step": 45500 }, { "epoch": 134.12, "learning_rate": 9.461454290225717e-06, "loss": 0.31, "step": 45600 }, { "epoch": 134.41, "learning_rate": 9.4590800779614e-06, "loss": 0.3005, "step": 45700 }, { "epoch": 134.71, "learning_rate": 9.4567009430058e-06, "loss": 0.2996, "step": 45800 }, { "epoch": 135.0, "learning_rate": 9.454316887985417e-06, "loss": 0.2984, "step": 45900 }, { "epoch": 135.29, "learning_rate": 9.45192791553217e-06, "loss": 0.3057, "step": 46000 }, { "epoch": 135.29, "eval_cer": 0.0899263327666623, "eval_loss": 0.329167902469635, "eval_runtime": 5.0924, "eval_samples_per_second": 70.498, "eval_steps_per_second": 2.356, "eval_wer": 0.3359664678381428, "step": 46000 }, { "epoch": 135.59, "learning_rate": 9.44953402828342e-06, "loss": 0.3065, "step": 46100 }, { "epoch": 135.88, "learning_rate": 9.447135228881942e-06, "loss": 0.2978, "step": 46200 }, { "epoch": 136.18, "learning_rate": 9.44473151997594e-06, "loss": 0.2965, "step": 46300 }, { "epoch": 136.47, "learning_rate": 9.44232290421904e-06, "loss": 0.2928, "step": 46400 }, { "epoch": 136.76, "learning_rate": 9.439909384270277e-06, "loss": 0.3002, "step": 46500 }, { "epoch": 137.06, "learning_rate": 9.437490962794108e-06, "loss": 0.3014, "step": 46600 }, { "epoch": 137.35, "learning_rate": 9.435067642460396e-06, "loss": 0.2988, "step": 46700 }, { "epoch": 137.65, "learning_rate": 9.432639425944417e-06, "loss": 0.2897, "step": 46800 }, { "epoch": 137.94, "learning_rate": 9.430206315926848e-06, "loss": 0.301, "step": 46900 }, { "epoch": 138.24, "learning_rate": 9.427768315093772e-06, "loss": 0.304, "step": 47000 }, { "epoch": 138.24, "eval_cer": 0.08805195937404647, "eval_loss": 0.32851627469062805, "eval_runtime": 5.1462, "eval_samples_per_second": 69.76, "eval_steps_per_second": 2.332, "eval_wer": 0.3300016121231662, "step": 47000 }, { "epoch": 138.53, "learning_rate": 9.425325426136666e-06, "loss": 0.3, "step": 47100 }, { "epoch": 138.82, "learning_rate": 9.422877651752406e-06, "loss": 0.3031, "step": 47200 }, { "epoch": 139.12, "learning_rate": 9.42044954537496e-06, "loss": 0.2905, "step": 47300 }, { "epoch": 139.41, "learning_rate": 9.417992057035348e-06, "loss": 0.2997, "step": 47400 }, { "epoch": 139.71, "learning_rate": 9.415529691364405e-06, "loss": 0.3007, "step": 47500 }, { "epoch": 140.0, "learning_rate": 9.413062451080509e-06, "loss": 0.2976, "step": 47600 }, { "epoch": 140.29, "learning_rate": 9.410590338907417e-06, "loss": 0.2914, "step": 47700 }, { "epoch": 140.59, "learning_rate": 9.40811335757427e-06, "loss": 0.2941, "step": 47800 }, { "epoch": 140.88, "learning_rate": 9.405631509815582e-06, "loss": 0.3046, "step": 47900 }, { "epoch": 141.18, "learning_rate": 9.403144798371238e-06, "loss": 0.2888, "step": 48000 }, { "epoch": 141.18, "eval_cer": 0.0869622074015954, "eval_loss": 0.3325551450252533, "eval_runtime": 4.8817, "eval_samples_per_second": 73.54, "eval_steps_per_second": 2.458, "eval_wer": 0.3282282766403353, "step": 48000 }, { "epoch": 141.47, "learning_rate": 9.40065322598649e-06, "loss": 0.2881, "step": 48100 }, { "epoch": 141.76, "learning_rate": 9.398156795411963e-06, "loss": 0.2817, "step": 48200 }, { "epoch": 142.06, "learning_rate": 9.395680546289059e-06, "loss": 0.2959, "step": 48300 }, { "epoch": 142.35, "learning_rate": 9.393174456121325e-06, "loss": 0.2927, "step": 48400 }, { "epoch": 142.65, "learning_rate": 9.390663516020151e-06, "loss": 0.2758, "step": 48500 }, { "epoch": 142.94, "learning_rate": 9.388147728757537e-06, "loss": 0.2924, "step": 48600 }, { "epoch": 143.24, "learning_rate": 9.385627097110841e-06, "loss": 0.2873, "step": 48700 }, { "epoch": 143.53, "learning_rate": 9.38310162386276e-06, "loss": 0.2857, "step": 48800 }, { "epoch": 143.82, "learning_rate": 9.380571311801346e-06, "loss": 0.2893, "step": 48900 }, { "epoch": 144.12, "learning_rate": 9.378036163719985e-06, "loss": 0.2832, "step": 49000 }, { "epoch": 144.12, "eval_cer": 0.0869622074015954, "eval_loss": 0.33355438709259033, "eval_runtime": 5.3667, "eval_samples_per_second": 66.894, "eval_steps_per_second": 2.236, "eval_wer": 0.3266161534741254, "step": 49000 }, { "epoch": 144.41, "learning_rate": 9.375496182417404e-06, "loss": 0.2903, "step": 49100 }, { "epoch": 144.71, "learning_rate": 9.372951370697672e-06, "loss": 0.2803, "step": 49200 }, { "epoch": 145.0, "learning_rate": 9.370401731370179e-06, "loss": 0.2853, "step": 49300 }, { "epoch": 145.29, "learning_rate": 9.367847267249653e-06, "loss": 0.287, "step": 49400 }, { "epoch": 145.59, "learning_rate": 9.365287981156147e-06, "loss": 0.2842, "step": 49500 }, { "epoch": 145.88, "learning_rate": 9.362723875915033e-06, "loss": 0.2797, "step": 49600 }, { "epoch": 146.18, "learning_rate": 9.360154954357012e-06, "loss": 0.2833, "step": 49700 }, { "epoch": 146.47, "learning_rate": 9.357581219318092e-06, "loss": 0.2881, "step": 49800 }, { "epoch": 146.76, "learning_rate": 9.355002673639604e-06, "loss": 0.2759, "step": 49900 }, { "epoch": 147.06, "learning_rate": 9.352419320168182e-06, "loss": 0.2812, "step": 50000 }, { "epoch": 147.06, "eval_cer": 0.08652630661261497, "eval_loss": 0.3421614170074463, "eval_runtime": 5.2345, "eval_samples_per_second": 68.583, "eval_steps_per_second": 2.292, "eval_wer": 0.32210220860873773, "step": 50000 }, { "epoch": 147.35, "learning_rate": 9.34983116175577e-06, "loss": 0.2795, "step": 50100 }, { "epoch": 147.65, "learning_rate": 9.347238201259622e-06, "loss": 0.2813, "step": 50200 }, { "epoch": 147.94, "learning_rate": 9.344640441542285e-06, "loss": 0.2888, "step": 50300 }, { "epoch": 148.24, "learning_rate": 9.342037885471612e-06, "loss": 0.2841, "step": 50400 }, { "epoch": 148.53, "learning_rate": 9.339430535920744e-06, "loss": 0.2747, "step": 50500 }, { "epoch": 148.82, "learning_rate": 9.336818395768117e-06, "loss": 0.2747, "step": 50600 }, { "epoch": 149.12, "learning_rate": 9.334201467897458e-06, "loss": 0.2762, "step": 50700 }, { "epoch": 149.41, "learning_rate": 9.331579755197777e-06, "loss": 0.2795, "step": 50800 }, { "epoch": 149.71, "learning_rate": 9.32897954917077e-06, "loss": 0.2718, "step": 50900 }, { "epoch": 150.0, "learning_rate": 9.32634832327718e-06, "loss": 0.2809, "step": 51000 }, { "epoch": 150.0, "eval_cer": 0.0866570768493091, "eval_loss": 0.3332664370536804, "eval_runtime": 4.6401, "eval_samples_per_second": 77.369, "eval_steps_per_second": 2.586, "eval_wer": 0.32532645494115753, "step": 51000 }, { "epoch": 150.29, "learning_rate": 9.323712321224206e-06, "loss": 0.2733, "step": 51100 }, { "epoch": 150.59, "learning_rate": 9.321071545921912e-06, "loss": 0.2667, "step": 51200 }, { "epoch": 150.88, "learning_rate": 9.318426000285638e-06, "loss": 0.285, "step": 51300 }, { "epoch": 151.18, "learning_rate": 9.315775687235985e-06, "loss": 0.2748, "step": 51400 }, { "epoch": 151.47, "learning_rate": 9.313120609698822e-06, "loss": 0.2712, "step": 51500 }, { "epoch": 151.76, "learning_rate": 9.310460770605275e-06, "loss": 0.27, "step": 51600 }, { "epoch": 152.06, "learning_rate": 9.307796172891725e-06, "loss": 0.278, "step": 51700 }, { "epoch": 152.35, "learning_rate": 9.30512681949981e-06, "loss": 0.2729, "step": 51800 }, { "epoch": 152.65, "learning_rate": 9.302452713376417e-06, "loss": 0.2729, "step": 51900 }, { "epoch": 152.94, "learning_rate": 9.299773857473677e-06, "loss": 0.2714, "step": 52000 }, { "epoch": 152.94, "eval_cer": 0.08609040582363454, "eval_loss": 0.32614585757255554, "eval_runtime": 4.6598, "eval_samples_per_second": 77.042, "eval_steps_per_second": 2.575, "eval_wer": 0.3238755440915686, "step": 52000 }, { "epoch": 153.24, "learning_rate": 9.297090254748968e-06, "loss": 0.2639, "step": 52100 }, { "epoch": 153.53, "learning_rate": 9.294401908164907e-06, "loss": 0.2636, "step": 52200 }, { "epoch": 153.82, "learning_rate": 9.291708820689352e-06, "loss": 0.274, "step": 52300 }, { "epoch": 154.12, "learning_rate": 9.289010995295385e-06, "loss": 0.2677, "step": 52400 }, { "epoch": 154.41, "learning_rate": 9.286308434961327e-06, "loss": 0.2707, "step": 52500 }, { "epoch": 154.71, "learning_rate": 9.283601142670726e-06, "loss": 0.2779, "step": 52600 }, { "epoch": 155.0, "learning_rate": 9.28088912141235e-06, "loss": 0.2754, "step": 52700 }, { "epoch": 155.29, "learning_rate": 9.278172374180191e-06, "loss": 0.2692, "step": 52800 }, { "epoch": 155.59, "learning_rate": 9.275450903973456e-06, "loss": 0.2626, "step": 52900 }, { "epoch": 155.88, "learning_rate": 9.272724713796566e-06, "loss": 0.2672, "step": 53000 }, { "epoch": 155.88, "eval_cer": 0.08548014471906194, "eval_loss": 0.3363560140132904, "eval_runtime": 5.1126, "eval_samples_per_second": 70.218, "eval_steps_per_second": 2.347, "eval_wer": 0.3203288731259068, "step": 53000 }, { "epoch": 156.18, "learning_rate": 9.269993806659154e-06, "loss": 0.2577, "step": 53100 }, { "epoch": 156.47, "learning_rate": 9.26725818557606e-06, "loss": 0.2576, "step": 53200 }, { "epoch": 156.76, "learning_rate": 9.26451785356733e-06, "loss": 0.2611, "step": 53300 }, { "epoch": 157.06, "learning_rate": 9.261772813658206e-06, "loss": 0.2618, "step": 53400 }, { "epoch": 157.35, "learning_rate": 9.259023068879129e-06, "loss": 0.2622, "step": 53500 }, { "epoch": 157.65, "learning_rate": 9.25626862226574e-06, "loss": 0.2703, "step": 53600 }, { "epoch": 157.94, "learning_rate": 9.253509476858861e-06, "loss": 0.2649, "step": 53700 }, { "epoch": 158.24, "learning_rate": 9.25074563570451e-06, "loss": 0.2642, "step": 53800 }, { "epoch": 158.53, "learning_rate": 9.247977101853883e-06, "loss": 0.2607, "step": 53900 }, { "epoch": 158.82, "learning_rate": 9.245203878363358e-06, "loss": 0.2697, "step": 54000 }, { "epoch": 158.82, "eval_cer": 0.08343141101085393, "eval_loss": 0.3369295001029968, "eval_runtime": 5.4163, "eval_samples_per_second": 66.282, "eval_steps_per_second": 2.216, "eval_wer": 0.3117846203449944, "step": 54000 }, { "epoch": 159.12, "learning_rate": 9.242425968294492e-06, "loss": 0.2545, "step": 54100 }, { "epoch": 159.41, "learning_rate": 9.239643374714014e-06, "loss": 0.2519, "step": 54200 }, { "epoch": 159.71, "learning_rate": 9.236856100693828e-06, "loss": 0.2657, "step": 54300 }, { "epoch": 160.0, "learning_rate": 9.234064149310995e-06, "loss": 0.2644, "step": 54400 }, { "epoch": 160.29, "learning_rate": 9.23126752364775e-06, "loss": 0.2577, "step": 54500 }, { "epoch": 160.59, "learning_rate": 9.228466226791484e-06, "loss": 0.2632, "step": 54600 }, { "epoch": 160.88, "learning_rate": 9.225660261834746e-06, "loss": 0.2579, "step": 54700 }, { "epoch": 161.18, "learning_rate": 9.222849631875233e-06, "loss": 0.2599, "step": 54800 }, { "epoch": 161.47, "learning_rate": 9.220034340015803e-06, "loss": 0.2576, "step": 54900 }, { "epoch": 161.76, "learning_rate": 9.217214389364448e-06, "loss": 0.2557, "step": 55000 }, { "epoch": 161.76, "eval_cer": 0.08504424393008152, "eval_loss": 0.33482369780540466, "eval_runtime": 4.9338, "eval_samples_per_second": 72.764, "eval_steps_per_second": 2.432, "eval_wer": 0.31678220216024505, "step": 55000 }, { "epoch": 162.06, "learning_rate": 9.214418052132991e-06, "loss": 0.2633, "step": 55100 }, { "epoch": 162.35, "learning_rate": 9.211588839752508e-06, "loss": 0.2735, "step": 55200 }, { "epoch": 162.65, "learning_rate": 9.208754977903685e-06, "loss": 0.2596, "step": 55300 }, { "epoch": 162.94, "learning_rate": 9.205916469715018e-06, "loss": 0.2607, "step": 55400 }, { "epoch": 163.24, "learning_rate": 9.203073318320138e-06, "loss": 0.2635, "step": 55500 }, { "epoch": 163.53, "learning_rate": 9.200225526857794e-06, "loss": 0.2498, "step": 55600 }, { "epoch": 163.82, "learning_rate": 9.197373098471868e-06, "loss": 0.2624, "step": 55700 }, { "epoch": 164.12, "learning_rate": 9.194516036311354e-06, "loss": 0.2563, "step": 55800 }, { "epoch": 164.41, "learning_rate": 9.191654343530363e-06, "loss": 0.2477, "step": 55900 }, { "epoch": 164.71, "learning_rate": 9.188788023288119e-06, "loss": 0.2481, "step": 56000 }, { "epoch": 164.71, "eval_cer": 0.084521162983305, "eval_loss": 0.3317776620388031, "eval_runtime": 4.9296, "eval_samples_per_second": 72.825, "eval_steps_per_second": 2.434, "eval_wer": 0.3143640174109302, "step": 56000 }, { "epoch": 165.0, "learning_rate": 9.185917078748954e-06, "loss": 0.2539, "step": 56100 }, { "epoch": 165.29, "learning_rate": 9.183041513082305e-06, "loss": 0.2472, "step": 56200 }, { "epoch": 165.59, "learning_rate": 9.180161329462708e-06, "loss": 0.2495, "step": 56300 }, { "epoch": 165.88, "learning_rate": 9.177276531069804e-06, "loss": 0.2523, "step": 56400 }, { "epoch": 166.18, "learning_rate": 9.174387121088321e-06, "loss": 0.2498, "step": 56500 }, { "epoch": 166.47, "learning_rate": 9.171493102708084e-06, "loss": 0.2514, "step": 56600 }, { "epoch": 166.76, "learning_rate": 9.168594479124003e-06, "loss": 0.2484, "step": 56700 }, { "epoch": 167.06, "learning_rate": 9.165691253536068e-06, "loss": 0.2464, "step": 56800 }, { "epoch": 167.35, "learning_rate": 9.162783429149358e-06, "loss": 0.2405, "step": 56900 }, { "epoch": 167.65, "learning_rate": 9.15987100917402e-06, "loss": 0.254, "step": 57000 }, { "epoch": 167.65, "eval_cer": 0.08356218124754806, "eval_loss": 0.3432825803756714, "eval_runtime": 4.4479, "eval_samples_per_second": 80.713, "eval_steps_per_second": 2.698, "eval_wer": 0.3121070449782363, "step": 57000 }, { "epoch": 167.94, "learning_rate": 9.156953996825281e-06, "loss": 0.2475, "step": 57100 }, { "epoch": 168.24, "learning_rate": 9.154032395323438e-06, "loss": 0.254, "step": 57200 }, { "epoch": 168.53, "learning_rate": 9.151106207893846e-06, "loss": 0.2501, "step": 57300 }, { "epoch": 168.82, "learning_rate": 9.148175437766935e-06, "loss": 0.2431, "step": 57400 }, { "epoch": 169.12, "learning_rate": 9.145240088178183e-06, "loss": 0.2534, "step": 57500 }, { "epoch": 169.41, "learning_rate": 9.142329584267872e-06, "loss": 0.2476, "step": 57600 }, { "epoch": 169.71, "learning_rate": 9.139385131195785e-06, "loss": 0.2359, "step": 57700 }, { "epoch": 170.0, "learning_rate": 9.136436108366091e-06, "loss": 0.2545, "step": 57800 }, { "epoch": 170.29, "learning_rate": 9.133482519034428e-06, "loss": 0.2479, "step": 57900 }, { "epoch": 170.59, "learning_rate": 9.13052436646147e-06, "loss": 0.2454, "step": 58000 }, { "epoch": 170.59, "eval_cer": 0.08212370864391265, "eval_loss": 0.3390425443649292, "eval_runtime": 4.4296, "eval_samples_per_second": 81.045, "eval_steps_per_second": 2.709, "eval_wer": 0.3088827986458165, "step": 58000 }, { "epoch": 170.88, "learning_rate": 9.127561653912929e-06, "loss": 0.2439, "step": 58100 }, { "epoch": 171.18, "learning_rate": 9.12459438465955e-06, "loss": 0.2415, "step": 58200 }, { "epoch": 171.47, "learning_rate": 9.121622561977108e-06, "loss": 0.251, "step": 58300 }, { "epoch": 171.76, "learning_rate": 9.118646189146411e-06, "loss": 0.2406, "step": 58400 }, { "epoch": 172.06, "learning_rate": 9.115665269453284e-06, "loss": 0.2458, "step": 58500 }, { "epoch": 172.35, "learning_rate": 9.11267980618857e-06, "loss": 0.2376, "step": 58600 }, { "epoch": 172.65, "learning_rate": 9.109689802648138e-06, "loss": 0.2432, "step": 58700 }, { "epoch": 172.94, "learning_rate": 9.106695262132857e-06, "loss": 0.2409, "step": 58800 }, { "epoch": 173.24, "learning_rate": 9.10369618794861e-06, "loss": 0.2432, "step": 58900 }, { "epoch": 173.53, "learning_rate": 9.10069258340629e-06, "loss": 0.239, "step": 59000 }, { "epoch": 173.53, "eval_cer": 0.08295192014297546, "eval_loss": 0.34216058254241943, "eval_runtime": 5.0698, "eval_samples_per_second": 70.811, "eval_steps_per_second": 2.367, "eval_wer": 0.3133967435112043, "step": 59000 }, { "epoch": 173.82, "learning_rate": 9.097684451821783e-06, "loss": 0.237, "step": 59100 }, { "epoch": 174.12, "learning_rate": 9.094671796515979e-06, "loss": 0.2288, "step": 59200 }, { "epoch": 174.41, "learning_rate": 9.091654620814756e-06, "loss": 0.2372, "step": 59300 }, { "epoch": 174.71, "learning_rate": 9.088632928048988e-06, "loss": 0.2379, "step": 59400 }, { "epoch": 175.0, "learning_rate": 9.085606721554536e-06, "loss": 0.2377, "step": 59500 }, { "epoch": 175.29, "learning_rate": 9.082576004672238e-06, "loss": 0.2292, "step": 59600 }, { "epoch": 175.59, "learning_rate": 9.079540780747916e-06, "loss": 0.2307, "step": 59700 }, { "epoch": 175.88, "learning_rate": 9.076501053132367e-06, "loss": 0.2442, "step": 59800 }, { "epoch": 176.18, "learning_rate": 9.07345682518136e-06, "loss": 0.2385, "step": 59900 }, { "epoch": 176.47, "learning_rate": 9.070408100255632e-06, "loss": 0.2358, "step": 60000 }, { "epoch": 176.47, "eval_cer": 0.08247242927509699, "eval_loss": 0.34609493613243103, "eval_runtime": 5.0633, "eval_samples_per_second": 70.902, "eval_steps_per_second": 2.37, "eval_wer": 0.31194583266161535, "step": 60000 }, { "epoch": 176.76, "learning_rate": 9.067354881720881e-06, "loss": 0.2394, "step": 60100 }, { "epoch": 177.06, "learning_rate": 9.064297172947772e-06, "loss": 0.2336, "step": 60200 }, { "epoch": 177.35, "learning_rate": 9.061265621467159e-06, "loss": 0.2455, "step": 60300 }, { "epoch": 177.65, "learning_rate": 9.058198987167215e-06, "loss": 0.2339, "step": 60400 }, { "epoch": 177.94, "learning_rate": 9.05512787273675e-06, "loss": 0.2365, "step": 60500 }, { "epoch": 178.24, "learning_rate": 9.052052281566177e-06, "loss": 0.2398, "step": 60600 }, { "epoch": 178.53, "learning_rate": 9.04897221705086e-06, "loss": 0.2351, "step": 60700 }, { "epoch": 178.82, "learning_rate": 9.045887682591096e-06, "loss": 0.2369, "step": 60800 }, { "epoch": 179.12, "learning_rate": 9.042798681592122e-06, "loss": 0.2355, "step": 60900 }, { "epoch": 179.41, "learning_rate": 9.039705217464103e-06, "loss": 0.2321, "step": 61000 }, { "epoch": 179.41, "eval_cer": 0.08168780785493222, "eval_loss": 0.3485713005065918, "eval_runtime": 4.9102, "eval_samples_per_second": 73.113, "eval_steps_per_second": 2.444, "eval_wer": 0.3075931001128486, "step": 61000 }, { "epoch": 179.71, "learning_rate": 9.036607293622126e-06, "loss": 0.24, "step": 61100 }, { "epoch": 180.0, "learning_rate": 9.033504913486213e-06, "loss": 0.2412, "step": 61200 }, { "epoch": 180.29, "learning_rate": 9.030398080481293e-06, "loss": 0.2303, "step": 61300 }, { "epoch": 180.59, "learning_rate": 9.027286798037222e-06, "loss": 0.2324, "step": 61400 }, { "epoch": 180.88, "learning_rate": 9.024171069588759e-06, "loss": 0.2271, "step": 61500 }, { "epoch": 181.18, "learning_rate": 9.0210821222651e-06, "loss": 0.2296, "step": 61600 }, { "epoch": 181.47, "learning_rate": 9.01795755650591e-06, "loss": 0.2331, "step": 61700 }, { "epoch": 181.76, "learning_rate": 9.014828555041533e-06, "loss": 0.233, "step": 61800 }, { "epoch": 182.06, "learning_rate": 9.011695121326294e-06, "loss": 0.2292, "step": 61900 }, { "epoch": 182.35, "learning_rate": 9.008557258819412e-06, "loss": 0.2254, "step": 62000 }, { "epoch": 182.35, "eval_cer": 0.08125190706595178, "eval_loss": 0.3570455014705658, "eval_runtime": 4.4496, "eval_samples_per_second": 80.681, "eval_steps_per_second": 2.697, "eval_wer": 0.3048524907302918, "step": 62000 }, { "epoch": 182.65, "learning_rate": 9.005414970984991e-06, "loss": 0.2275, "step": 62100 }, { "epoch": 182.94, "learning_rate": 9.002268261292025e-06, "loss": 0.2326, "step": 62200 }, { "epoch": 183.24, "learning_rate": 8.999117133214384e-06, "loss": 0.2203, "step": 62300 }, { "epoch": 183.53, "learning_rate": 8.995961590230823e-06, "loss": 0.2262, "step": 62400 }, { "epoch": 183.82, "learning_rate": 8.992801635824966e-06, "loss": 0.2349, "step": 62500 }, { "epoch": 184.12, "learning_rate": 8.989637273485308e-06, "loss": 0.2266, "step": 62600 }, { "epoch": 184.41, "learning_rate": 8.986468506705211e-06, "loss": 0.2297, "step": 62700 }, { "epoch": 184.71, "learning_rate": 8.983295338982898e-06, "loss": 0.2277, "step": 62800 }, { "epoch": 185.0, "learning_rate": 8.980117773821452e-06, "loss": 0.2191, "step": 62900 }, { "epoch": 185.29, "learning_rate": 8.976935814728811e-06, "loss": 0.2243, "step": 63000 }, { "epoch": 185.29, "eval_cer": 0.081469857460442, "eval_loss": 0.3529977798461914, "eval_runtime": 5.5886, "eval_samples_per_second": 64.238, "eval_steps_per_second": 2.147, "eval_wer": 0.30146703208125103, "step": 63000 }, { "epoch": 185.59, "learning_rate": 8.973749465217761e-06, "loss": 0.2322, "step": 63100 }, { "epoch": 185.88, "learning_rate": 8.970558728805939e-06, "loss": 0.2267, "step": 63200 }, { "epoch": 186.18, "learning_rate": 8.96736360901582e-06, "loss": 0.2199, "step": 63300 }, { "epoch": 186.47, "learning_rate": 8.964164109374725e-06, "loss": 0.2243, "step": 63400 }, { "epoch": 186.76, "learning_rate": 8.9609602334148e-06, "loss": 0.2279, "step": 63500 }, { "epoch": 187.06, "learning_rate": 8.957751984673035e-06, "loss": 0.2254, "step": 63600 }, { "epoch": 187.35, "learning_rate": 8.954539366691238e-06, "loss": 0.2284, "step": 63700 }, { "epoch": 187.65, "learning_rate": 8.951354574451317e-06, "loss": 0.225, "step": 63800 }, { "epoch": 187.94, "learning_rate": 8.948133272238002e-06, "loss": 0.2196, "step": 63900 }, { "epoch": 188.24, "learning_rate": 8.944907611403423e-06, "loss": 0.2238, "step": 64000 }, { "epoch": 188.24, "eval_cer": 0.08094677651366548, "eval_loss": 0.35666173696517944, "eval_runtime": 5.2701, "eval_samples_per_second": 68.12, "eval_steps_per_second": 2.277, "eval_wer": 0.2988876350153152, "step": 64000 }, { "epoch": 188.53, "learning_rate": 8.941677595508617e-06, "loss": 0.2272, "step": 64100 }, { "epoch": 188.82, "learning_rate": 8.938443228119427e-06, "loss": 0.23, "step": 64200 }, { "epoch": 189.12, "learning_rate": 8.935204512806494e-06, "loss": 0.2261, "step": 64300 }, { "epoch": 189.41, "learning_rate": 8.931993905234649e-06, "loss": 0.2222, "step": 64400 }, { "epoch": 189.71, "learning_rate": 8.928746548195306e-06, "loss": 0.2331, "step": 64500 }, { "epoch": 190.0, "learning_rate": 8.925494853937067e-06, "loss": 0.2166, "step": 64600 }, { "epoch": 190.29, "learning_rate": 8.922238826049705e-06, "loss": 0.2224, "step": 64700 }, { "epoch": 190.59, "learning_rate": 8.918978468127777e-06, "loss": 0.213, "step": 64800 }, { "epoch": 190.88, "learning_rate": 8.915713783770622e-06, "loss": 0.2186, "step": 64900 }, { "epoch": 191.18, "learning_rate": 8.912444776582354e-06, "loss": 0.2143, "step": 65000 }, { "epoch": 191.18, "eval_cer": 0.08016215509350072, "eval_loss": 0.3535269796848297, "eval_runtime": 4.4256, "eval_samples_per_second": 81.12, "eval_steps_per_second": 2.712, "eval_wer": 0.3001773335482831, "step": 65000 }, { "epoch": 191.47, "learning_rate": 8.909171450171858e-06, "loss": 0.2201, "step": 65100 }, { "epoch": 191.76, "learning_rate": 8.90589380815279e-06, "loss": 0.215, "step": 65200 }, { "epoch": 192.06, "learning_rate": 8.902611854143569e-06, "loss": 0.218, "step": 65300 }, { "epoch": 192.35, "learning_rate": 8.899325591767371e-06, "loss": 0.2169, "step": 65400 }, { "epoch": 192.65, "learning_rate": 8.896035024652135e-06, "loss": 0.218, "step": 65500 }, { "epoch": 192.94, "learning_rate": 8.892740156430548e-06, "loss": 0.2225, "step": 65600 }, { "epoch": 193.24, "learning_rate": 8.889440990740048e-06, "loss": 0.2191, "step": 65700 }, { "epoch": 193.53, "learning_rate": 8.886137531222812e-06, "loss": 0.2262, "step": 65800 }, { "epoch": 193.82, "learning_rate": 8.882829781525762e-06, "loss": 0.219, "step": 65900 }, { "epoch": 194.12, "learning_rate": 8.879517745300557e-06, "loss": 0.2068, "step": 66000 }, { "epoch": 194.12, "eval_cer": 0.0793339435944379, "eval_loss": 0.35546955466270447, "eval_runtime": 4.9742, "eval_samples_per_second": 72.173, "eval_steps_per_second": 2.412, "eval_wer": 0.2992100596485571, "step": 66000 }, { "epoch": 194.41, "learning_rate": 8.876201426203583e-06, "loss": 0.2166, "step": 66100 }, { "epoch": 194.71, "learning_rate": 8.872880827895957e-06, "loss": 0.2128, "step": 66200 }, { "epoch": 195.0, "learning_rate": 8.869555954043525e-06, "loss": 0.2172, "step": 66300 }, { "epoch": 195.29, "learning_rate": 8.866226808316844e-06, "loss": 0.2199, "step": 66400 }, { "epoch": 195.59, "learning_rate": 8.862893394391192e-06, "loss": 0.2214, "step": 66500 }, { "epoch": 195.88, "learning_rate": 8.859555715946561e-06, "loss": 0.2143, "step": 66600 }, { "epoch": 196.18, "learning_rate": 8.856213776667646e-06, "loss": 0.2128, "step": 66700 }, { "epoch": 196.47, "learning_rate": 8.85286758024385e-06, "loss": 0.2083, "step": 66800 }, { "epoch": 196.76, "learning_rate": 8.84951713036927e-06, "loss": 0.2139, "step": 66900 }, { "epoch": 197.06, "learning_rate": 8.846162430742708e-06, "loss": 0.2177, "step": 67000 }, { "epoch": 197.06, "eval_cer": 0.0796390741467242, "eval_loss": 0.3596145808696747, "eval_runtime": 4.9633, "eval_samples_per_second": 72.331, "eval_steps_per_second": 2.418, "eval_wer": 0.300822182814767, "step": 67000 }, { "epoch": 197.35, "learning_rate": 8.842803485067648e-06, "loss": 0.2133, "step": 67100 }, { "epoch": 197.65, "learning_rate": 8.839440297052269e-06, "loss": 0.2151, "step": 67200 }, { "epoch": 197.94, "learning_rate": 8.836072870409429e-06, "loss": 0.229, "step": 67300 }, { "epoch": 198.24, "learning_rate": 8.832701208856665e-06, "loss": 0.2118, "step": 67400 }, { "epoch": 198.53, "learning_rate": 8.829325316116191e-06, "loss": 0.2137, "step": 67500 }, { "epoch": 198.82, "learning_rate": 8.825945195914893e-06, "loss": 0.2113, "step": 67600 }, { "epoch": 199.12, "learning_rate": 8.822560851984324e-06, "loss": 0.2267, "step": 67700 }, { "epoch": 199.41, "learning_rate": 8.819172288060696e-06, "loss": 0.2123, "step": 67800 }, { "epoch": 199.71, "learning_rate": 8.815779507884882e-06, "loss": 0.2234, "step": 67900 }, { "epoch": 200.0, "learning_rate": 8.812382515202413e-06, "loss": 0.214, "step": 68000 }, { "epoch": 200.0, "eval_cer": 0.08020574517239876, "eval_loss": 0.3504684865474701, "eval_runtime": 4.4424, "eval_samples_per_second": 80.812, "eval_steps_per_second": 2.701, "eval_wer": 0.3000161212316621, "step": 68000 }, { "epoch": 200.29, "learning_rate": 8.808981313763467e-06, "loss": 0.2106, "step": 68100 }, { "epoch": 200.59, "learning_rate": 8.805575907322868e-06, "loss": 0.2152, "step": 68200 }, { "epoch": 200.88, "learning_rate": 8.80216629964008e-06, "loss": 0.221, "step": 68300 }, { "epoch": 201.18, "learning_rate": 8.798752494479213e-06, "loss": 0.2061, "step": 68400 }, { "epoch": 201.47, "learning_rate": 8.795334495609003e-06, "loss": 0.2031, "step": 68500 }, { "epoch": 201.76, "learning_rate": 8.79191230680282e-06, "loss": 0.2065, "step": 68600 }, { "epoch": 202.06, "learning_rate": 8.78848593183866e-06, "loss": 0.2109, "step": 68700 }, { "epoch": 202.35, "learning_rate": 8.785055374499135e-06, "loss": 0.2076, "step": 68800 }, { "epoch": 202.65, "learning_rate": 8.781620638571478e-06, "loss": 0.2059, "step": 68900 }, { "epoch": 202.94, "learning_rate": 8.778181727847537e-06, "loss": 0.2027, "step": 69000 }, { "epoch": 202.94, "eval_cer": 0.0793339435944379, "eval_loss": 0.3646654784679413, "eval_runtime": 4.806, "eval_samples_per_second": 74.698, "eval_steps_per_second": 2.497, "eval_wer": 0.2956633886828954, "step": 69000 }, { "epoch": 203.24, "learning_rate": 8.774738646123767e-06, "loss": 0.1986, "step": 69100 }, { "epoch": 203.53, "learning_rate": 8.771291397201227e-06, "loss": 0.206, "step": 69200 }, { "epoch": 203.82, "learning_rate": 8.76787451960502e-06, "loss": 0.2011, "step": 69300 }, { "epoch": 204.12, "learning_rate": 8.764418989283467e-06, "loss": 0.2044, "step": 69400 }, { "epoch": 204.41, "learning_rate": 8.760959303155737e-06, "loss": 0.2121, "step": 69500 }, { "epoch": 204.71, "learning_rate": 8.757495465041219e-06, "loss": 0.2046, "step": 69600 }, { "epoch": 205.0, "learning_rate": 8.75402747876389e-06, "loss": 0.2066, "step": 69700 }, { "epoch": 205.29, "learning_rate": 8.750555348152299e-06, "loss": 0.2158, "step": 69800 }, { "epoch": 205.59, "learning_rate": 8.747079077039577e-06, "loss": 0.1984, "step": 69900 }, { "epoch": 205.88, "learning_rate": 8.743598669263422e-06, "loss": 0.2062, "step": 70000 }, { "epoch": 205.88, "eval_cer": 0.0796390741467242, "eval_loss": 0.3702377378940582, "eval_runtime": 4.7589, "eval_samples_per_second": 75.438, "eval_steps_per_second": 2.522, "eval_wer": 0.2975979364823472, "step": 70000 }, { "epoch": 206.18, "learning_rate": 8.740114128666103e-06, "loss": 0.2108, "step": 70100 }, { "epoch": 206.47, "learning_rate": 8.736625459094445e-06, "loss": 0.2085, "step": 70200 }, { "epoch": 206.76, "learning_rate": 8.733132664399839e-06, "loss": 0.2036, "step": 70300 }, { "epoch": 207.06, "learning_rate": 8.729635748438225e-06, "loss": 0.2005, "step": 70400 }, { "epoch": 207.35, "learning_rate": 8.726134715070092e-06, "loss": 0.207, "step": 70500 }, { "epoch": 207.65, "learning_rate": 8.722629568160476e-06, "loss": 0.2073, "step": 70600 }, { "epoch": 207.94, "learning_rate": 8.71912031157896e-06, "loss": 0.2015, "step": 70700 }, { "epoch": 208.24, "learning_rate": 8.71560694919965e-06, "loss": 0.1977, "step": 70800 }, { "epoch": 208.53, "learning_rate": 8.712089484901201e-06, "loss": 0.2027, "step": 70900 }, { "epoch": 208.82, "learning_rate": 8.708567922566781e-06, "loss": 0.2097, "step": 71000 }, { "epoch": 208.82, "eval_cer": 0.07981343446231638, "eval_loss": 0.3614213764667511, "eval_runtime": 4.5359, "eval_samples_per_second": 79.147, "eval_steps_per_second": 2.646, "eval_wer": 0.2972755118491053, "step": 71000 }, { "epoch": 209.12, "learning_rate": 8.705042266084098e-06, "loss": 0.2017, "step": 71100 }, { "epoch": 209.41, "learning_rate": 8.701512519345366e-06, "loss": 0.202, "step": 71200 }, { "epoch": 209.71, "learning_rate": 8.69797868624732e-06, "loss": 0.2067, "step": 71300 }, { "epoch": 210.0, "learning_rate": 8.69444077069121e-06, "loss": 0.2098, "step": 71400 }, { "epoch": 210.29, "learning_rate": 8.690898776582786e-06, "loss": 0.2027, "step": 71500 }, { "epoch": 210.59, "learning_rate": 8.687352707832303e-06, "loss": 0.1998, "step": 71600 }, { "epoch": 210.88, "learning_rate": 8.683802568354519e-06, "loss": 0.2014, "step": 71700 }, { "epoch": 211.18, "learning_rate": 8.680248362068677e-06, "loss": 0.1935, "step": 71800 }, { "epoch": 211.47, "learning_rate": 8.676690092898518e-06, "loss": 0.2037, "step": 71900 }, { "epoch": 211.76, "learning_rate": 8.673127764772264e-06, "loss": 0.2041, "step": 72000 }, { "epoch": 211.76, "eval_cer": 0.0793339435944379, "eval_loss": 0.3621172606945038, "eval_runtime": 4.7752, "eval_samples_per_second": 75.18, "eval_steps_per_second": 2.513, "eval_wer": 0.2964694502660003, "step": 72000 }, { "epoch": 212.06, "learning_rate": 8.66956138162262e-06, "loss": 0.2003, "step": 72100 }, { "epoch": 212.35, "learning_rate": 8.665990947386765e-06, "loss": 0.1893, "step": 72200 }, { "epoch": 212.65, "learning_rate": 8.662416466006352e-06, "loss": 0.1984, "step": 72300 }, { "epoch": 212.94, "learning_rate": 8.658837941427502e-06, "loss": 0.2038, "step": 72400 }, { "epoch": 213.24, "learning_rate": 8.655255377600802e-06, "loss": 0.2029, "step": 72500 }, { "epoch": 213.53, "learning_rate": 8.65166877848129e-06, "loss": 0.2029, "step": 72600 }, { "epoch": 213.82, "learning_rate": 8.648078148028466e-06, "loss": 0.1899, "step": 72700 }, { "epoch": 214.12, "learning_rate": 8.644483490206283e-06, "loss": 0.1949, "step": 72800 }, { "epoch": 214.41, "learning_rate": 8.640920815698158e-06, "loss": 0.2023, "step": 72900 }, { "epoch": 214.71, "learning_rate": 8.637318155221476e-06, "loss": 0.2099, "step": 73000 }, { "epoch": 214.71, "eval_cer": 0.07837496185868097, "eval_loss": 0.3655032813549042, "eval_runtime": 5.0092, "eval_samples_per_second": 71.667, "eval_steps_per_second": 2.396, "eval_wer": 0.29614702563275835, "step": 73000 }, { "epoch": 215.0, "learning_rate": 8.633711479254145e-06, "loss": 0.1991, "step": 73100 }, { "epoch": 215.29, "learning_rate": 8.630100791777824e-06, "loss": 0.1907, "step": 73200 }, { "epoch": 215.59, "learning_rate": 8.626486096778608e-06, "loss": 0.1894, "step": 73300 }, { "epoch": 215.88, "learning_rate": 8.622867398247007e-06, "loss": 0.193, "step": 73400 }, { "epoch": 216.18, "learning_rate": 8.619244700177962e-06, "loss": 0.1929, "step": 73500 }, { "epoch": 216.47, "learning_rate": 8.615618006570818e-06, "loss": 0.192, "step": 73600 }, { "epoch": 216.76, "learning_rate": 8.611987321429341e-06, "loss": 0.1951, "step": 73700 }, { "epoch": 217.06, "learning_rate": 8.608352648761697e-06, "loss": 0.1962, "step": 73800 }, { "epoch": 217.35, "learning_rate": 8.604713992580456e-06, "loss": 0.1981, "step": 73900 }, { "epoch": 217.65, "learning_rate": 8.601071356902584e-06, "loss": 0.2009, "step": 74000 }, { "epoch": 217.65, "eval_cer": 0.07854932217427314, "eval_loss": 0.36690473556518555, "eval_runtime": 4.8416, "eval_samples_per_second": 74.149, "eval_steps_per_second": 2.479, "eval_wer": 0.2948573270997904, "step": 74000 }, { "epoch": 217.94, "learning_rate": 8.597424745749446e-06, "loss": 0.1953, "step": 74100 }, { "epoch": 218.24, "learning_rate": 8.59377416314679e-06, "loss": 0.1933, "step": 74200 }, { "epoch": 218.53, "learning_rate": 8.59011961312475e-06, "loss": 0.1988, "step": 74300 }, { "epoch": 218.82, "learning_rate": 8.58646109971784e-06, "loss": 0.1955, "step": 74400 }, { "epoch": 219.12, "learning_rate": 8.58279862696495e-06, "loss": 0.1873, "step": 74500 }, { "epoch": 219.41, "learning_rate": 8.57913219890934e-06, "loss": 0.1928, "step": 74600 }, { "epoch": 219.71, "learning_rate": 8.575461819598637e-06, "loss": 0.1936, "step": 74700 }, { "epoch": 220.0, "learning_rate": 8.57178749308483e-06, "loss": 0.1883, "step": 74800 }, { "epoch": 220.29, "learning_rate": 8.568109223424269e-06, "loss": 0.1984, "step": 74900 }, { "epoch": 220.59, "learning_rate": 8.56442701467765e-06, "loss": 0.188, "step": 75000 }, { "epoch": 220.59, "eval_cer": 0.07911599319994769, "eval_loss": 0.3651310205459595, "eval_runtime": 4.7688, "eval_samples_per_second": 75.282, "eval_steps_per_second": 2.516, "eval_wer": 0.2963082379493793, "step": 75000 }, { "epoch": 220.88, "learning_rate": 8.560740870910022e-06, "loss": 0.1876, "step": 75100 }, { "epoch": 221.18, "learning_rate": 8.55705079619078e-06, "loss": 0.188, "step": 75200 }, { "epoch": 221.47, "learning_rate": 8.553356794593654e-06, "loss": 0.1815, "step": 75300 }, { "epoch": 221.76, "learning_rate": 8.549658870196714e-06, "loss": 0.1993, "step": 75400 }, { "epoch": 222.06, "learning_rate": 8.545957027082354e-06, "loss": 0.1927, "step": 75500 }, { "epoch": 222.35, "learning_rate": 8.542251269337301e-06, "loss": 0.1961, "step": 75600 }, { "epoch": 222.65, "learning_rate": 8.538541601052601e-06, "loss": 0.1909, "step": 75700 }, { "epoch": 222.94, "learning_rate": 8.534828026323619e-06, "loss": 0.1906, "step": 75800 }, { "epoch": 223.24, "learning_rate": 8.531110549250025e-06, "loss": 0.1893, "step": 75900 }, { "epoch": 223.53, "learning_rate": 8.527389173935807e-06, "loss": 0.1904, "step": 76000 }, { "epoch": 223.53, "eval_cer": 0.07854932217427314, "eval_loss": 0.3699847459793091, "eval_runtime": 4.7309, "eval_samples_per_second": 75.884, "eval_steps_per_second": 2.537, "eval_wer": 0.2943736901499275, "step": 76000 }, { "epoch": 223.82, "learning_rate": 8.523663904489252e-06, "loss": 0.1924, "step": 76100 }, { "epoch": 224.12, "learning_rate": 8.519934745022946e-06, "loss": 0.1919, "step": 76200 }, { "epoch": 224.41, "learning_rate": 8.516201699653767e-06, "loss": 0.1839, "step": 76300 }, { "epoch": 224.71, "learning_rate": 8.51246477250289e-06, "loss": 0.1907, "step": 76400 }, { "epoch": 225.0, "learning_rate": 8.50876139492468e-06, "loss": 0.1808, "step": 76500 }, { "epoch": 225.29, "learning_rate": 8.50501675530586e-06, "loss": 0.1896, "step": 76600 }, { "epoch": 225.59, "learning_rate": 8.501268246253185e-06, "loss": 0.1865, "step": 76700 }, { "epoch": 225.88, "learning_rate": 8.497515871904896e-06, "loss": 0.1868, "step": 76800 }, { "epoch": 226.18, "learning_rate": 8.493759636403502e-06, "loss": 0.1851, "step": 76900 }, { "epoch": 226.47, "learning_rate": 8.489999543895777e-06, "loss": 0.1901, "step": 77000 }, { "epoch": 226.47, "eval_cer": 0.07850573209537509, "eval_loss": 0.37494558095932007, "eval_runtime": 4.7868, "eval_samples_per_second": 74.998, "eval_steps_per_second": 2.507, "eval_wer": 0.2937288408834435, "step": 77000 }, { "epoch": 226.76, "learning_rate": 8.486235598532748e-06, "loss": 0.1895, "step": 77100 }, { "epoch": 227.06, "learning_rate": 8.482467804469701e-06, "loss": 0.1884, "step": 77200 }, { "epoch": 227.35, "learning_rate": 8.478696165866164e-06, "loss": 0.1808, "step": 77300 }, { "epoch": 227.65, "learning_rate": 8.474920686885921e-06, "loss": 0.1905, "step": 77400 }, { "epoch": 227.94, "learning_rate": 8.471141371696981e-06, "loss": 0.187, "step": 77500 }, { "epoch": 228.24, "learning_rate": 8.467358224471598e-06, "loss": 0.1942, "step": 77600 }, { "epoch": 228.53, "learning_rate": 8.463571249386255e-06, "loss": 0.187, "step": 77700 }, { "epoch": 228.82, "learning_rate": 8.459780450621655e-06, "loss": 0.1821, "step": 77800 }, { "epoch": 229.12, "learning_rate": 8.45598583236273e-06, "loss": 0.1905, "step": 77900 }, { "epoch": 229.41, "learning_rate": 8.452187398798625e-06, "loss": 0.1857, "step": 78000 }, { "epoch": 229.41, "eval_cer": 0.07802624122749661, "eval_loss": 0.3787274658679962, "eval_runtime": 4.6442, "eval_samples_per_second": 77.301, "eval_steps_per_second": 2.584, "eval_wer": 0.29098823150088665, "step": 78000 }, { "epoch": 229.71, "learning_rate": 8.448385154122697e-06, "loss": 0.1909, "step": 78100 }, { "epoch": 230.0, "learning_rate": 8.444579102532511e-06, "loss": 0.178, "step": 78200 }, { "epoch": 230.29, "learning_rate": 8.440769248229831e-06, "loss": 0.1833, "step": 78300 }, { "epoch": 230.59, "learning_rate": 8.436955595420629e-06, "loss": 0.1824, "step": 78400 }, { "epoch": 230.88, "learning_rate": 8.433138148315059e-06, "loss": 0.1811, "step": 78500 }, { "epoch": 231.18, "learning_rate": 8.429316911127469e-06, "loss": 0.1839, "step": 78600 }, { "epoch": 231.47, "learning_rate": 8.42549188807639e-06, "loss": 0.1871, "step": 78700 }, { "epoch": 231.76, "learning_rate": 8.421663083384539e-06, "loss": 0.1796, "step": 78800 }, { "epoch": 232.06, "learning_rate": 8.417830501278794e-06, "loss": 0.1853, "step": 78900 }, { "epoch": 232.35, "learning_rate": 8.413994145990216e-06, "loss": 0.1796, "step": 79000 }, { "epoch": 232.35, "eval_cer": 0.078418551937579, "eval_loss": 0.3776050806045532, "eval_runtime": 4.6833, "eval_samples_per_second": 76.656, "eval_steps_per_second": 2.562, "eval_wer": 0.2943736901499275, "step": 79000 }, { "epoch": 232.65, "learning_rate": 8.410154021754026e-06, "loss": 0.1848, "step": 79100 }, { "epoch": 232.94, "learning_rate": 8.406310132809604e-06, "loss": 0.182, "step": 79200 }, { "epoch": 233.24, "learning_rate": 8.402462483400494e-06, "loss": 0.1849, "step": 79300 }, { "epoch": 233.53, "learning_rate": 8.398611077774382e-06, "loss": 0.1856, "step": 79400 }, { "epoch": 233.82, "learning_rate": 8.394755920183107e-06, "loss": 0.1754, "step": 79500 }, { "epoch": 234.12, "learning_rate": 8.390897014882645e-06, "loss": 0.1732, "step": 79600 }, { "epoch": 234.41, "learning_rate": 8.387034366133113e-06, "loss": 0.1879, "step": 79700 }, { "epoch": 234.71, "learning_rate": 8.383167978198762e-06, "loss": 0.1751, "step": 79800 }, { "epoch": 235.0, "learning_rate": 8.379297855347966e-06, "loss": 0.1849, "step": 79900 }, { "epoch": 235.29, "learning_rate": 8.37542400185323e-06, "loss": 0.1836, "step": 80000 }, { "epoch": 235.29, "eval_cer": 0.078418551937579, "eval_loss": 0.38717299699783325, "eval_runtime": 4.8192, "eval_samples_per_second": 74.494, "eval_steps_per_second": 2.49, "eval_wer": 0.2930839916169595, "step": 80000 }, { "epoch": 235.59, "learning_rate": 8.371546421991167e-06, "loss": 0.1776, "step": 80100 }, { "epoch": 235.88, "learning_rate": 8.367665120042513e-06, "loss": 0.179, "step": 80200 }, { "epoch": 236.18, "learning_rate": 8.363780100292104e-06, "loss": 0.1853, "step": 80300 }, { "epoch": 236.47, "learning_rate": 8.359891367028895e-06, "loss": 0.1792, "step": 80400 }, { "epoch": 236.76, "learning_rate": 8.356037867317286e-06, "loss": 0.1834, "step": 80500 }, { "epoch": 237.06, "learning_rate": 8.352141756939638e-06, "loss": 0.1799, "step": 80600 }, { "epoch": 237.35, "learning_rate": 8.348241945897569e-06, "loss": 0.1832, "step": 80700 }, { "epoch": 237.65, "learning_rate": 8.344338438496354e-06, "loss": 0.1799, "step": 80800 }, { "epoch": 237.94, "learning_rate": 8.340431239045348e-06, "loss": 0.1772, "step": 80900 }, { "epoch": 238.24, "learning_rate": 8.336520351857981e-06, "loss": 0.1833, "step": 81000 }, { "epoch": 238.24, "eval_cer": 0.07889804280545748, "eval_loss": 0.3830723762512207, "eval_runtime": 4.9874, "eval_samples_per_second": 71.981, "eval_steps_per_second": 2.406, "eval_wer": 0.2930839916169595, "step": 81000 }, { "epoch": 238.53, "learning_rate": 8.33260578125176e-06, "loss": 0.1729, "step": 81100 }, { "epoch": 238.82, "learning_rate": 8.32868753154825e-06, "loss": 0.1789, "step": 81200 }, { "epoch": 239.12, "learning_rate": 8.324765607073083e-06, "loss": 0.1753, "step": 81300 }, { "epoch": 239.41, "learning_rate": 8.320840012155949e-06, "loss": 0.1704, "step": 81400 }, { "epoch": 239.71, "learning_rate": 8.316910751130583e-06, "loss": 0.1784, "step": 81500 }, { "epoch": 240.0, "learning_rate": 8.312977828334777e-06, "loss": 0.1784, "step": 81600 }, { "epoch": 240.29, "learning_rate": 8.309041248110355e-06, "loss": 0.178, "step": 81700 }, { "epoch": 240.59, "learning_rate": 8.305101014803185e-06, "loss": 0.1754, "step": 81800 }, { "epoch": 240.88, "learning_rate": 8.301157132763172e-06, "loss": 0.1795, "step": 81900 }, { "epoch": 241.18, "learning_rate": 8.297209606344238e-06, "loss": 0.1702, "step": 82000 }, { "epoch": 241.18, "eval_cer": 0.07824419162198684, "eval_loss": 0.3892400562763214, "eval_runtime": 4.742, "eval_samples_per_second": 75.706, "eval_steps_per_second": 2.531, "eval_wer": 0.2914718684507496, "step": 82000 }, { "epoch": 241.47, "learning_rate": 8.29325843990434e-06, "loss": 0.1775, "step": 82100 }, { "epoch": 241.76, "learning_rate": 8.289303637805442e-06, "loss": 0.1759, "step": 82200 }, { "epoch": 242.06, "learning_rate": 8.285345204413531e-06, "loss": 0.1819, "step": 82300 }, { "epoch": 242.35, "learning_rate": 8.281383144098599e-06, "loss": 0.1693, "step": 82400 }, { "epoch": 242.65, "learning_rate": 8.277417461234639e-06, "loss": 0.1743, "step": 82500 }, { "epoch": 242.94, "learning_rate": 8.27344816019965e-06, "loss": 0.1764, "step": 82600 }, { "epoch": 243.24, "learning_rate": 8.269475245375624e-06, "loss": 0.1715, "step": 82700 }, { "epoch": 243.53, "learning_rate": 8.265498721148536e-06, "loss": 0.1747, "step": 82800 }, { "epoch": 243.82, "learning_rate": 8.261598229793867e-06, "loss": 0.1758, "step": 82900 }, { "epoch": 244.12, "learning_rate": 8.257614571903827e-06, "loss": 0.1782, "step": 83000 }, { "epoch": 244.12, "eval_cer": 0.07833137177978292, "eval_loss": 0.38854503631591797, "eval_runtime": 4.6398, "eval_samples_per_second": 77.374, "eval_steps_per_second": 2.586, "eval_wer": 0.29340641625020153, "step": 83000 }, { "epoch": 244.41, "learning_rate": 8.253627317704554e-06, "loss": 0.1749, "step": 83100 }, { "epoch": 244.71, "learning_rate": 8.24963647159786e-06, "loss": 0.1746, "step": 83200 }, { "epoch": 245.0, "learning_rate": 8.245642037989519e-06, "loss": 0.1728, "step": 83300 }, { "epoch": 245.29, "learning_rate": 8.241644021289268e-06, "loss": 0.1726, "step": 83400 }, { "epoch": 245.59, "learning_rate": 8.237642425910796e-06, "loss": 0.1696, "step": 83500 }, { "epoch": 245.88, "learning_rate": 8.233637256271744e-06, "loss": 0.1729, "step": 83600 }, { "epoch": 246.18, "learning_rate": 8.229628516793703e-06, "loss": 0.172, "step": 83700 }, { "epoch": 246.47, "learning_rate": 8.2256162119022e-06, "loss": 0.1728, "step": 83800 }, { "epoch": 246.76, "learning_rate": 8.2216003460267e-06, "loss": 0.1773, "step": 83900 }, { "epoch": 247.06, "learning_rate": 8.217580923600598e-06, "loss": 0.1701, "step": 84000 }, { "epoch": 247.06, "eval_cer": 0.07737239004402598, "eval_loss": 0.3914085924625397, "eval_runtime": 4.7341, "eval_samples_per_second": 75.833, "eval_steps_per_second": 2.535, "eval_wer": 0.2895373206512978, "step": 84000 }, { "epoch": 247.35, "learning_rate": 8.21355794906122e-06, "loss": 0.1728, "step": 84100 }, { "epoch": 247.65, "learning_rate": 8.209531426849805e-06, "loss": 0.1745, "step": 84200 }, { "epoch": 247.94, "learning_rate": 8.205501361411516e-06, "loss": 0.1684, "step": 84300 }, { "epoch": 248.24, "learning_rate": 8.201467757195422e-06, "loss": 0.17, "step": 84400 }, { "epoch": 248.53, "learning_rate": 8.197430618654507e-06, "loss": 0.1723, "step": 84500 }, { "epoch": 248.82, "learning_rate": 8.193389950245647e-06, "loss": 0.1755, "step": 84600 }, { "epoch": 249.12, "learning_rate": 8.18934575642962e-06, "loss": 0.1714, "step": 84700 }, { "epoch": 249.41, "learning_rate": 8.185298041671098e-06, "loss": 0.167, "step": 84800 }, { "epoch": 249.71, "learning_rate": 8.181246810438635e-06, "loss": 0.1716, "step": 84900 }, { "epoch": 250.0, "learning_rate": 8.177192067204668e-06, "loss": 0.1694, "step": 85000 }, { "epoch": 250.0, "eval_cer": 0.07815701146419075, "eval_loss": 0.3912142217159271, "eval_runtime": 4.7431, "eval_samples_per_second": 75.689, "eval_steps_per_second": 2.53, "eval_wer": 0.2903433822344027, "step": 85000 }, { "epoch": 250.29, "learning_rate": 8.173174416300648e-06, "loss": 0.1667, "step": 85100 }, { "epoch": 250.59, "learning_rate": 8.169112697504755e-06, "loss": 0.1663, "step": 85200 }, { "epoch": 250.88, "learning_rate": 8.16504748010306e-06, "loss": 0.1759, "step": 85300 }, { "epoch": 251.18, "learning_rate": 8.160978768583436e-06, "loss": 0.1643, "step": 85400 }, { "epoch": 251.47, "learning_rate": 8.156906567437623e-06, "loss": 0.1659, "step": 85500 }, { "epoch": 251.76, "learning_rate": 8.15283088116121e-06, "loss": 0.1669, "step": 85600 }, { "epoch": 252.06, "learning_rate": 8.148751714253633e-06, "loss": 0.168, "step": 85700 }, { "epoch": 252.35, "learning_rate": 8.14466907121817e-06, "loss": 0.1734, "step": 85800 }, { "epoch": 252.65, "learning_rate": 8.140582956561936e-06, "loss": 0.1641, "step": 85900 }, { "epoch": 252.94, "learning_rate": 8.13649337479588e-06, "loss": 0.17, "step": 86000 }, { "epoch": 252.94, "eval_cer": 0.07772111067521033, "eval_loss": 0.404951274394989, "eval_runtime": 4.4459, "eval_samples_per_second": 80.749, "eval_steps_per_second": 2.699, "eval_wer": 0.29131065613412865, "step": 86000 }, { "epoch": 253.24, "learning_rate": 8.132400330434778e-06, "loss": 0.1724, "step": 86100 }, { "epoch": 253.53, "learning_rate": 8.128303827997228e-06, "loss": 0.1713, "step": 86200 }, { "epoch": 253.82, "learning_rate": 8.12420387200565e-06, "loss": 0.1699, "step": 86300 }, { "epoch": 254.12, "learning_rate": 8.120100466986268e-06, "loss": 0.163, "step": 86400 }, { "epoch": 254.41, "learning_rate": 8.115993617469121e-06, "loss": 0.1714, "step": 86500 }, { "epoch": 254.71, "learning_rate": 8.11188332798805e-06, "loss": 0.1717, "step": 86600 }, { "epoch": 255.0, "learning_rate": 8.10776960308069e-06, "loss": 0.1671, "step": 86700 }, { "epoch": 255.29, "learning_rate": 8.10365244728847e-06, "loss": 0.1674, "step": 86800 }, { "epoch": 255.59, "learning_rate": 8.099531865156609e-06, "loss": 0.1612, "step": 86900 }, { "epoch": 255.88, "learning_rate": 8.095407861234105e-06, "loss": 0.1654, "step": 87000 }, { "epoch": 255.88, "eval_cer": 0.07676212893945338, "eval_loss": 0.3947739899158478, "eval_runtime": 4.6602, "eval_samples_per_second": 77.036, "eval_steps_per_second": 2.575, "eval_wer": 0.2882476221183298, "step": 87000 }, { "epoch": 256.18, "learning_rate": 8.091280440073735e-06, "loss": 0.1648, "step": 87100 }, { "epoch": 256.47, "learning_rate": 8.08714960623205e-06, "loss": 0.1632, "step": 87200 }, { "epoch": 256.76, "learning_rate": 8.083015364269366e-06, "loss": 0.1645, "step": 87300 }, { "epoch": 257.06, "learning_rate": 8.078877718749765e-06, "loss": 0.162, "step": 87400 }, { "epoch": 257.35, "learning_rate": 8.07473667424108e-06, "loss": 0.1624, "step": 87500 }, { "epoch": 257.65, "learning_rate": 8.070592235314904e-06, "loss": 0.1625, "step": 87600 }, { "epoch": 257.94, "learning_rate": 8.066444406546573e-06, "loss": 0.1648, "step": 87700 }, { "epoch": 258.24, "learning_rate": 8.062293192515168e-06, "loss": 0.17, "step": 87800 }, { "epoch": 258.53, "learning_rate": 8.0581385978035e-06, "loss": 0.1681, "step": 87900 }, { "epoch": 258.82, "learning_rate": 8.053980626998121e-06, "loss": 0.1638, "step": 88000 }, { "epoch": 258.82, "eval_cer": 0.0775031602807201, "eval_loss": 0.40064844489097595, "eval_runtime": 4.8954, "eval_samples_per_second": 73.334, "eval_steps_per_second": 2.451, "eval_wer": 0.29098823150088665, "step": 88000 }, { "epoch": 259.12, "learning_rate": 8.049819284689309e-06, "loss": 0.1636, "step": 88100 }, { "epoch": 259.41, "learning_rate": 8.045654575471056e-06, "loss": 0.1604, "step": 88200 }, { "epoch": 259.71, "learning_rate": 8.041486503941082e-06, "loss": 0.1713, "step": 88300 }, { "epoch": 260.0, "learning_rate": 8.037315074700811e-06, "loss": 0.1648, "step": 88400 }, { "epoch": 260.29, "learning_rate": 8.033140292355377e-06, "loss": 0.1635, "step": 88500 }, { "epoch": 260.59, "learning_rate": 8.028962161513614e-06, "loss": 0.1645, "step": 88600 }, { "epoch": 260.88, "learning_rate": 8.024780686788054e-06, "loss": 0.1615, "step": 88700 }, { "epoch": 261.18, "learning_rate": 8.020595872794921e-06, "loss": 0.1629, "step": 88800 }, { "epoch": 261.47, "learning_rate": 8.016407724154126e-06, "loss": 0.1644, "step": 88900 }, { "epoch": 261.76, "learning_rate": 8.012216245489255e-06, "loss": 0.1599, "step": 89000 }, { "epoch": 261.76, "eval_cer": 0.07654417854496316, "eval_loss": 0.40178772807121277, "eval_runtime": 4.5847, "eval_samples_per_second": 78.303, "eval_steps_per_second": 2.617, "eval_wer": 0.286313074318878, "step": 89000 }, { "epoch": 262.06, "learning_rate": 8.00806340591371e-06, "loss": 0.1659, "step": 89100 }, { "epoch": 262.35, "learning_rate": 8.003865314270893e-06, "loss": 0.1621, "step": 89200 }, { "epoch": 262.65, "learning_rate": 7.99966390645045e-06, "loss": 0.1645, "step": 89300 }, { "epoch": 262.94, "learning_rate": 7.995459187090606e-06, "loss": 0.1664, "step": 89400 }, { "epoch": 263.24, "learning_rate": 7.99125116083325e-06, "loss": 0.1548, "step": 89500 }, { "epoch": 263.53, "learning_rate": 7.98703983232392e-06, "loss": 0.1647, "step": 89600 }, { "epoch": 263.82, "learning_rate": 7.98282520621179e-06, "loss": 0.159, "step": 89700 }, { "epoch": 264.12, "learning_rate": 7.978607287149686e-06, "loss": 0.1754, "step": 89800 }, { "epoch": 264.41, "learning_rate": 7.974386079794062e-06, "loss": 0.1626, "step": 89900 }, { "epoch": 264.71, "learning_rate": 7.970203849953575e-06, "loss": 0.1627, "step": 90000 }, { "epoch": 264.71, "eval_cer": 0.07684930909724946, "eval_loss": 0.39812856912612915, "eval_runtime": 5.3822, "eval_samples_per_second": 66.701, "eval_steps_per_second": 2.23, "eval_wer": 0.28453973883604705, "step": 90000 }, { "epoch": 265.0, "learning_rate": 7.9659761127614e-06, "loss": 0.1689, "step": 90100 }, { "epoch": 265.29, "learning_rate": 7.961745101220146e-06, "loss": 0.1623, "step": 90200 }, { "epoch": 265.59, "learning_rate": 7.957510820000723e-06, "loss": 0.1558, "step": 90300 }, { "epoch": 265.88, "learning_rate": 7.95327327377765e-06, "loss": 0.1607, "step": 90400 }, { "epoch": 266.18, "learning_rate": 7.949032467229056e-06, "loss": 0.1588, "step": 90500 }, { "epoch": 266.47, "learning_rate": 7.94478840503666e-06, "loss": 0.1731, "step": 90600 }, { "epoch": 266.76, "learning_rate": 7.94054109188578e-06, "loss": 0.164, "step": 90700 }, { "epoch": 267.06, "learning_rate": 7.936290532465327e-06, "loss": 0.1632, "step": 90800 }, { "epoch": 267.35, "learning_rate": 7.932036731467787e-06, "loss": 0.1602, "step": 90900 }, { "epoch": 267.65, "learning_rate": 7.927779693589236e-06, "loss": 0.1624, "step": 91000 }, { "epoch": 267.65, "eval_cer": 0.07645699838716707, "eval_loss": 0.40907594561576843, "eval_runtime": 5.3309, "eval_samples_per_second": 67.344, "eval_steps_per_second": 2.251, "eval_wer": 0.28776398516846685, "step": 91000 }, { "epoch": 267.94, "learning_rate": 7.923519423529306e-06, "loss": 0.1629, "step": 91100 }, { "epoch": 268.24, "learning_rate": 7.919255925991218e-06, "loss": 0.1559, "step": 91200 }, { "epoch": 268.53, "learning_rate": 7.91498920568174e-06, "loss": 0.1572, "step": 91300 }, { "epoch": 268.82, "learning_rate": 7.910719267311208e-06, "loss": 0.1595, "step": 91400 }, { "epoch": 269.12, "learning_rate": 7.906446115593504e-06, "loss": 0.1653, "step": 91500 }, { "epoch": 269.41, "learning_rate": 7.90216975524606e-06, "loss": 0.1601, "step": 91600 }, { "epoch": 269.71, "learning_rate": 7.897890190989852e-06, "loss": 0.1628, "step": 91700 }, { "epoch": 270.0, "learning_rate": 7.893607427549386e-06, "loss": 0.1616, "step": 91800 }, { "epoch": 270.29, "learning_rate": 7.889321469652712e-06, "loss": 0.1594, "step": 91900 }, { "epoch": 270.59, "learning_rate": 7.885032322031397e-06, "loss": 0.1612, "step": 92000 }, { "epoch": 270.59, "eval_cer": 0.07641340830826904, "eval_loss": 0.4112890660762787, "eval_runtime": 4.7995, "eval_samples_per_second": 74.799, "eval_steps_per_second": 2.5, "eval_wer": 0.2887312590681928, "step": 92000 }, { "epoch": 270.88, "learning_rate": 7.880739989420528e-06, "loss": 0.1572, "step": 92100 }, { "epoch": 271.18, "learning_rate": 7.876444476558717e-06, "loss": 0.1645, "step": 92200 }, { "epoch": 271.47, "learning_rate": 7.87214578818808e-06, "loss": 0.1638, "step": 92300 }, { "epoch": 271.76, "learning_rate": 7.86784392905424e-06, "loss": 0.1569, "step": 92400 }, { "epoch": 272.06, "learning_rate": 7.863538903906323e-06, "loss": 0.1581, "step": 92500 }, { "epoch": 272.35, "learning_rate": 7.859230717496947e-06, "loss": 0.1641, "step": 92600 }, { "epoch": 272.65, "learning_rate": 7.854919374582222e-06, "loss": 0.1574, "step": 92700 }, { "epoch": 272.94, "learning_rate": 7.850604879921739e-06, "loss": 0.1504, "step": 92800 }, { "epoch": 273.24, "learning_rate": 7.846287238278573e-06, "loss": 0.1584, "step": 92900 }, { "epoch": 273.53, "learning_rate": 7.841966454419276e-06, "loss": 0.1559, "step": 93000 }, { "epoch": 273.53, "eval_cer": 0.07702366941284164, "eval_loss": 0.41579774022102356, "eval_runtime": 4.6321, "eval_samples_per_second": 77.503, "eval_steps_per_second": 2.591, "eval_wer": 0.28776398516846685, "step": 93000 }, { "epoch": 273.82, "learning_rate": 7.837642533113857e-06, "loss": 0.1609, "step": 93100 }, { "epoch": 274.12, "learning_rate": 7.8333154791358e-06, "loss": 0.1566, "step": 93200 }, { "epoch": 274.41, "learning_rate": 7.828985297262043e-06, "loss": 0.1611, "step": 93300 }, { "epoch": 274.71, "learning_rate": 7.824651992272978e-06, "loss": 0.1665, "step": 93400 }, { "epoch": 275.0, "learning_rate": 7.820315568952442e-06, "loss": 0.1487, "step": 93500 }, { "epoch": 275.29, "learning_rate": 7.81597603208772e-06, "loss": 0.1605, "step": 93600 }, { "epoch": 275.59, "learning_rate": 7.811633386469528e-06, "loss": 0.164, "step": 93700 }, { "epoch": 275.88, "learning_rate": 7.80728763689202e-06, "loss": 0.1566, "step": 93800 }, { "epoch": 276.18, "learning_rate": 7.80293878815277e-06, "loss": 0.1577, "step": 93900 }, { "epoch": 276.47, "learning_rate": 7.798630379785097e-06, "loss": 0.155, "step": 94000 }, { "epoch": 276.47, "eval_cer": 0.0757595571247984, "eval_loss": 0.41765499114990234, "eval_runtime": 4.7179, "eval_samples_per_second": 76.093, "eval_steps_per_second": 2.543, "eval_wer": 0.2843785265194261, "step": 94000 }, { "epoch": 276.76, "learning_rate": 7.794275378000553e-06, "loss": 0.158, "step": 94100 }, { "epoch": 277.06, "learning_rate": 7.789917291419415e-06, "loss": 0.1537, "step": 94200 }, { "epoch": 277.35, "learning_rate": 7.785556124852882e-06, "loss": 0.1545, "step": 94300 }, { "epoch": 277.65, "learning_rate": 7.78119188311555e-06, "loss": 0.1583, "step": 94400 }, { "epoch": 277.94, "learning_rate": 7.776824571025409e-06, "loss": 0.1493, "step": 94500 }, { "epoch": 278.24, "learning_rate": 7.772454193403844e-06, "loss": 0.156, "step": 94600 }, { "epoch": 278.53, "learning_rate": 7.768080755075625e-06, "loss": 0.1642, "step": 94700 }, { "epoch": 278.82, "learning_rate": 7.76370426086889e-06, "loss": 0.1466, "step": 94800 }, { "epoch": 279.12, "learning_rate": 7.759324715615161e-06, "loss": 0.1542, "step": 94900 }, { "epoch": 279.41, "learning_rate": 7.754942124149329e-06, "loss": 0.162, "step": 95000 }, { "epoch": 279.41, "eval_cer": 0.07510570594132776, "eval_loss": 0.41507747769355774, "eval_runtime": 4.8011, "eval_samples_per_second": 74.775, "eval_steps_per_second": 2.499, "eval_wer": 0.2838948895695631, "step": 95000 }, { "epoch": 279.71, "learning_rate": 7.750556491309638e-06, "loss": 0.1493, "step": 95100 }, { "epoch": 280.0, "learning_rate": 7.7461678219377e-06, "loss": 0.1503, "step": 95200 }, { "epoch": 280.29, "learning_rate": 7.741776120878473e-06, "loss": 0.1486, "step": 95300 }, { "epoch": 280.59, "learning_rate": 7.737381392980263e-06, "loss": 0.1515, "step": 95400 }, { "epoch": 280.88, "learning_rate": 7.732983643094722e-06, "loss": 0.1532, "step": 95500 }, { "epoch": 281.18, "learning_rate": 7.728582876076831e-06, "loss": 0.1558, "step": 95600 }, { "epoch": 281.47, "learning_rate": 7.724179096784907e-06, "loss": 0.1523, "step": 95700 }, { "epoch": 281.76, "learning_rate": 7.719772310080592e-06, "loss": 0.1518, "step": 95800 }, { "epoch": 282.06, "learning_rate": 7.715362520828843e-06, "loss": 0.1553, "step": 95900 }, { "epoch": 282.35, "learning_rate": 7.71094973389794e-06, "loss": 0.1483, "step": 96000 }, { "epoch": 282.35, "eval_cer": 0.07619545791377882, "eval_loss": 0.4204952120780945, "eval_runtime": 4.5847, "eval_samples_per_second": 78.304, "eval_steps_per_second": 2.617, "eval_wer": 0.28453973883604705, "step": 96000 }, { "epoch": 282.65, "learning_rate": 7.706533954159466e-06, "loss": 0.1479, "step": 96100 }, { "epoch": 282.94, "learning_rate": 7.702115186488308e-06, "loss": 0.1518, "step": 96200 }, { "epoch": 283.24, "learning_rate": 7.697693435762656e-06, "loss": 0.1515, "step": 96300 }, { "epoch": 283.53, "learning_rate": 7.693268706863994e-06, "loss": 0.1527, "step": 96400 }, { "epoch": 283.82, "learning_rate": 7.688841004677086e-06, "loss": 0.145, "step": 96500 }, { "epoch": 284.12, "learning_rate": 7.684410334089984e-06, "loss": 0.1493, "step": 96600 }, { "epoch": 284.41, "learning_rate": 7.679976699994016e-06, "loss": 0.1547, "step": 96700 }, { "epoch": 284.71, "learning_rate": 7.675540107283781e-06, "loss": 0.1471, "step": 96800 }, { "epoch": 285.0, "learning_rate": 7.671100560857147e-06, "loss": 0.1592, "step": 96900 }, { "epoch": 285.29, "learning_rate": 7.666702505148194e-06, "loss": 0.1566, "step": 97000 }, { "epoch": 285.29, "eval_cer": 0.07549801665141014, "eval_loss": 0.424325555562973, "eval_runtime": 5.013, "eval_samples_per_second": 71.614, "eval_steps_per_second": 2.394, "eval_wer": 0.2843785265194261, "step": 97000 }, { "epoch": 285.59, "learning_rate": 7.662257095410217e-06, "loss": 0.1477, "step": 97100 }, { "epoch": 285.88, "learning_rate": 7.657808746619888e-06, "loss": 0.1592, "step": 97200 }, { "epoch": 286.18, "learning_rate": 7.65335746368805e-06, "loss": 0.1451, "step": 97300 }, { "epoch": 286.47, "learning_rate": 7.64890325152879e-06, "loss": 0.1537, "step": 97400 }, { "epoch": 286.76, "learning_rate": 7.644446115059424e-06, "loss": 0.151, "step": 97500 }, { "epoch": 287.06, "learning_rate": 7.6400306741939e-06, "loss": 0.1557, "step": 97600 }, { "epoch": 287.35, "learning_rate": 7.635567732989454e-06, "loss": 0.1524, "step": 97700 }, { "epoch": 287.65, "learning_rate": 7.631101882196917e-06, "loss": 0.1494, "step": 97800 }, { "epoch": 287.94, "learning_rate": 7.626633126746452e-06, "loss": 0.1485, "step": 97900 }, { "epoch": 288.24, "learning_rate": 7.622161471571434e-06, "loss": 0.143, "step": 98000 }, { "epoch": 288.24, "eval_cer": 0.07684930909724946, "eval_loss": 0.4253920018672943, "eval_runtime": 4.609, "eval_samples_per_second": 77.891, "eval_steps_per_second": 2.604, "eval_wer": 0.29018216991778173, "step": 98000 }, { "epoch": 288.53, "learning_rate": 7.617686921608436e-06, "loss": 0.1556, "step": 98100 }, { "epoch": 288.82, "learning_rate": 7.613209481797228e-06, "loss": 0.1475, "step": 98200 }, { "epoch": 289.12, "learning_rate": 7.60872915708077e-06, "loss": 0.1514, "step": 98300 }, { "epoch": 289.41, "learning_rate": 7.604245952405205e-06, "loss": 0.1576, "step": 98400 }, { "epoch": 289.71, "learning_rate": 7.599759872719859e-06, "loss": 0.142, "step": 98500 }, { "epoch": 290.0, "learning_rate": 7.595270922977229e-06, "loss": 0.1549, "step": 98600 }, { "epoch": 290.29, "learning_rate": 7.590779108132982e-06, "loss": 0.1465, "step": 98700 }, { "epoch": 290.59, "learning_rate": 7.5862844331459475e-06, "loss": 0.1434, "step": 98800 }, { "epoch": 290.88, "learning_rate": 7.581786902978113e-06, "loss": 0.1414, "step": 98900 }, { "epoch": 291.18, "learning_rate": 7.577286522594618e-06, "loss": 0.1463, "step": 99000 }, { "epoch": 291.18, "eval_cer": 0.07532365633581797, "eval_loss": 0.4343777000904083, "eval_runtime": 4.7592, "eval_samples_per_second": 75.433, "eval_steps_per_second": 2.521, "eval_wer": 0.2826051910365952, "step": 99000 }, { "epoch": 291.47, "learning_rate": 7.572783296963745e-06, "loss": 0.1457, "step": 99100 }, { "epoch": 291.76, "learning_rate": 7.568277231056922e-06, "loss": 0.1504, "step": 99200 }, { "epoch": 292.06, "learning_rate": 7.563768329848713e-06, "loss": 0.1503, "step": 99300 }, { "epoch": 292.35, "learning_rate": 7.559256598316809e-06, "loss": 0.1444, "step": 99400 }, { "epoch": 292.65, "learning_rate": 7.5547420414420294e-06, "loss": 0.1469, "step": 99500 }, { "epoch": 292.94, "learning_rate": 7.5502246642083056e-06, "loss": 0.1487, "step": 99600 }, { "epoch": 293.24, "learning_rate": 7.545704471602689e-06, "loss": 0.1445, "step": 99700 }, { "epoch": 293.53, "learning_rate": 7.541226712540208e-06, "loss": 0.146, "step": 99800 }, { "epoch": 293.82, "learning_rate": 7.5367009321935426e-06, "loss": 0.1479, "step": 99900 }, { "epoch": 294.12, "learning_rate": 7.53217235140478e-06, "loss": 0.149, "step": 100000 }, { "epoch": 294.12, "eval_cer": 0.07610827775598274, "eval_loss": 0.4314731955528259, "eval_runtime": 4.9571, "eval_samples_per_second": 72.421, "eval_steps_per_second": 2.421, "eval_wer": 0.2847009511526681, "step": 100000 }, { "epoch": 294.41, "learning_rate": 7.527640975173338e-06, "loss": 0.1434, "step": 100100 }, { "epoch": 294.71, "learning_rate": 7.523106808501723e-06, "loss": 0.1478, "step": 100200 }, { "epoch": 295.0, "learning_rate": 7.5185698563955214e-06, "loss": 0.1441, "step": 100300 }, { "epoch": 295.29, "learning_rate": 7.514030123863388e-06, "loss": 0.1417, "step": 100400 }, { "epoch": 295.59, "learning_rate": 7.509487615917055e-06, "loss": 0.1458, "step": 100500 }, { "epoch": 295.88, "learning_rate": 7.504942337571315e-06, "loss": 0.1491, "step": 100600 }, { "epoch": 296.18, "learning_rate": 7.500394293844018e-06, "loss": 0.1427, "step": 100700 }, { "epoch": 296.47, "learning_rate": 7.495843489756072e-06, "loss": 0.153, "step": 100800 }, { "epoch": 296.76, "learning_rate": 7.491289930331425e-06, "loss": 0.1457, "step": 100900 }, { "epoch": 297.06, "learning_rate": 7.486733620597073e-06, "loss": 0.144, "step": 101000 }, { "epoch": 297.06, "eval_cer": 0.07554160673030819, "eval_loss": 0.4298832416534424, "eval_runtime": 5.3958, "eval_samples_per_second": 66.533, "eval_steps_per_second": 2.224, "eval_wer": 0.2834112526197001, "step": 101000 }, { "epoch": 297.35, "learning_rate": 7.482174565583045e-06, "loss": 0.138, "step": 101100 }, { "epoch": 297.65, "learning_rate": 7.4776127703224025e-06, "loss": 0.1473, "step": 101200 }, { "epoch": 297.94, "learning_rate": 7.4730482398512305e-06, "loss": 0.1439, "step": 101300 }, { "epoch": 298.24, "learning_rate": 7.468480979208635e-06, "loss": 0.1396, "step": 101400 }, { "epoch": 298.53, "learning_rate": 7.463910993436735e-06, "loss": 0.1436, "step": 101500 }, { "epoch": 298.82, "learning_rate": 7.4593382875806576e-06, "loss": 0.147, "step": 101600 }, { "epoch": 299.12, "learning_rate": 7.454762866688535e-06, "loss": 0.1414, "step": 101700 }, { "epoch": 299.41, "learning_rate": 7.4501847358114945e-06, "loss": 0.1399, "step": 101800 }, { "epoch": 299.71, "learning_rate": 7.445603900003656e-06, "loss": 0.1494, "step": 101900 }, { "epoch": 300.0, "learning_rate": 7.441020364322124e-06, "loss": 0.1415, "step": 102000 }, { "epoch": 300.0, "eval_cer": 0.07610827775598274, "eval_loss": 0.4383721649646759, "eval_runtime": 5.4378, "eval_samples_per_second": 66.019, "eval_steps_per_second": 2.207, "eval_wer": 0.28518458810253106, "step": 102000 }, { "epoch": 300.29, "learning_rate": 7.4364341338269885e-06, "loss": 0.1471, "step": 102100 }, { "epoch": 300.59, "learning_rate": 7.431845213581309e-06, "loss": 0.145, "step": 102200 }, { "epoch": 300.88, "learning_rate": 7.427253608651116e-06, "loss": 0.1422, "step": 102300 }, { "epoch": 301.18, "learning_rate": 7.422659324105404e-06, "loss": 0.1493, "step": 102400 }, { "epoch": 301.47, "learning_rate": 7.4180623650161274e-06, "loss": 0.1512, "step": 102500 }, { "epoch": 301.76, "learning_rate": 7.413462736458192e-06, "loss": 0.1461, "step": 102600 }, { "epoch": 302.06, "learning_rate": 7.408860443509448e-06, "loss": 0.1468, "step": 102700 }, { "epoch": 302.35, "learning_rate": 7.404255491250691e-06, "loss": 0.1334, "step": 102800 }, { "epoch": 302.65, "learning_rate": 7.3996478847656525e-06, "loss": 0.1459, "step": 102900 }, { "epoch": 302.94, "learning_rate": 7.39503762914099e-06, "loss": 0.1456, "step": 103000 }, { "epoch": 302.94, "eval_cer": 0.0748441654679395, "eval_loss": 0.4347250163555145, "eval_runtime": 4.8036, "eval_samples_per_second": 74.735, "eval_steps_per_second": 2.498, "eval_wer": 0.2801870062872803, "step": 103000 }, { "epoch": 303.24, "learning_rate": 7.390424729466288e-06, "loss": 0.1469, "step": 103100 }, { "epoch": 303.53, "learning_rate": 7.3858091908340515e-06, "loss": 0.14, "step": 103200 }, { "epoch": 303.82, "learning_rate": 7.381191018339697e-06, "loss": 0.1417, "step": 103300 }, { "epoch": 304.12, "learning_rate": 7.376570217081548e-06, "loss": 0.1355, "step": 103400 }, { "epoch": 304.41, "learning_rate": 7.371946792160831e-06, "loss": 0.1428, "step": 103500 }, { "epoch": 304.71, "learning_rate": 7.367320748681672e-06, "loss": 0.1422, "step": 103600 }, { "epoch": 305.0, "learning_rate": 7.362692091751083e-06, "loss": 0.1432, "step": 103700 }, { "epoch": 305.29, "learning_rate": 7.3580608264789614e-06, "loss": 0.1523, "step": 103800 }, { "epoch": 305.59, "learning_rate": 7.353426957978087e-06, "loss": 0.1367, "step": 103900 }, { "epoch": 305.88, "learning_rate": 7.348790491364114e-06, "loss": 0.1442, "step": 104000 }, { "epoch": 305.88, "eval_cer": 0.07562878688810427, "eval_loss": 0.4230651557445526, "eval_runtime": 4.398, "eval_samples_per_second": 81.628, "eval_steps_per_second": 2.729, "eval_wer": 0.28244397871997423, "step": 104000 }, { "epoch": 306.18, "learning_rate": 7.3441514317555615e-06, "loss": 0.1306, "step": 104100 }, { "epoch": 306.47, "learning_rate": 7.339509784273812e-06, "loss": 0.1443, "step": 104200 }, { "epoch": 306.76, "learning_rate": 7.334865554043108e-06, "loss": 0.1424, "step": 104300 }, { "epoch": 307.06, "learning_rate": 7.33021874619054e-06, "loss": 0.1352, "step": 104400 }, { "epoch": 307.35, "learning_rate": 7.325569365846044e-06, "loss": 0.1362, "step": 104500 }, { "epoch": 307.65, "learning_rate": 7.320917418142398e-06, "loss": 0.143, "step": 104600 }, { "epoch": 307.94, "learning_rate": 7.3162629082152136e-06, "loss": 0.1449, "step": 104700 }, { "epoch": 308.24, "learning_rate": 7.311605841202931e-06, "loss": 0.142, "step": 104800 }, { "epoch": 308.53, "learning_rate": 7.306946222246813e-06, "loss": 0.151, "step": 104900 }, { "epoch": 308.82, "learning_rate": 7.302284056490938e-06, "loss": 0.1357, "step": 105000 }, { "epoch": 308.82, "eval_cer": 0.07510570594132776, "eval_loss": 0.44283321499824524, "eval_runtime": 4.9758, "eval_samples_per_second": 72.149, "eval_steps_per_second": 2.412, "eval_wer": 0.28131549250362725, "step": 105000 }, { "epoch": 309.12, "learning_rate": 7.297619349082201e-06, "loss": 0.1349, "step": 105100 }, { "epoch": 309.41, "learning_rate": 7.292952105170298e-06, "loss": 0.1374, "step": 105200 }, { "epoch": 309.71, "learning_rate": 7.288282329907726e-06, "loss": 0.143, "step": 105300 }, { "epoch": 310.0, "learning_rate": 7.28361002844978e-06, "loss": 0.1453, "step": 105400 }, { "epoch": 310.29, "learning_rate": 7.27893520595454e-06, "loss": 0.142, "step": 105500 }, { "epoch": 310.59, "learning_rate": 7.274257867582868e-06, "loss": 0.135, "step": 105600 }, { "epoch": 310.88, "learning_rate": 7.269578018498409e-06, "loss": 0.1452, "step": 105700 }, { "epoch": 311.18, "learning_rate": 7.264942499799369e-06, "loss": 0.1379, "step": 105800 }, { "epoch": 311.47, "learning_rate": 7.260257669769517e-06, "loss": 0.1339, "step": 105900 }, { "epoch": 311.76, "learning_rate": 7.255570344482677e-06, "loss": 0.1446, "step": 106000 }, { "epoch": 311.76, "eval_cer": 0.07532365633581797, "eval_loss": 0.44697633385658264, "eval_runtime": 5.0129, "eval_samples_per_second": 71.616, "eval_steps_per_second": 2.394, "eval_wer": 0.2842173142028051, "step": 106000 }, { "epoch": 312.06, "learning_rate": 7.250880529113518e-06, "loss": 0.1406, "step": 106100 }, { "epoch": 312.35, "learning_rate": 7.246188228839456e-06, "loss": 0.1378, "step": 106200 }, { "epoch": 312.65, "learning_rate": 7.241493448840649e-06, "loss": 0.1446, "step": 106300 }, { "epoch": 312.94, "learning_rate": 7.236796194299992e-06, "loss": 0.1424, "step": 106400 }, { "epoch": 313.24, "learning_rate": 7.232096470403117e-06, "loss": 0.1387, "step": 106500 }, { "epoch": 313.53, "learning_rate": 7.227394282338378e-06, "loss": 0.1411, "step": 106600 }, { "epoch": 313.82, "learning_rate": 7.222689635296852e-06, "loss": 0.1337, "step": 106700 }, { "epoch": 314.12, "learning_rate": 7.217982534472326e-06, "loss": 0.1403, "step": 106800 }, { "epoch": 314.41, "learning_rate": 7.213320092658842e-06, "loss": 0.1401, "step": 106900 }, { "epoch": 314.71, "learning_rate": 7.208608124268647e-06, "loss": 0.1345, "step": 107000 }, { "epoch": 314.71, "eval_cer": 0.07471339523124537, "eval_loss": 0.457571417093277, "eval_runtime": 4.9987, "eval_samples_per_second": 71.818, "eval_steps_per_second": 2.401, "eval_wer": 0.28083185555376433, "step": 107000 }, { "epoch": 315.0, "learning_rate": 7.20389371764102e-06, "loss": 0.1436, "step": 107100 }, { "epoch": 315.29, "learning_rate": 7.199176877980525e-06, "loss": 0.1302, "step": 107200 }, { "epoch": 315.59, "learning_rate": 7.194457610494413e-06, "loss": 0.1348, "step": 107300 }, { "epoch": 315.88, "learning_rate": 7.189735920392614e-06, "loss": 0.1376, "step": 107400 }, { "epoch": 316.18, "learning_rate": 7.185011812887735e-06, "loss": 0.1341, "step": 107500 }, { "epoch": 316.47, "learning_rate": 7.180285293195048e-06, "loss": 0.1361, "step": 107600 }, { "epoch": 316.76, "learning_rate": 7.1755563665324905e-06, "loss": 0.1361, "step": 107700 }, { "epoch": 317.06, "learning_rate": 7.170825038120654e-06, "loss": 0.1341, "step": 107800 }, { "epoch": 317.35, "learning_rate": 7.1660913131827855e-06, "loss": 0.1393, "step": 107900 }, { "epoch": 317.65, "learning_rate": 7.161355196944777e-06, "loss": 0.137, "step": 108000 }, { "epoch": 317.65, "eval_cer": 0.07562878688810427, "eval_loss": 0.45369425415992737, "eval_runtime": 4.9175, "eval_samples_per_second": 73.004, "eval_steps_per_second": 2.44, "eval_wer": 0.285990649685636, "step": 108000 }, { "epoch": 317.94, "learning_rate": 7.156616694635158e-06, "loss": 0.1378, "step": 108100 }, { "epoch": 318.24, "learning_rate": 7.151875811485094e-06, "loss": 0.1325, "step": 108200 }, { "epoch": 318.53, "learning_rate": 7.147132552728379e-06, "loss": 0.1417, "step": 108300 }, { "epoch": 318.82, "learning_rate": 7.142386923601428e-06, "loss": 0.1339, "step": 108400 }, { "epoch": 319.12, "learning_rate": 7.137638929343274e-06, "loss": 0.143, "step": 108500 }, { "epoch": 319.41, "learning_rate": 7.132888575195561e-06, "loss": 0.1337, "step": 108600 }, { "epoch": 319.71, "learning_rate": 7.128135866402539e-06, "loss": 0.1351, "step": 108700 }, { "epoch": 320.0, "learning_rate": 7.123380808211055e-06, "loss": 0.1378, "step": 108800 }, { "epoch": 320.29, "learning_rate": 7.118623405870554e-06, "loss": 0.135, "step": 108900 }, { "epoch": 320.59, "learning_rate": 7.113863664633064e-06, "loss": 0.1318, "step": 109000 }, { "epoch": 320.59, "eval_cer": 0.07523647617802189, "eval_loss": 0.4415852725505829, "eval_runtime": 5.3729, "eval_samples_per_second": 66.817, "eval_steps_per_second": 2.233, "eval_wer": 0.28163791713686925, "step": 109000 }, { "epoch": 320.88, "learning_rate": 7.109101589753197e-06, "loss": 0.1359, "step": 109100 }, { "epoch": 321.18, "learning_rate": 7.1043371864881424e-06, "loss": 0.13, "step": 109200 }, { "epoch": 321.47, "learning_rate": 7.099570460097659e-06, "loss": 0.1373, "step": 109300 }, { "epoch": 321.76, "learning_rate": 7.094849117742743e-06, "loss": 0.1411, "step": 109400 }, { "epoch": 322.06, "learning_rate": 7.090077783990845e-06, "loss": 0.1401, "step": 109500 }, { "epoch": 322.35, "learning_rate": 7.0853041428554725e-06, "loss": 0.1341, "step": 109600 }, { "epoch": 322.65, "learning_rate": 7.080528199606582e-06, "loss": 0.1352, "step": 109700 }, { "epoch": 322.94, "learning_rate": 7.075749959516676e-06, "loss": 0.1343, "step": 109800 }, { "epoch": 323.24, "learning_rate": 7.0709694278607836e-06, "loss": 0.142, "step": 109900 }, { "epoch": 323.53, "learning_rate": 7.066186609916472e-06, "loss": 0.137, "step": 110000 }, { "epoch": 323.53, "eval_cer": 0.07414672420557081, "eval_loss": 0.4473969638347626, "eval_runtime": 4.4522, "eval_samples_per_second": 80.635, "eval_steps_per_second": 2.695, "eval_wer": 0.27760760922134453, "step": 110000 }, { "epoch": 323.82, "learning_rate": 7.06140151096383e-06, "loss": 0.1354, "step": 110100 }, { "epoch": 324.12, "learning_rate": 7.056614136285462e-06, "loss": 0.1351, "step": 110200 }, { "epoch": 324.41, "learning_rate": 7.051824491166489e-06, "loss": 0.1303, "step": 110300 }, { "epoch": 324.71, "learning_rate": 7.047032580894535e-06, "loss": 0.1328, "step": 110400 }, { "epoch": 325.0, "learning_rate": 7.042238410759725e-06, "loss": 0.129, "step": 110500 }, { "epoch": 325.29, "learning_rate": 7.0374419860546804e-06, "loss": 0.1365, "step": 110600 }, { "epoch": 325.59, "learning_rate": 7.032643312074512e-06, "loss": 0.1309, "step": 110700 }, { "epoch": 325.88, "learning_rate": 7.027842394116812e-06, "loss": 0.1313, "step": 110800 }, { "epoch": 326.18, "learning_rate": 7.02303923748165e-06, "loss": 0.1343, "step": 110900 }, { "epoch": 326.47, "learning_rate": 7.018233847471566e-06, "loss": 0.1351, "step": 111000 }, { "epoch": 326.47, "eval_cer": 0.07571596704590035, "eval_loss": 0.45716190338134766, "eval_runtime": 4.8972, "eval_samples_per_second": 73.307, "eval_steps_per_second": 2.45, "eval_wer": 0.28357246493632116, "step": 111000 }, { "epoch": 326.76, "learning_rate": 7.0134262293915704e-06, "loss": 0.1296, "step": 111100 }, { "epoch": 327.06, "learning_rate": 7.008616388549128e-06, "loss": 0.1242, "step": 111200 }, { "epoch": 327.35, "learning_rate": 7.003804330254161e-06, "loss": 0.1326, "step": 111300 }, { "epoch": 327.65, "learning_rate": 6.998990059819037e-06, "loss": 0.1379, "step": 111400 }, { "epoch": 327.94, "learning_rate": 6.994173582558566e-06, "loss": 0.1339, "step": 111500 }, { "epoch": 328.24, "learning_rate": 6.989354903789993e-06, "loss": 0.139, "step": 111600 }, { "epoch": 328.53, "learning_rate": 6.984534028833002e-06, "loss": 0.1295, "step": 111700 }, { "epoch": 328.82, "learning_rate": 6.97971096300969e-06, "loss": 0.1318, "step": 111800 }, { "epoch": 329.12, "learning_rate": 6.974885711644581e-06, "loss": 0.1331, "step": 111900 }, { "epoch": 329.41, "learning_rate": 6.9700582800646064e-06, "loss": 0.1357, "step": 112000 }, { "epoch": 329.41, "eval_cer": 0.0754544265725121, "eval_loss": 0.4541434347629547, "eval_runtime": 4.8992, "eval_samples_per_second": 73.277, "eval_steps_per_second": 2.449, "eval_wer": 0.28212155408673223, "step": 112000 }, { "epoch": 329.71, "learning_rate": 6.965228673599105e-06, "loss": 0.1317, "step": 112100 }, { "epoch": 330.0, "learning_rate": 6.960396897579821e-06, "loss": 0.1278, "step": 112200 }, { "epoch": 330.29, "learning_rate": 6.9555629573408886e-06, "loss": 0.1307, "step": 112300 }, { "epoch": 330.59, "learning_rate": 6.950726858218837e-06, "loss": 0.1302, "step": 112400 }, { "epoch": 330.88, "learning_rate": 6.945888605552571e-06, "loss": 0.1333, "step": 112500 }, { "epoch": 331.18, "learning_rate": 6.94104820468338e-06, "loss": 0.1276, "step": 112600 }, { "epoch": 331.47, "learning_rate": 6.93620566095492e-06, "loss": 0.1303, "step": 112700 }, { "epoch": 331.76, "learning_rate": 6.931360979713216e-06, "loss": 0.1302, "step": 112800 }, { "epoch": 332.06, "learning_rate": 6.926514166306653e-06, "loss": 0.1292, "step": 112900 }, { "epoch": 332.35, "learning_rate": 6.921665226085965e-06, "loss": 0.1362, "step": 113000 }, { "epoch": 332.35, "eval_cer": 0.0760646876770847, "eval_loss": 0.44597867131233215, "eval_runtime": 5.0068, "eval_samples_per_second": 71.703, "eval_steps_per_second": 2.397, "eval_wer": 0.2866354989521199, "step": 113000 }, { "epoch": 332.65, "learning_rate": 6.9168141644042386e-06, "loss": 0.1331, "step": 113100 }, { "epoch": 332.94, "learning_rate": 6.9119609866169e-06, "loss": 0.1309, "step": 113200 }, { "epoch": 333.24, "learning_rate": 6.907105698081715e-06, "loss": 0.1275, "step": 113300 }, { "epoch": 333.53, "learning_rate": 6.9022483041587785e-06, "loss": 0.1323, "step": 113400 }, { "epoch": 333.82, "learning_rate": 6.897486020635022e-06, "loss": 0.129, "step": 113500 }, { "epoch": 334.12, "learning_rate": 6.892624473866769e-06, "loss": 0.1377, "step": 113600 }, { "epoch": 334.41, "learning_rate": 6.8877608376976024e-06, "loss": 0.1258, "step": 113700 }, { "epoch": 334.71, "learning_rate": 6.88289511749683e-06, "loss": 0.1307, "step": 113800 }, { "epoch": 335.0, "learning_rate": 6.878027318636063e-06, "loss": 0.1331, "step": 113900 }, { "epoch": 335.29, "learning_rate": 6.873157446489203e-06, "loss": 0.1279, "step": 114000 }, { "epoch": 335.29, "eval_cer": 0.07371082341659038, "eval_loss": 0.4529751241207123, "eval_runtime": 4.2881, "eval_samples_per_second": 83.72, "eval_steps_per_second": 2.798, "eval_wer": 0.2758342737385136, "step": 114000 }, { "epoch": 335.59, "learning_rate": 6.868285506432445e-06, "loss": 0.1319, "step": 114100 }, { "epoch": 335.88, "learning_rate": 6.863411503844266e-06, "loss": 0.1291, "step": 114200 }, { "epoch": 336.18, "learning_rate": 6.858535444105418e-06, "loss": 0.1266, "step": 114300 }, { "epoch": 336.47, "learning_rate": 6.8536573325989285e-06, "loss": 0.1277, "step": 114400 }, { "epoch": 336.76, "learning_rate": 6.848777174710084e-06, "loss": 0.1297, "step": 114500 }, { "epoch": 337.06, "learning_rate": 6.843894975826434e-06, "loss": 0.1306, "step": 114600 }, { "epoch": 337.35, "learning_rate": 6.839010741337779e-06, "loss": 0.1285, "step": 114700 }, { "epoch": 337.65, "learning_rate": 6.834124476636171e-06, "loss": 0.1291, "step": 114800 }, { "epoch": 337.94, "learning_rate": 6.829236187115898e-06, "loss": 0.1378, "step": 114900 }, { "epoch": 338.24, "learning_rate": 6.8243458781734866e-06, "loss": 0.1345, "step": 115000 }, { "epoch": 338.24, "eval_cer": 0.07427749444226495, "eval_loss": 0.47045978903770447, "eval_runtime": 5.4296, "eval_samples_per_second": 66.119, "eval_steps_per_second": 2.21, "eval_wer": 0.27873609543769146, "step": 115000 }, { "epoch": 338.53, "learning_rate": 6.81945355520769e-06, "loss": 0.1245, "step": 115100 }, { "epoch": 338.82, "learning_rate": 6.81455922361949e-06, "loss": 0.1318, "step": 115200 }, { "epoch": 339.12, "learning_rate": 6.8096628888120795e-06, "loss": 0.1235, "step": 115300 }, { "epoch": 339.41, "learning_rate": 6.804764556190868e-06, "loss": 0.1266, "step": 115400 }, { "epoch": 339.71, "learning_rate": 6.7998642311634675e-06, "loss": 0.1291, "step": 115500 }, { "epoch": 340.0, "learning_rate": 6.794961919139691e-06, "loss": 0.1256, "step": 115600 }, { "epoch": 340.29, "learning_rate": 6.790057625531546e-06, "loss": 0.1342, "step": 115700 }, { "epoch": 340.59, "learning_rate": 6.785151355753222e-06, "loss": 0.1247, "step": 115800 }, { "epoch": 340.88, "learning_rate": 6.780243115221098e-06, "loss": 0.1296, "step": 115900 }, { "epoch": 341.18, "learning_rate": 6.775332909353724e-06, "loss": 0.132, "step": 116000 }, { "epoch": 341.18, "eval_cer": 0.07466980515234732, "eval_loss": 0.4567488431930542, "eval_runtime": 5.3257, "eval_samples_per_second": 67.409, "eval_steps_per_second": 2.253, "eval_wer": 0.27841367080444945, "step": 116000 }, { "epoch": 341.47, "learning_rate": 6.770420743571821e-06, "loss": 0.1232, "step": 116100 }, { "epoch": 341.76, "learning_rate": 6.765506623298272e-06, "loss": 0.1265, "step": 116200 }, { "epoch": 342.06, "learning_rate": 6.760590553958122e-06, "loss": 0.1267, "step": 116300 }, { "epoch": 342.35, "learning_rate": 6.755672540978561e-06, "loss": 0.126, "step": 116400 }, { "epoch": 342.65, "learning_rate": 6.750752589788931e-06, "loss": 0.1285, "step": 116500 }, { "epoch": 342.94, "learning_rate": 6.74583070582071e-06, "loss": 0.1268, "step": 116600 }, { "epoch": 343.24, "learning_rate": 6.740906894507514e-06, "loss": 0.1268, "step": 116700 }, { "epoch": 343.53, "learning_rate": 6.735981161285079e-06, "loss": 0.1222, "step": 116800 }, { "epoch": 343.82, "learning_rate": 6.73105351159127e-06, "loss": 0.1282, "step": 116900 }, { "epoch": 344.12, "learning_rate": 6.7261239508660655e-06, "loss": 0.1282, "step": 117000 }, { "epoch": 344.12, "eval_cer": 0.07462621507344928, "eval_loss": 0.45933759212493896, "eval_runtime": 4.7882, "eval_samples_per_second": 74.976, "eval_steps_per_second": 2.506, "eval_wer": 0.28002579397065935, "step": 117000 }, { "epoch": 344.41, "learning_rate": 6.721192484551554e-06, "loss": 0.1233, "step": 117100 }, { "epoch": 344.71, "learning_rate": 6.716259118091923e-06, "loss": 0.1296, "step": 117200 }, { "epoch": 345.0, "learning_rate": 6.711323856933466e-06, "loss": 0.1248, "step": 117300 }, { "epoch": 345.29, "learning_rate": 6.706386706524562e-06, "loss": 0.1272, "step": 117400 }, { "epoch": 345.59, "learning_rate": 6.701447672315678e-06, "loss": 0.1314, "step": 117500 }, { "epoch": 345.88, "learning_rate": 6.696506759759362e-06, "loss": 0.1268, "step": 117600 }, { "epoch": 346.18, "learning_rate": 6.691563974310231e-06, "loss": 0.1285, "step": 117700 }, { "epoch": 346.47, "learning_rate": 6.686619321424976e-06, "loss": 0.1218, "step": 117800 }, { "epoch": 346.76, "learning_rate": 6.681672806562342e-06, "loss": 0.1261, "step": 117900 }, { "epoch": 347.06, "learning_rate": 6.676724435183138e-06, "loss": 0.1297, "step": 118000 }, { "epoch": 347.06, "eval_cer": 0.07497493570463362, "eval_loss": 0.4662339687347412, "eval_runtime": 4.4705, "eval_samples_per_second": 80.304, "eval_steps_per_second": 2.684, "eval_wer": 0.28034821860390136, "step": 118000 }, { "epoch": 347.35, "learning_rate": 6.671774212750215e-06, "loss": 0.1214, "step": 118100 }, { "epoch": 347.65, "learning_rate": 6.666822144728472e-06, "loss": 0.1347, "step": 118200 }, { "epoch": 347.94, "learning_rate": 6.661868236584843e-06, "loss": 0.1279, "step": 118300 }, { "epoch": 348.24, "learning_rate": 6.656912493788296e-06, "loss": 0.1223, "step": 118400 }, { "epoch": 348.53, "learning_rate": 6.651954921809825e-06, "loss": 0.1335, "step": 118500 }, { "epoch": 348.82, "learning_rate": 6.64699552612244e-06, "loss": 0.1201, "step": 118600 }, { "epoch": 349.12, "learning_rate": 6.642034312201164e-06, "loss": 0.1347, "step": 118700 }, { "epoch": 349.41, "learning_rate": 6.637071285523029e-06, "loss": 0.1183, "step": 118800 }, { "epoch": 349.71, "learning_rate": 6.6321561088346606e-06, "loss": 0.1266, "step": 118900 }, { "epoch": 350.0, "learning_rate": 6.627189491072736e-06, "loss": 0.1237, "step": 119000 }, { "epoch": 350.0, "eval_cer": 0.07458262499455125, "eval_loss": 0.4724867343902588, "eval_runtime": 4.6268, "eval_samples_per_second": 77.592, "eval_steps_per_second": 2.594, "eval_wer": 0.2817991294534902, "step": 119000 }, { "epoch": 350.29, "learning_rate": 6.622221076942194e-06, "loss": 0.1275, "step": 119100 }, { "epoch": 350.59, "learning_rate": 6.617250871928014e-06, "loss": 0.1247, "step": 119200 }, { "epoch": 350.88, "learning_rate": 6.612278881517154e-06, "loss": 0.1222, "step": 119300 }, { "epoch": 351.18, "learning_rate": 6.607354857694247e-06, "loss": 0.1243, "step": 119400 }, { "epoch": 351.47, "learning_rate": 6.602379330675764e-06, "loss": 0.1328, "step": 119500 }, { "epoch": 351.76, "learning_rate": 6.5974020346783354e-06, "loss": 0.1303, "step": 119600 }, { "epoch": 352.06, "learning_rate": 6.592422975196755e-06, "loss": 0.1245, "step": 119700 }, { "epoch": 352.35, "learning_rate": 6.5874421577277505e-06, "loss": 0.1286, "step": 119800 }, { "epoch": 352.65, "learning_rate": 6.582459587769996e-06, "loss": 0.1287, "step": 119900 }, { "epoch": 352.94, "learning_rate": 6.577475270824101e-06, "loss": 0.1278, "step": 120000 }, { "epoch": 352.94, "eval_cer": 0.07379800357438647, "eval_loss": 0.46413475275039673, "eval_runtime": 4.9638, "eval_samples_per_second": 72.324, "eval_steps_per_second": 2.418, "eval_wer": 0.2769627599548605, "step": 120000 }, { "epoch": 353.24, "learning_rate": 6.572489212392604e-06, "loss": 0.1223, "step": 120100 }, { "epoch": 353.53, "learning_rate": 6.567501417979963e-06, "loss": 0.1258, "step": 120200 }, { "epoch": 353.82, "learning_rate": 6.562511893092552e-06, "loss": 0.1242, "step": 120300 }, { "epoch": 354.12, "learning_rate": 6.557520643238662e-06, "loss": 0.1243, "step": 120400 }, { "epoch": 354.41, "learning_rate": 6.552527673928481e-06, "loss": 0.1278, "step": 120500 }, { "epoch": 354.71, "learning_rate": 6.547532990674099e-06, "loss": 0.1259, "step": 120600 }, { "epoch": 355.0, "learning_rate": 6.5425365989894976e-06, "loss": 0.122, "step": 120700 }, { "epoch": 355.29, "learning_rate": 6.537538504390543e-06, "loss": 0.1225, "step": 120800 }, { "epoch": 355.59, "learning_rate": 6.532538712394982e-06, "loss": 0.1256, "step": 120900 }, { "epoch": 355.88, "learning_rate": 6.527537228522437e-06, "loss": 0.1294, "step": 121000 }, { "epoch": 355.88, "eval_cer": 0.07419031428446886, "eval_loss": 0.4756881296634674, "eval_runtime": 4.9381, "eval_samples_per_second": 72.7, "eval_steps_per_second": 2.43, "eval_wer": 0.2790585200709334, "step": 121000 }, { "epoch": 356.18, "learning_rate": 6.522534058294396e-06, "loss": 0.1159, "step": 121100 }, { "epoch": 356.47, "learning_rate": 6.51752920723421e-06, "loss": 0.1259, "step": 121200 }, { "epoch": 356.76, "learning_rate": 6.5125226808670865e-06, "loss": 0.1215, "step": 121300 }, { "epoch": 357.06, "learning_rate": 6.5075144847200775e-06, "loss": 0.122, "step": 121400 }, { "epoch": 357.35, "learning_rate": 6.502504624322086e-06, "loss": 0.1248, "step": 121500 }, { "epoch": 357.65, "learning_rate": 6.497493105203845e-06, "loss": 0.1208, "step": 121600 }, { "epoch": 357.94, "learning_rate": 6.492479932897925e-06, "loss": 0.1218, "step": 121700 }, { "epoch": 358.24, "learning_rate": 6.487515269276015e-06, "loss": 0.1193, "step": 121800 }, { "epoch": 358.53, "learning_rate": 6.482498823593491e-06, "loss": 0.1177, "step": 121900 }, { "epoch": 358.82, "learning_rate": 6.477480741276527e-06, "loss": 0.1238, "step": 122000 }, { "epoch": 358.82, "eval_cer": 0.07449544483675516, "eval_loss": 0.48461535573005676, "eval_runtime": 4.649, "eval_samples_per_second": 77.221, "eval_steps_per_second": 2.581, "eval_wer": 0.2774463969047235, "step": 122000 }, { "epoch": 359.12, "learning_rate": 6.472461027864931e-06, "loss": 0.1186, "step": 122100 }, { "epoch": 359.41, "learning_rate": 6.467439688900324e-06, "loss": 0.1233, "step": 122200 }, { "epoch": 359.71, "learning_rate": 6.46241672992611e-06, "loss": 0.1199, "step": 122300 }, { "epoch": 360.0, "learning_rate": 6.457392156487486e-06, "loss": 0.1133, "step": 122400 }, { "epoch": 360.29, "learning_rate": 6.452365974131434e-06, "loss": 0.1211, "step": 122500 }, { "epoch": 360.59, "learning_rate": 6.447338188406705e-06, "loss": 0.1204, "step": 122600 }, { "epoch": 360.88, "learning_rate": 6.442308804863825e-06, "loss": 0.1291, "step": 122700 }, { "epoch": 361.18, "learning_rate": 6.437277829055086e-06, "loss": 0.1222, "step": 122800 }, { "epoch": 361.47, "learning_rate": 6.432245266534533e-06, "loss": 0.122, "step": 122900 }, { "epoch": 361.76, "learning_rate": 6.4272111228579685e-06, "loss": 0.1259, "step": 123000 }, { "epoch": 361.76, "eval_cer": 0.07388518373218256, "eval_loss": 0.47283557057380676, "eval_runtime": 5.3824, "eval_samples_per_second": 66.699, "eval_steps_per_second": 2.23, "eval_wer": 0.2774463969047235, "step": 123000 }, { "epoch": 362.06, "learning_rate": 6.4221754035829305e-06, "loss": 0.1164, "step": 123100 }, { "epoch": 362.35, "learning_rate": 6.417138114268706e-06, "loss": 0.1214, "step": 123200 }, { "epoch": 362.65, "learning_rate": 6.412099260476314e-06, "loss": 0.1232, "step": 123300 }, { "epoch": 362.94, "learning_rate": 6.4070588477684956e-06, "loss": 0.1279, "step": 123400 }, { "epoch": 363.24, "learning_rate": 6.4020168817097175e-06, "loss": 0.1245, "step": 123500 }, { "epoch": 363.53, "learning_rate": 6.396973367866159e-06, "loss": 0.1182, "step": 123600 }, { "epoch": 363.82, "learning_rate": 6.391928311805709e-06, "loss": 0.1142, "step": 123700 }, { "epoch": 364.12, "learning_rate": 6.386881719097959e-06, "loss": 0.1221, "step": 123800 }, { "epoch": 364.41, "learning_rate": 6.3818335953141955e-06, "loss": 0.1157, "step": 123900 }, { "epoch": 364.71, "learning_rate": 6.376783946027399e-06, "loss": 0.1188, "step": 124000 }, { "epoch": 364.71, "eval_cer": 0.07558519680920622, "eval_loss": 0.4801531732082367, "eval_runtime": 4.7837, "eval_samples_per_second": 75.046, "eval_steps_per_second": 2.509, "eval_wer": 0.2809930678703853, "step": 124000 }, { "epoch": 365.0, "learning_rate": 6.37173277681223e-06, "loss": 0.1251, "step": 124100 }, { "epoch": 365.29, "learning_rate": 6.366680093245028e-06, "loss": 0.1198, "step": 124200 }, { "epoch": 365.59, "learning_rate": 6.361625900903804e-06, "loss": 0.1168, "step": 124300 }, { "epoch": 365.88, "learning_rate": 6.356570205368238e-06, "loss": 0.1275, "step": 124400 }, { "epoch": 366.18, "learning_rate": 6.3515130122196656e-06, "loss": 0.121, "step": 124500 }, { "epoch": 366.47, "learning_rate": 6.346454327041079e-06, "loss": 0.1218, "step": 124600 }, { "epoch": 366.76, "learning_rate": 6.341394155417111e-06, "loss": 0.1177, "step": 124700 }, { "epoch": 367.06, "learning_rate": 6.336332502934044e-06, "loss": 0.1193, "step": 124800 }, { "epoch": 367.35, "learning_rate": 6.331269375179788e-06, "loss": 0.115, "step": 124900 }, { "epoch": 367.65, "learning_rate": 6.3262047777438884e-06, "loss": 0.1203, "step": 125000 }, { "epoch": 367.65, "eval_cer": 0.07405954404777472, "eval_loss": 0.4863865375518799, "eval_runtime": 5.4102, "eval_samples_per_second": 66.357, "eval_steps_per_second": 2.218, "eval_wer": 0.2761566983717556, "step": 125000 }, { "epoch": 367.94, "learning_rate": 6.321138716217509e-06, "loss": 0.1207, "step": 125100 }, { "epoch": 368.24, "learning_rate": 6.31607119619343e-06, "loss": 0.1183, "step": 125200 }, { "epoch": 368.53, "learning_rate": 6.31100222326604e-06, "loss": 0.1204, "step": 125300 }, { "epoch": 368.82, "learning_rate": 6.305931803031335e-06, "loss": 0.1168, "step": 125400 }, { "epoch": 369.12, "learning_rate": 6.3008599410869085e-06, "loss": 0.1181, "step": 125500 }, { "epoch": 369.41, "learning_rate": 6.295786643031946e-06, "loss": 0.1203, "step": 125600 }, { "epoch": 369.71, "learning_rate": 6.290711914467214e-06, "loss": 0.1233, "step": 125700 }, { "epoch": 370.0, "learning_rate": 6.285635760995063e-06, "loss": 0.1258, "step": 125800 }, { "epoch": 370.29, "learning_rate": 6.280608970954318e-06, "loss": 0.1191, "step": 125900 }, { "epoch": 370.59, "learning_rate": 6.275529998589889e-06, "loss": 0.1203, "step": 126000 }, { "epoch": 370.59, "eval_cer": 0.07401595396887668, "eval_loss": 0.4892123341560364, "eval_runtime": 4.6022, "eval_samples_per_second": 78.006, "eval_steps_per_second": 2.607, "eval_wer": 0.2769627599548605, "step": 126000 }, { "epoch": 370.88, "learning_rate": 6.270449618078422e-06, "loss": 0.1201, "step": 126100 }, { "epoch": 371.18, "learning_rate": 6.2653678350285066e-06, "loss": 0.1213, "step": 126200 }, { "epoch": 371.47, "learning_rate": 6.260284655050277e-06, "loss": 0.1264, "step": 126300 }, { "epoch": 371.76, "learning_rate": 6.255200083755416e-06, "loss": 0.1181, "step": 126400 }, { "epoch": 372.06, "learning_rate": 6.250114126757135e-06, "loss": 0.1226, "step": 126500 }, { "epoch": 372.35, "learning_rate": 6.245026789670181e-06, "loss": 0.1249, "step": 126600 }, { "epoch": 372.65, "learning_rate": 6.239938078110822e-06, "loss": 0.1211, "step": 126700 }, { "epoch": 372.94, "learning_rate": 6.2348479976968425e-06, "loss": 0.1227, "step": 126800 }, { "epoch": 373.24, "learning_rate": 6.22975655404754e-06, "loss": 0.1192, "step": 126900 }, { "epoch": 373.53, "learning_rate": 6.224714687498088e-06, "loss": 0.1167, "step": 127000 }, { "epoch": 373.53, "eval_cer": 0.07475698531014341, "eval_loss": 0.49567899107933044, "eval_runtime": 5.3774, "eval_samples_per_second": 66.761, "eval_steps_per_second": 2.232, "eval_wer": 0.28163791713686925, "step": 127000 }, { "epoch": 373.82, "learning_rate": 6.21962054773413e-06, "loss": 0.1229, "step": 127100 }, { "epoch": 374.12, "learning_rate": 6.2145250615455e-06, "loss": 0.1165, "step": 127200 }, { "epoch": 374.41, "learning_rate": 6.209428234557462e-06, "loss": 0.1258, "step": 127300 }, { "epoch": 374.71, "learning_rate": 6.204330072396759e-06, "loss": 0.1203, "step": 127400 }, { "epoch": 375.0, "learning_rate": 6.199230580691613e-06, "loss": 0.1226, "step": 127500 }, { "epoch": 375.29, "learning_rate": 6.194129765071708e-06, "loss": 0.1153, "step": 127600 }, { "epoch": 375.59, "learning_rate": 6.189027631168194e-06, "loss": 0.1205, "step": 127700 }, { "epoch": 375.88, "learning_rate": 6.183924184613672e-06, "loss": 0.1221, "step": 127800 }, { "epoch": 376.18, "learning_rate": 6.178819431042198e-06, "loss": 0.1199, "step": 127900 }, { "epoch": 376.47, "learning_rate": 6.1737133760892655e-06, "loss": 0.1173, "step": 128000 }, { "epoch": 376.47, "eval_cer": 0.07462621507344928, "eval_loss": 0.4890415072441101, "eval_runtime": 4.8418, "eval_samples_per_second": 74.147, "eval_steps_per_second": 2.478, "eval_wer": 0.2801870062872803, "step": 128000 }, { "epoch": 376.76, "learning_rate": 6.168606025391807e-06, "loss": 0.1158, "step": 128100 }, { "epoch": 377.06, "learning_rate": 6.163497384588187e-06, "loss": 0.1153, "step": 128200 }, { "epoch": 377.35, "learning_rate": 6.158387459318186e-06, "loss": 0.1216, "step": 128300 }, { "epoch": 377.65, "learning_rate": 6.153276255223016e-06, "loss": 0.1168, "step": 128400 }, { "epoch": 377.94, "learning_rate": 6.148163777945292e-06, "loss": 0.118, "step": 128500 }, { "epoch": 378.24, "learning_rate": 6.143050033129035e-06, "loss": 0.115, "step": 128600 }, { "epoch": 378.53, "learning_rate": 6.137935026419669e-06, "loss": 0.1152, "step": 128700 }, { "epoch": 378.82, "learning_rate": 6.132818763464003e-06, "loss": 0.1227, "step": 128800 }, { "epoch": 379.12, "learning_rate": 6.127701249910245e-06, "loss": 0.1223, "step": 128900 }, { "epoch": 379.41, "learning_rate": 6.122582491407975e-06, "loss": 0.1184, "step": 129000 }, { "epoch": 379.41, "eval_cer": 0.07388518373218256, "eval_loss": 0.4918311536312103, "eval_runtime": 4.5282, "eval_samples_per_second": 79.281, "eval_steps_per_second": 2.65, "eval_wer": 0.2737385136224408, "step": 129000 }, { "epoch": 379.71, "learning_rate": 6.117462493608148e-06, "loss": 0.1195, "step": 129100 }, { "epoch": 380.0, "learning_rate": 6.112341262163092e-06, "loss": 0.1158, "step": 129200 }, { "epoch": 380.29, "learning_rate": 6.10721880272649e-06, "loss": 0.1154, "step": 129300 }, { "epoch": 380.59, "learning_rate": 6.102095120953385e-06, "loss": 0.1211, "step": 129400 }, { "epoch": 380.88, "learning_rate": 6.09697022250017e-06, "loss": 0.1211, "step": 129500 }, { "epoch": 381.18, "learning_rate": 6.091844113024581e-06, "loss": 0.1209, "step": 129600 }, { "epoch": 381.47, "learning_rate": 6.086716798185686e-06, "loss": 0.1197, "step": 129700 }, { "epoch": 381.76, "learning_rate": 6.081588283643892e-06, "loss": 0.1169, "step": 129800 }, { "epoch": 382.06, "learning_rate": 6.0764585750609215e-06, "loss": 0.1198, "step": 129900 }, { "epoch": 382.35, "learning_rate": 6.071327678099823e-06, "loss": 0.1142, "step": 130000 }, { "epoch": 382.35, "eval_cer": 0.07401595396887668, "eval_loss": 0.4911036491394043, "eval_runtime": 5.3976, "eval_samples_per_second": 66.51, "eval_steps_per_second": 2.223, "eval_wer": 0.2774463969047235, "step": 130000 }, { "epoch": 382.65, "learning_rate": 6.066195598424953e-06, "loss": 0.1159, "step": 130100 }, { "epoch": 382.94, "learning_rate": 6.0610623417019734e-06, "loss": 0.1172, "step": 130200 }, { "epoch": 383.24, "learning_rate": 6.055927913597847e-06, "loss": 0.1167, "step": 130300 }, { "epoch": 383.53, "learning_rate": 6.0507923197808275e-06, "loss": 0.1167, "step": 130400 }, { "epoch": 383.82, "learning_rate": 6.045655565920457e-06, "loss": 0.1305, "step": 130500 }, { "epoch": 384.12, "learning_rate": 6.040517657687562e-06, "loss": 0.1127, "step": 130600 }, { "epoch": 384.41, "learning_rate": 6.035378600754237e-06, "loss": 0.1232, "step": 130700 }, { "epoch": 384.71, "learning_rate": 6.030238400793849e-06, "loss": 0.1166, "step": 130800 }, { "epoch": 385.0, "learning_rate": 6.025097063481024e-06, "loss": 0.1152, "step": 130900 }, { "epoch": 385.29, "learning_rate": 6.019954594491645e-06, "loss": 0.1118, "step": 131000 }, { "epoch": 385.29, "eval_cer": 0.07610827775598274, "eval_loss": 0.49062150716781616, "eval_runtime": 4.4732, "eval_samples_per_second": 80.256, "eval_steps_per_second": 2.683, "eval_wer": 0.2847009511526681, "step": 131000 }, { "epoch": 385.59, "learning_rate": 6.014810999502842e-06, "loss": 0.1142, "step": 131100 }, { "epoch": 385.88, "learning_rate": 6.009666284192995e-06, "loss": 0.1225, "step": 131200 }, { "epoch": 386.18, "learning_rate": 6.004571918040052e-06, "loss": 0.1195, "step": 131300 }, { "epoch": 386.47, "learning_rate": 5.99942499018966e-06, "loss": 0.1158, "step": 131400 }, { "epoch": 386.76, "learning_rate": 5.994276959003917e-06, "loss": 0.1169, "step": 131500 }, { "epoch": 387.06, "learning_rate": 5.989127830166097e-06, "loss": 0.1152, "step": 131600 }, { "epoch": 387.35, "learning_rate": 5.983977609360683e-06, "loss": 0.1156, "step": 131700 }, { "epoch": 387.65, "learning_rate": 5.978826302273363e-06, "loss": 0.1097, "step": 131800 }, { "epoch": 387.94, "learning_rate": 5.973673914591029e-06, "loss": 0.115, "step": 131900 }, { "epoch": 388.24, "learning_rate": 5.968520452001762e-06, "loss": 0.1156, "step": 132000 }, { "epoch": 388.24, "eval_cer": 0.07462621507344928, "eval_loss": 0.49032217264175415, "eval_runtime": 4.9494, "eval_samples_per_second": 72.533, "eval_steps_per_second": 2.425, "eval_wer": 0.2793809447041754, "step": 132000 }, { "epoch": 388.53, "learning_rate": 5.963365920194832e-06, "loss": 0.111, "step": 132100 }, { "epoch": 388.82, "learning_rate": 5.958210324860687e-06, "loss": 0.1128, "step": 132200 }, { "epoch": 389.12, "learning_rate": 5.953053671690952e-06, "loss": 0.1155, "step": 132300 }, { "epoch": 389.41, "learning_rate": 5.947947548620953e-06, "loss": 0.1136, "step": 132400 }, { "epoch": 389.71, "learning_rate": 5.9427888072958684e-06, "loss": 0.1123, "step": 132500 }, { "epoch": 390.0, "learning_rate": 5.937629025160088e-06, "loss": 0.12, "step": 132600 }, { "epoch": 390.29, "learning_rate": 5.9324682079098565e-06, "loss": 0.1158, "step": 132700 }, { "epoch": 390.59, "learning_rate": 5.927306361242563e-06, "loss": 0.1151, "step": 132800 }, { "epoch": 390.88, "learning_rate": 5.922143490856731e-06, "loss": 0.1119, "step": 132900 }, { "epoch": 391.18, "learning_rate": 5.9169796024520155e-06, "loss": 0.1102, "step": 133000 }, { "epoch": 391.18, "eval_cer": 0.07471339523124537, "eval_loss": 0.5015389919281006, "eval_runtime": 4.6902, "eval_samples_per_second": 76.543, "eval_steps_per_second": 2.559, "eval_wer": 0.27889730775431243, "step": 133000 }, { "epoch": 391.47, "learning_rate": 5.911814701729196e-06, "loss": 0.1132, "step": 133100 }, { "epoch": 391.76, "learning_rate": 5.906648794390167e-06, "loss": 0.1146, "step": 133200 }, { "epoch": 392.06, "learning_rate": 5.9014818861379375e-06, "loss": 0.112, "step": 133300 }, { "epoch": 392.35, "learning_rate": 5.89631398267662e-06, "loss": 0.1116, "step": 133400 }, { "epoch": 392.65, "learning_rate": 5.891145089711425e-06, "loss": 0.1121, "step": 133500 }, { "epoch": 392.94, "learning_rate": 5.885975212948656e-06, "loss": 0.1157, "step": 133600 }, { "epoch": 393.24, "learning_rate": 5.880804358095702e-06, "loss": 0.1101, "step": 133700 }, { "epoch": 393.53, "learning_rate": 5.875632530861034e-06, "loss": 0.1167, "step": 133800 }, { "epoch": 393.82, "learning_rate": 5.870511469659539e-06, "loss": 0.1119, "step": 133900 }, { "epoch": 394.12, "learning_rate": 5.8653377243724815e-06, "loss": 0.1191, "step": 134000 }, { "epoch": 394.12, "eval_cer": 0.07475698531014341, "eval_loss": 0.5096559524536133, "eval_runtime": 5.1149, "eval_samples_per_second": 70.188, "eval_steps_per_second": 2.346, "eval_wer": 0.2779300338545865, "step": 134000 }, { "epoch": 394.41, "learning_rate": 5.86016302377841e-06, "loss": 0.1136, "step": 134100 }, { "epoch": 394.71, "learning_rate": 5.854987373590043e-06, "loss": 0.1159, "step": 134200 }, { "epoch": 395.0, "learning_rate": 5.8498107795211376e-06, "loss": 0.1145, "step": 134300 }, { "epoch": 395.29, "learning_rate": 5.8446332472865054e-06, "loss": 0.1102, "step": 134400 }, { "epoch": 395.59, "learning_rate": 5.839454782601983e-06, "loss": 0.1104, "step": 134500 }, { "epoch": 395.88, "learning_rate": 5.834275391184444e-06, "loss": 0.1101, "step": 134600 }, { "epoch": 396.18, "learning_rate": 5.829095078751781e-06, "loss": 0.1105, "step": 134700 }, { "epoch": 396.47, "learning_rate": 5.823913851022901e-06, "loss": 0.1167, "step": 134800 }, { "epoch": 396.76, "learning_rate": 5.818731713717729e-06, "loss": 0.1175, "step": 134900 }, { "epoch": 397.06, "learning_rate": 5.813548672557189e-06, "loss": 0.1129, "step": 135000 }, { "epoch": 397.06, "eval_cer": 0.07366723333769234, "eval_loss": 0.5002287030220032, "eval_runtime": 5.5456, "eval_samples_per_second": 64.736, "eval_steps_per_second": 2.164, "eval_wer": 0.2763179106883766, "step": 135000 }, { "epoch": 397.35, "learning_rate": 5.808364733263202e-06, "loss": 0.1121, "step": 135100 }, { "epoch": 397.65, "learning_rate": 5.803179901558684e-06, "loss": 0.1149, "step": 135200 }, { "epoch": 397.94, "learning_rate": 5.797994183167534e-06, "loss": 0.1112, "step": 135300 }, { "epoch": 398.24, "learning_rate": 5.792807583814628e-06, "loss": 0.1118, "step": 135400 }, { "epoch": 398.53, "learning_rate": 5.787620109225819e-06, "loss": 0.1175, "step": 135500 }, { "epoch": 398.82, "learning_rate": 5.782431765127925e-06, "loss": 0.1092, "step": 135600 }, { "epoch": 399.12, "learning_rate": 5.777242557248722e-06, "loss": 0.1143, "step": 135700 }, { "epoch": 399.41, "learning_rate": 5.772052491316941e-06, "loss": 0.1126, "step": 135800 }, { "epoch": 399.71, "learning_rate": 5.766861573062257e-06, "loss": 0.1176, "step": 135900 }, { "epoch": 400.0, "learning_rate": 5.761669808215291e-06, "loss": 0.1097, "step": 136000 }, { "epoch": 400.0, "eval_cer": 0.07488775554683753, "eval_loss": 0.5063867568969727, "eval_runtime": 4.6813, "eval_samples_per_second": 76.689, "eval_steps_per_second": 2.563, "eval_wer": 0.2809930678703853, "step": 136000 }, { "epoch": 400.29, "learning_rate": 5.756477202507598e-06, "loss": 0.1192, "step": 136100 }, { "epoch": 400.59, "learning_rate": 5.751283761671659e-06, "loss": 0.1035, "step": 136200 }, { "epoch": 400.88, "learning_rate": 5.746089491440875e-06, "loss": 0.1048, "step": 136300 }, { "epoch": 401.18, "learning_rate": 5.740894397549567e-06, "loss": 0.106, "step": 136400 }, { "epoch": 401.47, "learning_rate": 5.735698485732963e-06, "loss": 0.1065, "step": 136500 }, { "epoch": 401.76, "learning_rate": 5.730501761727196e-06, "loss": 0.1117, "step": 136600 }, { "epoch": 402.06, "learning_rate": 5.725304231269293e-06, "loss": 0.1157, "step": 136700 }, { "epoch": 402.35, "learning_rate": 5.720105900097174e-06, "loss": 0.1119, "step": 136800 }, { "epoch": 402.65, "learning_rate": 5.7149067739496375e-06, "loss": 0.1088, "step": 136900 }, { "epoch": 402.94, "learning_rate": 5.709706858566368e-06, "loss": 0.1049, "step": 137000 }, { "epoch": 402.94, "eval_cer": 0.07288261191752757, "eval_loss": 0.497284859418869, "eval_runtime": 4.9493, "eval_samples_per_second": 72.535, "eval_steps_per_second": 2.425, "eval_wer": 0.2732548766725778, "step": 137000 }, { "epoch": 403.24, "learning_rate": 5.704506159687914e-06, "loss": 0.1091, "step": 137100 }, { "epoch": 403.53, "learning_rate": 5.699304683055693e-06, "loss": 0.1183, "step": 137200 }, { "epoch": 403.82, "learning_rate": 5.69410243441198e-06, "loss": 0.1084, "step": 137300 }, { "epoch": 404.12, "learning_rate": 5.6888994194999015e-06, "loss": 0.1108, "step": 137400 }, { "epoch": 404.41, "learning_rate": 5.683695644063432e-06, "loss": 0.1056, "step": 137500 }, { "epoch": 404.71, "learning_rate": 5.6784911138473804e-06, "loss": 0.1134, "step": 137600 }, { "epoch": 405.0, "learning_rate": 5.6732858345973975e-06, "loss": 0.113, "step": 137700 }, { "epoch": 405.29, "learning_rate": 5.6680798120599556e-06, "loss": 0.1164, "step": 137800 }, { "epoch": 405.59, "learning_rate": 5.662873051982345e-06, "loss": 0.117, "step": 137900 }, { "epoch": 405.88, "learning_rate": 5.657665560112675e-06, "loss": 0.117, "step": 138000 }, { "epoch": 405.88, "eval_cer": 0.0742339043633669, "eval_loss": 0.5041438341140747, "eval_runtime": 5.2679, "eval_samples_per_second": 68.149, "eval_steps_per_second": 2.278, "eval_wer": 0.2790585200709334, "step": 138000 }, { "epoch": 406.18, "learning_rate": 5.652457342199862e-06, "loss": 0.1129, "step": 138100 }, { "epoch": 406.47, "learning_rate": 5.647248403993621e-06, "loss": 0.1138, "step": 138200 }, { "epoch": 406.76, "learning_rate": 5.642038751244467e-06, "loss": 0.1099, "step": 138300 }, { "epoch": 407.06, "learning_rate": 5.636828389703699e-06, "loss": 0.1094, "step": 138400 }, { "epoch": 407.35, "learning_rate": 5.631617325123402e-06, "loss": 0.1055, "step": 138500 }, { "epoch": 407.65, "learning_rate": 5.626405563256434e-06, "loss": 0.1122, "step": 138600 }, { "epoch": 407.94, "learning_rate": 5.62124523779462e-06, "loss": 0.1102, "step": 138700 }, { "epoch": 408.24, "learning_rate": 5.616032105445265e-06, "loss": 0.1095, "step": 138800 }, { "epoch": 408.53, "learning_rate": 5.610818293014856e-06, "loss": 0.1117, "step": 138900 }, { "epoch": 408.82, "learning_rate": 5.605603806259288e-06, "loss": 0.1082, "step": 139000 }, { "epoch": 408.82, "eval_cer": 0.07218517065515889, "eval_loss": 0.5032652616500854, "eval_runtime": 4.4402, "eval_samples_per_second": 80.853, "eval_steps_per_second": 2.703, "eval_wer": 0.2713203288731259, "step": 139000 }, { "epoch": 409.12, "learning_rate": 5.600388650935198e-06, "loss": 0.1117, "step": 139100 }, { "epoch": 409.41, "learning_rate": 5.595172832799962e-06, "loss": 0.1055, "step": 139200 }, { "epoch": 409.71, "learning_rate": 5.589956357611688e-06, "loss": 0.1079, "step": 139300 }, { "epoch": 410.0, "learning_rate": 5.584739231129208e-06, "loss": 0.1094, "step": 139400 }, { "epoch": 410.29, "learning_rate": 5.579521459112074e-06, "loss": 0.1046, "step": 139500 }, { "epoch": 410.59, "learning_rate": 5.574303047320551e-06, "loss": 0.1145, "step": 139600 }, { "epoch": 410.88, "learning_rate": 5.569136195093107e-06, "loss": 0.1112, "step": 139700 }, { "epoch": 411.18, "learning_rate": 5.563916527290414e-06, "loss": 0.1119, "step": 139800 }, { "epoch": 411.47, "learning_rate": 5.558696236940708e-06, "loss": 0.1083, "step": 139900 }, { "epoch": 411.76, "learning_rate": 5.553475329807039e-06, "loss": 0.1119, "step": 140000 }, { "epoch": 411.76, "eval_cer": 0.073318512706508, "eval_loss": 0.5045868754386902, "eval_runtime": 4.7184, "eval_samples_per_second": 76.085, "eval_steps_per_second": 2.543, "eval_wer": 0.27518942447202965, "step": 140000 }, { "epoch": 412.06, "learning_rate": 5.548253811653128e-06, "loss": 0.1071, "step": 140100 }, { "epoch": 412.35, "learning_rate": 5.543031688243378e-06, "loss": 0.1126, "step": 140200 }, { "epoch": 412.65, "learning_rate": 5.537808965342856e-06, "loss": 0.1018, "step": 140300 }, { "epoch": 412.94, "learning_rate": 5.5325856487172936e-06, "loss": 0.1087, "step": 140400 }, { "epoch": 413.24, "learning_rate": 5.527361744133073e-06, "loss": 0.1081, "step": 140500 }, { "epoch": 413.53, "learning_rate": 5.522137257357233e-06, "loss": 0.108, "step": 140600 }, { "epoch": 413.82, "learning_rate": 5.516912194157449e-06, "loss": 0.1138, "step": 140700 }, { "epoch": 414.12, "learning_rate": 5.5116865603020355e-06, "loss": 0.1073, "step": 140800 }, { "epoch": 414.41, "learning_rate": 5.5064603615599364e-06, "loss": 0.1084, "step": 140900 }, { "epoch": 414.71, "learning_rate": 5.5012336037007165e-06, "loss": 0.113, "step": 141000 }, { "epoch": 414.71, "eval_cer": 0.0739287738110806, "eval_loss": 0.5068278908729553, "eval_runtime": 4.4954, "eval_samples_per_second": 79.86, "eval_steps_per_second": 2.669, "eval_wer": 0.27712397227148156, "step": 141000 }, { "epoch": 415.0, "learning_rate": 5.496006292494563e-06, "loss": 0.1068, "step": 141100 }, { "epoch": 415.29, "learning_rate": 5.490778433712272e-06, "loss": 0.1119, "step": 141200 }, { "epoch": 415.59, "learning_rate": 5.485550033125242e-06, "loss": 0.1073, "step": 141300 }, { "epoch": 415.88, "learning_rate": 5.480321096505472e-06, "loss": 0.1052, "step": 141400 }, { "epoch": 416.18, "learning_rate": 5.475091629625551e-06, "loss": 0.1095, "step": 141500 }, { "epoch": 416.47, "learning_rate": 5.469861638258653e-06, "loss": 0.1113, "step": 141600 }, { "epoch": 416.76, "learning_rate": 5.4646311281785355e-06, "loss": 0.1081, "step": 141700 }, { "epoch": 417.06, "learning_rate": 5.459400105159525e-06, "loss": 0.1029, "step": 141800 }, { "epoch": 417.35, "learning_rate": 5.454168574976514e-06, "loss": 0.1133, "step": 141900 }, { "epoch": 417.65, "learning_rate": 5.4489365434049535e-06, "loss": 0.1091, "step": 142000 }, { "epoch": 417.65, "eval_cer": 0.07275184168083344, "eval_loss": 0.5030051469802856, "eval_runtime": 5.6004, "eval_samples_per_second": 64.103, "eval_steps_per_second": 2.143, "eval_wer": 0.2748669998387877, "step": 142000 }, { "epoch": 417.94, "learning_rate": 5.443704016220852e-06, "loss": 0.1109, "step": 142100 }, { "epoch": 418.24, "learning_rate": 5.438470999200765e-06, "loss": 0.1039, "step": 142200 }, { "epoch": 418.53, "learning_rate": 5.433237498121785e-06, "loss": 0.1073, "step": 142300 }, { "epoch": 418.82, "learning_rate": 5.428003518761542e-06, "loss": 0.1132, "step": 142400 }, { "epoch": 419.12, "learning_rate": 5.422769066898191e-06, "loss": 0.1089, "step": 142500 }, { "epoch": 419.41, "learning_rate": 5.417534148310413e-06, "loss": 0.1145, "step": 142600 }, { "epoch": 419.71, "learning_rate": 5.412298768777399e-06, "loss": 0.1076, "step": 142700 }, { "epoch": 420.0, "learning_rate": 5.407062934078855e-06, "loss": 0.106, "step": 142800 }, { "epoch": 420.29, "learning_rate": 5.401826649994986e-06, "loss": 0.1088, "step": 142900 }, { "epoch": 420.59, "learning_rate": 5.39658992230649e-06, "loss": 0.1079, "step": 143000 }, { "epoch": 420.59, "eval_cer": 0.0736236432587943, "eval_loss": 0.5185303688049316, "eval_runtime": 4.7112, "eval_samples_per_second": 76.202, "eval_steps_per_second": 2.547, "eval_wer": 0.27551184910527166, "step": 143000 }, { "epoch": 420.88, "learning_rate": 5.39135275679456e-06, "loss": 0.1097, "step": 143100 }, { "epoch": 421.18, "learning_rate": 5.38611515924087e-06, "loss": 0.108, "step": 143200 }, { "epoch": 421.47, "learning_rate": 5.380877135427571e-06, "loss": 0.107, "step": 143300 }, { "epoch": 421.76, "learning_rate": 5.3756386911372885e-06, "loss": 0.1098, "step": 143400 }, { "epoch": 422.06, "learning_rate": 5.370399832153105e-06, "loss": 0.1081, "step": 143500 }, { "epoch": 422.35, "learning_rate": 5.365160564258564e-06, "loss": 0.1028, "step": 143600 }, { "epoch": 422.65, "learning_rate": 5.359920893237661e-06, "loss": 0.1014, "step": 143700 }, { "epoch": 422.94, "learning_rate": 5.354680824874838e-06, "loss": 0.1069, "step": 143800 }, { "epoch": 423.24, "learning_rate": 5.349440364954974e-06, "loss": 0.1084, "step": 143900 }, { "epoch": 423.53, "learning_rate": 5.34419951926338e-06, "loss": 0.1076, "step": 144000 }, { "epoch": 423.53, "eval_cer": 0.07405954404777472, "eval_loss": 0.5147412419319153, "eval_runtime": 4.5037, "eval_samples_per_second": 79.712, "eval_steps_per_second": 2.664, "eval_wer": 0.2785748831210704, "step": 144000 }, { "epoch": 423.82, "learning_rate": 5.338958293585792e-06, "loss": 0.1043, "step": 144100 }, { "epoch": 424.12, "learning_rate": 5.33376911154043e-06, "loss": 0.1108, "step": 144200 }, { "epoch": 424.41, "learning_rate": 5.328527146905228e-06, "loss": 0.1142, "step": 144300 }, { "epoch": 424.71, "learning_rate": 5.3232848195858635e-06, "loss": 0.1071, "step": 144400 }, { "epoch": 425.0, "learning_rate": 5.3180421353697085e-06, "loss": 0.1034, "step": 144500 }, { "epoch": 425.29, "learning_rate": 5.312799100044533e-06, "loss": 0.1069, "step": 144600 }, { "epoch": 425.59, "learning_rate": 5.3075557193984864e-06, "loss": 0.1037, "step": 144700 }, { "epoch": 425.88, "learning_rate": 5.302311999220111e-06, "loss": 0.108, "step": 144800 }, { "epoch": 426.18, "learning_rate": 5.297067945298313e-06, "loss": 0.1121, "step": 144900 }, { "epoch": 426.47, "learning_rate": 5.291823563422372e-06, "loss": 0.107, "step": 145000 }, { "epoch": 426.47, "eval_cer": 0.07292620199642562, "eval_loss": 0.5176792740821838, "eval_runtime": 4.7997, "eval_samples_per_second": 74.796, "eval_steps_per_second": 2.5, "eval_wer": 0.2737385136224408, "step": 145000 }, { "epoch": 426.76, "learning_rate": 5.28657885938193e-06, "loss": 0.1021, "step": 145100 }, { "epoch": 427.06, "learning_rate": 5.281333838966982e-06, "loss": 0.1001, "step": 145200 }, { "epoch": 427.35, "learning_rate": 5.276088507967876e-06, "loss": 0.1103, "step": 145300 }, { "epoch": 427.65, "learning_rate": 5.2708428721752995e-06, "loss": 0.1074, "step": 145400 }, { "epoch": 427.94, "learning_rate": 5.265596937380277e-06, "loss": 0.1005, "step": 145500 }, { "epoch": 428.24, "learning_rate": 5.260350709374167e-06, "loss": 0.1044, "step": 145600 }, { "epoch": 428.53, "learning_rate": 5.255104193948646e-06, "loss": 0.1069, "step": 145700 }, { "epoch": 428.82, "learning_rate": 5.24985739689571e-06, "loss": 0.1122, "step": 145800 }, { "epoch": 429.12, "learning_rate": 5.2446103240076685e-06, "loss": 0.1052, "step": 145900 }, { "epoch": 429.41, "learning_rate": 5.239362981077132e-06, "loss": 0.1082, "step": 146000 }, { "epoch": 429.41, "eval_cer": 0.07344928294320213, "eval_loss": 0.51496821641922, "eval_runtime": 4.8758, "eval_samples_per_second": 73.63, "eval_steps_per_second": 2.461, "eval_wer": 0.2764791230049976, "step": 146000 }, { "epoch": 429.71, "learning_rate": 5.23411537389701e-06, "loss": 0.1047, "step": 146100 }, { "epoch": 430.0, "learning_rate": 5.2288675082605045e-06, "loss": 0.1101, "step": 146200 }, { "epoch": 430.29, "learning_rate": 5.223619389961103e-06, "loss": 0.1032, "step": 146300 }, { "epoch": 430.59, "learning_rate": 5.218371024792572e-06, "loss": 0.0983, "step": 146400 }, { "epoch": 430.88, "learning_rate": 5.213122418548948e-06, "loss": 0.1118, "step": 146500 }, { "epoch": 431.18, "learning_rate": 5.2078735770245385e-06, "loss": 0.1063, "step": 146600 }, { "epoch": 431.47, "learning_rate": 5.202624506013904e-06, "loss": 0.1084, "step": 146700 }, { "epoch": 431.76, "learning_rate": 5.197375211311864e-06, "loss": 0.1056, "step": 146800 }, { "epoch": 432.06, "learning_rate": 5.192178194899027e-06, "loss": 0.1106, "step": 146900 }, { "epoch": 432.35, "learning_rate": 5.186928472291934e-06, "loss": 0.1018, "step": 147000 }, { "epoch": 432.35, "eval_cer": 0.07375441349548843, "eval_loss": 0.5148587822914124, "eval_runtime": 5.1845, "eval_samples_per_second": 69.245, "eval_steps_per_second": 2.315, "eval_wer": 0.2742221505723037, "step": 147000 }, { "epoch": 432.65, "learning_rate": 5.181678543321391e-06, "loss": 0.1075, "step": 147100 }, { "epoch": 432.94, "learning_rate": 5.176428413783156e-06, "loss": 0.1031, "step": 147200 }, { "epoch": 433.24, "learning_rate": 5.171178089473222e-06, "loss": 0.1064, "step": 147300 }, { "epoch": 433.53, "learning_rate": 5.165927576187788e-06, "loss": 0.1091, "step": 147400 }, { "epoch": 433.82, "learning_rate": 5.160676879723263e-06, "loss": 0.1027, "step": 147500 }, { "epoch": 434.12, "learning_rate": 5.155426005876261e-06, "loss": 0.1088, "step": 147600 }, { "epoch": 434.41, "learning_rate": 5.150174960443588e-06, "loss": 0.1016, "step": 147700 }, { "epoch": 434.71, "learning_rate": 5.14492374922224e-06, "loss": 0.1046, "step": 147800 }, { "epoch": 435.0, "learning_rate": 5.139672378009402e-06, "loss": 0.1044, "step": 147900 }, { "epoch": 435.29, "learning_rate": 5.134420852602428e-06, "loss": 0.1028, "step": 148000 }, { "epoch": 435.29, "eval_cer": 0.07292620199642562, "eval_loss": 0.5164076685905457, "eval_runtime": 5.4, "eval_samples_per_second": 66.482, "eval_steps_per_second": 2.222, "eval_wer": 0.2748669998387877, "step": 148000 }, { "epoch": 435.59, "learning_rate": 5.129169178798846e-06, "loss": 0.1016, "step": 148100 }, { "epoch": 435.88, "learning_rate": 5.1239173623963465e-06, "loss": 0.1081, "step": 148200 }, { "epoch": 436.18, "learning_rate": 5.118665409192778e-06, "loss": 0.1082, "step": 148300 }, { "epoch": 436.47, "learning_rate": 5.113465846457636e-06, "loss": 0.0973, "step": 148400 }, { "epoch": 436.76, "learning_rate": 5.108213638269423e-06, "loss": 0.1, "step": 148500 }, { "epoch": 437.06, "learning_rate": 5.102961310616583e-06, "loss": 0.1126, "step": 148600 }, { "epoch": 437.35, "learning_rate": 5.09770886929753e-06, "loss": 0.096, "step": 148700 }, { "epoch": 437.65, "learning_rate": 5.092456320110802e-06, "loss": 0.1005, "step": 148800 }, { "epoch": 437.94, "learning_rate": 5.087203668855059e-06, "loss": 0.1019, "step": 148900 }, { "epoch": 438.24, "learning_rate": 5.081950921329067e-06, "loss": 0.1031, "step": 149000 }, { "epoch": 438.24, "eval_cer": 0.07318774246981387, "eval_loss": 0.5136764049530029, "eval_runtime": 5.3659, "eval_samples_per_second": 66.903, "eval_steps_per_second": 2.236, "eval_wer": 0.2747057875221667, "step": 149000 }, { "epoch": 438.53, "learning_rate": 5.076698083331706e-06, "loss": 0.1097, "step": 149100 }, { "epoch": 438.82, "learning_rate": 5.07144516066195e-06, "loss": 0.1034, "step": 149200 }, { "epoch": 439.12, "learning_rate": 5.066192159118869e-06, "loss": 0.1075, "step": 149300 }, { "epoch": 439.41, "learning_rate": 5.060939084501621e-06, "loss": 0.1065, "step": 149400 }, { "epoch": 439.71, "learning_rate": 5.055685942609444e-06, "loss": 0.1049, "step": 149500 }, { "epoch": 440.0, "learning_rate": 5.050432739241649e-06, "loss": 0.1031, "step": 149600 }, { "epoch": 440.29, "learning_rate": 5.045179480197614e-06, "loss": 0.1079, "step": 149700 }, { "epoch": 440.59, "learning_rate": 5.039926171276781e-06, "loss": 0.1001, "step": 149800 }, { "epoch": 440.88, "learning_rate": 5.03467281827865e-06, "loss": 0.1063, "step": 149900 }, { "epoch": 441.18, "learning_rate": 5.02941942700276e-06, "loss": 0.1101, "step": 150000 }, { "epoch": 441.18, "eval_cer": 0.0720979904973628, "eval_loss": 0.5085006356239319, "eval_runtime": 4.5834, "eval_samples_per_second": 78.325, "eval_steps_per_second": 2.618, "eval_wer": 0.27035305497339995, "step": 150000 }, { "epoch": 441.47, "learning_rate": 5.024166003248703e-06, "loss": 0.1019, "step": 150100 }, { "epoch": 441.76, "learning_rate": 5.018912552816099e-06, "loss": 0.1026, "step": 150200 }, { "epoch": 442.06, "learning_rate": 5.0136590815046005e-06, "loss": 0.1031, "step": 150300 }, { "epoch": 442.35, "learning_rate": 5.008405595113883e-06, "loss": 0.1048, "step": 150400 }, { "epoch": 442.65, "learning_rate": 5.003152099443643e-06, "loss": 0.1062, "step": 150500 }, { "epoch": 442.94, "learning_rate": 4.997898600293576e-06, "loss": 0.1024, "step": 150600 }, { "epoch": 443.24, "learning_rate": 4.992645103463394e-06, "loss": 0.106, "step": 150700 }, { "epoch": 443.53, "learning_rate": 4.9873916147527965e-06, "loss": 0.1097, "step": 150800 }, { "epoch": 443.82, "learning_rate": 4.9821381399614795e-06, "loss": 0.1016, "step": 150900 }, { "epoch": 444.12, "learning_rate": 4.976937219323197e-06, "loss": 0.1037, "step": 151000 }, { "epoch": 444.12, "eval_cer": 0.07188004010287259, "eval_loss": 0.5222977995872498, "eval_runtime": 5.3886, "eval_samples_per_second": 66.622, "eval_steps_per_second": 2.227, "eval_wer": 0.2709979042398839, "step": 151000 }, { "epoch": 444.41, "learning_rate": 4.971683789485565e-06, "loss": 0.1015, "step": 151100 }, { "epoch": 444.71, "learning_rate": 4.966430390908183e-06, "loss": 0.1074, "step": 151200 }, { "epoch": 445.0, "learning_rate": 4.961177029390647e-06, "loss": 0.0986, "step": 151300 }, { "epoch": 445.29, "learning_rate": 4.955923710732511e-06, "loss": 0.1052, "step": 151400 }, { "epoch": 445.59, "learning_rate": 4.950670440733284e-06, "loss": 0.1072, "step": 151500 }, { "epoch": 445.88, "learning_rate": 4.945417225192419e-06, "loss": 0.1041, "step": 151600 }, { "epoch": 446.18, "learning_rate": 4.940164069909305e-06, "loss": 0.101, "step": 151700 }, { "epoch": 446.47, "learning_rate": 4.934910980683273e-06, "loss": 0.105, "step": 151800 }, { "epoch": 446.76, "learning_rate": 4.929657963313573e-06, "loss": 0.1043, "step": 151900 }, { "epoch": 447.06, "learning_rate": 4.924405023599384e-06, "loss": 0.101, "step": 152000 }, { "epoch": 447.06, "eval_cer": 0.07257748136524127, "eval_loss": 0.5275741815567017, "eval_runtime": 4.7697, "eval_samples_per_second": 75.267, "eval_steps_per_second": 2.516, "eval_wer": 0.2745445752055457, "step": 152000 }, { "epoch": 447.35, "learning_rate": 4.919152167339793e-06, "loss": 0.1, "step": 152100 }, { "epoch": 447.65, "learning_rate": 4.913899400333793e-06, "loss": 0.1068, "step": 152200 }, { "epoch": 447.94, "learning_rate": 4.908646728380285e-06, "loss": 0.1072, "step": 152300 }, { "epoch": 448.24, "learning_rate": 4.90339415727806e-06, "loss": 0.0946, "step": 152400 }, { "epoch": 448.53, "learning_rate": 4.898141692825804e-06, "loss": 0.1033, "step": 152500 }, { "epoch": 448.82, "learning_rate": 4.892889340822079e-06, "loss": 0.1096, "step": 152600 }, { "epoch": 449.12, "learning_rate": 4.88763710706532e-06, "loss": 0.0976, "step": 152700 }, { "epoch": 449.41, "learning_rate": 4.882384997353843e-06, "loss": 0.1001, "step": 152800 }, { "epoch": 449.71, "learning_rate": 4.877133017485817e-06, "loss": 0.1071, "step": 152900 }, { "epoch": 450.0, "learning_rate": 4.871881173259271e-06, "loss": 0.11, "step": 153000 }, { "epoch": 450.0, "eval_cer": 0.07144413931389215, "eval_loss": 0.5202327370643616, "eval_runtime": 4.6964, "eval_samples_per_second": 76.442, "eval_steps_per_second": 2.555, "eval_wer": 0.2680960825407061, "step": 153000 }, { "epoch": 450.29, "learning_rate": 4.866629470472086e-06, "loss": 0.0997, "step": 153100 }, { "epoch": 450.59, "learning_rate": 4.861377914921982e-06, "loss": 0.1028, "step": 153200 }, { "epoch": 450.88, "learning_rate": 4.856126512406523e-06, "loss": 0.1034, "step": 153300 }, { "epoch": 451.18, "learning_rate": 4.850875268723097e-06, "loss": 0.0986, "step": 153400 }, { "epoch": 451.47, "learning_rate": 4.845624189668923e-06, "loss": 0.0993, "step": 153500 }, { "epoch": 451.76, "learning_rate": 4.8403732810410364e-06, "loss": 0.1028, "step": 153600 }, { "epoch": 452.06, "learning_rate": 4.835122548636279e-06, "loss": 0.1034, "step": 153700 }, { "epoch": 452.35, "learning_rate": 4.829871998251308e-06, "loss": 0.1045, "step": 153800 }, { "epoch": 452.65, "learning_rate": 4.82462163568257e-06, "loss": 0.0997, "step": 153900 }, { "epoch": 452.94, "learning_rate": 4.819371466726311e-06, "loss": 0.101, "step": 154000 }, { "epoch": 452.94, "eval_cer": 0.07235953097075105, "eval_loss": 0.5265692472457886, "eval_runtime": 5.2446, "eval_samples_per_second": 68.452, "eval_steps_per_second": 2.288, "eval_wer": 0.27067547960664196, "step": 154000 }, { "epoch": 453.24, "learning_rate": 4.814121497178561e-06, "loss": 0.1029, "step": 154100 }, { "epoch": 453.53, "learning_rate": 4.808871732835127e-06, "loss": 0.1099, "step": 154200 }, { "epoch": 453.82, "learning_rate": 4.803622179491595e-06, "loss": 0.1007, "step": 154300 }, { "epoch": 454.12, "learning_rate": 4.798372842943313e-06, "loss": 0.1024, "step": 154400 }, { "epoch": 454.41, "learning_rate": 4.793123728985394e-06, "loss": 0.1029, "step": 154500 }, { "epoch": 454.71, "learning_rate": 4.787874843412701e-06, "loss": 0.1021, "step": 154600 }, { "epoch": 455.0, "learning_rate": 4.782626192019848e-06, "loss": 0.1064, "step": 154700 }, { "epoch": 455.29, "learning_rate": 4.77737778060119e-06, "loss": 0.106, "step": 154800 }, { "epoch": 455.59, "learning_rate": 4.7721296149508145e-06, "loss": 0.1033, "step": 154900 }, { "epoch": 455.88, "learning_rate": 4.766881700862543e-06, "loss": 0.0996, "step": 155000 }, { "epoch": 455.88, "eval_cer": 0.0717928599450765, "eval_loss": 0.5203773975372314, "eval_runtime": 4.9467, "eval_samples_per_second": 72.574, "eval_steps_per_second": 2.426, "eval_wer": 0.26777365790746416, "step": 155000 }, { "epoch": 456.18, "learning_rate": 4.7616340441299125e-06, "loss": 0.0956, "step": 155100 }, { "epoch": 456.47, "learning_rate": 4.75638665054618e-06, "loss": 0.1047, "step": 155200 }, { "epoch": 456.76, "learning_rate": 4.751139525904315e-06, "loss": 0.1088, "step": 155300 }, { "epoch": 457.06, "learning_rate": 4.745892675996981e-06, "loss": 0.1061, "step": 155400 }, { "epoch": 457.35, "learning_rate": 4.740646106616548e-06, "loss": 0.0984, "step": 155500 }, { "epoch": 457.65, "learning_rate": 4.7353998235550695e-06, "loss": 0.0978, "step": 155600 }, { "epoch": 457.94, "learning_rate": 4.7301538326042854e-06, "loss": 0.1028, "step": 155700 }, { "epoch": 458.24, "learning_rate": 4.724908139555617e-06, "loss": 0.1034, "step": 155800 }, { "epoch": 458.53, "learning_rate": 4.719662750200145e-06, "loss": 0.0987, "step": 155900 }, { "epoch": 458.82, "learning_rate": 4.714522568855664e-06, "loss": 0.1012, "step": 156000 }, { "epoch": 458.82, "eval_cer": 0.07161849962948433, "eval_loss": 0.5153563618659973, "eval_runtime": 5.0809, "eval_samples_per_second": 70.657, "eval_steps_per_second": 2.362, "eval_wer": 0.26954699339029503, "step": 156000 }, { "epoch": 459.12, "learning_rate": 4.709277797896285e-06, "loss": 0.0998, "step": 156100 }, { "epoch": 459.41, "learning_rate": 4.704033347885536e-06, "loss": 0.0976, "step": 156200 }, { "epoch": 459.71, "learning_rate": 4.698789224613135e-06, "loss": 0.103, "step": 156300 }, { "epoch": 460.0, "learning_rate": 4.6935454338684375e-06, "loss": 0.1093, "step": 156400 }, { "epoch": 460.29, "learning_rate": 4.68830198144043e-06, "loss": 0.1001, "step": 156500 }, { "epoch": 460.59, "learning_rate": 4.683058873117732e-06, "loss": 0.098, "step": 156600 }, { "epoch": 460.88, "learning_rate": 4.677816114688576e-06, "loss": 0.0984, "step": 156700 }, { "epoch": 461.18, "learning_rate": 4.672573711940808e-06, "loss": 0.0993, "step": 156800 }, { "epoch": 461.47, "learning_rate": 4.6673316706618886e-06, "loss": 0.1009, "step": 156900 }, { "epoch": 461.76, "learning_rate": 4.662089996638871e-06, "loss": 0.1033, "step": 157000 }, { "epoch": 461.76, "eval_cer": 0.07192363018177063, "eval_loss": 0.5216103792190552, "eval_runtime": 4.9964, "eval_samples_per_second": 71.851, "eval_steps_per_second": 2.402, "eval_wer": 0.269708205706916, "step": 157000 }, { "epoch": 462.06, "learning_rate": 4.656848695658411e-06, "loss": 0.1007, "step": 157100 }, { "epoch": 462.35, "learning_rate": 4.651607773506746e-06, "loss": 0.0969, "step": 157200 }, { "epoch": 462.65, "learning_rate": 4.646367235969696e-06, "loss": 0.0991, "step": 157300 }, { "epoch": 462.94, "learning_rate": 4.641127088832661e-06, "loss": 0.0989, "step": 157400 }, { "epoch": 463.24, "learning_rate": 4.635887337880604e-06, "loss": 0.1087, "step": 157500 }, { "epoch": 463.53, "learning_rate": 4.630647988898058e-06, "loss": 0.0969, "step": 157600 }, { "epoch": 463.82, "learning_rate": 4.625409047669106e-06, "loss": 0.1004, "step": 157700 }, { "epoch": 464.12, "learning_rate": 4.620170519977379e-06, "loss": 0.0976, "step": 157800 }, { "epoch": 464.41, "learning_rate": 4.614932411606059e-06, "loss": 0.0994, "step": 157900 }, { "epoch": 464.71, "learning_rate": 4.6096947283378616e-06, "loss": 0.1053, "step": 158000 }, { "epoch": 464.71, "eval_cer": 0.07188004010287259, "eval_loss": 0.516394317150116, "eval_runtime": 4.9144, "eval_samples_per_second": 73.051, "eval_steps_per_second": 2.442, "eval_wer": 0.270030630340158, "step": 158000 }, { "epoch": 465.0, "learning_rate": 4.60445747595503e-06, "loss": 0.1061, "step": 158100 }, { "epoch": 465.29, "learning_rate": 4.599273026216009e-06, "loss": 0.1009, "step": 158200 }, { "epoch": 465.59, "learning_rate": 4.594036648495641e-06, "loss": 0.0989, "step": 158300 }, { "epoch": 465.88, "learning_rate": 4.5888007189466934e-06, "loss": 0.0972, "step": 158400 }, { "epoch": 466.18, "learning_rate": 4.583565243349476e-06, "loss": 0.0979, "step": 158500 }, { "epoch": 466.47, "learning_rate": 4.578330227483797e-06, "loss": 0.1039, "step": 158600 }, { "epoch": 466.76, "learning_rate": 4.573095677128959e-06, "loss": 0.1023, "step": 158700 }, { "epoch": 467.06, "learning_rate": 4.567861598063745e-06, "loss": 0.1064, "step": 158800 }, { "epoch": 467.35, "learning_rate": 4.562627996066427e-06, "loss": 0.0988, "step": 158900 }, { "epoch": 467.65, "learning_rate": 4.557394876914746e-06, "loss": 0.0974, "step": 159000 }, { "epoch": 467.65, "eval_cer": 0.07196722026066867, "eval_loss": 0.5301560163497925, "eval_runtime": 4.5122, "eval_samples_per_second": 79.561, "eval_steps_per_second": 2.659, "eval_wer": 0.26793487022408513, "step": 159000 }, { "epoch": 467.94, "learning_rate": 4.552162246385904e-06, "loss": 0.0982, "step": 159100 }, { "epoch": 468.24, "learning_rate": 4.546930110256574e-06, "loss": 0.1025, "step": 159200 }, { "epoch": 468.53, "learning_rate": 4.541698474302873e-06, "loss": 0.1005, "step": 159300 }, { "epoch": 468.82, "learning_rate": 4.5364673443003755e-06, "loss": 0.1037, "step": 159400 }, { "epoch": 469.12, "learning_rate": 4.531236726024092e-06, "loss": 0.1026, "step": 159500 }, { "epoch": 469.41, "learning_rate": 4.526006625248465e-06, "loss": 0.1028, "step": 159600 }, { "epoch": 469.71, "learning_rate": 4.520777047747376e-06, "loss": 0.0948, "step": 159700 }, { "epoch": 470.0, "learning_rate": 4.515547999294117e-06, "loss": 0.0978, "step": 159800 }, { "epoch": 470.29, "learning_rate": 4.510319485661405e-06, "loss": 0.094, "step": 159900 }, { "epoch": 470.59, "learning_rate": 4.5050915126213605e-06, "loss": 0.1016, "step": 160000 }, { "epoch": 470.59, "eval_cer": 0.07192363018177063, "eval_loss": 0.5172093510627747, "eval_runtime": 4.8089, "eval_samples_per_second": 74.653, "eval_steps_per_second": 2.495, "eval_wer": 0.26906335644043206, "step": 160000 }, { "epoch": 470.88, "learning_rate": 4.49986408594551e-06, "loss": 0.0979, "step": 160100 }, { "epoch": 471.18, "learning_rate": 4.494637211404779e-06, "loss": 0.0997, "step": 160200 }, { "epoch": 471.47, "learning_rate": 4.489410894769476e-06, "loss": 0.0984, "step": 160300 }, { "epoch": 471.76, "learning_rate": 4.484185141809304e-06, "loss": 0.0979, "step": 160400 }, { "epoch": 472.06, "learning_rate": 4.478959958293334e-06, "loss": 0.096, "step": 160500 }, { "epoch": 472.35, "learning_rate": 4.473735349990016e-06, "loss": 0.095, "step": 160600 }, { "epoch": 472.65, "learning_rate": 4.4685113226671594e-06, "loss": 0.0991, "step": 160700 }, { "epoch": 472.94, "learning_rate": 4.4632878820919336e-06, "loss": 0.1013, "step": 160800 }, { "epoch": 473.24, "learning_rate": 4.458065034030865e-06, "loss": 0.0981, "step": 160900 }, { "epoch": 473.53, "learning_rate": 4.452842784249817e-06, "loss": 0.0947, "step": 161000 }, { "epoch": 473.53, "eval_cer": 0.07266466152303735, "eval_loss": 0.5281272530555725, "eval_runtime": 5.2217, "eval_samples_per_second": 68.751, "eval_steps_per_second": 2.298, "eval_wer": 0.27196517813960985, "step": 161000 }, { "epoch": 473.82, "learning_rate": 4.447621138514001e-06, "loss": 0.102, "step": 161100 }, { "epoch": 474.12, "learning_rate": 4.4424001025879575e-06, "loss": 0.1006, "step": 161200 }, { "epoch": 474.41, "learning_rate": 4.437179682235552e-06, "loss": 0.0982, "step": 161300 }, { "epoch": 474.71, "learning_rate": 4.4319598832199765e-06, "loss": 0.1011, "step": 161400 }, { "epoch": 475.0, "learning_rate": 4.426740711303728e-06, "loss": 0.0995, "step": 161500 }, { "epoch": 475.29, "learning_rate": 4.4215221722486214e-06, "loss": 0.0995, "step": 161600 }, { "epoch": 475.59, "learning_rate": 4.416304271815767e-06, "loss": 0.0993, "step": 161700 }, { "epoch": 475.88, "learning_rate": 4.411087015765568e-06, "loss": 0.0985, "step": 161800 }, { "epoch": 476.18, "learning_rate": 4.4058704098577235e-06, "loss": 0.0943, "step": 161900 }, { "epoch": 476.47, "learning_rate": 4.400654459851207e-06, "loss": 0.101, "step": 162000 }, { "epoch": 476.47, "eval_cer": 0.07222876073405693, "eval_loss": 0.5367242693901062, "eval_runtime": 5.1506, "eval_samples_per_second": 69.7, "eval_steps_per_second": 2.33, "eval_wer": 0.2709979042398839, "step": 162000 }, { "epoch": 476.76, "learning_rate": 4.395439171504275e-06, "loss": 0.0996, "step": 162100 }, { "epoch": 477.06, "learning_rate": 4.390224550574449e-06, "loss": 0.0986, "step": 162200 }, { "epoch": 477.35, "learning_rate": 4.385010602818511e-06, "loss": 0.0921, "step": 162300 }, { "epoch": 477.65, "learning_rate": 4.37979733399251e-06, "loss": 0.1047, "step": 162400 }, { "epoch": 477.94, "learning_rate": 4.374584749851735e-06, "loss": 0.1039, "step": 162500 }, { "epoch": 478.24, "learning_rate": 4.369372856150725e-06, "loss": 0.1004, "step": 162600 }, { "epoch": 478.53, "learning_rate": 4.364161658643255e-06, "loss": 0.0994, "step": 162700 }, { "epoch": 478.82, "learning_rate": 4.358951163082328e-06, "loss": 0.0951, "step": 162800 }, { "epoch": 479.12, "learning_rate": 4.353741375220182e-06, "loss": 0.0997, "step": 162900 }, { "epoch": 479.41, "learning_rate": 4.348532300808261e-06, "loss": 0.0984, "step": 163000 }, { "epoch": 479.41, "eval_cer": 0.07227235081295497, "eval_loss": 0.5390114784240723, "eval_runtime": 5.3346, "eval_samples_per_second": 67.297, "eval_steps_per_second": 2.249, "eval_wer": 0.2718039658229889, "step": 163000 }, { "epoch": 479.71, "learning_rate": 4.343323945597232e-06, "loss": 0.0976, "step": 163100 }, { "epoch": 480.0, "learning_rate": 4.338116315336962e-06, "loss": 0.0963, "step": 163200 }, { "epoch": 480.29, "learning_rate": 4.332961481136282e-06, "loss": 0.0989, "step": 163300 }, { "epoch": 480.59, "learning_rate": 4.3277553106309965e-06, "loss": 0.097, "step": 163400 }, { "epoch": 480.88, "learning_rate": 4.322549882263777e-06, "loss": 0.0983, "step": 163500 }, { "epoch": 481.18, "learning_rate": 4.317345201781263e-06, "loss": 0.0927, "step": 163600 }, { "epoch": 481.47, "learning_rate": 4.312141274929265e-06, "loss": 0.0952, "step": 163700 }, { "epoch": 481.76, "learning_rate": 4.306938107452762e-06, "loss": 0.0965, "step": 163800 }, { "epoch": 482.06, "learning_rate": 4.3017357050958994e-06, "loss": 0.1033, "step": 163900 }, { "epoch": 482.35, "learning_rate": 4.296534073601972e-06, "loss": 0.0995, "step": 164000 }, { "epoch": 482.35, "eval_cer": 0.07100823852491173, "eval_loss": 0.5308058261871338, "eval_runtime": 4.9229, "eval_samples_per_second": 72.925, "eval_steps_per_second": 2.438, "eval_wer": 0.2672900209576012, "step": 164000 }, { "epoch": 482.65, "learning_rate": 4.291333218713423e-06, "loss": 0.0936, "step": 164100 }, { "epoch": 482.94, "learning_rate": 4.286133146171844e-06, "loss": 0.0969, "step": 164200 }, { "epoch": 483.24, "learning_rate": 4.2809338617179585e-06, "loss": 0.0991, "step": 164300 }, { "epoch": 483.53, "learning_rate": 4.275735371091624e-06, "loss": 0.0983, "step": 164400 }, { "epoch": 483.82, "learning_rate": 4.270537680031817e-06, "loss": 0.0979, "step": 164500 }, { "epoch": 484.12, "learning_rate": 4.26534079427663e-06, "loss": 0.1016, "step": 164600 }, { "epoch": 484.41, "learning_rate": 4.260144719563275e-06, "loss": 0.099, "step": 164700 }, { "epoch": 484.71, "learning_rate": 4.25494946162806e-06, "loss": 0.1006, "step": 164800 }, { "epoch": 485.0, "learning_rate": 4.249755026206398e-06, "loss": 0.0931, "step": 164900 }, { "epoch": 485.29, "learning_rate": 4.244561419032788e-06, "loss": 0.0954, "step": 165000 }, { "epoch": 485.29, "eval_cer": 0.07174926986617845, "eval_loss": 0.5440545678138733, "eval_runtime": 5.088, "eval_samples_per_second": 70.558, "eval_steps_per_second": 2.358, "eval_wer": 0.2666451716911172, "step": 165000 }, { "epoch": 485.59, "learning_rate": 4.239368645840816e-06, "loss": 0.1025, "step": 165100 }, { "epoch": 485.88, "learning_rate": 4.234176712363151e-06, "loss": 0.1006, "step": 165200 }, { "epoch": 486.18, "learning_rate": 4.228985624331532e-06, "loss": 0.1006, "step": 165300 }, { "epoch": 486.47, "learning_rate": 4.223795387476766e-06, "loss": 0.1019, "step": 165400 }, { "epoch": 486.76, "learning_rate": 4.218606007528718e-06, "loss": 0.1005, "step": 165500 }, { "epoch": 487.06, "learning_rate": 4.213417490216308e-06, "loss": 0.0988, "step": 165600 }, { "epoch": 487.35, "learning_rate": 4.208229841267508e-06, "loss": 0.1007, "step": 165700 }, { "epoch": 487.65, "learning_rate": 4.203043066409322e-06, "loss": 0.0926, "step": 165800 }, { "epoch": 487.94, "learning_rate": 4.197857171367799e-06, "loss": 0.0971, "step": 165900 }, { "epoch": 488.24, "learning_rate": 4.192672161868012e-06, "loss": 0.0983, "step": 166000 }, { "epoch": 488.24, "eval_cer": 0.07231594089185302, "eval_loss": 0.5344653725624084, "eval_runtime": 5.4383, "eval_samples_per_second": 66.014, "eval_steps_per_second": 2.207, "eval_wer": 0.270514267290021, "step": 166000 }, { "epoch": 488.53, "learning_rate": 4.187488043634053e-06, "loss": 0.0942, "step": 166100 }, { "epoch": 488.82, "learning_rate": 4.1823048223890385e-06, "loss": 0.1031, "step": 166200 }, { "epoch": 489.12, "learning_rate": 4.177122503855086e-06, "loss": 0.0953, "step": 166300 }, { "epoch": 489.41, "learning_rate": 4.171941093753323e-06, "loss": 0.0953, "step": 166400 }, { "epoch": 489.71, "learning_rate": 4.166760597803871e-06, "loss": 0.0945, "step": 166500 }, { "epoch": 490.0, "learning_rate": 4.161581021725842e-06, "loss": 0.0958, "step": 166600 }, { "epoch": 490.29, "learning_rate": 4.156402371237335e-06, "loss": 0.0953, "step": 166700 }, { "epoch": 490.59, "learning_rate": 4.1512246520554224e-06, "loss": 0.0997, "step": 166800 }, { "epoch": 490.88, "learning_rate": 4.146047869896156e-06, "loss": 0.0972, "step": 166900 }, { "epoch": 491.18, "learning_rate": 4.140872030474547e-06, "loss": 0.103, "step": 167000 }, { "epoch": 491.18, "eval_cer": 0.07231594089185302, "eval_loss": 0.5379437208175659, "eval_runtime": 4.8891, "eval_samples_per_second": 73.428, "eval_steps_per_second": 2.454, "eval_wer": 0.2713203288731259, "step": 167000 }, { "epoch": 491.47, "learning_rate": 4.135697139504564e-06, "loss": 0.0962, "step": 167100 }, { "epoch": 491.76, "learning_rate": 4.130523202699138e-06, "loss": 0.0972, "step": 167200 }, { "epoch": 492.06, "learning_rate": 4.1253502257701364e-06, "loss": 0.1022, "step": 167300 }, { "epoch": 492.35, "learning_rate": 4.120178214428373e-06, "loss": 0.0895, "step": 167400 }, { "epoch": 492.65, "learning_rate": 4.115058879957378e-06, "loss": 0.0959, "step": 167500 }, { "epoch": 492.94, "learning_rate": 4.109888807119945e-06, "loss": 0.0977, "step": 167600 }, { "epoch": 493.24, "learning_rate": 4.104719716938696e-06, "loss": 0.0994, "step": 167700 }, { "epoch": 493.53, "learning_rate": 4.099551615120152e-06, "loss": 0.0979, "step": 167800 }, { "epoch": 493.82, "learning_rate": 4.094384507369739e-06, "loss": 0.0988, "step": 167900 }, { "epoch": 494.12, "learning_rate": 4.089218399391795e-06, "loss": 0.0948, "step": 168000 }, { "epoch": 494.12, "eval_cer": 0.07131336907719803, "eval_loss": 0.5431644320487976, "eval_runtime": 4.7451, "eval_samples_per_second": 75.657, "eval_steps_per_second": 2.529, "eval_wer": 0.2653554731581493, "step": 168000 }, { "epoch": 494.41, "learning_rate": 4.084104942918741e-06, "loss": 0.0947, "step": 168100 }, { "epoch": 494.71, "learning_rate": 4.0789408414543055e-06, "loss": 0.0927, "step": 168200 }, { "epoch": 495.0, "learning_rate": 4.073777756811685e-06, "loss": 0.0954, "step": 168300 }, { "epoch": 495.29, "learning_rate": 4.068615694690766e-06, "loss": 0.0966, "step": 168400 }, { "epoch": 495.59, "learning_rate": 4.063454660790316e-06, "loss": 0.0959, "step": 168500 }, { "epoch": 495.88, "learning_rate": 4.05829466080796e-06, "loss": 0.0946, "step": 168600 }, { "epoch": 496.18, "learning_rate": 4.053135700440182e-06, "loss": 0.0995, "step": 168700 }, { "epoch": 496.47, "learning_rate": 4.047977785382323e-06, "loss": 0.0941, "step": 168800 }, { "epoch": 496.76, "learning_rate": 4.042820921328565e-06, "loss": 0.0924, "step": 168900 }, { "epoch": 497.06, "learning_rate": 4.037716666796161e-06, "loss": 0.0916, "step": 169000 }, { "epoch": 497.06, "eval_cer": 0.07183645002397454, "eval_loss": 0.5349707007408142, "eval_runtime": 5.3743, "eval_samples_per_second": 66.799, "eval_steps_per_second": 2.233, "eval_wer": 0.269708205706916, "step": 169000 }, { "epoch": 497.35, "learning_rate": 4.0325619111764545e-06, "loss": 0.0976, "step": 169100 }, { "epoch": 497.65, "learning_rate": 4.0274082235795125e-06, "loss": 0.0961, "step": 169200 }, { "epoch": 497.94, "learning_rate": 4.022255609694858e-06, "loss": 0.0924, "step": 169300 }, { "epoch": 498.24, "learning_rate": 4.017104075210819e-06, "loss": 0.0984, "step": 169400 }, { "epoch": 498.53, "learning_rate": 4.011953625814535e-06, "loss": 0.0939, "step": 169500 }, { "epoch": 498.82, "learning_rate": 4.006804267191951e-06, "loss": 0.1, "step": 169600 }, { "epoch": 499.12, "learning_rate": 4.001656005027803e-06, "loss": 0.0974, "step": 169700 }, { "epoch": 499.41, "learning_rate": 3.996508845005622e-06, "loss": 0.0932, "step": 169800 }, { "epoch": 499.71, "learning_rate": 3.991362792807717e-06, "loss": 0.0986, "step": 169900 }, { "epoch": 500.0, "learning_rate": 3.986217854115173e-06, "loss": 0.0955, "step": 170000 }, { "epoch": 500.0, "eval_cer": 0.07157490955058629, "eval_loss": 0.5349684953689575, "eval_runtime": 4.8795, "eval_samples_per_second": 73.573, "eval_steps_per_second": 2.459, "eval_wer": 0.27083669192326293, "step": 170000 }, { "epoch": 500.29, "learning_rate": 3.981074034607853e-06, "loss": 0.0901, "step": 170100 }, { "epoch": 500.59, "learning_rate": 3.97593133996438e-06, "loss": 0.0926, "step": 170200 }, { "epoch": 500.88, "learning_rate": 3.970789775862133e-06, "loss": 0.1036, "step": 170300 }, { "epoch": 501.18, "learning_rate": 3.9656493479772475e-06, "loss": 0.0972, "step": 170400 }, { "epoch": 501.47, "learning_rate": 3.960510061984599e-06, "loss": 0.0938, "step": 170500 }, { "epoch": 501.76, "learning_rate": 3.95537192355781e-06, "loss": 0.0953, "step": 170600 }, { "epoch": 502.06, "learning_rate": 3.950234938369229e-06, "loss": 0.097, "step": 170700 }, { "epoch": 502.35, "learning_rate": 3.9450991120899345e-06, "loss": 0.0993, "step": 170800 }, { "epoch": 502.65, "learning_rate": 3.939964450389728e-06, "loss": 0.0974, "step": 170900 }, { "epoch": 502.94, "learning_rate": 3.934830958937119e-06, "loss": 0.1022, "step": 171000 }, { "epoch": 502.94, "eval_cer": 0.07083387820931956, "eval_loss": 0.5352509021759033, "eval_runtime": 5.2076, "eval_samples_per_second": 68.938, "eval_steps_per_second": 2.304, "eval_wer": 0.2653554731581493, "step": 171000 }, { "epoch": 503.24, "learning_rate": 3.929698643399334e-06, "loss": 0.0976, "step": 171100 }, { "epoch": 503.53, "learning_rate": 3.924567509442289e-06, "loss": 0.0972, "step": 171200 }, { "epoch": 503.82, "learning_rate": 3.919437562730608e-06, "loss": 0.0917, "step": 171300 }, { "epoch": 504.12, "learning_rate": 3.914308808927598e-06, "loss": 0.0919, "step": 171400 }, { "epoch": 504.41, "learning_rate": 3.909181253695248e-06, "loss": 0.0967, "step": 171500 }, { "epoch": 504.71, "learning_rate": 3.9040549026942304e-06, "loss": 0.0962, "step": 171600 }, { "epoch": 505.0, "learning_rate": 3.8989297615838775e-06, "loss": 0.1009, "step": 171700 }, { "epoch": 505.29, "learning_rate": 3.893805836022198e-06, "loss": 0.0947, "step": 171800 }, { "epoch": 505.59, "learning_rate": 3.888683131665849e-06, "loss": 0.0963, "step": 171900 }, { "epoch": 505.88, "learning_rate": 3.883561654170144e-06, "loss": 0.0928, "step": 172000 }, { "epoch": 505.88, "eval_cer": 0.07166208970838238, "eval_loss": 0.5374095439910889, "eval_runtime": 4.9233, "eval_samples_per_second": 72.919, "eval_steps_per_second": 2.437, "eval_wer": 0.2653554731581493, "step": 172000 }, { "epoch": 506.18, "learning_rate": 3.878441409189042e-06, "loss": 0.0975, "step": 172100 }, { "epoch": 506.47, "learning_rate": 3.8733224023751394e-06, "loss": 0.0945, "step": 172200 }, { "epoch": 506.76, "learning_rate": 3.868204639379668e-06, "loss": 0.096, "step": 172300 }, { "epoch": 507.06, "learning_rate": 3.863088125852486e-06, "loss": 0.0946, "step": 172400 }, { "epoch": 507.35, "learning_rate": 3.857972867442068e-06, "loss": 0.0915, "step": 172500 }, { "epoch": 507.65, "learning_rate": 3.852858869795512e-06, "loss": 0.0966, "step": 172600 }, { "epoch": 507.94, "learning_rate": 3.847746138558514e-06, "loss": 0.0907, "step": 172700 }, { "epoch": 508.24, "learning_rate": 3.842634679375379e-06, "loss": 0.0976, "step": 172800 }, { "epoch": 508.53, "learning_rate": 3.837524497889005e-06, "loss": 0.1, "step": 172900 }, { "epoch": 508.82, "learning_rate": 3.832415599740879e-06, "loss": 0.0965, "step": 173000 }, { "epoch": 508.82, "eval_cer": 0.07144413931389215, "eval_loss": 0.5368661880493164, "eval_runtime": 5.3628, "eval_samples_per_second": 66.942, "eval_steps_per_second": 2.238, "eval_wer": 0.2682572948573271, "step": 173000 }, { "epoch": 509.12, "learning_rate": 3.827307990571073e-06, "loss": 0.09, "step": 173100 }, { "epoch": 509.41, "learning_rate": 3.822201676018233e-06, "loss": 0.103, "step": 173200 }, { "epoch": 509.71, "learning_rate": 3.817096661719582e-06, "loss": 0.0981, "step": 173300 }, { "epoch": 510.0, "learning_rate": 3.8119929533108995e-06, "loss": 0.0987, "step": 173400 }, { "epoch": 510.29, "learning_rate": 3.806890556426529e-06, "loss": 0.0963, "step": 173500 }, { "epoch": 510.59, "learning_rate": 3.801789476699365e-06, "loss": 0.0938, "step": 173600 }, { "epoch": 510.88, "learning_rate": 3.7966897197608445e-06, "loss": 0.0927, "step": 173700 }, { "epoch": 511.18, "learning_rate": 3.7915912912409496e-06, "loss": 0.095, "step": 173800 }, { "epoch": 511.47, "learning_rate": 3.7864941967681905e-06, "loss": 0.0991, "step": 173900 }, { "epoch": 511.76, "learning_rate": 3.7813984419696097e-06, "loss": 0.0903, "step": 174000 }, { "epoch": 511.76, "eval_cer": 0.07201081033956672, "eval_loss": 0.5484318137168884, "eval_runtime": 4.907, "eval_samples_per_second": 73.161, "eval_steps_per_second": 2.445, "eval_wer": 0.270514267290021, "step": 174000 }, { "epoch": 512.06, "learning_rate": 3.776304032470769e-06, "loss": 0.0956, "step": 174100 }, { "epoch": 512.35, "learning_rate": 3.771210973895741e-06, "loss": 0.089, "step": 174200 }, { "epoch": 512.65, "learning_rate": 3.7661701821540377e-06, "loss": 0.0915, "step": 174300 }, { "epoch": 512.94, "learning_rate": 3.7610798286434015e-06, "loss": 0.0941, "step": 174400 }, { "epoch": 513.24, "learning_rate": 3.755990842863646e-06, "loss": 0.0977, "step": 174500 }, { "epoch": 513.53, "learning_rate": 3.750903230432862e-06, "loss": 0.0973, "step": 174600 }, { "epoch": 513.82, "learning_rate": 3.7458169969676174e-06, "loss": 0.0957, "step": 174700 }, { "epoch": 514.12, "learning_rate": 3.740732148082967e-06, "loss": 0.0926, "step": 174800 }, { "epoch": 514.41, "learning_rate": 3.735648689392428e-06, "loss": 0.095, "step": 174900 }, { "epoch": 514.71, "learning_rate": 3.7305666265079883e-06, "loss": 0.0947, "step": 175000 }, { "epoch": 514.71, "eval_cer": 0.07153131947168824, "eval_loss": 0.5374939441680908, "eval_runtime": 5.2741, "eval_samples_per_second": 68.069, "eval_steps_per_second": 2.275, "eval_wer": 0.26712880864098015, "step": 175000 }, { "epoch": 515.0, "learning_rate": 3.7254859650400955e-06, "loss": 0.0919, "step": 175100 }, { "epoch": 515.29, "learning_rate": 3.720406710597645e-06, "loss": 0.0903, "step": 175200 }, { "epoch": 515.59, "learning_rate": 3.7153288687879858e-06, "loss": 0.0929, "step": 175300 }, { "epoch": 515.88, "learning_rate": 3.7102524452169e-06, "loss": 0.0922, "step": 175400 }, { "epoch": 516.18, "learning_rate": 3.705177445488609e-06, "loss": 0.0971, "step": 175500 }, { "epoch": 516.47, "learning_rate": 3.7001038752057626e-06, "loss": 0.093, "step": 175600 }, { "epoch": 516.76, "learning_rate": 3.695031739969428e-06, "loss": 0.0887, "step": 175700 }, { "epoch": 517.06, "learning_rate": 3.6899610453790945e-06, "loss": 0.0924, "step": 175800 }, { "epoch": 517.35, "learning_rate": 3.6848917970326547e-06, "loss": 0.0946, "step": 175900 }, { "epoch": 517.65, "learning_rate": 3.679824000526408e-06, "loss": 0.1018, "step": 176000 }, { "epoch": 517.65, "eval_cer": 0.07109541868270781, "eval_loss": 0.5277024507522583, "eval_runtime": 5.1447, "eval_samples_per_second": 69.78, "eval_steps_per_second": 2.332, "eval_wer": 0.2672900209576012, "step": 176000 }, { "epoch": 517.94, "learning_rate": 3.674757661455051e-06, "loss": 0.0893, "step": 176100 }, { "epoch": 518.24, "learning_rate": 3.66969278541167e-06, "loss": 0.0914, "step": 176200 }, { "epoch": 518.53, "learning_rate": 3.664629377987739e-06, "loss": 0.0916, "step": 176300 }, { "epoch": 518.82, "learning_rate": 3.659567444773108e-06, "loss": 0.0939, "step": 176400 }, { "epoch": 519.12, "learning_rate": 3.654506991355996e-06, "loss": 0.0963, "step": 176500 }, { "epoch": 519.41, "learning_rate": 3.6494480233229978e-06, "loss": 0.0929, "step": 176600 }, { "epoch": 519.71, "learning_rate": 3.64439054625906e-06, "loss": 0.0916, "step": 176700 }, { "epoch": 520.0, "learning_rate": 3.6393851181263416e-06, "loss": 0.0896, "step": 176800 }, { "epoch": 520.29, "learning_rate": 3.6343306246998226e-06, "loss": 0.0928, "step": 176900 }, { "epoch": 520.59, "learning_rate": 3.629277638931521e-06, "loss": 0.0889, "step": 177000 }, { "epoch": 520.59, "eval_cer": 0.07070310797262543, "eval_loss": 0.5390043258666992, "eval_runtime": 4.8192, "eval_samples_per_second": 74.493, "eval_steps_per_second": 2.49, "eval_wer": 0.2653554731581493, "step": 177000 }, { "epoch": 520.88, "learning_rate": 3.6242261663997854e-06, "loss": 0.0883, "step": 177100 }, { "epoch": 521.18, "learning_rate": 3.6191762126812878e-06, "loss": 0.096, "step": 177200 }, { "epoch": 521.47, "learning_rate": 3.6141277833510248e-06, "loss": 0.0906, "step": 177300 }, { "epoch": 521.76, "learning_rate": 3.609080883982315e-06, "loss": 0.0884, "step": 177400 }, { "epoch": 522.06, "learning_rate": 3.6040355201467834e-06, "loss": 0.0902, "step": 177500 }, { "epoch": 522.35, "learning_rate": 3.598991697414361e-06, "loss": 0.092, "step": 177600 }, { "epoch": 522.65, "learning_rate": 3.5939494213532784e-06, "loss": 0.0931, "step": 177700 }, { "epoch": 522.94, "learning_rate": 3.5889086975300547e-06, "loss": 0.0945, "step": 177800 }, { "epoch": 523.24, "learning_rate": 3.583869531509503e-06, "loss": 0.0915, "step": 177900 }, { "epoch": 523.53, "learning_rate": 3.578831928854708e-06, "loss": 0.091, "step": 178000 }, { "epoch": 523.53, "eval_cer": 0.0720979904973628, "eval_loss": 0.5432314276695251, "eval_runtime": 5.2897, "eval_samples_per_second": 67.868, "eval_steps_per_second": 2.269, "eval_wer": 0.2685797194905691, "step": 178000 }, { "epoch": 523.82, "learning_rate": 3.573795895127036e-06, "loss": 0.0902, "step": 178100 }, { "epoch": 524.12, "learning_rate": 3.568811772666565e-06, "loss": 0.0872, "step": 178200 }, { "epoch": 524.41, "learning_rate": 3.5637788776423364e-06, "loss": 0.0873, "step": 178300 }, { "epoch": 524.71, "learning_rate": 3.55874756816335e-06, "loss": 0.0884, "step": 178400 }, { "epoch": 525.0, "learning_rate": 3.5537178497840207e-06, "loss": 0.0956, "step": 178500 }, { "epoch": 525.29, "learning_rate": 3.5486897280570045e-06, "loss": 0.0907, "step": 178600 }, { "epoch": 525.59, "learning_rate": 3.5436632085332013e-06, "loss": 0.0923, "step": 178700 }, { "epoch": 525.88, "learning_rate": 3.538638296761735e-06, "loss": 0.0912, "step": 178800 }, { "epoch": 526.18, "learning_rate": 3.533614998289961e-06, "loss": 0.0942, "step": 178900 }, { "epoch": 526.47, "learning_rate": 3.5285933186634514e-06, "loss": 0.095, "step": 179000 }, { "epoch": 526.47, "eval_cer": 0.0705723377359313, "eval_loss": 0.5412935018539429, "eval_runtime": 4.9199, "eval_samples_per_second": 72.97, "eval_steps_per_second": 2.439, "eval_wer": 0.26068031597614055, "step": 179000 }, { "epoch": 526.76, "learning_rate": 3.5235732634259866e-06, "loss": 0.0962, "step": 179100 }, { "epoch": 527.06, "learning_rate": 3.518554838119562e-06, "loss": 0.0937, "step": 179200 }, { "epoch": 527.35, "learning_rate": 3.513538048284366e-06, "loss": 0.0938, "step": 179300 }, { "epoch": 527.65, "learning_rate": 3.5085228994587883e-06, "loss": 0.0929, "step": 179400 }, { "epoch": 527.94, "learning_rate": 3.5035093971794004e-06, "loss": 0.092, "step": 179500 }, { "epoch": 528.24, "learning_rate": 3.498497546980959e-06, "loss": 0.0938, "step": 179600 }, { "epoch": 528.53, "learning_rate": 3.493487354396401e-06, "loss": 0.0941, "step": 179700 }, { "epoch": 528.82, "learning_rate": 3.4884788249568245e-06, "loss": 0.0949, "step": 179800 }, { "epoch": 529.12, "learning_rate": 3.4834719641915003e-06, "loss": 0.0889, "step": 179900 }, { "epoch": 529.41, "learning_rate": 3.478466777627851e-06, "loss": 0.0941, "step": 180000 }, { "epoch": 529.41, "eval_cer": 0.07161849962948433, "eval_loss": 0.5512475371360779, "eval_runtime": 5.4027, "eval_samples_per_second": 66.448, "eval_steps_per_second": 2.221, "eval_wer": 0.2682572948573271, "step": 180000 }, { "epoch": 529.71, "learning_rate": 3.473463270791453e-06, "loss": 0.0892, "step": 180100 }, { "epoch": 530.0, "learning_rate": 3.4684614492060307e-06, "loss": 0.0917, "step": 180200 }, { "epoch": 530.29, "learning_rate": 3.463511311314118e-06, "loss": 0.0914, "step": 180300 }, { "epoch": 530.59, "learning_rate": 3.4585128598041152e-06, "loss": 0.0944, "step": 180400 }, { "epoch": 530.88, "learning_rate": 3.4535161100498956e-06, "loss": 0.0882, "step": 180500 }, { "epoch": 531.18, "learning_rate": 3.4485210675677183e-06, "loss": 0.0977, "step": 180600 }, { "epoch": 531.47, "learning_rate": 3.4435277378719652e-06, "loss": 0.0932, "step": 180700 }, { "epoch": 531.76, "learning_rate": 3.438536126475119e-06, "loss": 0.093, "step": 180800 }, { "epoch": 532.06, "learning_rate": 3.433546238887773e-06, "loss": 0.0926, "step": 180900 }, { "epoch": 532.35, "learning_rate": 3.4285580806186124e-06, "loss": 0.0911, "step": 181000 }, { "epoch": 532.35, "eval_cer": 0.07135695915609608, "eval_loss": 0.5525036454200745, "eval_runtime": 5.4419, "eval_samples_per_second": 65.969, "eval_steps_per_second": 2.205, "eval_wer": 0.27035305497339995, "step": 181000 }, { "epoch": 532.65, "learning_rate": 3.4235716571744144e-06, "loss": 0.0887, "step": 181100 }, { "epoch": 532.94, "learning_rate": 3.418586974060044e-06, "loss": 0.0947, "step": 181200 }, { "epoch": 533.24, "learning_rate": 3.413604036778442e-06, "loss": 0.0918, "step": 181300 }, { "epoch": 533.53, "learning_rate": 3.4086228508306187e-06, "loss": 0.0907, "step": 181400 }, { "epoch": 533.82, "learning_rate": 3.4036434217156587e-06, "loss": 0.0874, "step": 181500 }, { "epoch": 534.12, "learning_rate": 3.398665754930701e-06, "loss": 0.0905, "step": 181600 }, { "epoch": 534.41, "learning_rate": 3.393689855970944e-06, "loss": 0.095, "step": 181700 }, { "epoch": 534.71, "learning_rate": 3.388715730329629e-06, "loss": 0.088, "step": 181800 }, { "epoch": 535.0, "learning_rate": 3.3837433834980416e-06, "loss": 0.0935, "step": 181900 }, { "epoch": 535.29, "learning_rate": 3.3787728209655064e-06, "loss": 0.0906, "step": 182000 }, { "epoch": 535.29, "eval_cer": 0.07113900876160587, "eval_loss": 0.5467122793197632, "eval_runtime": 5.3361, "eval_samples_per_second": 67.278, "eval_steps_per_second": 2.249, "eval_wer": 0.26632274705787523, "step": 182000 }, { "epoch": 535.59, "learning_rate": 3.3738040482193736e-06, "loss": 0.0893, "step": 182100 }, { "epoch": 535.88, "learning_rate": 3.3688370707450233e-06, "loss": 0.0942, "step": 182200 }, { "epoch": 536.18, "learning_rate": 3.3638718940258498e-06, "loss": 0.0911, "step": 182300 }, { "epoch": 536.47, "learning_rate": 3.358908523543255e-06, "loss": 0.0968, "step": 182400 }, { "epoch": 536.76, "learning_rate": 3.3539469647766575e-06, "loss": 0.0864, "step": 182500 }, { "epoch": 537.06, "learning_rate": 3.3489872232034666e-06, "loss": 0.0909, "step": 182600 }, { "epoch": 537.35, "learning_rate": 3.3440293042990925e-06, "loss": 0.0878, "step": 182700 }, { "epoch": 537.65, "learning_rate": 3.339073213536926e-06, "loss": 0.0873, "step": 182800 }, { "epoch": 537.94, "learning_rate": 3.334118956388345e-06, "loss": 0.0927, "step": 182900 }, { "epoch": 538.24, "learning_rate": 3.3291665383227007e-06, "loss": 0.092, "step": 183000 }, { "epoch": 538.24, "eval_cer": 0.0717928599450765, "eval_loss": 0.5496759414672852, "eval_runtime": 4.3873, "eval_samples_per_second": 81.827, "eval_steps_per_second": 2.735, "eval_wer": 0.2684185071739481, "step": 183000 }, { "epoch": 538.53, "learning_rate": 3.3242159648073158e-06, "loss": 0.0873, "step": 183100 }, { "epoch": 538.82, "learning_rate": 3.3192672413074744e-06, "loss": 0.0883, "step": 183200 }, { "epoch": 539.12, "learning_rate": 3.3143203732864228e-06, "loss": 0.0908, "step": 183300 }, { "epoch": 539.41, "learning_rate": 3.3093753662053494e-06, "loss": 0.0873, "step": 183400 }, { "epoch": 539.71, "learning_rate": 3.304432225523402e-06, "loss": 0.0892, "step": 183500 }, { "epoch": 540.0, "learning_rate": 3.299490956697653e-06, "loss": 0.0878, "step": 183600 }, { "epoch": 540.29, "learning_rate": 3.29455156518312e-06, "loss": 0.09, "step": 183700 }, { "epoch": 540.59, "learning_rate": 3.2896140564327445e-06, "loss": 0.0868, "step": 183800 }, { "epoch": 540.88, "learning_rate": 3.2846784358973847e-06, "loss": 0.0949, "step": 183900 }, { "epoch": 541.18, "learning_rate": 3.2797447090258226e-06, "loss": 0.0885, "step": 184000 }, { "epoch": 541.18, "eval_cer": 0.07074669805152348, "eval_loss": 0.5454766154289246, "eval_runtime": 5.0489, "eval_samples_per_second": 71.104, "eval_steps_per_second": 2.377, "eval_wer": 0.26229243914235045, "step": 184000 }, { "epoch": 541.47, "learning_rate": 3.274812881264742e-06, "loss": 0.0859, "step": 184100 }, { "epoch": 541.76, "learning_rate": 3.2698829580587354e-06, "loss": 0.0914, "step": 184200 }, { "epoch": 542.06, "learning_rate": 3.264954944850292e-06, "loss": 0.0912, "step": 184300 }, { "epoch": 542.35, "learning_rate": 3.260028847079787e-06, "loss": 0.0925, "step": 184400 }, { "epoch": 542.65, "learning_rate": 3.2551046701854907e-06, "loss": 0.0923, "step": 184500 }, { "epoch": 542.94, "learning_rate": 3.250231632556272e-06, "loss": 0.0877, "step": 184600 }, { "epoch": 543.24, "learning_rate": 3.2453112943763365e-06, "loss": 0.0889, "step": 184700 }, { "epoch": 543.53, "learning_rate": 3.2403928933203477e-06, "loss": 0.0902, "step": 184800 }, { "epoch": 543.82, "learning_rate": 3.2354764348180695e-06, "loss": 0.0907, "step": 184900 }, { "epoch": 544.12, "learning_rate": 3.2305619242971294e-06, "loss": 0.0849, "step": 185000 }, { "epoch": 544.12, "eval_cer": 0.07153131947168824, "eval_loss": 0.550433337688446, "eval_runtime": 5.0702, "eval_samples_per_second": 70.805, "eval_steps_per_second": 2.367, "eval_wer": 0.2664839593744962, "step": 185000 }, { "epoch": 544.41, "learning_rate": 3.225649367182997e-06, "loss": 0.095, "step": 185100 }, { "epoch": 544.71, "learning_rate": 3.2207387688989895e-06, "loss": 0.0894, "step": 185200 }, { "epoch": 545.0, "learning_rate": 3.2158301348662623e-06, "loss": 0.0883, "step": 185300 }, { "epoch": 545.29, "learning_rate": 3.210923470503799e-06, "loss": 0.0947, "step": 185400 }, { "epoch": 545.59, "learning_rate": 3.2060187812284127e-06, "loss": 0.088, "step": 185500 }, { "epoch": 545.88, "learning_rate": 3.2011160724547318e-06, "loss": 0.0869, "step": 185600 }, { "epoch": 546.18, "learning_rate": 3.1962153495951995e-06, "loss": 0.0904, "step": 185700 }, { "epoch": 546.47, "learning_rate": 3.1913166180600718e-06, "loss": 0.0917, "step": 185800 }, { "epoch": 546.76, "learning_rate": 3.186419883257398e-06, "loss": 0.0874, "step": 185900 }, { "epoch": 547.06, "learning_rate": 3.18152515059303e-06, "loss": 0.0912, "step": 186000 }, { "epoch": 547.06, "eval_cer": 0.07100823852491173, "eval_loss": 0.5470239520072937, "eval_runtime": 5.3768, "eval_samples_per_second": 66.768, "eval_steps_per_second": 2.232, "eval_wer": 0.2653554731581493, "step": 186000 }, { "epoch": 547.35, "learning_rate": 3.176632425470604e-06, "loss": 0.0929, "step": 186100 }, { "epoch": 547.65, "learning_rate": 3.1717417132915425e-06, "loss": 0.0891, "step": 186200 }, { "epoch": 547.94, "learning_rate": 3.166853019455049e-06, "loss": 0.0859, "step": 186300 }, { "epoch": 548.24, "learning_rate": 3.1619663493580914e-06, "loss": 0.0941, "step": 186400 }, { "epoch": 548.53, "learning_rate": 3.157081708395412e-06, "loss": 0.0942, "step": 186500 }, { "epoch": 548.82, "learning_rate": 3.1521991019595033e-06, "loss": 0.0865, "step": 186600 }, { "epoch": 549.12, "learning_rate": 3.1473185354406226e-06, "loss": 0.0926, "step": 186700 }, { "epoch": 549.41, "learning_rate": 3.142440014226766e-06, "loss": 0.0888, "step": 186800 }, { "epoch": 549.71, "learning_rate": 3.1375635437036746e-06, "loss": 0.0925, "step": 186900 }, { "epoch": 550.0, "learning_rate": 3.1326891292548302e-06, "loss": 0.0928, "step": 187000 }, { "epoch": 550.0, "eval_cer": 0.07061592781482935, "eval_loss": 0.5491250157356262, "eval_runtime": 5.2902, "eval_samples_per_second": 67.862, "eval_steps_per_second": 2.268, "eval_wer": 0.26438819925842333, "step": 187000 }, { "epoch": 550.29, "learning_rate": 3.1278167762614365e-06, "loss": 0.0886, "step": 187100 }, { "epoch": 550.59, "learning_rate": 3.1229464901024297e-06, "loss": 0.0886, "step": 187200 }, { "epoch": 550.88, "learning_rate": 3.1180782761544575e-06, "loss": 0.093, "step": 187300 }, { "epoch": 551.18, "learning_rate": 3.1132121397918824e-06, "loss": 0.0903, "step": 187400 }, { "epoch": 551.47, "learning_rate": 3.108348086386777e-06, "loss": 0.0916, "step": 187500 }, { "epoch": 551.76, "learning_rate": 3.103486121308907e-06, "loss": 0.0902, "step": 187600 }, { "epoch": 552.06, "learning_rate": 3.09862624992574e-06, "loss": 0.0911, "step": 187700 }, { "epoch": 552.35, "learning_rate": 3.0937684776024274e-06, "loss": 0.0921, "step": 187800 }, { "epoch": 552.65, "learning_rate": 3.0889128097018036e-06, "loss": 0.0908, "step": 187900 }, { "epoch": 552.94, "learning_rate": 3.084059251584384e-06, "loss": 0.0904, "step": 188000 }, { "epoch": 552.94, "eval_cer": 0.0714877293927902, "eval_loss": 0.5426270365715027, "eval_runtime": 4.6484, "eval_samples_per_second": 77.231, "eval_steps_per_second": 2.582, "eval_wer": 0.2651942608415283, "step": 188000 }, { "epoch": 553.24, "learning_rate": 3.0792563125505725e-06, "loss": 0.0897, "step": 188100 }, { "epoch": 553.53, "learning_rate": 3.0744069688402957e-06, "loss": 0.0876, "step": 188200 }, { "epoch": 553.82, "learning_rate": 3.069559750927237e-06, "loss": 0.0913, "step": 188300 }, { "epoch": 554.12, "learning_rate": 3.0647146641625786e-06, "loss": 0.0878, "step": 188400 }, { "epoch": 554.41, "learning_rate": 3.059871713895155e-06, "loss": 0.0893, "step": 188500 }, { "epoch": 554.71, "learning_rate": 3.0550309054714367e-06, "loss": 0.0894, "step": 188600 }, { "epoch": 555.0, "learning_rate": 3.0501922442355305e-06, "loss": 0.0933, "step": 188700 }, { "epoch": 555.29, "learning_rate": 3.045355735529175e-06, "loss": 0.0917, "step": 188800 }, { "epoch": 555.59, "learning_rate": 3.0405213846917307e-06, "loss": 0.0883, "step": 188900 }, { "epoch": 555.88, "learning_rate": 3.0356891970601797e-06, "loss": 0.0876, "step": 189000 }, { "epoch": 555.88, "eval_cer": 0.07105182860380978, "eval_loss": 0.5487252473831177, "eval_runtime": 5.1579, "eval_samples_per_second": 69.602, "eval_steps_per_second": 2.327, "eval_wer": 0.26422698694180236, "step": 189000 }, { "epoch": 556.18, "learning_rate": 3.030859177969111e-06, "loss": 0.0936, "step": 189100 }, { "epoch": 556.47, "learning_rate": 3.0260313327507186e-06, "loss": 0.0902, "step": 189200 }, { "epoch": 556.76, "learning_rate": 3.0212056667348028e-06, "loss": 0.0921, "step": 189300 }, { "epoch": 557.06, "learning_rate": 3.016382185248753e-06, "loss": 0.0905, "step": 189400 }, { "epoch": 557.35, "learning_rate": 3.0115608936175523e-06, "loss": 0.0867, "step": 189500 }, { "epoch": 557.65, "learning_rate": 3.0067417971637597e-06, "loss": 0.0923, "step": 189600 }, { "epoch": 557.94, "learning_rate": 3.0019249012075125e-06, "loss": 0.0951, "step": 189700 }, { "epoch": 558.24, "learning_rate": 2.9971102110665225e-06, "loss": 0.0875, "step": 189800 }, { "epoch": 558.53, "learning_rate": 2.992297732056062e-06, "loss": 0.09, "step": 189900 }, { "epoch": 558.82, "learning_rate": 2.987487469488968e-06, "loss": 0.0913, "step": 190000 }, { "epoch": 558.82, "eval_cer": 0.07113900876160587, "eval_loss": 0.5487645268440247, "eval_runtime": 4.7526, "eval_samples_per_second": 75.537, "eval_steps_per_second": 2.525, "eval_wer": 0.2637433499919394, "step": 190000 }, { "epoch": 559.12, "learning_rate": 2.982727498068645e-06, "loss": 0.0897, "step": 190100 }, { "epoch": 559.41, "learning_rate": 2.977921662020099e-06, "loss": 0.0906, "step": 190200 }, { "epoch": 559.71, "learning_rate": 2.9731180582856704e-06, "loss": 0.0901, "step": 190300 }, { "epoch": 560.0, "learning_rate": 2.9683166921683935e-06, "loss": 0.087, "step": 190400 }, { "epoch": 560.29, "learning_rate": 2.963517568968831e-06, "loss": 0.0888, "step": 190500 }, { "epoch": 560.59, "learning_rate": 2.9587206939850745e-06, "loss": 0.0902, "step": 190600 }, { "epoch": 560.88, "learning_rate": 2.9539260725127276e-06, "loss": 0.0884, "step": 190700 }, { "epoch": 561.18, "learning_rate": 2.9491337098449125e-06, "loss": 0.0893, "step": 190800 }, { "epoch": 561.47, "learning_rate": 2.9443436112722536e-06, "loss": 0.0901, "step": 190900 }, { "epoch": 561.76, "learning_rate": 2.9395557820828742e-06, "loss": 0.0926, "step": 191000 }, { "epoch": 561.76, "eval_cer": 0.07144413931389215, "eval_loss": 0.5500932335853577, "eval_runtime": 5.4728, "eval_samples_per_second": 65.597, "eval_steps_per_second": 2.193, "eval_wer": 0.26632274705787523, "step": 191000 }, { "epoch": 562.06, "learning_rate": 2.934770227562399e-06, "loss": 0.0911, "step": 191100 }, { "epoch": 562.35, "learning_rate": 2.929986952993933e-06, "loss": 0.0954, "step": 191200 }, { "epoch": 562.65, "learning_rate": 2.925205963658071e-06, "loss": 0.0898, "step": 191300 }, { "epoch": 562.94, "learning_rate": 2.9204272648328835e-06, "loss": 0.0911, "step": 191400 }, { "epoch": 563.24, "learning_rate": 2.915650861793908e-06, "loss": 0.0887, "step": 191500 }, { "epoch": 563.53, "learning_rate": 2.910876759814154e-06, "loss": 0.089, "step": 191600 }, { "epoch": 563.82, "learning_rate": 2.9061049641640858e-06, "loss": 0.0856, "step": 191700 }, { "epoch": 564.12, "learning_rate": 2.9013354801116246e-06, "loss": 0.0859, "step": 191800 }, { "epoch": 564.41, "learning_rate": 2.8965683129221395e-06, "loss": 0.0957, "step": 191900 }, { "epoch": 564.71, "learning_rate": 2.891803467858435e-06, "loss": 0.0842, "step": 192000 }, { "epoch": 564.71, "eval_cer": 0.07157490955058629, "eval_loss": 0.5528156757354736, "eval_runtime": 4.4134, "eval_samples_per_second": 81.344, "eval_steps_per_second": 2.719, "eval_wer": 0.2666451716911172, "step": 192000 }, { "epoch": 565.0, "learning_rate": 2.8870409501807633e-06, "loss": 0.0866, "step": 192100 }, { "epoch": 565.29, "learning_rate": 2.8822807651468005e-06, "loss": 0.0891, "step": 192200 }, { "epoch": 565.59, "learning_rate": 2.8775229180116483e-06, "loss": 0.0882, "step": 192300 }, { "epoch": 565.88, "learning_rate": 2.8727674140278293e-06, "loss": 0.0932, "step": 192400 }, { "epoch": 566.18, "learning_rate": 2.868014258445274e-06, "loss": 0.0873, "step": 192500 }, { "epoch": 566.47, "learning_rate": 2.863263456511328e-06, "loss": 0.0933, "step": 192600 }, { "epoch": 566.76, "learning_rate": 2.858515013470734e-06, "loss": 0.0903, "step": 192700 }, { "epoch": 567.06, "learning_rate": 2.8537689345656307e-06, "loss": 0.091, "step": 192800 }, { "epoch": 567.35, "learning_rate": 2.8490252250355505e-06, "loss": 0.0909, "step": 192900 }, { "epoch": 567.65, "learning_rate": 2.8442838901174e-06, "loss": 0.0863, "step": 193000 }, { "epoch": 567.65, "eval_cer": 0.07126977899829999, "eval_loss": 0.5538076162338257, "eval_runtime": 4.856, "eval_samples_per_second": 73.929, "eval_steps_per_second": 2.471, "eval_wer": 0.26616153474125426, "step": 193000 }, { "epoch": 567.94, "learning_rate": 2.839592312798779e-06, "loss": 0.0894, "step": 193100 }, { "epoch": 568.24, "learning_rate": 2.834855718928081e-06, "loss": 0.0901, "step": 193200 }, { "epoch": 568.53, "learning_rate": 2.830121515312029e-06, "loss": 0.0875, "step": 193300 }, { "epoch": 568.82, "learning_rate": 2.8253897071770427e-06, "loss": 0.0842, "step": 193400 }, { "epoch": 569.12, "learning_rate": 2.8206602997468963e-06, "loss": 0.0935, "step": 193500 }, { "epoch": 569.41, "learning_rate": 2.8159332982427146e-06, "loss": 0.0919, "step": 193600 }, { "epoch": 569.71, "learning_rate": 2.8112087078829664e-06, "loss": 0.0862, "step": 193700 }, { "epoch": 570.0, "learning_rate": 2.8064865338834586e-06, "loss": 0.0903, "step": 193800 }, { "epoch": 570.29, "learning_rate": 2.8017667814573297e-06, "loss": 0.0929, "step": 193900 }, { "epoch": 570.59, "learning_rate": 2.7970494558150456e-06, "loss": 0.0885, "step": 194000 }, { "epoch": 570.59, "eval_cer": 0.0708774682882176, "eval_loss": 0.543542742729187, "eval_runtime": 4.864, "eval_samples_per_second": 73.807, "eval_steps_per_second": 2.467, "eval_wer": 0.2653554731581493, "step": 194000 }, { "epoch": 570.88, "learning_rate": 2.792334562164394e-06, "loss": 0.0874, "step": 194100 }, { "epoch": 571.18, "learning_rate": 2.7876221057104745e-06, "loss": 0.0906, "step": 194200 }, { "epoch": 571.47, "learning_rate": 2.7829120916557005e-06, "loss": 0.0891, "step": 194300 }, { "epoch": 571.76, "learning_rate": 2.778204525199786e-06, "loss": 0.0887, "step": 194400 }, { "epoch": 572.06, "learning_rate": 2.773499411539744e-06, "loss": 0.0853, "step": 194500 }, { "epoch": 572.35, "learning_rate": 2.768796755869879e-06, "loss": 0.0846, "step": 194600 }, { "epoch": 572.65, "learning_rate": 2.764096563381784e-06, "loss": 0.0835, "step": 194700 }, { "epoch": 572.94, "learning_rate": 2.759398839264329e-06, "loss": 0.0919, "step": 194800 }, { "epoch": 573.24, "learning_rate": 2.754703588703663e-06, "loss": 0.0872, "step": 194900 }, { "epoch": 573.53, "learning_rate": 2.7500108168832006e-06, "loss": 0.0875, "step": 195000 }, { "epoch": 573.53, "eval_cer": 0.07065951789372739, "eval_loss": 0.5488081574440002, "eval_runtime": 5.0704, "eval_samples_per_second": 70.803, "eval_steps_per_second": 2.367, "eval_wer": 0.26261486377559246, "step": 195000 }, { "epoch": 573.82, "learning_rate": 2.745320528983624e-06, "loss": 0.0898, "step": 195100 }, { "epoch": 574.12, "learning_rate": 2.7406327301828693e-06, "loss": 0.0853, "step": 195200 }, { "epoch": 574.41, "learning_rate": 2.7359474256561273e-06, "loss": 0.0854, "step": 195300 }, { "epoch": 574.71, "learning_rate": 2.731264620575834e-06, "loss": 0.093, "step": 195400 }, { "epoch": 575.0, "learning_rate": 2.7265843201116658e-06, "loss": 0.087, "step": 195500 }, { "epoch": 575.29, "learning_rate": 2.7219065294305363e-06, "loss": 0.0918, "step": 195600 }, { "epoch": 575.59, "learning_rate": 2.7172312536965857e-06, "loss": 0.09, "step": 195700 }, { "epoch": 575.88, "learning_rate": 2.7125584980711784e-06, "loss": 0.0884, "step": 195800 }, { "epoch": 576.18, "learning_rate": 2.7078882677128983e-06, "loss": 0.0837, "step": 195900 }, { "epoch": 576.47, "learning_rate": 2.7032205677775385e-06, "loss": 0.0924, "step": 196000 }, { "epoch": 576.47, "eval_cer": 0.07079028813042151, "eval_loss": 0.5483184456825256, "eval_runtime": 4.8631, "eval_samples_per_second": 73.821, "eval_steps_per_second": 2.468, "eval_wer": 0.26454941157504436, "step": 196000 }, { "epoch": 576.76, "learning_rate": 2.6985554034181022e-06, "loss": 0.0909, "step": 196100 }, { "epoch": 577.06, "learning_rate": 2.6939393934276265e-06, "loss": 0.0874, "step": 196200 }, { "epoch": 577.35, "learning_rate": 2.6893258785973584e-06, "loss": 0.0861, "step": 196300 }, { "epoch": 577.65, "learning_rate": 2.684668300784915e-06, "loss": 0.0831, "step": 196400 }, { "epoch": 577.94, "learning_rate": 2.680013279029546e-06, "loss": 0.0918, "step": 196500 }, { "epoch": 578.24, "learning_rate": 2.675360818470253e-06, "loss": 0.0898, "step": 196600 }, { "epoch": 578.53, "learning_rate": 2.670710924243214e-06, "loss": 0.0918, "step": 196700 }, { "epoch": 578.82, "learning_rate": 2.6660636014817764e-06, "loss": 0.0897, "step": 196800 }, { "epoch": 579.12, "learning_rate": 2.6614188553164387e-06, "loss": 0.0912, "step": 196900 }, { "epoch": 579.41, "learning_rate": 2.656776690874868e-06, "loss": 0.0884, "step": 197000 }, { "epoch": 579.41, "eval_cer": 0.07092105836711564, "eval_loss": 0.5512089133262634, "eval_runtime": 4.8465, "eval_samples_per_second": 74.074, "eval_steps_per_second": 2.476, "eval_wer": 0.26551668547477025, "step": 197000 }, { "epoch": 579.71, "learning_rate": 2.652137113281874e-06, "loss": 0.0817, "step": 197100 }, { "epoch": 580.0, "learning_rate": 2.6475001276594115e-06, "loss": 0.0875, "step": 197200 }, { "epoch": 580.29, "learning_rate": 2.6428657391265756e-06, "loss": 0.085, "step": 197300 }, { "epoch": 580.59, "learning_rate": 2.638233952799588e-06, "loss": 0.0851, "step": 197400 }, { "epoch": 580.88, "learning_rate": 2.633604773791808e-06, "loss": 0.089, "step": 197500 }, { "epoch": 581.18, "learning_rate": 2.628978207213708e-06, "loss": 0.0921, "step": 197600 }, { "epoch": 581.47, "learning_rate": 2.624354258172881e-06, "loss": 0.0889, "step": 197700 }, { "epoch": 581.76, "learning_rate": 2.6197329317740304e-06, "loss": 0.0874, "step": 197800 }, { "epoch": 582.06, "learning_rate": 2.6151142331189556e-06, "loss": 0.0807, "step": 197900 }, { "epoch": 582.35, "learning_rate": 2.610498167306569e-06, "loss": 0.0904, "step": 198000 }, { "epoch": 582.35, "eval_cer": 0.07079028813042151, "eval_loss": 0.5547834038734436, "eval_runtime": 4.9397, "eval_samples_per_second": 72.676, "eval_steps_per_second": 2.429, "eval_wer": 0.26600032242463323, "step": 198000 }, { "epoch": 582.65, "learning_rate": 2.605884739432867e-06, "loss": 0.0887, "step": 198100 }, { "epoch": 582.94, "learning_rate": 2.601273954590936e-06, "loss": 0.0895, "step": 198200 }, { "epoch": 583.24, "learning_rate": 2.596665817870947e-06, "loss": 0.085, "step": 198300 }, { "epoch": 583.53, "learning_rate": 2.59206033436014e-06, "loss": 0.084, "step": 198400 }, { "epoch": 583.82, "learning_rate": 2.5874575091428383e-06, "loss": 0.0945, "step": 198500 }, { "epoch": 584.12, "learning_rate": 2.5828573473004157e-06, "loss": 0.0809, "step": 198600 }, { "epoch": 584.41, "learning_rate": 2.5782598539113205e-06, "loss": 0.0859, "step": 198700 }, { "epoch": 584.71, "learning_rate": 2.5737109689990237e-06, "loss": 0.0896, "step": 198800 }, { "epoch": 585.0, "learning_rate": 2.569118800928999e-06, "loss": 0.087, "step": 198900 }, { "epoch": 585.29, "learning_rate": 2.564529316479245e-06, "loss": 0.0882, "step": 199000 }, { "epoch": 585.29, "eval_cer": 0.07092105836711564, "eval_loss": 0.5537840723991394, "eval_runtime": 4.9542, "eval_samples_per_second": 72.464, "eval_steps_per_second": 2.422, "eval_wer": 0.2656778977913913, "step": 199000 }, { "epoch": 585.59, "learning_rate": 2.559942520716414e-06, "loss": 0.0905, "step": 199100 }, { "epoch": 585.88, "learning_rate": 2.5553584187041926e-06, "loss": 0.0917, "step": 199200 }, { "epoch": 586.18, "learning_rate": 2.5507770155032917e-06, "loss": 0.085, "step": 199300 }, { "epoch": 586.47, "learning_rate": 2.5461983161714442e-06, "loss": 0.0868, "step": 199400 }, { "epoch": 586.76, "learning_rate": 2.5416223257633977e-06, "loss": 0.0875, "step": 199500 }, { "epoch": 587.06, "learning_rate": 2.5370490493309086e-06, "loss": 0.0869, "step": 199600 }, { "epoch": 587.35, "learning_rate": 2.5324784919227373e-06, "loss": 0.0861, "step": 199700 }, { "epoch": 587.65, "learning_rate": 2.527910658584643e-06, "loss": 0.0874, "step": 199800 }, { "epoch": 587.94, "learning_rate": 2.5233455543593778e-06, "loss": 0.0922, "step": 199900 }, { "epoch": 588.24, "learning_rate": 2.5187831842866795e-06, "loss": 0.0917, "step": 200000 }, { "epoch": 588.24, "eval_cer": 0.07031079726254305, "eval_loss": 0.5549612045288086, "eval_runtime": 4.6478, "eval_samples_per_second": 77.24, "eval_steps_per_second": 2.582, "eval_wer": 0.2650330485249073, "step": 200000 }, { "epoch": 588.53, "learning_rate": 2.5142235534032688e-06, "loss": 0.0845, "step": 200100 }, { "epoch": 588.82, "learning_rate": 2.5096666667428427e-06, "loss": 0.0859, "step": 200200 }, { "epoch": 589.12, "learning_rate": 2.5051125293360667e-06, "loss": 0.0898, "step": 200300 }, { "epoch": 589.41, "learning_rate": 2.5005611462105746e-06, "loss": 0.0914, "step": 200400 }, { "epoch": 589.71, "learning_rate": 2.4960125223909555e-06, "loss": 0.0874, "step": 200500 }, { "epoch": 590.0, "learning_rate": 2.4914666628987555e-06, "loss": 0.0931, "step": 200600 }, { "epoch": 590.29, "learning_rate": 2.486923572752467e-06, "loss": 0.0875, "step": 200700 }, { "epoch": 590.59, "learning_rate": 2.4823832569675267e-06, "loss": 0.0855, "step": 200800 }, { "epoch": 590.88, "learning_rate": 2.4778457205563067e-06, "loss": 0.0874, "step": 200900 }, { "epoch": 591.18, "learning_rate": 2.4733109685281124e-06, "loss": 0.086, "step": 201000 }, { "epoch": 591.18, "eval_cer": 0.07048515757813521, "eval_loss": 0.5632910132408142, "eval_runtime": 5.3132, "eval_samples_per_second": 67.568, "eval_steps_per_second": 2.259, "eval_wer": 0.2648718362082863, "step": 201000 }, { "epoch": 591.47, "learning_rate": 2.468779005889174e-06, "loss": 0.0856, "step": 201100 }, { "epoch": 591.76, "learning_rate": 2.4642498376426442e-06, "loss": 0.0864, "step": 201200 }, { "epoch": 592.06, "learning_rate": 2.4597234687885885e-06, "loss": 0.0915, "step": 201300 }, { "epoch": 592.35, "learning_rate": 2.455199904323983e-06, "loss": 0.0937, "step": 201400 }, { "epoch": 592.65, "learning_rate": 2.4506791492427086e-06, "loss": 0.0884, "step": 201500 }, { "epoch": 592.94, "learning_rate": 2.446161208535543e-06, "loss": 0.0841, "step": 201600 }, { "epoch": 593.24, "learning_rate": 2.4416460871901585e-06, "loss": 0.0819, "step": 201700 }, { "epoch": 593.53, "learning_rate": 2.4371337901911142e-06, "loss": 0.0884, "step": 201800 }, { "epoch": 593.82, "learning_rate": 2.4326243225198505e-06, "loss": 0.088, "step": 201900 }, { "epoch": 594.12, "learning_rate": 2.4281176891546858e-06, "loss": 0.0851, "step": 202000 }, { "epoch": 594.12, "eval_cer": 0.07061592781482935, "eval_loss": 0.5610267519950867, "eval_runtime": 5.3517, "eval_samples_per_second": 67.082, "eval_steps_per_second": 2.242, "eval_wer": 0.2651942608415283, "step": 202000 }, { "epoch": 594.41, "learning_rate": 2.4236138950708086e-06, "loss": 0.0849, "step": 202100 }, { "epoch": 594.71, "learning_rate": 2.419112945240274e-06, "loss": 0.0862, "step": 202200 }, { "epoch": 595.0, "learning_rate": 2.4146148446319944e-06, "loss": 0.0856, "step": 202300 }, { "epoch": 595.29, "learning_rate": 2.41011959821174e-06, "loss": 0.0894, "step": 202400 }, { "epoch": 595.59, "learning_rate": 2.4056272109421286e-06, "loss": 0.087, "step": 202500 }, { "epoch": 595.88, "learning_rate": 2.401137687782621e-06, "loss": 0.0889, "step": 202600 }, { "epoch": 596.18, "learning_rate": 2.3966510336895166e-06, "loss": 0.0854, "step": 202700 }, { "epoch": 596.47, "learning_rate": 2.3921672536159486e-06, "loss": 0.0866, "step": 202800 }, { "epoch": 596.76, "learning_rate": 2.387686352511875e-06, "loss": 0.0875, "step": 202900 }, { "epoch": 597.06, "learning_rate": 2.383208335324078e-06, "loss": 0.0852, "step": 203000 }, { "epoch": 597.06, "eval_cer": 0.07035438734144109, "eval_loss": 0.5522825717926025, "eval_runtime": 4.7713, "eval_samples_per_second": 75.241, "eval_steps_per_second": 2.515, "eval_wer": 0.2624536514589715, "step": 203000 }, { "epoch": 597.35, "learning_rate": 2.3787332069961545e-06, "loss": 0.0834, "step": 203100 }, { "epoch": 597.65, "learning_rate": 2.3742609724685123e-06, "loss": 0.0891, "step": 203200 }, { "epoch": 597.94, "learning_rate": 2.3697916366783653e-06, "loss": 0.0892, "step": 203300 }, { "epoch": 598.24, "learning_rate": 2.3653252045597257e-06, "loss": 0.0858, "step": 203400 }, { "epoch": 598.53, "learning_rate": 2.3608616810434028e-06, "loss": 0.0838, "step": 203500 }, { "epoch": 598.82, "learning_rate": 2.3564010710569924e-06, "loss": 0.0852, "step": 203600 }, { "epoch": 599.12, "learning_rate": 2.3519433795248748e-06, "loss": 0.0938, "step": 203700 }, { "epoch": 599.41, "learning_rate": 2.3474886113682097e-06, "loss": 0.0864, "step": 203800 }, { "epoch": 599.71, "learning_rate": 2.3430367715049235e-06, "loss": 0.0871, "step": 203900 }, { "epoch": 600.0, "learning_rate": 2.33858786484972e-06, "loss": 0.0871, "step": 204000 }, { "epoch": 600.0, "eval_cer": 0.0711825988405039, "eval_loss": 0.5549289584159851, "eval_runtime": 4.6864, "eval_samples_per_second": 76.604, "eval_steps_per_second": 2.561, "eval_wer": 0.2680960825407061, "step": 204000 }, { "epoch": 600.29, "learning_rate": 2.334141896314057e-06, "loss": 0.0874, "step": 204100 }, { "epoch": 600.59, "learning_rate": 2.329698870806151e-06, "loss": 0.0827, "step": 204200 }, { "epoch": 600.88, "learning_rate": 2.325258793230972e-06, "loss": 0.0825, "step": 204300 }, { "epoch": 601.18, "learning_rate": 2.320821668490227e-06, "loss": 0.0812, "step": 204400 }, { "epoch": 601.47, "learning_rate": 2.3163875014823745e-06, "loss": 0.082, "step": 204500 }, { "epoch": 601.76, "learning_rate": 2.3119562971026018e-06, "loss": 0.086, "step": 204600 }, { "epoch": 602.06, "learning_rate": 2.3075280602428245e-06, "loss": 0.0839, "step": 204700 }, { "epoch": 602.35, "learning_rate": 2.3031027957916875e-06, "loss": 0.0848, "step": 204800 }, { "epoch": 602.65, "learning_rate": 2.298680508634544e-06, "loss": 0.0843, "step": 204900 }, { "epoch": 602.94, "learning_rate": 2.294261203653473e-06, "loss": 0.0852, "step": 205000 }, { "epoch": 602.94, "eval_cer": 0.07096464844601369, "eval_loss": 0.5612467527389526, "eval_runtime": 4.9666, "eval_samples_per_second": 72.282, "eval_steps_per_second": 2.416, "eval_wer": 0.2666451716911172, "step": 205000 }, { "epoch": 603.24, "learning_rate": 2.2898890341045833e-06, "loss": 0.087, "step": 205100 }, { "epoch": 603.53, "learning_rate": 2.2854756781652714e-06, "loss": 0.0855, "step": 205200 }, { "epoch": 603.82, "learning_rate": 2.281065318979769e-06, "loss": 0.0866, "step": 205300 }, { "epoch": 604.12, "learning_rate": 2.276657961416981e-06, "loss": 0.0895, "step": 205400 }, { "epoch": 604.41, "learning_rate": 2.2722536103424977e-06, "loss": 0.0823, "step": 205500 }, { "epoch": 604.71, "learning_rate": 2.2678522706185918e-06, "loss": 0.083, "step": 205600 }, { "epoch": 605.0, "learning_rate": 2.2634539471042104e-06, "loss": 0.0893, "step": 205700 }, { "epoch": 605.29, "learning_rate": 2.2590586446549725e-06, "loss": 0.0835, "step": 205800 }, { "epoch": 605.59, "learning_rate": 2.2546663681231596e-06, "loss": 0.0869, "step": 205900 }, { "epoch": 605.88, "learning_rate": 2.250277122357714e-06, "loss": 0.083, "step": 206000 }, { "epoch": 605.88, "eval_cer": 0.07092105836711564, "eval_loss": 0.562522292137146, "eval_runtime": 4.7678, "eval_samples_per_second": 75.296, "eval_steps_per_second": 2.517, "eval_wer": 0.2648718362082863, "step": 206000 }, { "epoch": 606.18, "learning_rate": 2.245890912204233e-06, "loss": 0.0843, "step": 206100 }, { "epoch": 606.47, "learning_rate": 2.2415077425049604e-06, "loss": 0.085, "step": 206200 }, { "epoch": 606.76, "learning_rate": 2.2371714042527648e-06, "loss": 0.0867, "step": 206300 }, { "epoch": 607.06, "learning_rate": 2.2327942994500047e-06, "loss": 0.0816, "step": 206400 }, { "epoch": 607.35, "learning_rate": 2.228420249559719e-06, "loss": 0.0853, "step": 206500 }, { "epoch": 607.65, "learning_rate": 2.224049259410736e-06, "loss": 0.087, "step": 206600 }, { "epoch": 607.94, "learning_rate": 2.2196813338284906e-06, "loss": 0.0845, "step": 206700 }, { "epoch": 608.24, "learning_rate": 2.2153164776350483e-06, "loss": 0.0828, "step": 206800 }, { "epoch": 608.53, "learning_rate": 2.2109546956490803e-06, "loss": 0.0845, "step": 206900 }, { "epoch": 608.82, "learning_rate": 2.2065959926858566e-06, "loss": 0.0859, "step": 207000 }, { "epoch": 608.82, "eval_cer": 0.0708774682882176, "eval_loss": 0.5508594512939453, "eval_runtime": 5.2083, "eval_samples_per_second": 68.928, "eval_steps_per_second": 2.304, "eval_wer": 0.26390456230856035, "step": 207000 }, { "epoch": 609.12, "learning_rate": 2.202240373557264e-06, "loss": 0.0869, "step": 207100 }, { "epoch": 609.41, "learning_rate": 2.197887843071768e-06, "loss": 0.089, "step": 207200 }, { "epoch": 609.71, "learning_rate": 2.19353840603444e-06, "loss": 0.0842, "step": 207300 }, { "epoch": 610.0, "learning_rate": 2.189192067246923e-06, "loss": 0.0879, "step": 207400 }, { "epoch": 610.29, "learning_rate": 2.184848831507445e-06, "loss": 0.0901, "step": 207500 }, { "epoch": 610.59, "learning_rate": 2.180508703610814e-06, "loss": 0.0862, "step": 207600 }, { "epoch": 610.88, "learning_rate": 2.176171688348395e-06, "loss": 0.0821, "step": 207700 }, { "epoch": 611.18, "learning_rate": 2.1718377905081306e-06, "loss": 0.082, "step": 207800 }, { "epoch": 611.47, "learning_rate": 2.167507014874508e-06, "loss": 0.0832, "step": 207900 }, { "epoch": 611.76, "learning_rate": 2.1631793662285754e-06, "loss": 0.0842, "step": 208000 }, { "epoch": 611.76, "eval_cer": 0.07013643694695088, "eval_loss": 0.5625478625297546, "eval_runtime": 4.8229, "eval_samples_per_second": 74.437, "eval_steps_per_second": 2.488, "eval_wer": 0.2648718362082863, "step": 208000 }, { "epoch": 612.06, "learning_rate": 2.158854849347933e-06, "loss": 0.087, "step": 208100 }, { "epoch": 612.35, "learning_rate": 2.1545334690067107e-06, "loss": 0.0852, "step": 208200 }, { "epoch": 612.65, "learning_rate": 2.1502152299755904e-06, "loss": 0.0899, "step": 208300 }, { "epoch": 612.94, "learning_rate": 2.1459001370217743e-06, "loss": 0.0866, "step": 208400 }, { "epoch": 613.24, "learning_rate": 2.1415881949089956e-06, "loss": 0.0895, "step": 208500 }, { "epoch": 613.53, "learning_rate": 2.1372794083975156e-06, "loss": 0.0863, "step": 208600 }, { "epoch": 613.82, "learning_rate": 2.133016822846251e-06, "loss": 0.0887, "step": 208700 }, { "epoch": 614.12, "learning_rate": 2.1287143301295543e-06, "loss": 0.0871, "step": 208800 }, { "epoch": 614.41, "learning_rate": 2.124415007226515e-06, "loss": 0.0883, "step": 208900 }, { "epoch": 614.71, "learning_rate": 2.120118858883457e-06, "loss": 0.084, "step": 209000 }, { "epoch": 614.71, "eval_cer": 0.0705723377359313, "eval_loss": 0.5603653192520142, "eval_runtime": 4.9708, "eval_samples_per_second": 72.222, "eval_steps_per_second": 2.414, "eval_wer": 0.26422698694180236, "step": 209000 }, { "epoch": 615.0, "learning_rate": 2.115825889843199e-06, "loss": 0.0854, "step": 209100 }, { "epoch": 615.29, "learning_rate": 2.111536104845055e-06, "loss": 0.0825, "step": 209200 }, { "epoch": 615.59, "learning_rate": 2.1072495086248112e-06, "loss": 0.0868, "step": 209300 }, { "epoch": 615.88, "learning_rate": 2.1029661059147488e-06, "loss": 0.0801, "step": 209400 }, { "epoch": 616.18, "learning_rate": 2.098685901443615e-06, "loss": 0.084, "step": 209500 }, { "epoch": 616.47, "learning_rate": 2.094408899936627e-06, "loss": 0.0847, "step": 209600 }, { "epoch": 616.76, "learning_rate": 2.0901351061154686e-06, "loss": 0.0809, "step": 209700 }, { "epoch": 617.06, "learning_rate": 2.085864524698275e-06, "loss": 0.0863, "step": 209800 }, { "epoch": 617.35, "learning_rate": 2.0815971603996466e-06, "loss": 0.0842, "step": 209900 }, { "epoch": 617.65, "learning_rate": 2.0773330179306243e-06, "loss": 0.0891, "step": 210000 }, { "epoch": 617.65, "eval_cer": 0.0699620766313587, "eval_loss": 0.5616000890731812, "eval_runtime": 5.1126, "eval_samples_per_second": 70.219, "eval_steps_per_second": 2.347, "eval_wer": 0.2632597130420764, "step": 210000 }, { "epoch": 617.94, "learning_rate": 2.073072101998694e-06, "loss": 0.0861, "step": 210100 }, { "epoch": 618.24, "learning_rate": 2.0688144173077814e-06, "loss": 0.0872, "step": 210200 }, { "epoch": 618.53, "learning_rate": 2.0645599685582372e-06, "loss": 0.0846, "step": 210300 }, { "epoch": 618.82, "learning_rate": 2.0603087604468527e-06, "loss": 0.0832, "step": 210400 }, { "epoch": 619.12, "learning_rate": 2.056060797666832e-06, "loss": 0.0834, "step": 210500 }, { "epoch": 619.41, "learning_rate": 2.051816084907799e-06, "loss": 0.085, "step": 210600 }, { "epoch": 619.71, "learning_rate": 2.0476170253101334e-06, "loss": 0.0829, "step": 210700 }, { "epoch": 620.0, "learning_rate": 2.0434211601942156e-06, "loss": 0.087, "step": 210800 }, { "epoch": 620.29, "learning_rate": 2.0391861602727887e-06, "loss": 0.0848, "step": 210900 }, { "epoch": 620.59, "learning_rate": 2.0349544290014495e-06, "loss": 0.0839, "step": 211000 }, { "epoch": 620.59, "eval_cer": 0.07061592781482935, "eval_loss": 0.564612865447998, "eval_runtime": 4.8577, "eval_samples_per_second": 73.903, "eval_steps_per_second": 2.47, "eval_wer": 0.2648718362082863, "step": 211000 }, { "epoch": 620.88, "learning_rate": 2.030725971051895e-06, "loss": 0.0888, "step": 211100 }, { "epoch": 621.18, "learning_rate": 2.026500791092223e-06, "loss": 0.0862, "step": 211200 }, { "epoch": 621.47, "learning_rate": 2.022278893786906e-06, "loss": 0.0774, "step": 211300 }, { "epoch": 621.76, "learning_rate": 2.018060283796786e-06, "loss": 0.0832, "step": 211400 }, { "epoch": 622.06, "learning_rate": 2.0138449657790904e-06, "loss": 0.0831, "step": 211500 }, { "epoch": 622.35, "learning_rate": 2.0096329443873976e-06, "loss": 0.0905, "step": 211600 }, { "epoch": 622.65, "learning_rate": 2.005424224271658e-06, "loss": 0.088, "step": 211700 }, { "epoch": 622.94, "learning_rate": 2.0012188100781738e-06, "loss": 0.0845, "step": 211800 }, { "epoch": 623.24, "learning_rate": 1.997016706449591e-06, "loss": 0.0834, "step": 211900 }, { "epoch": 623.53, "learning_rate": 1.992817918024914e-06, "loss": 0.085, "step": 212000 }, { "epoch": 623.53, "eval_cer": 0.07083387820931956, "eval_loss": 0.5574280023574829, "eval_runtime": 5.1804, "eval_samples_per_second": 69.3, "eval_steps_per_second": 2.316, "eval_wer": 0.2648718362082863, "step": 212000 }, { "epoch": 623.82, "learning_rate": 1.9886224494394724e-06, "loss": 0.0873, "step": 212100 }, { "epoch": 624.12, "learning_rate": 1.9844303053249453e-06, "loss": 0.0859, "step": 212200 }, { "epoch": 624.41, "learning_rate": 1.9802414903093293e-06, "loss": 0.0868, "step": 212300 }, { "epoch": 624.71, "learning_rate": 1.9760560090169512e-06, "loss": 0.0842, "step": 212400 }, { "epoch": 625.0, "learning_rate": 1.9718738660684627e-06, "loss": 0.0849, "step": 212500 }, { "epoch": 625.29, "learning_rate": 1.967695066080818e-06, "loss": 0.0862, "step": 212600 }, { "epoch": 625.59, "learning_rate": 1.9635196136672945e-06, "loss": 0.0838, "step": 212700 }, { "epoch": 625.88, "learning_rate": 1.959347513437461e-06, "loss": 0.082, "step": 212800 }, { "epoch": 626.18, "learning_rate": 1.955178769997193e-06, "loss": 0.0844, "step": 212900 }, { "epoch": 626.47, "learning_rate": 1.9510133879486625e-06, "loss": 0.0832, "step": 213000 }, { "epoch": 626.47, "eval_cer": 0.07044156749923718, "eval_loss": 0.5674094557762146, "eval_runtime": 4.8288, "eval_samples_per_second": 74.345, "eval_steps_per_second": 2.485, "eval_wer": 0.2650330485249073, "step": 213000 }, { "epoch": 626.76, "learning_rate": 1.946851371890321e-06, "loss": 0.0817, "step": 213100 }, { "epoch": 627.06, "learning_rate": 1.9426927264169165e-06, "loss": 0.0869, "step": 213200 }, { "epoch": 627.35, "learning_rate": 1.9385374561194643e-06, "loss": 0.0877, "step": 213300 }, { "epoch": 627.65, "learning_rate": 1.934385565585259e-06, "loss": 0.0783, "step": 213400 }, { "epoch": 627.94, "learning_rate": 1.930237059397868e-06, "loss": 0.0846, "step": 213500 }, { "epoch": 628.24, "learning_rate": 1.926091942137113e-06, "loss": 0.0881, "step": 213600 }, { "epoch": 628.53, "learning_rate": 1.9219502183790854e-06, "loss": 0.0902, "step": 213700 }, { "epoch": 628.82, "learning_rate": 1.9178118926961197e-06, "loss": 0.0904, "step": 213800 }, { "epoch": 629.12, "learning_rate": 1.9136769696568056e-06, "loss": 0.0844, "step": 213900 }, { "epoch": 629.41, "learning_rate": 1.909545453825975e-06, "loss": 0.0899, "step": 214000 }, { "epoch": 629.41, "eval_cer": 0.06991848655246066, "eval_loss": 0.5597048997879028, "eval_runtime": 5.3718, "eval_samples_per_second": 66.831, "eval_steps_per_second": 2.234, "eval_wer": 0.2624536514589715, "step": 214000 }, { "epoch": 629.71, "learning_rate": 1.905417349764696e-06, "loss": 0.0848, "step": 214100 }, { "epoch": 630.0, "learning_rate": 1.9012926620302774e-06, "loss": 0.0819, "step": 214200 }, { "epoch": 630.29, "learning_rate": 1.8971713951762444e-06, "loss": 0.0818, "step": 214300 }, { "epoch": 630.59, "learning_rate": 1.8930535537523598e-06, "loss": 0.0882, "step": 214400 }, { "epoch": 630.88, "learning_rate": 1.8889391423045917e-06, "loss": 0.0839, "step": 214500 }, { "epoch": 631.18, "learning_rate": 1.8848281653751282e-06, "loss": 0.0823, "step": 214600 }, { "epoch": 631.47, "learning_rate": 1.8807206275023704e-06, "loss": 0.0843, "step": 214700 }, { "epoch": 631.76, "learning_rate": 1.8766165332209101e-06, "loss": 0.0872, "step": 214800 }, { "epoch": 632.06, "learning_rate": 1.8725568764400725e-06, "loss": 0.0766, "step": 214900 }, { "epoch": 632.35, "learning_rate": 1.8684596483809147e-06, "loss": 0.0821, "step": 215000 }, { "epoch": 632.35, "eval_cer": 0.07052874765703326, "eval_loss": 0.5650409460067749, "eval_runtime": 4.9953, "eval_samples_per_second": 71.867, "eval_steps_per_second": 2.402, "eval_wer": 0.26632274705787523, "step": 215000 }, { "epoch": 632.65, "learning_rate": 1.8643658774488132e-06, "loss": 0.0836, "step": 215100 }, { "epoch": 632.94, "learning_rate": 1.860275568163169e-06, "loss": 0.0859, "step": 215200 }, { "epoch": 633.24, "learning_rate": 1.8561887250395604e-06, "loss": 0.0894, "step": 215300 }, { "epoch": 633.53, "learning_rate": 1.852105352589741e-06, "loss": 0.0862, "step": 215400 }, { "epoch": 633.82, "learning_rate": 1.848025455321632e-06, "loss": 0.0842, "step": 215500 }, { "epoch": 634.12, "learning_rate": 1.8439490377393176e-06, "loss": 0.0837, "step": 215600 }, { "epoch": 634.41, "learning_rate": 1.8398761043430419e-06, "loss": 0.0825, "step": 215700 }, { "epoch": 634.71, "learning_rate": 1.8358066596292034e-06, "loss": 0.0854, "step": 215800 }, { "epoch": 635.0, "learning_rate": 1.8317407080903416e-06, "loss": 0.0829, "step": 215900 }, { "epoch": 635.29, "learning_rate": 1.8276782542151516e-06, "loss": 0.0905, "step": 216000 }, { "epoch": 635.29, "eval_cer": 0.06930822544788806, "eval_loss": 0.5545493960380554, "eval_runtime": 5.1065, "eval_samples_per_second": 70.303, "eval_steps_per_second": 2.35, "eval_wer": 0.2616475898758665, "step": 216000 }, { "epoch": 635.59, "learning_rate": 1.823619302488459e-06, "loss": 0.0823, "step": 216100 }, { "epoch": 635.88, "learning_rate": 1.819563857391226e-06, "loss": 0.0843, "step": 216200 }, { "epoch": 636.18, "learning_rate": 1.815511923400544e-06, "loss": 0.0856, "step": 216300 }, { "epoch": 636.47, "learning_rate": 1.8114635049896224e-06, "loss": 0.0879, "step": 216400 }, { "epoch": 636.76, "learning_rate": 1.8074186066277988e-06, "loss": 0.0804, "step": 216500 }, { "epoch": 637.06, "learning_rate": 1.8033772327805188e-06, "loss": 0.0853, "step": 216600 }, { "epoch": 637.35, "learning_rate": 1.7993393879093385e-06, "loss": 0.0826, "step": 216700 }, { "epoch": 637.65, "learning_rate": 1.7953050764719204e-06, "loss": 0.087, "step": 216800 }, { "epoch": 637.94, "learning_rate": 1.7913145931303599e-06, "loss": 0.0849, "step": 216900 }, { "epoch": 638.24, "learning_rate": 1.7872873264724445e-06, "loss": 0.0815, "step": 217000 }, { "epoch": 638.24, "eval_cer": 0.07004925678915479, "eval_loss": 0.5678441524505615, "eval_runtime": 5.429, "eval_samples_per_second": 66.127, "eval_steps_per_second": 2.21, "eval_wer": 0.2634209253586974, "step": 217000 }, { "epoch": 638.53, "learning_rate": 1.7832636065534054e-06, "loss": 0.0839, "step": 217100 }, { "epoch": 638.82, "learning_rate": 1.7792434378153084e-06, "loss": 0.0829, "step": 217200 }, { "epoch": 639.12, "learning_rate": 1.7752268246963001e-06, "loss": 0.087, "step": 217300 }, { "epoch": 639.41, "learning_rate": 1.7712137716306022e-06, "loss": 0.0829, "step": 217400 }, { "epoch": 639.71, "learning_rate": 1.7672042830485047e-06, "loss": 0.0878, "step": 217500 }, { "epoch": 640.0, "learning_rate": 1.7631983633763632e-06, "loss": 0.0808, "step": 217600 }, { "epoch": 640.29, "learning_rate": 1.7591960170365947e-06, "loss": 0.0838, "step": 217700 }, { "epoch": 640.59, "learning_rate": 1.755197248447668e-06, "loss": 0.0769, "step": 217800 }, { "epoch": 640.88, "learning_rate": 1.751202062024106e-06, "loss": 0.085, "step": 217900 }, { "epoch": 641.18, "learning_rate": 1.7472104621764747e-06, "loss": 0.0853, "step": 218000 }, { "epoch": 641.18, "eval_cer": 0.07004925678915479, "eval_loss": 0.5571328401565552, "eval_runtime": 4.4749, "eval_samples_per_second": 80.226, "eval_steps_per_second": 2.682, "eval_wer": 0.2640657746251814, "step": 218000 }, { "epoch": 641.47, "learning_rate": 1.7432224533113807e-06, "loss": 0.0826, "step": 218100 }, { "epoch": 641.76, "learning_rate": 1.7392380398314668e-06, "loss": 0.0874, "step": 218200 }, { "epoch": 642.06, "learning_rate": 1.7352572261354073e-06, "loss": 0.0895, "step": 218300 }, { "epoch": 642.35, "learning_rate": 1.7312800166179012e-06, "loss": 0.0878, "step": 218400 }, { "epoch": 642.65, "learning_rate": 1.727306415669669e-06, "loss": 0.0837, "step": 218500 }, { "epoch": 642.94, "learning_rate": 1.7233364276774472e-06, "loss": 0.0833, "step": 218600 }, { "epoch": 643.24, "learning_rate": 1.7193700570239847e-06, "loss": 0.0801, "step": 218700 }, { "epoch": 643.53, "learning_rate": 1.7154073080880357e-06, "loss": 0.0774, "step": 218800 }, { "epoch": 643.82, "learning_rate": 1.7114481852443576e-06, "loss": 0.0864, "step": 218900 }, { "epoch": 644.12, "learning_rate": 1.7074926928637025e-06, "loss": 0.0853, "step": 219000 }, { "epoch": 644.12, "eval_cer": 0.06961335600017436, "eval_loss": 0.5619438290596008, "eval_runtime": 5.7032, "eval_samples_per_second": 62.947, "eval_steps_per_second": 2.104, "eval_wer": 0.26390456230856035, "step": 219000 }, { "epoch": 644.41, "learning_rate": 1.703540835312817e-06, "loss": 0.0853, "step": 219100 }, { "epoch": 644.71, "learning_rate": 1.6995926169544337e-06, "loss": 0.0814, "step": 219200 }, { "epoch": 645.0, "learning_rate": 1.6956480421472665e-06, "loss": 0.0854, "step": 219300 }, { "epoch": 645.29, "learning_rate": 1.6917071152460103e-06, "loss": 0.0863, "step": 219400 }, { "epoch": 645.59, "learning_rate": 1.6877698406013293e-06, "loss": 0.0819, "step": 219500 }, { "epoch": 645.88, "learning_rate": 1.6838362225598576e-06, "loss": 0.0848, "step": 219600 }, { "epoch": 646.18, "learning_rate": 1.6799062654641918e-06, "loss": 0.082, "step": 219700 }, { "epoch": 646.47, "learning_rate": 1.6759799736528881e-06, "loss": 0.0814, "step": 219800 }, { "epoch": 646.76, "learning_rate": 1.6720573514604543e-06, "loss": 0.0838, "step": 219900 }, { "epoch": 647.06, "learning_rate": 1.6681384032173487e-06, "loss": 0.0816, "step": 220000 }, { "epoch": 647.06, "eval_cer": 0.07044156749923718, "eval_loss": 0.5699228048324585, "eval_runtime": 4.8268, "eval_samples_per_second": 74.376, "eval_steps_per_second": 2.486, "eval_wer": 0.26551668547477025, "step": 220000 }, { "epoch": 647.35, "learning_rate": 1.6642622677279875e-06, "loss": 0.0861, "step": 220100 }, { "epoch": 647.65, "learning_rate": 1.6603506435113182e-06, "loss": 0.0821, "step": 220200 }, { "epoch": 647.94, "learning_rate": 1.6564427061678367e-06, "loss": 0.0828, "step": 220300 }, { "epoch": 648.24, "learning_rate": 1.6525384600117844e-06, "loss": 0.0842, "step": 220400 }, { "epoch": 648.53, "learning_rate": 1.6486379093533317e-06, "loss": 0.0847, "step": 220500 }, { "epoch": 648.82, "learning_rate": 1.6447410584985756e-06, "loss": 0.0896, "step": 220600 }, { "epoch": 649.12, "learning_rate": 1.6408479117495162e-06, "loss": 0.0837, "step": 220700 }, { "epoch": 649.41, "learning_rate": 1.6369584734040777e-06, "loss": 0.0854, "step": 220800 }, { "epoch": 649.71, "learning_rate": 1.6330727477560798e-06, "loss": 0.0869, "step": 220900 }, { "epoch": 650.0, "learning_rate": 1.6291907390952482e-06, "loss": 0.0856, "step": 221000 }, { "epoch": 650.0, "eval_cer": 0.07018002702584891, "eval_loss": 0.5630475878715515, "eval_runtime": 4.4033, "eval_samples_per_second": 81.53, "eval_steps_per_second": 2.725, "eval_wer": 0.26390456230856035, "step": 221000 }, { "epoch": 650.29, "learning_rate": 1.6253124517072055e-06, "loss": 0.0829, "step": 221100 }, { "epoch": 650.59, "learning_rate": 1.6214378898734629e-06, "loss": 0.0792, "step": 221200 }, { "epoch": 650.88, "learning_rate": 1.6175670578714258e-06, "loss": 0.0769, "step": 221300 }, { "epoch": 651.18, "learning_rate": 1.6136999599743726e-06, "loss": 0.0795, "step": 221400 }, { "epoch": 651.47, "learning_rate": 1.609836600451466e-06, "loss": 0.0857, "step": 221500 }, { "epoch": 651.76, "learning_rate": 1.6059769835677387e-06, "loss": 0.0903, "step": 221600 }, { "epoch": 652.06, "learning_rate": 1.6021211135840914e-06, "loss": 0.0827, "step": 221700 }, { "epoch": 652.35, "learning_rate": 1.5982689947572938e-06, "loss": 0.0875, "step": 221800 }, { "epoch": 652.65, "learning_rate": 1.5944206313399663e-06, "loss": 0.0855, "step": 221900 }, { "epoch": 652.94, "learning_rate": 1.5905760275805875e-06, "loss": 0.0801, "step": 222000 }, { "epoch": 652.94, "eval_cer": 0.06956976592127631, "eval_loss": 0.5596914291381836, "eval_runtime": 5.2656, "eval_samples_per_second": 68.178, "eval_steps_per_second": 2.279, "eval_wer": 0.26309850072545543, "step": 222000 }, { "epoch": 653.24, "learning_rate": 1.5867351877234865e-06, "loss": 0.0821, "step": 222100 }, { "epoch": 653.53, "learning_rate": 1.582898116008833e-06, "loss": 0.0774, "step": 222200 }, { "epoch": 653.82, "learning_rate": 1.5790648166726453e-06, "loss": 0.0818, "step": 222300 }, { "epoch": 654.12, "learning_rate": 1.5752352939467664e-06, "loss": 0.0795, "step": 222400 }, { "epoch": 654.41, "learning_rate": 1.5714095520588762e-06, "loss": 0.0936, "step": 222500 }, { "epoch": 654.71, "learning_rate": 1.5675875952324799e-06, "loss": 0.0829, "step": 222600 }, { "epoch": 655.0, "learning_rate": 1.5637694276869036e-06, "loss": 0.0824, "step": 222700 }, { "epoch": 655.29, "learning_rate": 1.5599550536372909e-06, "loss": 0.0811, "step": 222800 }, { "epoch": 655.59, "learning_rate": 1.556144477294596e-06, "loss": 0.0795, "step": 222900 }, { "epoch": 655.88, "learning_rate": 1.5523377028655818e-06, "loss": 0.0855, "step": 223000 }, { "epoch": 655.88, "eval_cer": 0.07061592781482935, "eval_loss": 0.5634012818336487, "eval_runtime": 4.6021, "eval_samples_per_second": 78.007, "eval_steps_per_second": 2.607, "eval_wer": 0.2651942608415283, "step": 223000 }, { "epoch": 656.18, "learning_rate": 1.548534734552814e-06, "loss": 0.0817, "step": 223100 }, { "epoch": 656.47, "learning_rate": 1.544735576554655e-06, "loss": 0.0865, "step": 223200 }, { "epoch": 656.76, "learning_rate": 1.540940233065263e-06, "loss": 0.0865, "step": 223300 }, { "epoch": 657.06, "learning_rate": 1.5371487082745828e-06, "loss": 0.0852, "step": 223400 }, { "epoch": 657.35, "learning_rate": 1.5333610063683456e-06, "loss": 0.0814, "step": 223500 }, { "epoch": 657.65, "learning_rate": 1.5295771315280612e-06, "loss": 0.0832, "step": 223600 }, { "epoch": 657.94, "learning_rate": 1.5257970879310135e-06, "loss": 0.0845, "step": 223700 }, { "epoch": 658.24, "learning_rate": 1.5220208797502584e-06, "loss": 0.0876, "step": 223800 }, { "epoch": 658.53, "learning_rate": 1.518248511154617e-06, "loss": 0.0747, "step": 223900 }, { "epoch": 658.82, "learning_rate": 1.5145176525169048e-06, "loss": 0.0826, "step": 224000 }, { "epoch": 658.82, "eval_cer": 0.06961335600017436, "eval_loss": 0.5628807544708252, "eval_runtime": 4.6717, "eval_samples_per_second": 76.846, "eval_steps_per_second": 2.569, "eval_wer": 0.2619700145091085, "step": 224000 }, { "epoch": 659.12, "learning_rate": 1.510752937081314e-06, "loss": 0.0802, "step": 224100 }, { "epoch": 659.41, "learning_rate": 1.5069920736703108e-06, "loss": 0.086, "step": 224200 }, { "epoch": 659.71, "learning_rate": 1.503235066435771e-06, "loss": 0.0843, "step": 224300 }, { "epoch": 660.0, "learning_rate": 1.4994819195253251e-06, "loss": 0.0874, "step": 224400 }, { "epoch": 660.29, "learning_rate": 1.4957326370823293e-06, "loss": 0.0853, "step": 224500 }, { "epoch": 660.59, "learning_rate": 1.4919872232458848e-06, "loss": 0.0862, "step": 224600 }, { "epoch": 660.88, "learning_rate": 1.4882456821508124e-06, "loss": 0.0812, "step": 224700 }, { "epoch": 661.18, "learning_rate": 1.4845080179276621e-06, "loss": 0.0777, "step": 224800 }, { "epoch": 661.47, "learning_rate": 1.4807742347027083e-06, "loss": 0.0897, "step": 224900 }, { "epoch": 661.76, "learning_rate": 1.4770443365979291e-06, "loss": 0.0885, "step": 225000 }, { "epoch": 661.76, "eval_cer": 0.0699620766313587, "eval_loss": 0.561669111251831, "eval_runtime": 4.6722, "eval_samples_per_second": 76.838, "eval_steps_per_second": 2.568, "eval_wer": 0.2634209253586974, "step": 225000 }, { "epoch": 662.06, "learning_rate": 1.4733183277310282e-06, "loss": 0.0888, "step": 225100 }, { "epoch": 662.35, "learning_rate": 1.4695962122154023e-06, "loss": 0.0855, "step": 225200 }, { "epoch": 662.65, "learning_rate": 1.465877994160156e-06, "loss": 0.0834, "step": 225300 }, { "epoch": 662.94, "learning_rate": 1.4621636776700965e-06, "loss": 0.0795, "step": 225400 }, { "epoch": 663.24, "learning_rate": 1.4584532668457113e-06, "loss": 0.0819, "step": 225500 }, { "epoch": 663.53, "learning_rate": 1.4547467657831893e-06, "loss": 0.0779, "step": 225600 }, { "epoch": 663.82, "learning_rate": 1.4510441785743935e-06, "loss": 0.0816, "step": 225700 }, { "epoch": 664.12, "learning_rate": 1.4473455093068683e-06, "loss": 0.0854, "step": 225800 }, { "epoch": 664.41, "learning_rate": 1.4436507620638395e-06, "loss": 0.0863, "step": 225900 }, { "epoch": 664.71, "learning_rate": 1.4399968296879947e-06, "loss": 0.0817, "step": 226000 }, { "epoch": 664.71, "eval_cer": 0.07009284686805282, "eval_loss": 0.5662137269973755, "eval_runtime": 5.0718, "eval_samples_per_second": 70.784, "eval_steps_per_second": 2.366, "eval_wer": 0.2624536514589715, "step": 226000 }, { "epoch": 665.0, "learning_rate": 1.436309899404354e-06, "loss": 0.0853, "step": 226100 }, { "epoch": 665.29, "learning_rate": 1.4326269033281902e-06, "loss": 0.0885, "step": 226200 }, { "epoch": 665.59, "learning_rate": 1.4289478455254213e-06, "loss": 0.0802, "step": 226300 }, { "epoch": 665.88, "learning_rate": 1.425272730057617e-06, "loss": 0.0875, "step": 226400 }, { "epoch": 666.18, "learning_rate": 1.4216015609819967e-06, "loss": 0.0812, "step": 226500 }, { "epoch": 666.47, "learning_rate": 1.4179343423514169e-06, "loss": 0.0812, "step": 226600 }, { "epoch": 666.76, "learning_rate": 1.414271078214382e-06, "loss": 0.0834, "step": 226700 }, { "epoch": 667.06, "learning_rate": 1.4106117726150247e-06, "loss": 0.0836, "step": 226800 }, { "epoch": 667.35, "learning_rate": 1.4069564295931093e-06, "loss": 0.0791, "step": 226900 }, { "epoch": 667.65, "learning_rate": 1.403305053184027e-06, "loss": 0.0823, "step": 227000 }, { "epoch": 667.65, "eval_cer": 0.0699620766313587, "eval_loss": 0.5672768950462341, "eval_runtime": 4.6733, "eval_samples_per_second": 76.819, "eval_steps_per_second": 2.568, "eval_wer": 0.26261486377559246, "step": 227000 }, { "epoch": 667.94, "learning_rate": 1.399657647418783e-06, "loss": 0.0858, "step": 227100 }, { "epoch": 668.24, "learning_rate": 1.3960142163240098e-06, "loss": 0.0833, "step": 227200 }, { "epoch": 668.53, "learning_rate": 1.3923747639219442e-06, "loss": 0.0878, "step": 227300 }, { "epoch": 668.82, "learning_rate": 1.388739294230434e-06, "loss": 0.0796, "step": 227400 }, { "epoch": 669.12, "learning_rate": 1.3851078112629302e-06, "loss": 0.0843, "step": 227500 }, { "epoch": 669.41, "learning_rate": 1.381480319028477e-06, "loss": 0.0833, "step": 227600 }, { "epoch": 669.71, "learning_rate": 1.3778568215317223e-06, "loss": 0.0881, "step": 227700 }, { "epoch": 670.0, "learning_rate": 1.3742373227728972e-06, "loss": 0.0839, "step": 227800 }, { "epoch": 670.29, "learning_rate": 1.3706218267478204e-06, "loss": 0.0814, "step": 227900 }, { "epoch": 670.59, "learning_rate": 1.3670103374478917e-06, "loss": 0.0805, "step": 228000 }, { "epoch": 670.59, "eval_cer": 0.0705723377359313, "eval_loss": 0.565666675567627, "eval_runtime": 4.6037, "eval_samples_per_second": 77.98, "eval_steps_per_second": 2.607, "eval_wer": 0.2648718362082863, "step": 228000 }, { "epoch": 670.88, "learning_rate": 1.3634028588600878e-06, "loss": 0.0811, "step": 228100 }, { "epoch": 671.18, "learning_rate": 1.359799394966957e-06, "loss": 0.0803, "step": 228200 }, { "epoch": 671.47, "learning_rate": 1.3561999497466155e-06, "loss": 0.0832, "step": 228300 }, { "epoch": 671.76, "learning_rate": 1.3526045271727439e-06, "loss": 0.0841, "step": 228400 }, { "epoch": 672.06, "learning_rate": 1.3490131312145816e-06, "loss": 0.0799, "step": 228500 }, { "epoch": 672.35, "learning_rate": 1.345425765836922e-06, "loss": 0.0794, "step": 228600 }, { "epoch": 672.65, "learning_rate": 1.3418424350001109e-06, "loss": 0.0792, "step": 228700 }, { "epoch": 672.94, "learning_rate": 1.338263142660034e-06, "loss": 0.0896, "step": 228800 }, { "epoch": 673.24, "learning_rate": 1.3346878927681278e-06, "loss": 0.0869, "step": 228900 }, { "epoch": 673.53, "learning_rate": 1.33111668927136e-06, "loss": 0.0899, "step": 229000 }, { "epoch": 673.53, "eval_cer": 0.07000566671025675, "eval_loss": 0.5663681626319885, "eval_runtime": 4.6501, "eval_samples_per_second": 77.202, "eval_steps_per_second": 2.581, "eval_wer": 0.26229243914235045, "step": 229000 }, { "epoch": 673.82, "learning_rate": 1.327549536112233e-06, "loss": 0.0784, "step": 229100 }, { "epoch": 674.12, "learning_rate": 1.3240220481360283e-06, "loss": 0.0815, "step": 229200 }, { "epoch": 674.41, "learning_rate": 1.3204629668602482e-06, "loss": 0.0821, "step": 229300 }, { "epoch": 674.71, "learning_rate": 1.3169079476835022e-06, "loss": 0.0837, "step": 229400 }, { "epoch": 675.0, "learning_rate": 1.3133569945304225e-06, "loss": 0.0862, "step": 229500 }, { "epoch": 675.29, "learning_rate": 1.3098101113211554e-06, "loss": 0.081, "step": 229600 }, { "epoch": 675.59, "learning_rate": 1.3062673019713551e-06, "loss": 0.0801, "step": 229700 }, { "epoch": 675.88, "learning_rate": 1.3027285703921772e-06, "loss": 0.0796, "step": 229800 }, { "epoch": 676.18, "learning_rate": 1.299193920490275e-06, "loss": 0.0807, "step": 229900 }, { "epoch": 676.47, "learning_rate": 1.2956633561677968e-06, "loss": 0.0793, "step": 230000 }, { "epoch": 676.47, "eval_cer": 0.06974412623686849, "eval_loss": 0.5635000467300415, "eval_runtime": 4.8465, "eval_samples_per_second": 74.073, "eval_steps_per_second": 2.476, "eval_wer": 0.26148637755924553, "step": 230000 }, { "epoch": 676.76, "learning_rate": 1.2921368813223807e-06, "loss": 0.0826, "step": 230100 }, { "epoch": 677.06, "learning_rate": 1.288614499847149e-06, "loss": 0.0847, "step": 230200 }, { "epoch": 677.35, "learning_rate": 1.2850962156307062e-06, "loss": 0.0801, "step": 230300 }, { "epoch": 677.65, "learning_rate": 1.2815820325571327e-06, "loss": 0.0805, "step": 230400 }, { "epoch": 677.94, "learning_rate": 1.2780719545059821e-06, "loss": 0.0779, "step": 230500 }, { "epoch": 678.24, "learning_rate": 1.274565985352275e-06, "loss": 0.0856, "step": 230600 }, { "epoch": 678.53, "learning_rate": 1.2710641289664977e-06, "loss": 0.0848, "step": 230700 }, { "epoch": 678.82, "learning_rate": 1.267566389214594e-06, "loss": 0.0854, "step": 230800 }, { "epoch": 679.12, "learning_rate": 1.2640727699579651e-06, "loss": 0.0838, "step": 230900 }, { "epoch": 679.41, "learning_rate": 1.2605832750534618e-06, "loss": 0.0818, "step": 231000 }, { "epoch": 679.41, "eval_cer": 0.06983130639466457, "eval_loss": 0.5645167827606201, "eval_runtime": 4.407, "eval_samples_per_second": 81.461, "eval_steps_per_second": 2.723, "eval_wer": 0.26438819925842333, "step": 231000 }, { "epoch": 679.71, "learning_rate": 1.2570979083533824e-06, "loss": 0.0812, "step": 231100 }, { "epoch": 680.0, "learning_rate": 1.2536166737054679e-06, "loss": 0.082, "step": 231200 }, { "epoch": 680.29, "learning_rate": 1.2501395749528971e-06, "loss": 0.0848, "step": 231300 }, { "epoch": 680.59, "learning_rate": 1.2466666159342839e-06, "loss": 0.0824, "step": 231400 }, { "epoch": 680.88, "learning_rate": 1.2431978004836703e-06, "loss": 0.0798, "step": 231500 }, { "epoch": 681.18, "learning_rate": 1.2397331324305255e-06, "loss": 0.087, "step": 231600 }, { "epoch": 681.47, "learning_rate": 1.2362726155997402e-06, "loss": 0.0814, "step": 231700 }, { "epoch": 681.76, "learning_rate": 1.2328162538116207e-06, "loss": 0.0796, "step": 231800 }, { "epoch": 682.06, "learning_rate": 1.2293640508818878e-06, "loss": 0.0869, "step": 231900 }, { "epoch": 682.35, "learning_rate": 1.22591601062167e-06, "loss": 0.0784, "step": 232000 }, { "epoch": 682.35, "eval_cer": 0.06948258576348024, "eval_loss": 0.5605387091636658, "eval_runtime": 4.8376, "eval_samples_per_second": 74.211, "eval_steps_per_second": 2.481, "eval_wer": 0.26293728840883446, "step": 232000 }, { "epoch": 682.65, "learning_rate": 1.2224721368375014e-06, "loss": 0.0781, "step": 232100 }, { "epoch": 682.94, "learning_rate": 1.2190324333313154e-06, "loss": 0.0837, "step": 232200 }, { "epoch": 683.24, "learning_rate": 1.2155969039004423e-06, "loss": 0.078, "step": 232300 }, { "epoch": 683.53, "learning_rate": 1.2121655523376036e-06, "loss": 0.0851, "step": 232400 }, { "epoch": 683.82, "learning_rate": 1.208738382430909e-06, "loss": 0.0844, "step": 232500 }, { "epoch": 684.12, "learning_rate": 1.2053153979638527e-06, "loss": 0.0816, "step": 232600 }, { "epoch": 684.41, "learning_rate": 1.2018966027153062e-06, "loss": 0.0808, "step": 232700 }, { "epoch": 684.71, "learning_rate": 1.1984820004595183e-06, "loss": 0.0838, "step": 232800 }, { "epoch": 685.0, "learning_rate": 1.1950715949661068e-06, "loss": 0.0871, "step": 232900 }, { "epoch": 685.29, "learning_rate": 1.1916653900000586e-06, "loss": 0.0809, "step": 233000 }, { "epoch": 685.29, "eval_cer": 0.06948258576348024, "eval_loss": 0.5701205730438232, "eval_runtime": 4.8603, "eval_samples_per_second": 73.863, "eval_steps_per_second": 2.469, "eval_wer": 0.26116395292600353, "step": 233000 }, { "epoch": 685.59, "learning_rate": 1.1882633893217222e-06, "loss": 0.077, "step": 233100 }, { "epoch": 685.88, "learning_rate": 1.184865596686804e-06, "loss": 0.0858, "step": 233200 }, { "epoch": 686.18, "learning_rate": 1.181472015846366e-06, "loss": 0.0798, "step": 233300 }, { "epoch": 686.47, "learning_rate": 1.1780826505468207e-06, "loss": 0.0833, "step": 233400 }, { "epoch": 686.76, "learning_rate": 1.1746975045299258e-06, "loss": 0.0831, "step": 233500 }, { "epoch": 687.06, "learning_rate": 1.171350369846545e-06, "loss": 0.0842, "step": 233600 }, { "epoch": 687.35, "learning_rate": 1.1680073777664342e-06, "loss": 0.0804, "step": 233700 }, { "epoch": 687.65, "learning_rate": 1.1646348273553372e-06, "loss": 0.0826, "step": 233800 }, { "epoch": 687.94, "learning_rate": 1.161266511072886e-06, "loss": 0.0797, "step": 233900 }, { "epoch": 688.24, "learning_rate": 1.1579024326376014e-06, "loss": 0.0851, "step": 234000 }, { "epoch": 688.24, "eval_cer": 0.0696569460790724, "eval_loss": 0.5669453740119934, "eval_runtime": 5.0116, "eval_samples_per_second": 71.633, "eval_steps_per_second": 2.394, "eval_wer": 0.26132516524262456, "step": 234000 }, { "epoch": 688.53, "learning_rate": 1.1545425957633266e-06, "loss": 0.082, "step": 234100 }, { "epoch": 688.82, "learning_rate": 1.1511870041592172e-06, "loss": 0.086, "step": 234200 }, { "epoch": 689.12, "learning_rate": 1.1478356615297498e-06, "loss": 0.0777, "step": 234300 }, { "epoch": 689.41, "learning_rate": 1.1444885715747057e-06, "loss": 0.0808, "step": 234400 }, { "epoch": 689.71, "learning_rate": 1.1411457379891722e-06, "loss": 0.0776, "step": 234500 }, { "epoch": 690.0, "learning_rate": 1.1378071644635397e-06, "loss": 0.0825, "step": 234600 }, { "epoch": 690.29, "learning_rate": 1.1344728546834881e-06, "loss": 0.0817, "step": 234700 }, { "epoch": 690.59, "learning_rate": 1.1311428123300016e-06, "loss": 0.0819, "step": 234800 }, { "epoch": 690.88, "learning_rate": 1.1278170410793455e-06, "loss": 0.0787, "step": 234900 }, { "epoch": 691.18, "learning_rate": 1.1244955446030715e-06, "loss": 0.0883, "step": 235000 }, { "epoch": 691.18, "eval_cer": 0.0696569460790724, "eval_loss": 0.5649272799491882, "eval_runtime": 5.4507, "eval_samples_per_second": 65.863, "eval_steps_per_second": 2.202, "eval_wer": 0.26309850072545543, "step": 235000 }, { "epoch": 691.47, "learning_rate": 1.1211783265680143e-06, "loss": 0.0801, "step": 235100 }, { "epoch": 691.76, "learning_rate": 1.1178653906362797e-06, "loss": 0.0814, "step": 235200 }, { "epoch": 692.06, "learning_rate": 1.1145567404652558e-06, "loss": 0.0868, "step": 235300 }, { "epoch": 692.35, "learning_rate": 1.111252379707587e-06, "loss": 0.0826, "step": 235400 }, { "epoch": 692.65, "learning_rate": 1.107952312011194e-06, "loss": 0.0756, "step": 235500 }, { "epoch": 692.94, "learning_rate": 1.1046565410192528e-06, "loss": 0.0822, "step": 235600 }, { "epoch": 693.24, "learning_rate": 1.1013650703701922e-06, "loss": 0.0824, "step": 235700 }, { "epoch": 693.53, "learning_rate": 1.0980779036977024e-06, "loss": 0.0784, "step": 235800 }, { "epoch": 693.82, "learning_rate": 1.0947950446307127e-06, "loss": 0.0798, "step": 235900 }, { "epoch": 694.12, "learning_rate": 1.0915164967934045e-06, "loss": 0.0803, "step": 236000 }, { "epoch": 694.12, "eval_cer": 0.06930822544788806, "eval_loss": 0.5643986463546753, "eval_runtime": 4.3472, "eval_samples_per_second": 82.582, "eval_steps_per_second": 2.76, "eval_wer": 0.2600354667096566, "step": 236000 }, { "epoch": 694.41, "learning_rate": 1.0882422638051977e-06, "loss": 0.0819, "step": 236100 }, { "epoch": 694.71, "learning_rate": 1.0849723492807435e-06, "loss": 0.0846, "step": 236200 }, { "epoch": 695.0, "learning_rate": 1.0817067568299344e-06, "loss": 0.0819, "step": 236300 }, { "epoch": 695.29, "learning_rate": 1.0784454900578834e-06, "loss": 0.0846, "step": 236400 }, { "epoch": 695.59, "learning_rate": 1.0751885525649336e-06, "loss": 0.0828, "step": 236500 }, { "epoch": 695.88, "learning_rate": 1.0719359479466484e-06, "loss": 0.0906, "step": 236600 }, { "epoch": 696.18, "learning_rate": 1.068687679793801e-06, "loss": 0.083, "step": 236700 }, { "epoch": 696.47, "learning_rate": 1.0654437516923893e-06, "loss": 0.0828, "step": 236800 }, { "epoch": 696.76, "learning_rate": 1.062204167223606e-06, "loss": 0.0849, "step": 236900 }, { "epoch": 697.06, "learning_rate": 1.0589689299638606e-06, "loss": 0.0859, "step": 237000 }, { "epoch": 697.06, "eval_cer": 0.06948258576348024, "eval_loss": 0.5633894205093384, "eval_runtime": 5.486, "eval_samples_per_second": 65.44, "eval_steps_per_second": 2.187, "eval_wer": 0.26019667902627763, "step": 237000 }, { "epoch": 697.35, "learning_rate": 1.0557703308014694e-06, "loss": 0.0832, "step": 237100 }, { "epoch": 697.65, "learning_rate": 1.0525437551086954e-06, "loss": 0.077, "step": 237200 }, { "epoch": 697.94, "learning_rate": 1.0493215372897642e-06, "loss": 0.0806, "step": 237300 }, { "epoch": 698.24, "learning_rate": 1.0461036809019087e-06, "loss": 0.0826, "step": 237400 }, { "epoch": 698.53, "learning_rate": 1.0428901894975458e-06, "loss": 0.0852, "step": 237500 }, { "epoch": 698.82, "learning_rate": 1.0396810666242736e-06, "loss": 0.0844, "step": 237600 }, { "epoch": 699.12, "learning_rate": 1.0364763158248685e-06, "loss": 0.0766, "step": 237700 }, { "epoch": 699.41, "learning_rate": 1.03327594063728e-06, "loss": 0.083, "step": 237800 }, { "epoch": 699.71, "learning_rate": 1.0300799445946264e-06, "loss": 0.0818, "step": 237900 }, { "epoch": 700.0, "learning_rate": 1.0268883312251915e-06, "loss": 0.0796, "step": 238000 }, { "epoch": 700.0, "eval_cer": 0.0696569460790724, "eval_loss": 0.558987021446228, "eval_runtime": 4.7414, "eval_samples_per_second": 75.716, "eval_steps_per_second": 2.531, "eval_wer": 0.26277607609221343, "step": 238000 }, { "epoch": 700.29, "learning_rate": 1.023701104052422e-06, "loss": 0.0837, "step": 238100 }, { "epoch": 700.59, "learning_rate": 1.020518266594921e-06, "loss": 0.0844, "step": 238200 }, { "epoch": 700.88, "learning_rate": 1.017339822366446e-06, "loss": 0.08, "step": 238300 }, { "epoch": 701.18, "learning_rate": 1.0141657748759048e-06, "loss": 0.0823, "step": 238400 }, { "epoch": 701.47, "learning_rate": 1.0109961276273511e-06, "loss": 0.0794, "step": 238500 }, { "epoch": 701.76, "learning_rate": 1.0078308841199807e-06, "loss": 0.0854, "step": 238600 }, { "epoch": 702.06, "learning_rate": 1.0046700478481281e-06, "loss": 0.0846, "step": 238700 }, { "epoch": 702.35, "learning_rate": 1.0015451647121965e-06, "loss": 0.0823, "step": 238800 }, { "epoch": 702.65, "learning_rate": 9.983931092155874e-07, "loss": 0.0795, "step": 238900 }, { "epoch": 702.94, "learning_rate": 9.952454713735167e-07, "loss": 0.0806, "step": 239000 }, { "epoch": 702.94, "eval_cer": 0.06974412623686849, "eval_loss": 0.5627612471580505, "eval_runtime": 4.8839, "eval_samples_per_second": 73.507, "eval_steps_per_second": 2.457, "eval_wer": 0.2616475898758665, "step": 239000 }, { "epoch": 703.24, "learning_rate": 9.921022546608861e-07, "loss": 0.0766, "step": 239100 }, { "epoch": 703.53, "learning_rate": 9.88963462547709e-07, "loss": 0.0834, "step": 239200 }, { "epoch": 703.82, "learning_rate": 9.858290984991197e-07, "loss": 0.0842, "step": 239300 }, { "epoch": 704.12, "learning_rate": 9.826991659753626e-07, "loss": 0.0799, "step": 239400 }, { "epoch": 704.41, "learning_rate": 9.79573668431788e-07, "loss": 0.079, "step": 239500 }, { "epoch": 704.71, "learning_rate": 9.764526093188565e-07, "loss": 0.0821, "step": 239600 }, { "epoch": 705.0, "learning_rate": 9.7333599208212e-07, "loss": 0.0829, "step": 239700 }, { "epoch": 705.29, "learning_rate": 9.70223820162232e-07, "loss": 0.0829, "step": 239800 }, { "epoch": 705.59, "learning_rate": 9.671160969949371e-07, "loss": 0.085, "step": 239900 }, { "epoch": 705.88, "learning_rate": 9.640128260110688e-07, "loss": 0.0846, "step": 240000 }, { "epoch": 705.88, "eval_cer": 0.0696569460790724, "eval_loss": 0.5651042461395264, "eval_runtime": 4.7198, "eval_samples_per_second": 76.063, "eval_steps_per_second": 2.543, "eval_wer": 0.26100274060938256, "step": 240000 }, { "epoch": 706.18, "learning_rate": 9.609140106365478e-07, "loss": 0.0811, "step": 240100 }, { "epoch": 706.47, "learning_rate": 9.578196542923713e-07, "loss": 0.08, "step": 240200 }, { "epoch": 706.76, "learning_rate": 9.54729760394617e-07, "loss": 0.0796, "step": 240300 }, { "epoch": 707.06, "learning_rate": 9.516443323544355e-07, "loss": 0.0857, "step": 240400 }, { "epoch": 707.35, "learning_rate": 9.485633735780475e-07, "loss": 0.0778, "step": 240500 }, { "epoch": 707.65, "learning_rate": 9.454868874667389e-07, "loss": 0.085, "step": 240600 }, { "epoch": 707.94, "learning_rate": 9.424148774168596e-07, "loss": 0.0845, "step": 240700 }, { "epoch": 708.24, "learning_rate": 9.393473468198155e-07, "loss": 0.0812, "step": 240800 }, { "epoch": 708.53, "learning_rate": 9.362842990620702e-07, "loss": 0.0816, "step": 240900 }, { "epoch": 708.82, "learning_rate": 9.332257375251364e-07, "loss": 0.079, "step": 241000 }, { "epoch": 708.82, "eval_cer": 0.06961335600017436, "eval_loss": 0.5604375600814819, "eval_runtime": 5.0667, "eval_samples_per_second": 70.855, "eval_steps_per_second": 2.368, "eval_wer": 0.2616475898758665, "step": 241000 }, { "epoch": 709.12, "learning_rate": 9.301716655855747e-07, "loss": 0.0836, "step": 241100 }, { "epoch": 709.41, "learning_rate": 9.271220866149882e-07, "loss": 0.081, "step": 241200 }, { "epoch": 709.71, "learning_rate": 9.241074325384697e-07, "loss": 0.0794, "step": 241300 }, { "epoch": 710.0, "learning_rate": 9.21066804587209e-07, "loss": 0.0787, "step": 241400 }, { "epoch": 710.29, "learning_rate": 9.180306796564203e-07, "loss": 0.0823, "step": 241500 }, { "epoch": 710.59, "learning_rate": 9.149990610978915e-07, "loss": 0.0829, "step": 241600 }, { "epoch": 710.88, "learning_rate": 9.119719522584436e-07, "loss": 0.0829, "step": 241700 }, { "epoch": 711.18, "learning_rate": 9.089493564799101e-07, "loss": 0.0786, "step": 241800 }, { "epoch": 711.47, "learning_rate": 9.059312770991496e-07, "loss": 0.0806, "step": 241900 }, { "epoch": 711.76, "learning_rate": 9.029177174480314e-07, "loss": 0.0793, "step": 242000 }, { "epoch": 711.76, "eval_cer": 0.06939540560568415, "eval_loss": 0.5705261826515198, "eval_runtime": 4.6246, "eval_samples_per_second": 77.628, "eval_steps_per_second": 2.595, "eval_wer": 0.26100274060938256, "step": 242000 }, { "epoch": 712.06, "learning_rate": 8.999086808534341e-07, "loss": 0.0795, "step": 242100 }, { "epoch": 712.35, "learning_rate": 8.969041706372461e-07, "loss": 0.0824, "step": 242200 }, { "epoch": 712.65, "learning_rate": 8.939041901163531e-07, "loss": 0.0808, "step": 242300 }, { "epoch": 712.94, "learning_rate": 8.909087426026492e-07, "loss": 0.0813, "step": 242400 }, { "epoch": 713.24, "learning_rate": 8.87917831403014e-07, "loss": 0.0786, "step": 242500 }, { "epoch": 713.53, "learning_rate": 8.849314598193282e-07, "loss": 0.0838, "step": 242600 }, { "epoch": 713.82, "learning_rate": 8.81949631148456e-07, "loss": 0.0787, "step": 242700 }, { "epoch": 714.12, "learning_rate": 8.789723486822443e-07, "loss": 0.0791, "step": 242800 }, { "epoch": 714.41, "learning_rate": 8.759996157075285e-07, "loss": 0.0844, "step": 242900 }, { "epoch": 714.71, "learning_rate": 8.730314355061126e-07, "loss": 0.0813, "step": 243000 }, { "epoch": 714.71, "eval_cer": 0.06926463536899002, "eval_loss": 0.5673476457595825, "eval_runtime": 5.3489, "eval_samples_per_second": 67.117, "eval_steps_per_second": 2.243, "eval_wer": 0.25906819280993065, "step": 243000 }, { "epoch": 715.0, "learning_rate": 8.700678113547822e-07, "loss": 0.0833, "step": 243100 }, { "epoch": 715.29, "learning_rate": 8.671087465252903e-07, "loss": 0.0805, "step": 243200 }, { "epoch": 715.59, "learning_rate": 8.641542442843526e-07, "loss": 0.0848, "step": 243300 }, { "epoch": 715.88, "learning_rate": 8.612043078936555e-07, "loss": 0.0796, "step": 243400 }, { "epoch": 716.18, "learning_rate": 8.582589406098357e-07, "loss": 0.0803, "step": 243500 }, { "epoch": 716.47, "learning_rate": 8.553181456844955e-07, "loss": 0.0822, "step": 243600 }, { "epoch": 716.76, "learning_rate": 8.523819263641841e-07, "loss": 0.0863, "step": 243700 }, { "epoch": 717.06, "learning_rate": 8.494795796192135e-07, "loss": 0.0813, "step": 243800 }, { "epoch": 717.35, "learning_rate": 8.465524753915627e-07, "loss": 0.0867, "step": 243900 }, { "epoch": 717.65, "learning_rate": 8.436299564459782e-07, "loss": 0.0803, "step": 244000 }, { "epoch": 717.65, "eval_cer": 0.06978771631576654, "eval_loss": 0.5662087202072144, "eval_runtime": 4.8974, "eval_samples_per_second": 73.304, "eval_steps_per_second": 2.45, "eval_wer": 0.2616475898758665, "step": 244000 }, { "epoch": 717.94, "learning_rate": 8.40712026008833e-07, "loss": 0.081, "step": 244100 }, { "epoch": 718.24, "learning_rate": 8.377986873014355e-07, "loss": 0.0802, "step": 244200 }, { "epoch": 718.53, "learning_rate": 8.348899435400249e-07, "loss": 0.0806, "step": 244300 }, { "epoch": 718.82, "learning_rate": 8.319857979357665e-07, "loss": 0.0783, "step": 244400 }, { "epoch": 719.12, "learning_rate": 8.290862536947514e-07, "loss": 0.0785, "step": 244500 }, { "epoch": 719.41, "learning_rate": 8.2619131401799e-07, "loss": 0.083, "step": 244600 }, { "epoch": 719.71, "learning_rate": 8.233009821014081e-07, "loss": 0.0873, "step": 244700 }, { "epoch": 720.0, "learning_rate": 8.204152611358468e-07, "loss": 0.0818, "step": 244800 }, { "epoch": 720.29, "learning_rate": 8.175341543070553e-07, "loss": 0.0802, "step": 244900 }, { "epoch": 720.59, "learning_rate": 8.146576647956905e-07, "loss": 0.079, "step": 245000 }, { "epoch": 720.59, "eval_cer": 0.06970053615797045, "eval_loss": 0.5707852840423584, "eval_runtime": 4.806, "eval_samples_per_second": 74.699, "eval_steps_per_second": 2.497, "eval_wer": 0.2603578913428986, "step": 245000 }, { "epoch": 720.88, "learning_rate": 8.117857957773096e-07, "loss": 0.0786, "step": 245100 }, { "epoch": 721.18, "learning_rate": 8.089185504223712e-07, "loss": 0.0819, "step": 245200 }, { "epoch": 721.47, "learning_rate": 8.060559318962285e-07, "loss": 0.0851, "step": 245300 }, { "epoch": 721.76, "learning_rate": 8.031979433591263e-07, "loss": 0.0834, "step": 245400 }, { "epoch": 722.06, "learning_rate": 8.003445879661992e-07, "loss": 0.0787, "step": 245500 }, { "epoch": 722.35, "learning_rate": 7.974958688674661e-07, "loss": 0.0825, "step": 245600 }, { "epoch": 722.65, "learning_rate": 7.946517892078281e-07, "loss": 0.0861, "step": 245700 }, { "epoch": 722.94, "learning_rate": 7.918123521270637e-07, "loss": 0.0819, "step": 245800 }, { "epoch": 723.24, "learning_rate": 7.889775607598276e-07, "loss": 0.0841, "step": 245900 }, { "epoch": 723.53, "learning_rate": 7.861474182356449e-07, "loss": 0.0792, "step": 246000 }, { "epoch": 723.53, "eval_cer": 0.06961335600017436, "eval_loss": 0.568951427936554, "eval_runtime": 4.8277, "eval_samples_per_second": 74.362, "eval_steps_per_second": 2.486, "eval_wer": 0.2600354667096566, "step": 246000 }, { "epoch": 723.82, "learning_rate": 7.833501595469872e-07, "loss": 0.0801, "step": 246100 }, { "epoch": 724.12, "learning_rate": 7.805292775106627e-07, "loss": 0.0805, "step": 246200 }, { "epoch": 724.41, "learning_rate": 7.777130536440419e-07, "loss": 0.0792, "step": 246300 }, { "epoch": 724.71, "learning_rate": 7.749014910561536e-07, "loss": 0.083, "step": 246400 }, { "epoch": 725.0, "learning_rate": 7.720945928508789e-07, "loss": 0.082, "step": 246500 }, { "epoch": 725.29, "learning_rate": 7.692923621269482e-07, "loss": 0.0778, "step": 246600 }, { "epoch": 725.59, "learning_rate": 7.664948019779444e-07, "loss": 0.0814, "step": 246700 }, { "epoch": 725.88, "learning_rate": 7.637019154922865e-07, "loss": 0.0849, "step": 246800 }, { "epoch": 726.18, "learning_rate": 7.60913705753239e-07, "loss": 0.0785, "step": 246900 }, { "epoch": 726.47, "learning_rate": 7.581301758389026e-07, "loss": 0.0731, "step": 247000 }, { "epoch": 726.47, "eval_cer": 0.06956976592127631, "eval_loss": 0.5695874691009521, "eval_runtime": 5.5665, "eval_samples_per_second": 64.492, "eval_steps_per_second": 2.156, "eval_wer": 0.2600354667096566, "step": 247000 }, { "epoch": 726.76, "learning_rate": 7.553513288222108e-07, "loss": 0.0777, "step": 247100 }, { "epoch": 727.06, "learning_rate": 7.525771677709276e-07, "loss": 0.0844, "step": 247200 }, { "epoch": 727.35, "learning_rate": 7.498076957476447e-07, "loss": 0.0797, "step": 247300 }, { "epoch": 727.65, "learning_rate": 7.470429158097758e-07, "loss": 0.084, "step": 247400 }, { "epoch": 727.94, "learning_rate": 7.442828310095562e-07, "loss": 0.0799, "step": 247500 }, { "epoch": 728.24, "learning_rate": 7.415274443940363e-07, "loss": 0.0826, "step": 247600 }, { "epoch": 728.53, "learning_rate": 7.387767590050809e-07, "loss": 0.0842, "step": 247700 }, { "epoch": 728.82, "learning_rate": 7.360307778793646e-07, "loss": 0.0789, "step": 247800 }, { "epoch": 729.12, "learning_rate": 7.332895040483689e-07, "loss": 0.078, "step": 247900 }, { "epoch": 729.41, "learning_rate": 7.305529405383776e-07, "loss": 0.0822, "step": 248000 }, { "epoch": 729.41, "eval_cer": 0.06987489647356261, "eval_loss": 0.5686177015304565, "eval_runtime": 4.9297, "eval_samples_per_second": 72.824, "eval_steps_per_second": 2.434, "eval_wer": 0.26293728840883446, "step": 248000 }, { "epoch": 729.71, "learning_rate": 7.278210903704763e-07, "loss": 0.0813, "step": 248100 }, { "epoch": 730.0, "learning_rate": 7.250939565605447e-07, "loss": 0.0878, "step": 248200 }, { "epoch": 730.29, "learning_rate": 7.223715421192573e-07, "loss": 0.0789, "step": 248300 }, { "epoch": 730.59, "learning_rate": 7.196538500520789e-07, "loss": 0.0767, "step": 248400 }, { "epoch": 730.88, "learning_rate": 7.169408833592606e-07, "loss": 0.0817, "step": 248500 }, { "epoch": 731.18, "learning_rate": 7.142326450358361e-07, "loss": 0.0814, "step": 248600 }, { "epoch": 731.47, "learning_rate": 7.115291380716194e-07, "loss": 0.0797, "step": 248700 }, { "epoch": 731.76, "learning_rate": 7.088303654512024e-07, "loss": 0.0835, "step": 248800 }, { "epoch": 732.06, "learning_rate": 7.061363301539486e-07, "loss": 0.0806, "step": 248900 }, { "epoch": 732.35, "learning_rate": 7.03447035153993e-07, "loss": 0.08, "step": 249000 }, { "epoch": 732.35, "eval_cer": 0.06952617584237827, "eval_loss": 0.5695518851280212, "eval_runtime": 4.6502, "eval_samples_per_second": 77.2, "eval_steps_per_second": 2.581, "eval_wer": 0.2621312268257295, "step": 249000 }, { "epoch": 732.65, "learning_rate": 7.00762483420237e-07, "loss": 0.0801, "step": 249100 }, { "epoch": 732.94, "learning_rate": 6.980826779163457e-07, "loss": 0.086, "step": 249200 }, { "epoch": 733.24, "learning_rate": 6.954076216007438e-07, "loss": 0.0809, "step": 249300 }, { "epoch": 733.53, "learning_rate": 6.927373174266139e-07, "loss": 0.0798, "step": 249400 }, { "epoch": 733.82, "learning_rate": 6.900717683418923e-07, "loss": 0.0821, "step": 249500 }, { "epoch": 734.12, "learning_rate": 6.874109772892651e-07, "loss": 0.0794, "step": 249600 }, { "epoch": 734.41, "learning_rate": 6.847549472061671e-07, "loss": 0.0817, "step": 249700 }, { "epoch": 734.71, "learning_rate": 6.821036810247755e-07, "loss": 0.0783, "step": 249800 }, { "epoch": 735.0, "learning_rate": 6.794571816720085e-07, "loss": 0.0798, "step": 249900 }, { "epoch": 735.29, "learning_rate": 6.768154520695241e-07, "loss": 0.082, "step": 250000 }, { "epoch": 735.29, "eval_cer": 0.06987489647356261, "eval_loss": 0.5729803442955017, "eval_runtime": 4.2644, "eval_samples_per_second": 84.185, "eval_steps_per_second": 2.814, "eval_wer": 0.2621312268257295, "step": 250000 }, { "epoch": 735.59, "learning_rate": 6.74178495133711e-07, "loss": 0.0774, "step": 250100 }, { "epoch": 735.88, "learning_rate": 6.715463137756923e-07, "loss": 0.0809, "step": 250200 }, { "epoch": 736.18, "learning_rate": 6.689189109013167e-07, "loss": 0.083, "step": 250300 }, { "epoch": 736.47, "learning_rate": 6.662962894111591e-07, "loss": 0.0831, "step": 250400 }, { "epoch": 736.76, "learning_rate": 6.636784522005152e-07, "loss": 0.088, "step": 250500 }, { "epoch": 737.06, "learning_rate": 6.610654021593993e-07, "loss": 0.0841, "step": 250600 }, { "epoch": 737.35, "learning_rate": 6.5845714217254e-07, "loss": 0.0807, "step": 250700 }, { "epoch": 737.65, "learning_rate": 6.55853675119379e-07, "loss": 0.0819, "step": 250800 }, { "epoch": 737.94, "learning_rate": 6.532550038740665e-07, "loss": 0.0881, "step": 250900 }, { "epoch": 738.24, "learning_rate": 6.506611313054567e-07, "loss": 0.0821, "step": 251000 }, { "epoch": 738.24, "eval_cer": 0.0696569460790724, "eval_loss": 0.5708038806915283, "eval_runtime": 5.0046, "eval_samples_per_second": 71.734, "eval_steps_per_second": 2.398, "eval_wer": 0.26180880219248753, "step": 251000 }, { "epoch": 738.53, "learning_rate": 6.48072060277109e-07, "loss": 0.0755, "step": 251100 }, { "epoch": 738.82, "learning_rate": 6.454877936472798e-07, "loss": 0.0852, "step": 251200 }, { "epoch": 739.12, "learning_rate": 6.429083342689224e-07, "loss": 0.0845, "step": 251300 }, { "epoch": 739.41, "learning_rate": 6.403336849896824e-07, "loss": 0.087, "step": 251400 }, { "epoch": 739.71, "learning_rate": 6.377638486518967e-07, "loss": 0.0781, "step": 251500 }, { "epoch": 740.0, "learning_rate": 6.351988280925874e-07, "loss": 0.0796, "step": 251600 }, { "epoch": 740.29, "learning_rate": 6.326386261434603e-07, "loss": 0.0832, "step": 251700 }, { "epoch": 740.59, "learning_rate": 6.300832456309036e-07, "loss": 0.0829, "step": 251800 }, { "epoch": 740.88, "learning_rate": 6.275326893759775e-07, "loss": 0.0798, "step": 251900 }, { "epoch": 741.18, "learning_rate": 6.249869601944236e-07, "loss": 0.079, "step": 252000 }, { "epoch": 741.18, "eval_cer": 0.06948258576348024, "eval_loss": 0.5701922178268433, "eval_runtime": 5.0097, "eval_samples_per_second": 71.661, "eval_steps_per_second": 2.395, "eval_wer": 0.26148637755924553, "step": 252000 }, { "epoch": 741.47, "learning_rate": 6.224460608966492e-07, "loss": 0.0847, "step": 252100 }, { "epoch": 741.76, "learning_rate": 6.199099942877318e-07, "loss": 0.0833, "step": 252200 }, { "epoch": 742.06, "learning_rate": 6.174040515337682e-07, "loss": 0.0784, "step": 252300 }, { "epoch": 742.35, "learning_rate": 6.148776102998055e-07, "loss": 0.0839, "step": 252400 }, { "epoch": 742.65, "learning_rate": 6.123560101100456e-07, "loss": 0.0819, "step": 252500 }, { "epoch": 742.94, "learning_rate": 6.098392537482562e-07, "loss": 0.084, "step": 252600 }, { "epoch": 743.24, "learning_rate": 6.073273439928623e-07, "loss": 0.0823, "step": 252700 }, { "epoch": 743.53, "learning_rate": 6.04820283616937e-07, "loss": 0.0781, "step": 252800 }, { "epoch": 743.82, "learning_rate": 6.023180753882008e-07, "loss": 0.0802, "step": 252900 }, { "epoch": 744.12, "learning_rate": 5.998207220690161e-07, "loss": 0.0867, "step": 253000 }, { "epoch": 744.12, "eval_cer": 0.0696569460790724, "eval_loss": 0.5710974335670471, "eval_runtime": 4.3252, "eval_samples_per_second": 83.003, "eval_steps_per_second": 2.774, "eval_wer": 0.26132516524262456, "step": 253000 }, { "epoch": 744.41, "learning_rate": 5.973282264163866e-07, "loss": 0.0813, "step": 253100 }, { "epoch": 744.71, "learning_rate": 5.948405911819538e-07, "loss": 0.0816, "step": 253200 }, { "epoch": 745.0, "learning_rate": 5.923578191119922e-07, "loss": 0.0733, "step": 253300 }, { "epoch": 745.29, "learning_rate": 5.898799129474076e-07, "loss": 0.0871, "step": 253400 }, { "epoch": 745.59, "learning_rate": 5.874068754237349e-07, "loss": 0.0823, "step": 253500 }, { "epoch": 745.88, "learning_rate": 5.849387092711339e-07, "loss": 0.0796, "step": 253600 }, { "epoch": 746.18, "learning_rate": 5.824754172143865e-07, "loss": 0.0801, "step": 253700 }, { "epoch": 746.47, "learning_rate": 5.800170019728929e-07, "loss": 0.0778, "step": 253800 }, { "epoch": 746.76, "learning_rate": 5.7756346626067e-07, "loss": 0.084, "step": 253900 }, { "epoch": 747.06, "learning_rate": 5.751148127863487e-07, "loss": 0.0825, "step": 254000 }, { "epoch": 747.06, "eval_cer": 0.0696569460790724, "eval_loss": 0.5694045424461365, "eval_runtime": 5.1895, "eval_samples_per_second": 69.178, "eval_steps_per_second": 2.312, "eval_wer": 0.2619700145091085, "step": 254000 }, { "epoch": 747.35, "learning_rate": 5.72671044253168e-07, "loss": 0.083, "step": 254100 }, { "epoch": 747.65, "learning_rate": 5.702321633589785e-07, "loss": 0.0792, "step": 254200 }, { "epoch": 747.94, "learning_rate": 5.67822488485888e-07, "loss": 0.0769, "step": 254300 }, { "epoch": 748.24, "learning_rate": 5.65393341998165e-07, "loss": 0.0792, "step": 254400 }, { "epoch": 748.53, "learning_rate": 5.629690911837949e-07, "loss": 0.083, "step": 254500 }, { "epoch": 748.82, "learning_rate": 5.605497387190828e-07, "loss": 0.0827, "step": 254600 }, { "epoch": 749.12, "learning_rate": 5.581352872749168e-07, "loss": 0.08, "step": 254700 }, { "epoch": 749.41, "learning_rate": 5.557257395167842e-07, "loss": 0.0814, "step": 254800 }, { "epoch": 749.71, "learning_rate": 5.533451202237355e-07, "loss": 0.0788, "step": 254900 }, { "epoch": 750.0, "learning_rate": 5.509453387093233e-07, "loss": 0.0834, "step": 255000 }, { "epoch": 750.0, "eval_cer": 0.0696569460790724, "eval_loss": 0.5699195265769958, "eval_runtime": 4.7379, "eval_samples_per_second": 75.771, "eval_steps_per_second": 2.533, "eval_wer": 0.26100274060938256, "step": 255000 }, { "epoch": 750.29, "learning_rate": 5.485743931961168e-07, "loss": 0.0805, "step": 255100 }, { "epoch": 750.59, "learning_rate": 5.461843884168661e-07, "loss": 0.0782, "step": 255200 }, { "epoch": 750.88, "learning_rate": 5.437993005170794e-07, "loss": 0.0808, "step": 255300 }, { "epoch": 751.18, "learning_rate": 5.414191321298273e-07, "loss": 0.081, "step": 255400 }, { "epoch": 751.47, "learning_rate": 5.390438858827412e-07, "loss": 0.0777, "step": 255500 }, { "epoch": 751.76, "learning_rate": 5.366735643980225e-07, "loss": 0.0813, "step": 255600 }, { "epoch": 752.06, "learning_rate": 5.343081702924374e-07, "loss": 0.0839, "step": 255700 }, { "epoch": 752.35, "learning_rate": 5.319477061773076e-07, "loss": 0.0833, "step": 255800 }, { "epoch": 752.65, "learning_rate": 5.296157055488105e-07, "loss": 0.0832, "step": 255900 }, { "epoch": 752.94, "learning_rate": 5.272650598619727e-07, "loss": 0.0832, "step": 256000 }, { "epoch": 752.94, "eval_cer": 0.06948258576348024, "eval_loss": 0.5696724057197571, "eval_runtime": 4.9457, "eval_samples_per_second": 72.589, "eval_steps_per_second": 2.426, "eval_wer": 0.2608415282927616, "step": 256000 }, { "epoch": 753.24, "learning_rate": 5.249193519409756e-07, "loss": 0.085, "step": 256100 }, { "epoch": 753.53, "learning_rate": 5.2257858437541e-07, "loss": 0.0806, "step": 256200 }, { "epoch": 753.82, "learning_rate": 5.202427597494153e-07, "loss": 0.0789, "step": 256300 }, { "epoch": 754.12, "learning_rate": 5.179118806416677e-07, "loss": 0.077, "step": 256400 }, { "epoch": 754.41, "learning_rate": 5.155859496253928e-07, "loss": 0.0791, "step": 256500 }, { "epoch": 754.71, "learning_rate": 5.132649692683472e-07, "loss": 0.083, "step": 256600 }, { "epoch": 755.0, "learning_rate": 5.109489421328234e-07, "loss": 0.0836, "step": 256700 }, { "epoch": 755.29, "learning_rate": 5.086378707756473e-07, "loss": 0.0783, "step": 256800 }, { "epoch": 755.59, "learning_rate": 5.063317577481718e-07, "loss": 0.0771, "step": 256900 }, { "epoch": 755.88, "learning_rate": 5.040306055962773e-07, "loss": 0.0818, "step": 257000 }, { "epoch": 755.88, "eval_cer": 0.07009284686805282, "eval_loss": 0.5731448531150818, "eval_runtime": 5.0204, "eval_samples_per_second": 71.508, "eval_steps_per_second": 2.39, "eval_wer": 0.26293728840883446, "step": 257000 }, { "epoch": 756.18, "learning_rate": 5.017344168603672e-07, "loss": 0.0777, "step": 257100 }, { "epoch": 756.47, "learning_rate": 4.994431940753647e-07, "loss": 0.0805, "step": 257200 }, { "epoch": 756.76, "learning_rate": 4.971569397707115e-07, "loss": 0.084, "step": 257300 }, { "epoch": 757.06, "learning_rate": 4.948756564703649e-07, "loss": 0.0813, "step": 257400 }, { "epoch": 757.35, "learning_rate": 4.925993466927925e-07, "loss": 0.0771, "step": 257500 }, { "epoch": 757.65, "learning_rate": 4.90328012950973e-07, "loss": 0.0761, "step": 257600 }, { "epoch": 757.94, "learning_rate": 4.880616577523911e-07, "loss": 0.0808, "step": 257700 }, { "epoch": 758.24, "learning_rate": 4.85800283599035e-07, "loss": 0.0815, "step": 257800 }, { "epoch": 758.53, "learning_rate": 4.835438929873937e-07, "loss": 0.076, "step": 257900 }, { "epoch": 758.82, "learning_rate": 4.812924884084569e-07, "loss": 0.0814, "step": 258000 }, { "epoch": 758.82, "eval_cer": 0.0696569460790724, "eval_loss": 0.5717082619667053, "eval_runtime": 5.3882, "eval_samples_per_second": 66.627, "eval_steps_per_second": 2.227, "eval_wer": 0.26229243914235045, "step": 258000 }, { "epoch": 759.12, "learning_rate": 4.790460723477053e-07, "loss": 0.0782, "step": 258100 }, { "epoch": 759.41, "learning_rate": 4.768046472851168e-07, "loss": 0.0824, "step": 258200 }, { "epoch": 759.71, "learning_rate": 4.745682156951581e-07, "loss": 0.0792, "step": 258300 }, { "epoch": 760.0, "learning_rate": 4.723367800467826e-07, "loss": 0.0804, "step": 258400 }, { "epoch": 760.29, "learning_rate": 4.701103428034287e-07, "loss": 0.0797, "step": 258500 }, { "epoch": 760.59, "learning_rate": 4.6788890642301523e-07, "loss": 0.0806, "step": 258600 }, { "epoch": 760.88, "learning_rate": 4.656724733579432e-07, "loss": 0.0782, "step": 258700 }, { "epoch": 761.18, "learning_rate": 4.6348313554157366e-07, "loss": 0.0771, "step": 258800 }, { "epoch": 761.47, "learning_rate": 4.6127666634818326e-07, "loss": 0.078, "step": 258900 }, { "epoch": 761.76, "learning_rate": 4.590752077698496e-07, "loss": 0.0803, "step": 259000 }, { "epoch": 761.76, "eval_cer": 0.0699620766313587, "eval_loss": 0.5720624327659607, "eval_runtime": 4.7445, "eval_samples_per_second": 75.667, "eval_steps_per_second": 2.529, "eval_wer": 0.2624536514589715, "step": 259000 }, { "epoch": 762.06, "learning_rate": 4.56878762236917e-07, "loss": 0.0821, "step": 259100 }, { "epoch": 762.35, "learning_rate": 4.5468733217419626e-07, "loss": 0.0828, "step": 259200 }, { "epoch": 762.65, "learning_rate": 4.5250092000096e-07, "loss": 0.0827, "step": 259300 }, { "epoch": 762.94, "learning_rate": 4.5031952813094246e-07, "loss": 0.078, "step": 259400 }, { "epoch": 763.24, "learning_rate": 4.4814315897233507e-07, "loss": 0.081, "step": 259500 }, { "epoch": 763.53, "learning_rate": 4.459718149277842e-07, "loss": 0.0785, "step": 259600 }, { "epoch": 763.82, "learning_rate": 4.438054983943896e-07, "loss": 0.0798, "step": 259700 }, { "epoch": 764.12, "learning_rate": 4.416442117636988e-07, "loss": 0.0811, "step": 259800 }, { "epoch": 764.41, "learning_rate": 4.3948795742170867e-07, "loss": 0.0797, "step": 259900 }, { "epoch": 764.71, "learning_rate": 4.3733673774885965e-07, "loss": 0.0825, "step": 260000 }, { "epoch": 764.71, "eval_cer": 0.06974412623686849, "eval_loss": 0.573108971118927, "eval_runtime": 4.5318, "eval_samples_per_second": 79.217, "eval_steps_per_second": 2.648, "eval_wer": 0.2603578913428986, "step": 260000 }, { "epoch": 765.0, "learning_rate": 4.3519055512003306e-07, "loss": 0.0815, "step": 260100 }, { "epoch": 765.29, "learning_rate": 4.3304941190455195e-07, "loss": 0.0779, "step": 260200 }, { "epoch": 765.59, "learning_rate": 4.309133104661728e-07, "loss": 0.0785, "step": 260300 }, { "epoch": 765.88, "learning_rate": 4.287822531630892e-07, "loss": 0.0813, "step": 260400 }, { "epoch": 766.18, "learning_rate": 4.2665624234792425e-07, "loss": 0.0765, "step": 260500 }, { "epoch": 766.47, "learning_rate": 4.245352803677305e-07, "loss": 0.0816, "step": 260600 }, { "epoch": 766.76, "learning_rate": 4.2241936956398665e-07, "loss": 0.082, "step": 260700 }, { "epoch": 767.06, "learning_rate": 4.203085122725953e-07, "loss": 0.0868, "step": 260800 }, { "epoch": 767.35, "learning_rate": 4.18202710823879e-07, "loss": 0.0798, "step": 260900 }, { "epoch": 767.65, "learning_rate": 4.1610196754258095e-07, "loss": 0.0776, "step": 261000 }, { "epoch": 767.65, "eval_cer": 0.06978771631576654, "eval_loss": 0.5764541029930115, "eval_runtime": 5.2048, "eval_samples_per_second": 68.974, "eval_steps_per_second": 2.306, "eval_wer": 0.26148637755924553, "step": 261000 }, { "epoch": 767.94, "learning_rate": 4.140062847478576e-07, "loss": 0.0765, "step": 261100 }, { "epoch": 768.24, "learning_rate": 4.119156647532818e-07, "loss": 0.0849, "step": 261200 }, { "epoch": 768.53, "learning_rate": 4.098301098668339e-07, "loss": 0.0767, "step": 261300 }, { "epoch": 768.82, "learning_rate": 4.0774962239090553e-07, "loss": 0.0869, "step": 261400 }, { "epoch": 769.12, "learning_rate": 4.0567420462229225e-07, "loss": 0.0747, "step": 261500 }, { "epoch": 769.41, "learning_rate": 4.0360385885219345e-07, "loss": 0.0817, "step": 261600 }, { "epoch": 769.71, "learning_rate": 4.0153858736620865e-07, "loss": 0.0824, "step": 261700 }, { "epoch": 770.0, "learning_rate": 3.994783924443368e-07, "loss": 0.0799, "step": 261800 }, { "epoch": 770.29, "learning_rate": 3.9742327636097034e-07, "loss": 0.0778, "step": 261900 }, { "epoch": 770.59, "learning_rate": 3.953732413848971e-07, "loss": 0.0805, "step": 262000 }, { "epoch": 770.59, "eval_cer": 0.0696569460790724, "eval_loss": 0.5757123827934265, "eval_runtime": 5.0402, "eval_samples_per_second": 71.227, "eval_steps_per_second": 2.381, "eval_wer": 0.26116395292600353, "step": 262000 }, { "epoch": 770.88, "learning_rate": 3.9332828977929395e-07, "loss": 0.0764, "step": 262100 }, { "epoch": 771.18, "learning_rate": 3.912884238017267e-07, "loss": 0.0782, "step": 262200 }, { "epoch": 771.47, "learning_rate": 3.892536457041468e-07, "loss": 0.078, "step": 262300 }, { "epoch": 771.76, "learning_rate": 3.872239577328879e-07, "loss": 0.0835, "step": 262400 }, { "epoch": 772.06, "learning_rate": 3.8519936212866483e-07, "loss": 0.0789, "step": 262500 }, { "epoch": 772.35, "learning_rate": 3.831798611265708e-07, "loss": 0.0807, "step": 262600 }, { "epoch": 772.65, "learning_rate": 3.811654569560752e-07, "loss": 0.0804, "step": 262700 }, { "epoch": 772.94, "learning_rate": 3.7915615184101973e-07, "loss": 0.0755, "step": 262800 }, { "epoch": 773.24, "learning_rate": 3.771519479996172e-07, "loss": 0.0802, "step": 262900 }, { "epoch": 773.53, "learning_rate": 3.751528476444488e-07, "loss": 0.0794, "step": 263000 }, { "epoch": 773.53, "eval_cer": 0.0699620766313587, "eval_loss": 0.5735283493995667, "eval_runtime": 4.7277, "eval_samples_per_second": 75.936, "eval_steps_per_second": 2.538, "eval_wer": 0.2619700145091085, "step": 263000 }, { "epoch": 773.82, "learning_rate": 3.7315885298246145e-07, "loss": 0.0781, "step": 263100 }, { "epoch": 774.12, "learning_rate": 3.7116996621496647e-07, "loss": 0.0834, "step": 263200 }, { "epoch": 774.41, "learning_rate": 3.6918618953763477e-07, "loss": 0.085, "step": 263300 }, { "epoch": 774.71, "learning_rate": 3.672075251404966e-07, "loss": 0.0768, "step": 263400 }, { "epoch": 775.0, "learning_rate": 3.6523397520793866e-07, "loss": 0.0799, "step": 263500 }, { "epoch": 775.29, "learning_rate": 3.632655419187009e-07, "loss": 0.0777, "step": 263600 }, { "epoch": 775.59, "learning_rate": 3.6130222744587493e-07, "loss": 0.078, "step": 263700 }, { "epoch": 775.88, "learning_rate": 3.5934403395690266e-07, "loss": 0.0777, "step": 263800 }, { "epoch": 776.18, "learning_rate": 3.5739096361356806e-07, "loss": 0.0825, "step": 263900 }, { "epoch": 776.47, "learning_rate": 3.554430185720054e-07, "loss": 0.0803, "step": 264000 }, { "epoch": 776.47, "eval_cer": 0.06961335600017436, "eval_loss": 0.5729749798774719, "eval_runtime": 4.7677, "eval_samples_per_second": 75.299, "eval_steps_per_second": 2.517, "eval_wer": 0.2605191036595196, "step": 264000 }, { "epoch": 776.76, "learning_rate": 3.535002009826871e-07, "loss": 0.0819, "step": 264100 }, { "epoch": 777.06, "learning_rate": 3.515625129904249e-07, "loss": 0.082, "step": 264200 }, { "epoch": 777.35, "learning_rate": 3.4962995673437083e-07, "loss": 0.081, "step": 264300 }, { "epoch": 777.65, "learning_rate": 3.47702534348005e-07, "loss": 0.0817, "step": 264400 }, { "epoch": 777.94, "learning_rate": 3.457802479591482e-07, "loss": 0.0803, "step": 264500 }, { "epoch": 778.24, "learning_rate": 3.438630996899461e-07, "loss": 0.0789, "step": 264600 }, { "epoch": 778.53, "learning_rate": 3.4195109165687246e-07, "loss": 0.0813, "step": 264700 }, { "epoch": 778.82, "learning_rate": 3.400442259707282e-07, "loss": 0.0788, "step": 264800 }, { "epoch": 779.12, "learning_rate": 3.3814250473663434e-07, "loss": 0.0763, "step": 264900 }, { "epoch": 779.41, "learning_rate": 3.362459300540355e-07, "loss": 0.0792, "step": 265000 }, { "epoch": 779.41, "eval_cer": 0.0699620766313587, "eval_loss": 0.5743491649627686, "eval_runtime": 4.8049, "eval_samples_per_second": 74.715, "eval_steps_per_second": 2.497, "eval_wer": 0.26180880219248753, "step": 265000 }, { "epoch": 779.71, "learning_rate": 3.34354504016694e-07, "loss": 0.0802, "step": 265100 }, { "epoch": 780.0, "learning_rate": 3.324682287126868e-07, "loss": 0.0815, "step": 265200 }, { "epoch": 780.29, "learning_rate": 3.305871062244065e-07, "loss": 0.0819, "step": 265300 }, { "epoch": 780.59, "learning_rate": 3.2871113862855407e-07, "loss": 0.0791, "step": 265400 }, { "epoch": 780.88, "learning_rate": 3.2684032799614463e-07, "loss": 0.0783, "step": 265500 }, { "epoch": 781.18, "learning_rate": 3.2497467639249437e-07, "loss": 0.081, "step": 265600 }, { "epoch": 781.47, "learning_rate": 3.231141858772291e-07, "loss": 0.0853, "step": 265700 }, { "epoch": 781.76, "learning_rate": 3.2125885850427476e-07, "loss": 0.0836, "step": 265800 }, { "epoch": 782.06, "learning_rate": 3.194086963218551e-07, "loss": 0.0812, "step": 265900 }, { "epoch": 782.35, "learning_rate": 3.175637013724975e-07, "loss": 0.0816, "step": 266000 }, { "epoch": 782.35, "eval_cer": 0.06961335600017436, "eval_loss": 0.5711695551872253, "eval_runtime": 4.7303, "eval_samples_per_second": 75.894, "eval_steps_per_second": 2.537, "eval_wer": 0.2605191036595196, "step": 266000 }, { "epoch": 782.65, "learning_rate": 3.1572387569301753e-07, "loss": 0.0772, "step": 266100 }, { "epoch": 782.94, "learning_rate": 3.1388922131453006e-07, "loss": 0.0852, "step": 266200 }, { "epoch": 783.24, "learning_rate": 3.120597402624398e-07, "loss": 0.0799, "step": 266300 }, { "epoch": 783.53, "learning_rate": 3.102354345564357e-07, "loss": 0.0778, "step": 266400 }, { "epoch": 783.82, "learning_rate": 3.0841630621050055e-07, "loss": 0.082, "step": 266500 }, { "epoch": 784.12, "learning_rate": 3.066023572328941e-07, "loss": 0.0835, "step": 266600 }, { "epoch": 784.41, "learning_rate": 3.04793589626165e-07, "loss": 0.0808, "step": 266700 }, { "epoch": 784.71, "learning_rate": 3.0299000538713816e-07, "loss": 0.0792, "step": 266800 }, { "epoch": 785.0, "learning_rate": 3.0119160650691424e-07, "loss": 0.0736, "step": 266900 }, { "epoch": 785.29, "learning_rate": 2.993983949708756e-07, "loss": 0.0773, "step": 267000 }, { "epoch": 785.29, "eval_cer": 0.06970053615797045, "eval_loss": 0.5727453827857971, "eval_runtime": 5.3818, "eval_samples_per_second": 66.707, "eval_steps_per_second": 2.23, "eval_wer": 0.26068031597614055, "step": 267000 }, { "epoch": 785.59, "learning_rate": 2.976282272871539e-07, "loss": 0.083, "step": 267100 }, { "epoch": 785.88, "learning_rate": 2.958453444499787e-07, "loss": 0.0826, "step": 267200 }, { "epoch": 786.18, "learning_rate": 2.9406765485910036e-07, "loss": 0.0746, "step": 267300 }, { "epoch": 786.47, "learning_rate": 2.922951604770352e-07, "loss": 0.0792, "step": 267400 }, { "epoch": 786.76, "learning_rate": 2.9052786326056457e-07, "loss": 0.0823, "step": 267500 }, { "epoch": 787.06, "learning_rate": 2.8876576516073117e-07, "loss": 0.077, "step": 267600 }, { "epoch": 787.35, "learning_rate": 2.870088681228389e-07, "loss": 0.0817, "step": 267700 }, { "epoch": 787.65, "learning_rate": 2.852746652656024e-07, "loss": 0.0784, "step": 267800 }, { "epoch": 787.94, "learning_rate": 2.8352812410562815e-07, "loss": 0.0807, "step": 267900 }, { "epoch": 788.24, "learning_rate": 2.8178678978979357e-07, "loss": 0.0803, "step": 268000 }, { "epoch": 788.24, "eval_cer": 0.06943899568458219, "eval_loss": 0.5726141333580017, "eval_runtime": 4.5444, "eval_samples_per_second": 78.998, "eval_steps_per_second": 2.641, "eval_wer": 0.2608415282927616, "step": 268000 }, { "epoch": 788.53, "learning_rate": 2.800506642404821e-07, "loss": 0.0822, "step": 268100 }, { "epoch": 788.82, "learning_rate": 2.783197493743217e-07, "loss": 0.0829, "step": 268200 }, { "epoch": 789.12, "learning_rate": 2.765940471021933e-07, "loss": 0.0817, "step": 268300 }, { "epoch": 789.41, "learning_rate": 2.74873559329219e-07, "loss": 0.0793, "step": 268400 }, { "epoch": 789.71, "learning_rate": 2.731582879547667e-07, "loss": 0.082, "step": 268500 }, { "epoch": 790.0, "learning_rate": 2.71448234872444e-07, "loss": 0.0829, "step": 268600 }, { "epoch": 790.29, "learning_rate": 2.69743401970099e-07, "loss": 0.0781, "step": 268700 }, { "epoch": 790.59, "learning_rate": 2.680437911298167e-07, "loss": 0.0856, "step": 268800 }, { "epoch": 790.88, "learning_rate": 2.6634940422791577e-07, "loss": 0.0824, "step": 268900 }, { "epoch": 791.18, "learning_rate": 2.646602431349504e-07, "loss": 0.0814, "step": 269000 }, { "epoch": 791.18, "eval_cer": 0.0696569460790724, "eval_loss": 0.5711923241615295, "eval_runtime": 4.6959, "eval_samples_per_second": 76.449, "eval_steps_per_second": 2.555, "eval_wer": 0.26116395292600353, "step": 269000 }, { "epoch": 791.47, "learning_rate": 2.6297630971570234e-07, "loss": 0.0795, "step": 269100 }, { "epoch": 791.76, "learning_rate": 2.6129760582918383e-07, "loss": 0.0809, "step": 269200 }, { "epoch": 792.06, "learning_rate": 2.5962413332863534e-07, "loss": 0.0837, "step": 269300 }, { "epoch": 792.35, "learning_rate": 2.5795589406151846e-07, "loss": 0.0817, "step": 269400 }, { "epoch": 792.65, "learning_rate": 2.5629288986952217e-07, "loss": 0.0823, "step": 269500 }, { "epoch": 792.94, "learning_rate": 2.5463512258855126e-07, "loss": 0.0754, "step": 269600 }, { "epoch": 793.24, "learning_rate": 2.5298259404873125e-07, "loss": 0.0828, "step": 269700 }, { "epoch": 793.53, "learning_rate": 2.513353060744067e-07, "loss": 0.0811, "step": 269800 }, { "epoch": 793.82, "learning_rate": 2.4969326048413124e-07, "loss": 0.0767, "step": 269900 }, { "epoch": 794.12, "learning_rate": 2.4805645909067697e-07, "loss": 0.0896, "step": 270000 }, { "epoch": 794.12, "eval_cer": 0.0696569460790724, "eval_loss": 0.5720658898353577, "eval_runtime": 4.9834, "eval_samples_per_second": 72.039, "eval_steps_per_second": 2.408, "eval_wer": 0.26180880219248753, "step": 270000 }, { "epoch": 794.41, "learning_rate": 2.4642490370102247e-07, "loss": 0.0785, "step": 270100 }, { "epoch": 794.71, "learning_rate": 2.447985961163546e-07, "loss": 0.0761, "step": 270200 }, { "epoch": 795.0, "learning_rate": 2.4317753813207165e-07, "loss": 0.0814, "step": 270300 }, { "epoch": 795.29, "learning_rate": 2.415617315377705e-07, "loss": 0.0803, "step": 270400 }, { "epoch": 795.59, "learning_rate": 2.399511781172553e-07, "loss": 0.0776, "step": 270500 }, { "epoch": 795.88, "learning_rate": 2.3834587964852773e-07, "loss": 0.0789, "step": 270600 }, { "epoch": 796.18, "learning_rate": 2.3674583790378957e-07, "loss": 0.0781, "step": 270700 }, { "epoch": 796.47, "learning_rate": 2.3515105464943956e-07, "loss": 0.0801, "step": 270800 }, { "epoch": 796.76, "learning_rate": 2.3356153164606933e-07, "loss": 0.0792, "step": 270900 }, { "epoch": 797.06, "learning_rate": 2.3197727064846798e-07, "loss": 0.0819, "step": 271000 }, { "epoch": 797.06, "eval_cer": 0.0699620766313587, "eval_loss": 0.5707818865776062, "eval_runtime": 4.6691, "eval_samples_per_second": 76.889, "eval_steps_per_second": 2.57, "eval_wer": 0.2619700145091085, "step": 271000 }, { "epoch": 797.35, "learning_rate": 2.3039827340560928e-07, "loss": 0.0757, "step": 271100 }, { "epoch": 797.65, "learning_rate": 2.288245416606605e-07, "loss": 0.0793, "step": 271200 }, { "epoch": 797.94, "learning_rate": 2.272560771509741e-07, "loss": 0.0822, "step": 271300 }, { "epoch": 798.24, "learning_rate": 2.2569288160808778e-07, "loss": 0.0775, "step": 271400 }, { "epoch": 798.53, "learning_rate": 2.241349567577239e-07, "loss": 0.0837, "step": 271500 }, { "epoch": 798.82, "learning_rate": 2.225823043197839e-07, "loss": 0.0814, "step": 271600 }, { "epoch": 799.12, "learning_rate": 2.210349260083494e-07, "loss": 0.0812, "step": 271700 }, { "epoch": 799.41, "learning_rate": 2.1949282353168122e-07, "loss": 0.0828, "step": 271800 }, { "epoch": 799.71, "learning_rate": 2.179559985922125e-07, "loss": 0.0833, "step": 271900 }, { "epoch": 800.0, "learning_rate": 2.16424452886555e-07, "loss": 0.0765, "step": 272000 }, { "epoch": 800.0, "eval_cer": 0.06983130639466457, "eval_loss": 0.5701684355735779, "eval_runtime": 4.6145, "eval_samples_per_second": 77.799, "eval_steps_per_second": 2.601, "eval_wer": 0.2616475898758665, "step": 272000 }, { "epoch": 800.29, "learning_rate": 2.1489818810548736e-07, "loss": 0.077, "step": 272100 }, { "epoch": 800.59, "learning_rate": 2.1337720593396004e-07, "loss": 0.0785, "step": 272200 }, { "epoch": 800.88, "learning_rate": 2.118615080510933e-07, "loss": 0.084, "step": 272300 }, { "epoch": 801.18, "learning_rate": 2.1035109613017134e-07, "loss": 0.0812, "step": 272400 }, { "epoch": 801.47, "learning_rate": 2.0884597183864374e-07, "loss": 0.0806, "step": 272500 }, { "epoch": 801.76, "learning_rate": 2.073461368381241e-07, "loss": 0.0802, "step": 272600 }, { "epoch": 802.06, "learning_rate": 2.0586651202931184e-07, "loss": 0.0814, "step": 272700 }, { "epoch": 802.35, "learning_rate": 2.0437720763816893e-07, "loss": 0.0786, "step": 272800 }, { "epoch": 802.65, "learning_rate": 2.02893197471416e-07, "loss": 0.0823, "step": 272900 }, { "epoch": 802.94, "learning_rate": 2.0141448316735424e-07, "loss": 0.079, "step": 273000 }, { "epoch": 802.94, "eval_cer": 0.06961335600017436, "eval_loss": 0.5719471573829651, "eval_runtime": 4.6624, "eval_samples_per_second": 76.999, "eval_steps_per_second": 2.574, "eval_wer": 0.26148637755924553, "step": 273000 }, { "epoch": 803.24, "learning_rate": 1.9994106635844225e-07, "loss": 0.0813, "step": 273100 }, { "epoch": 803.53, "learning_rate": 1.9847294867128608e-07, "loss": 0.0827, "step": 273200 }, { "epoch": 803.82, "learning_rate": 1.970101317266454e-07, "loss": 0.0794, "step": 273300 }, { "epoch": 804.12, "learning_rate": 1.955526171394262e-07, "loss": 0.0853, "step": 273400 }, { "epoch": 804.41, "learning_rate": 1.941004065186797e-07, "loss": 0.0801, "step": 273500 }, { "epoch": 804.71, "learning_rate": 1.9265350146760564e-07, "loss": 0.0825, "step": 273600 }, { "epoch": 805.0, "learning_rate": 1.9121190358354135e-07, "loss": 0.0815, "step": 273700 }, { "epoch": 805.29, "learning_rate": 1.8977561445796932e-07, "loss": 0.0749, "step": 273800 }, { "epoch": 805.59, "learning_rate": 1.8835891917292903e-07, "loss": 0.0795, "step": 273900 }, { "epoch": 805.88, "learning_rate": 1.8693319918830056e-07, "loss": 0.0825, "step": 274000 }, { "epoch": 805.88, "eval_cer": 0.0699620766313587, "eval_loss": 0.5727930665016174, "eval_runtime": 4.7385, "eval_samples_per_second": 75.762, "eval_steps_per_second": 2.532, "eval_wer": 0.26277607609221343, "step": 274000 }, { "epoch": 806.18, "learning_rate": 1.8551279268572586e-07, "loss": 0.0821, "step": 274100 }, { "epoch": 806.47, "learning_rate": 1.8409770123329118e-07, "loss": 0.0779, "step": 274200 }, { "epoch": 806.76, "learning_rate": 1.826879263932152e-07, "loss": 0.0799, "step": 274300 }, { "epoch": 807.06, "learning_rate": 1.8128346972184797e-07, "loss": 0.0765, "step": 274400 }, { "epoch": 807.35, "learning_rate": 1.7988433276966698e-07, "loss": 0.0759, "step": 274500 }, { "epoch": 807.65, "learning_rate": 1.784905170812784e-07, "loss": 0.0778, "step": 274600 }, { "epoch": 807.94, "learning_rate": 1.7710202419541246e-07, "loss": 0.0823, "step": 274700 }, { "epoch": 808.24, "learning_rate": 1.7571885564492407e-07, "loss": 0.0776, "step": 274800 }, { "epoch": 808.53, "learning_rate": 1.7434101295678963e-07, "loss": 0.0765, "step": 274900 }, { "epoch": 808.82, "learning_rate": 1.7296849765210731e-07, "loss": 0.0799, "step": 275000 }, { "epoch": 808.82, "eval_cer": 0.06948258576348024, "eval_loss": 0.5712651610374451, "eval_runtime": 5.286, "eval_samples_per_second": 67.915, "eval_steps_per_second": 2.27, "eval_wer": 0.26116395292600353, "step": 275000 }, { "epoch": 809.12, "learning_rate": 1.7160131124609237e-07, "loss": 0.0826, "step": 275100 }, { "epoch": 809.41, "learning_rate": 1.702394552480774e-07, "loss": 0.0836, "step": 275200 }, { "epoch": 809.71, "learning_rate": 1.68882931161512e-07, "loss": 0.0807, "step": 275300 }, { "epoch": 810.0, "learning_rate": 1.675317404839566e-07, "loss": 0.0782, "step": 275400 }, { "epoch": 810.29, "learning_rate": 1.6618588470708686e-07, "loss": 0.0838, "step": 275500 }, { "epoch": 810.59, "learning_rate": 1.648453653166865e-07, "loss": 0.0816, "step": 275600 }, { "epoch": 810.88, "learning_rate": 1.635101837926495e-07, "loss": 0.0805, "step": 275700 }, { "epoch": 811.18, "learning_rate": 1.6218034160897567e-07, "loss": 0.0778, "step": 275800 }, { "epoch": 811.47, "learning_rate": 1.6085584023377177e-07, "loss": 0.0808, "step": 275900 }, { "epoch": 811.76, "learning_rate": 1.5953668112924758e-07, "loss": 0.0781, "step": 276000 }, { "epoch": 811.76, "eval_cer": 0.06987489647356261, "eval_loss": 0.5731009244918823, "eval_runtime": 4.7801, "eval_samples_per_second": 75.102, "eval_steps_per_second": 2.51, "eval_wer": 0.2619700145091085, "step": 276000 }, { "epoch": 812.06, "learning_rate": 1.5822286575171486e-07, "loss": 0.0751, "step": 276100 }, { "epoch": 812.35, "learning_rate": 1.5691439555158783e-07, "loss": 0.0798, "step": 276200 }, { "epoch": 812.65, "learning_rate": 1.556242767386512e-07, "loss": 0.0819, "step": 276300 }, { "epoch": 812.94, "learning_rate": 1.5432644773326065e-07, "loss": 0.0791, "step": 276400 }, { "epoch": 813.24, "learning_rate": 1.5303396820680326e-07, "loss": 0.0795, "step": 276500 }, { "epoch": 813.53, "learning_rate": 1.517468395861388e-07, "loss": 0.0786, "step": 276600 }, { "epoch": 813.82, "learning_rate": 1.5046506329221833e-07, "loss": 0.0815, "step": 276700 }, { "epoch": 814.12, "learning_rate": 1.49188640740085e-07, "loss": 0.0795, "step": 276800 }, { "epoch": 814.41, "learning_rate": 1.4791757333887213e-07, "loss": 0.077, "step": 276900 }, { "epoch": 814.71, "learning_rate": 1.466518624917984e-07, "loss": 0.0827, "step": 277000 }, { "epoch": 814.71, "eval_cer": 0.06922104529009197, "eval_loss": 0.5720049738883972, "eval_runtime": 4.7084, "eval_samples_per_second": 76.247, "eval_steps_per_second": 2.549, "eval_wer": 0.2608415282927616, "step": 277000 }, { "epoch": 815.0, "learning_rate": 1.453915095961722e-07, "loss": 0.0804, "step": 277100 }, { "epoch": 815.29, "learning_rate": 1.441365160433844e-07, "loss": 0.0796, "step": 277200 }, { "epoch": 815.59, "learning_rate": 1.428868832189112e-07, "loss": 0.0825, "step": 277300 }, { "epoch": 815.88, "learning_rate": 1.4164261250231014e-07, "loss": 0.0797, "step": 277400 }, { "epoch": 816.18, "learning_rate": 1.4040370526721802e-07, "loss": 0.0785, "step": 277500 }, { "epoch": 816.47, "learning_rate": 1.391701628813519e-07, "loss": 0.0773, "step": 277600 }, { "epoch": 816.76, "learning_rate": 1.3794198670650572e-07, "loss": 0.0803, "step": 277700 }, { "epoch": 817.06, "learning_rate": 1.3671917809854996e-07, "loss": 0.0822, "step": 277800 }, { "epoch": 817.35, "learning_rate": 1.3550173840742753e-07, "loss": 0.0765, "step": 277900 }, { "epoch": 817.65, "learning_rate": 1.3428966897715667e-07, "loss": 0.0767, "step": 278000 }, { "epoch": 817.65, "eval_cer": 0.06952617584237827, "eval_loss": 0.5717321038246155, "eval_runtime": 5.4079, "eval_samples_per_second": 66.384, "eval_steps_per_second": 2.219, "eval_wer": 0.2616475898758665, "step": 278000 }, { "epoch": 817.94, "learning_rate": 1.3308297114582535e-07, "loss": 0.0783, "step": 278100 }, { "epoch": 818.24, "learning_rate": 1.3188164624559186e-07, "loss": 0.0811, "step": 278200 }, { "epoch": 818.53, "learning_rate": 1.3068569560268307e-07, "loss": 0.0802, "step": 278300 }, { "epoch": 818.82, "learning_rate": 1.2949512053739232e-07, "loss": 0.0773, "step": 278400 }, { "epoch": 819.12, "learning_rate": 1.2830992236408046e-07, "loss": 0.0809, "step": 278500 }, { "epoch": 819.41, "learning_rate": 1.2713010239116919e-07, "loss": 0.0787, "step": 278600 }, { "epoch": 819.71, "learning_rate": 1.259556619211455e-07, "loss": 0.0758, "step": 278700 }, { "epoch": 820.0, "learning_rate": 1.2478660225055616e-07, "loss": 0.0862, "step": 278800 }, { "epoch": 820.29, "learning_rate": 1.2362292467000882e-07, "loss": 0.082, "step": 278900 }, { "epoch": 820.59, "learning_rate": 1.2246463046416745e-07, "loss": 0.0772, "step": 279000 }, { "epoch": 820.59, "eval_cer": 0.06956976592127631, "eval_loss": 0.5717667937278748, "eval_runtime": 4.7601, "eval_samples_per_second": 75.419, "eval_steps_per_second": 2.521, "eval_wer": 0.26148637755924553, "step": 279000 }, { "epoch": 820.88, "learning_rate": 1.213117209117559e-07, "loss": 0.0759, "step": 279100 }, { "epoch": 821.18, "learning_rate": 1.2016419728555108e-07, "loss": 0.0848, "step": 279200 }, { "epoch": 821.47, "learning_rate": 1.1902206085238455e-07, "loss": 0.0821, "step": 279300 }, { "epoch": 821.76, "learning_rate": 1.1788531287314109e-07, "loss": 0.0835, "step": 279400 }, { "epoch": 822.06, "learning_rate": 1.1675395460275629e-07, "loss": 0.083, "step": 279500 }, { "epoch": 822.35, "learning_rate": 1.1562798729021662e-07, "loss": 0.0793, "step": 279600 }, { "epoch": 822.65, "learning_rate": 1.145074121785561e-07, "loss": 0.083, "step": 279700 }, { "epoch": 822.94, "learning_rate": 1.133922305048557e-07, "loss": 0.0792, "step": 279800 }, { "epoch": 823.24, "learning_rate": 1.1228244350024342e-07, "loss": 0.0836, "step": 279900 }, { "epoch": 823.53, "learning_rate": 1.1118906958730913e-07, "loss": 0.0755, "step": 280000 }, { "epoch": 823.53, "eval_cer": 0.06961335600017436, "eval_loss": 0.5713757872581482, "eval_runtime": 4.7516, "eval_samples_per_second": 75.554, "eval_steps_per_second": 2.525, "eval_wer": 0.26132516524262456, "step": 280000 }, { "epoch": 823.82, "learning_rate": 1.1009002161327942e-07, "loss": 0.0798, "step": 280100 }, { "epoch": 824.12, "learning_rate": 1.0899637195387892e-07, "loss": 0.0788, "step": 280200 }, { "epoch": 824.41, "learning_rate": 1.0790812181646183e-07, "loss": 0.0808, "step": 280300 }, { "epoch": 824.71, "learning_rate": 1.0682527240242435e-07, "loss": 0.082, "step": 280400 }, { "epoch": 825.0, "learning_rate": 1.0574782490720082e-07, "loss": 0.0784, "step": 280500 }, { "epoch": 825.29, "learning_rate": 1.0467578052026029e-07, "loss": 0.0791, "step": 280600 }, { "epoch": 825.59, "learning_rate": 1.0360914042510883e-07, "loss": 0.0805, "step": 280700 }, { "epoch": 825.88, "learning_rate": 1.0254790579928398e-07, "loss": 0.0806, "step": 280800 }, { "epoch": 826.18, "learning_rate": 1.0149207781435689e-07, "loss": 0.0811, "step": 280900 }, { "epoch": 826.47, "learning_rate": 1.0044165763593183e-07, "loss": 0.077, "step": 281000 }, { "epoch": 826.47, "eval_cer": 0.06956976592127631, "eval_loss": 0.5718855857849121, "eval_runtime": 4.6002, "eval_samples_per_second": 78.04, "eval_steps_per_second": 2.609, "eval_wer": 0.2616475898758665, "step": 281000 }, { "epoch": 826.76, "learning_rate": 9.940706975758773e-08, "loss": 0.084, "step": 281100 }, { "epoch": 827.06, "learning_rate": 9.836741455820143e-08, "loss": 0.0778, "step": 281200 }, { "epoch": 827.35, "learning_rate": 9.733317061485114e-08, "loss": 0.0797, "step": 281300 }, { "epoch": 827.65, "learning_rate": 9.630433906931135e-08, "loss": 0.079, "step": 281400 }, { "epoch": 827.94, "learning_rate": 9.528092105738129e-08, "loss": 0.0846, "step": 281500 }, { "epoch": 828.24, "learning_rate": 9.42629177088844e-08, "loss": 0.0845, "step": 281600 }, { "epoch": 828.53, "learning_rate": 9.325033014766505e-08, "loss": 0.0766, "step": 281700 }, { "epoch": 828.82, "learning_rate": 9.224315949158957e-08, "loss": 0.0807, "step": 281800 }, { "epoch": 829.12, "learning_rate": 9.124140685254579e-08, "loss": 0.0794, "step": 281900 }, { "epoch": 829.41, "learning_rate": 9.024507333643684e-08, "loss": 0.0866, "step": 282000 }, { "epoch": 829.41, "eval_cer": 0.06961335600017436, "eval_loss": 0.5701565742492676, "eval_runtime": 4.6728, "eval_samples_per_second": 76.828, "eval_steps_per_second": 2.568, "eval_wer": 0.26116395292600353, "step": 282000 }, { "epoch": 829.71, "learning_rate": 8.925416004318732e-08, "loss": 0.0794, "step": 282100 }, { "epoch": 830.0, "learning_rate": 8.826866806673329e-08, "loss": 0.0786, "step": 282200 }, { "epoch": 830.29, "learning_rate": 8.728859849503057e-08, "loss": 0.0817, "step": 282300 }, { "epoch": 830.59, "learning_rate": 8.631395241004592e-08, "loss": 0.078, "step": 282400 }, { "epoch": 830.88, "learning_rate": 8.534473088775919e-08, "loss": 0.0766, "step": 282500 }, { "epoch": 831.18, "learning_rate": 8.43809349981628e-08, "loss": 0.0789, "step": 282600 }, { "epoch": 831.47, "learning_rate": 8.342256580525842e-08, "loss": 0.0821, "step": 282700 }, { "epoch": 831.76, "learning_rate": 8.246962436705642e-08, "loss": 0.082, "step": 282800 }, { "epoch": 832.06, "learning_rate": 8.152211173557634e-08, "loss": 0.0807, "step": 282900 }, { "epoch": 832.35, "learning_rate": 8.05800289568437e-08, "loss": 0.0791, "step": 283000 }, { "epoch": 832.35, "eval_cer": 0.0696569460790724, "eval_loss": 0.5718459486961365, "eval_runtime": 4.5798, "eval_samples_per_second": 78.388, "eval_steps_per_second": 2.62, "eval_wer": 0.26132516524262456, "step": 283000 }, { "epoch": 832.65, "learning_rate": 7.964337707088987e-08, "loss": 0.0784, "step": 283100 }, { "epoch": 832.94, "learning_rate": 7.871215711174995e-08, "loss": 0.0832, "step": 283200 }, { "epoch": 833.24, "learning_rate": 7.778637010746437e-08, "loss": 0.0796, "step": 283300 }, { "epoch": 833.53, "learning_rate": 7.686601708007224e-08, "loss": 0.0785, "step": 283400 }, { "epoch": 833.82, "learning_rate": 7.595109904561748e-08, "loss": 0.0768, "step": 283500 }, { "epoch": 834.12, "learning_rate": 7.504161701414159e-08, "loss": 0.079, "step": 283600 }, { "epoch": 834.41, "learning_rate": 7.413757198968585e-08, "loss": 0.0769, "step": 283700 }, { "epoch": 834.71, "learning_rate": 7.32389649702897e-08, "loss": 0.0797, "step": 283800 }, { "epoch": 835.0, "learning_rate": 7.234579694798627e-08, "loss": 0.0799, "step": 283900 }, { "epoch": 835.29, "learning_rate": 7.145806890880846e-08, "loss": 0.0781, "step": 284000 }, { "epoch": 835.29, "eval_cer": 0.06974412623686849, "eval_loss": 0.5719029307365417, "eval_runtime": 4.7885, "eval_samples_per_second": 74.971, "eval_steps_per_second": 2.506, "eval_wer": 0.26132516524262456, "step": 284000 }, { "epoch": 835.59, "learning_rate": 7.057578183278069e-08, "loss": 0.082, "step": 284100 }, { "epoch": 835.88, "learning_rate": 6.969893669392213e-08, "loss": 0.0802, "step": 284200 }, { "epoch": 836.18, "learning_rate": 6.882753446024293e-08, "loss": 0.0807, "step": 284300 }, { "epoch": 836.47, "learning_rate": 6.79615760937452e-08, "loss": 0.0803, "step": 284400 }, { "epoch": 836.76, "learning_rate": 6.710106255042148e-08, "loss": 0.0816, "step": 284500 }, { "epoch": 837.06, "learning_rate": 6.624599478025295e-08, "loss": 0.08, "step": 284600 }, { "epoch": 837.35, "learning_rate": 6.539637372720897e-08, "loss": 0.0793, "step": 284700 }, { "epoch": 837.65, "learning_rate": 6.455220032924592e-08, "loss": 0.0759, "step": 284800 }, { "epoch": 837.94, "learning_rate": 6.371347551830498e-08, "loss": 0.0752, "step": 284900 }, { "epoch": 838.24, "learning_rate": 6.288020022031494e-08, "loss": 0.0821, "step": 285000 }, { "epoch": 838.24, "eval_cer": 0.06952617584237827, "eval_loss": 0.5715811252593994, "eval_runtime": 4.9425, "eval_samples_per_second": 72.635, "eval_steps_per_second": 2.428, "eval_wer": 0.26148637755924553, "step": 285000 }, { "epoch": 838.53, "learning_rate": 6.20523753551855e-08, "loss": 0.0799, "step": 285100 }, { "epoch": 838.82, "learning_rate": 6.123000183681116e-08, "loss": 0.0764, "step": 285200 }, { "epoch": 839.12, "learning_rate": 6.041308057306793e-08, "loss": 0.0788, "step": 285300 }, { "epoch": 839.41, "learning_rate": 5.96016124658122e-08, "loss": 0.0789, "step": 285400 }, { "epoch": 839.71, "learning_rate": 5.879559841088067e-08, "loss": 0.0771, "step": 285500 }, { "epoch": 840.0, "learning_rate": 5.799503929808825e-08, "loss": 0.076, "step": 285600 }, { "epoch": 840.29, "learning_rate": 5.7199936011229085e-08, "loss": 0.0809, "step": 285700 }, { "epoch": 840.59, "learning_rate": 5.6410289428073805e-08, "loss": 0.0825, "step": 285800 }, { "epoch": 840.88, "learning_rate": 5.5626100420367314e-08, "loss": 0.0801, "step": 285900 }, { "epoch": 841.18, "learning_rate": 5.484736985383155e-08, "loss": 0.0794, "step": 286000 }, { "epoch": 841.18, "eval_cer": 0.06943899568458219, "eval_loss": 0.5725530385971069, "eval_runtime": 4.3327, "eval_samples_per_second": 82.858, "eval_steps_per_second": 2.77, "eval_wer": 0.2616475898758665, "step": 286000 }, { "epoch": 841.47, "learning_rate": 5.407409858816215e-08, "loss": 0.0761, "step": 286100 }, { "epoch": 841.76, "learning_rate": 5.330628747702682e-08, "loss": 0.0813, "step": 286200 }, { "epoch": 842.06, "learning_rate": 5.254393736806696e-08, "loss": 0.0746, "step": 286300 }, { "epoch": 842.35, "learning_rate": 5.1787049102893226e-08, "loss": 0.0787, "step": 286400 }, { "epoch": 842.65, "learning_rate": 5.103562351708891e-08, "loss": 0.0804, "step": 286500 }, { "epoch": 842.94, "learning_rate": 5.0289661440203754e-08, "loss": 0.0821, "step": 286600 }, { "epoch": 843.24, "learning_rate": 4.954916369575957e-08, "loss": 0.077, "step": 286700 }, { "epoch": 843.53, "learning_rate": 4.8814131101243e-08, "loss": 0.0812, "step": 286800 }, { "epoch": 843.82, "learning_rate": 4.8084564468107163e-08, "loss": 0.0793, "step": 286900 }, { "epoch": 844.12, "learning_rate": 4.736046460177335e-08, "loss": 0.084, "step": 287000 }, { "epoch": 844.12, "eval_cer": 0.06943899568458219, "eval_loss": 0.572623610496521, "eval_runtime": 4.6704, "eval_samples_per_second": 76.867, "eval_steps_per_second": 2.569, "eval_wer": 0.26148637755924553, "step": 287000 }, { "epoch": 844.41, "learning_rate": 4.664899155756353e-08, "loss": 0.0819, "step": 287100 }, { "epoch": 844.71, "learning_rate": 4.5935772929447395e-08, "loss": 0.0836, "step": 287200 }, { "epoch": 845.0, "learning_rate": 4.5235073860416254e-08, "loss": 0.0758, "step": 287300 }, { "epoch": 845.29, "learning_rate": 4.453273958858917e-08, "loss": 0.0788, "step": 287400 }, { "epoch": 845.59, "learning_rate": 4.383587600467143e-08, "loss": 0.0818, "step": 287500 }, { "epoch": 845.88, "learning_rate": 4.314448387798098e-08, "loss": 0.0785, "step": 287600 }, { "epoch": 846.18, "learning_rate": 4.245856397179282e-08, "loss": 0.081, "step": 287700 }, { "epoch": 846.47, "learning_rate": 4.1778117043342894e-08, "loss": 0.0748, "step": 287800 }, { "epoch": 846.76, "learning_rate": 4.1103143843823635e-08, "loss": 0.0754, "step": 287900 }, { "epoch": 847.06, "learning_rate": 4.043364511838566e-08, "loss": 0.0821, "step": 288000 }, { "epoch": 847.06, "eval_cer": 0.06970053615797045, "eval_loss": 0.5727963447570801, "eval_runtime": 5.4197, "eval_samples_per_second": 66.24, "eval_steps_per_second": 2.214, "eval_wer": 0.2616475898758665, "step": 288000 }, { "epoch": 847.35, "learning_rate": 3.976962160613551e-08, "loss": 0.0784, "step": 288100 }, { "epoch": 847.65, "learning_rate": 3.911107404013459e-08, "loss": 0.0837, "step": 288200 }, { "epoch": 847.94, "learning_rate": 3.845800314740133e-08, "loss": 0.0825, "step": 288300 }, { "epoch": 848.24, "learning_rate": 3.78104096489057e-08, "loss": 0.0807, "step": 288400 }, { "epoch": 848.53, "learning_rate": 3.716829425957136e-08, "loss": 0.0752, "step": 288500 }, { "epoch": 848.82, "learning_rate": 3.65316576882746e-08, "loss": 0.0849, "step": 288600 }, { "epoch": 849.12, "learning_rate": 3.590050063784323e-08, "loss": 0.079, "step": 288700 }, { "epoch": 849.41, "learning_rate": 3.527482380505598e-08, "loss": 0.0771, "step": 288800 }, { "epoch": 849.71, "learning_rate": 3.4654627880641446e-08, "loss": 0.0837, "step": 288900 }, { "epoch": 850.0, "learning_rate": 3.403991354927694e-08, "loss": 0.0781, "step": 289000 }, { "epoch": 850.0, "eval_cer": 0.06926463536899002, "eval_loss": 0.5718810558319092, "eval_runtime": 4.9265, "eval_samples_per_second": 72.871, "eval_steps_per_second": 2.436, "eval_wer": 0.2605191036595196, "step": 289000 }, { "epoch": 850.29, "learning_rate": 3.343068148958906e-08, "loss": 0.0751, "step": 289100 }, { "epoch": 850.59, "learning_rate": 3.2826932374151464e-08, "loss": 0.0807, "step": 289200 }, { "epoch": 850.88, "learning_rate": 3.2228666869486e-08, "loss": 0.0819, "step": 289300 }, { "epoch": 851.18, "learning_rate": 3.163588563605935e-08, "loss": 0.0802, "step": 289400 }, { "epoch": 851.47, "learning_rate": 3.104858932828414e-08, "loss": 0.0805, "step": 289500 }, { "epoch": 851.76, "learning_rate": 3.046677859451841e-08, "loss": 0.0777, "step": 289600 }, { "epoch": 852.06, "learning_rate": 2.989045407706282e-08, "loss": 0.0806, "step": 289700 }, { "epoch": 852.35, "learning_rate": 2.9319616412163966e-08, "loss": 0.0825, "step": 289800 }, { "epoch": 852.65, "learning_rate": 2.8754266230008875e-08, "loss": 0.0834, "step": 289900 }, { "epoch": 852.94, "learning_rate": 2.819440415472663e-08, "loss": 0.0822, "step": 290000 }, { "epoch": 852.94, "eval_cer": 0.06930822544788806, "eval_loss": 0.572381854057312, "eval_runtime": 4.9827, "eval_samples_per_second": 72.05, "eval_steps_per_second": 2.408, "eval_wer": 0.26116395292600353, "step": 290000 }, { "epoch": 853.24, "learning_rate": 2.7640030804389485e-08, "loss": 0.0818, "step": 290100 }, { "epoch": 853.53, "learning_rate": 2.7091146791007883e-08, "loss": 0.0835, "step": 290200 }, { "epoch": 853.82, "learning_rate": 2.6547752720533782e-08, "loss": 0.0782, "step": 290300 }, { "epoch": 854.12, "learning_rate": 2.6009849192858428e-08, "loss": 0.0794, "step": 290400 }, { "epoch": 854.41, "learning_rate": 2.547743680181125e-08, "loss": 0.0743, "step": 290500 }, { "epoch": 854.71, "learning_rate": 2.4950516135159308e-08, "loss": 0.0772, "step": 290600 }, { "epoch": 855.0, "learning_rate": 2.442908777460673e-08, "loss": 0.08, "step": 290700 }, { "epoch": 855.29, "learning_rate": 2.391315229579638e-08, "loss": 0.0824, "step": 290800 }, { "epoch": 855.59, "learning_rate": 2.3402710268303762e-08, "loss": 0.083, "step": 290900 }, { "epoch": 855.88, "learning_rate": 2.2897762255643108e-08, "loss": 0.0797, "step": 291000 }, { "epoch": 855.88, "eval_cer": 0.06970053615797045, "eval_loss": 0.5726251006126404, "eval_runtime": 5.2315, "eval_samples_per_second": 68.623, "eval_steps_per_second": 2.294, "eval_wer": 0.2616475898758665, "step": 291000 }, { "epoch": 856.18, "learning_rate": 2.2398308815261283e-08, "loss": 0.0801, "step": 291100 }, { "epoch": 856.47, "learning_rate": 2.1904350498540562e-08, "loss": 0.0867, "step": 291200 }, { "epoch": 856.76, "learning_rate": 2.141588785079529e-08, "loss": 0.0829, "step": 291300 }, { "epoch": 857.06, "learning_rate": 2.093772386768278e-08, "loss": 0.0784, "step": 291400 }, { "epoch": 857.35, "learning_rate": 2.0460199199532904e-08, "loss": 0.0814, "step": 291500 }, { "epoch": 857.65, "learning_rate": 1.9988171794658728e-08, "loss": 0.0798, "step": 291600 }, { "epoch": 857.94, "learning_rate": 1.9521642174164522e-08, "loss": 0.0799, "step": 291700 }, { "epoch": 858.24, "learning_rate": 1.906061085308497e-08, "loss": 0.0761, "step": 291800 }, { "epoch": 858.53, "learning_rate": 1.8605078340385165e-08, "loss": 0.0898, "step": 291900 }, { "epoch": 858.82, "learning_rate": 1.8155045138959494e-08, "loss": 0.0765, "step": 292000 }, { "epoch": 858.82, "eval_cer": 0.06943899568458219, "eval_loss": 0.5725178122520447, "eval_runtime": 4.364, "eval_samples_per_second": 82.263, "eval_steps_per_second": 2.75, "eval_wer": 0.2616475898758665, "step": 292000 }, { "epoch": 859.12, "learning_rate": 1.7710511745630542e-08, "loss": 0.0812, "step": 292100 }, { "epoch": 859.41, "learning_rate": 1.72714786511502e-08, "loss": 0.0782, "step": 292200 }, { "epoch": 859.71, "learning_rate": 1.6837946340197976e-08, "loss": 0.0808, "step": 292300 }, { "epoch": 860.0, "learning_rate": 1.640991529138103e-08, "loss": 0.0757, "step": 292400 }, { "epoch": 860.29, "learning_rate": 1.5987385977231374e-08, "loss": 0.0787, "step": 292500 }, { "epoch": 860.59, "learning_rate": 1.5570358864210876e-08, "loss": 0.0807, "step": 292600 }, { "epoch": 860.88, "learning_rate": 1.5158834412703493e-08, "loss": 0.083, "step": 292700 }, { "epoch": 861.18, "learning_rate": 1.4756846048477047e-08, "loss": 0.0832, "step": 292800 }, { "epoch": 861.47, "learning_rate": 1.4356273239014007e-08, "loss": 0.0783, "step": 292900 }, { "epoch": 861.76, "learning_rate": 1.396120443137916e-08, "loss": 0.077, "step": 293000 }, { "epoch": 861.76, "eval_cer": 0.06939540560568415, "eval_loss": 0.5725964903831482, "eval_runtime": 5.0444, "eval_samples_per_second": 71.168, "eval_steps_per_second": 2.379, "eval_wer": 0.2619700145091085, "step": 293000 }, { "epoch": 862.06, "learning_rate": 1.3571640061716407e-08, "loss": 0.0802, "step": 293100 }, { "epoch": 862.35, "learning_rate": 1.3187580560092839e-08, "loss": 0.0801, "step": 293200 }, { "epoch": 862.65, "learning_rate": 1.2809026350498744e-08, "loss": 0.0786, "step": 293300 }, { "epoch": 862.94, "learning_rate": 1.2435977850847048e-08, "loss": 0.0799, "step": 293400 }, { "epoch": 863.24, "learning_rate": 1.2068435472972207e-08, "loss": 0.0804, "step": 293500 }, { "epoch": 863.53, "learning_rate": 1.1706399622629095e-08, "loss": 0.082, "step": 293600 }, { "epoch": 863.82, "learning_rate": 1.134987069949578e-08, "loss": 0.0772, "step": 293700 }, { "epoch": 864.12, "learning_rate": 1.0998849097169085e-08, "loss": 0.0767, "step": 293800 }, { "epoch": 864.41, "learning_rate": 1.0653335203165693e-08, "loss": 0.0787, "step": 293900 }, { "epoch": 864.71, "learning_rate": 1.0313329398923822e-08, "loss": 0.0803, "step": 294000 }, { "epoch": 864.71, "eval_cer": 0.06952617584237827, "eval_loss": 0.5726108551025391, "eval_runtime": 4.7362, "eval_samples_per_second": 75.799, "eval_steps_per_second": 2.534, "eval_wer": 0.26132516524262456, "step": 294000 }, { "epoch": 865.0, "learning_rate": 9.978832059798216e-09, "loss": 0.0795, "step": 294100 }, { "epoch": 865.29, "learning_rate": 9.649843555065708e-09, "loss": 0.0814, "step": 294200 }, { "epoch": 865.59, "learning_rate": 9.326364247918552e-09, "loss": 0.0837, "step": 294300 }, { "epoch": 865.88, "learning_rate": 9.00839449546831e-09, "loss": 0.0812, "step": 294400 }, { "epoch": 866.18, "learning_rate": 8.695934648744742e-09, "loss": 0.0783, "step": 294500 }, { "epoch": 866.47, "learning_rate": 8.392027271795777e-09, "loss": 0.0805, "step": 294600 }, { "epoch": 866.76, "learning_rate": 8.090533157728008e-09, "loss": 0.0813, "step": 294700 }, { "epoch": 867.06, "learning_rate": 7.794549962677479e-09, "loss": 0.0824, "step": 294800 }, { "epoch": 867.35, "learning_rate": 7.504078013402249e-09, "loss": 0.0781, "step": 294900 }, { "epoch": 867.65, "learning_rate": 7.219117630573036e-09, "loss": 0.0826, "step": 295000 }, { "epoch": 867.65, "eval_cer": 0.06952617584237827, "eval_loss": 0.5726599097251892, "eval_runtime": 4.9613, "eval_samples_per_second": 72.36, "eval_steps_per_second": 2.419, "eval_wer": 0.26148637755924553, "step": 295000 }, { "epoch": 867.94, "learning_rate": 6.9396691287787476e-09, "loss": 0.0856, "step": 295100 }, { "epoch": 868.24, "learning_rate": 6.6657328165214975e-09, "loss": 0.0786, "step": 295200 }, { "epoch": 868.53, "learning_rate": 6.397308996219375e-09, "loss": 0.0779, "step": 295300 }, { "epoch": 868.82, "learning_rate": 6.1343979642042305e-09, "loss": 0.0753, "step": 295400 }, { "epoch": 869.12, "learning_rate": 5.877000010721667e-09, "loss": 0.079, "step": 295500 }, { "epoch": 869.41, "learning_rate": 5.625115419931049e-09, "loss": 0.0804, "step": 295600 }, { "epoch": 869.71, "learning_rate": 5.3787444699060495e-09, "loss": 0.0796, "step": 295700 }, { "epoch": 870.0, "learning_rate": 5.137887432632438e-09, "loss": 0.075, "step": 295800 }, { "epoch": 870.29, "learning_rate": 4.9025445740097375e-09, "loss": 0.0784, "step": 295900 }, { "epoch": 870.59, "learning_rate": 4.672716153849011e-09, "loss": 0.078, "step": 296000 }, { "epoch": 870.59, "eval_cer": 0.06978771631576654, "eval_loss": 0.5726059079170227, "eval_runtime": 4.7666, "eval_samples_per_second": 75.316, "eval_steps_per_second": 2.518, "eval_wer": 0.2616475898758665, "step": 296000 }, { "epoch": 870.88, "learning_rate": 4.448402425873965e-09, "loss": 0.0806, "step": 296100 }, { "epoch": 871.18, "learning_rate": 4.229603637720403e-09, "loss": 0.0785, "step": 296200 }, { "epoch": 871.47, "learning_rate": 4.016320030935106e-09, "loss": 0.0823, "step": 296300 }, { "epoch": 871.76, "learning_rate": 3.808551840978058e-09, "loss": 0.0789, "step": 296400 }, { "epoch": 872.06, "learning_rate": 3.6062992972180076e-09, "loss": 0.0848, "step": 296500 }, { "epoch": 872.35, "learning_rate": 3.4095626229357914e-09, "loss": 0.0795, "step": 296600 }, { "epoch": 872.65, "learning_rate": 3.218342035323785e-09, "loss": 0.0794, "step": 296700 }, { "epoch": 872.94, "learning_rate": 3.0326377454825695e-09, "loss": 0.0772, "step": 296800 }, { "epoch": 873.24, "learning_rate": 2.852449958424819e-09, "loss": 0.0818, "step": 296900 }, { "epoch": 873.53, "learning_rate": 2.677778873072523e-09, "loss": 0.0795, "step": 297000 }, { "epoch": 873.53, "eval_cer": 0.06948258576348024, "eval_loss": 0.5727548599243164, "eval_runtime": 5.1786, "eval_samples_per_second": 69.324, "eval_steps_per_second": 2.317, "eval_wer": 0.26180880219248753, "step": 297000 }, { "epoch": 873.82, "learning_rate": 2.508624682256988e-09, "loss": 0.0838, "step": 297100 }, { "epoch": 874.12, "learning_rate": 2.3449875727199476e-09, "loss": 0.0769, "step": 297200 }, { "epoch": 874.41, "learning_rate": 2.1868677251113414e-09, "loss": 0.0778, "step": 297300 }, { "epoch": 874.71, "learning_rate": 2.0342653139904246e-09, "loss": 0.0827, "step": 297400 }, { "epoch": 875.0, "learning_rate": 1.88718050782688e-09, "loss": 0.0773, "step": 297500 }, { "epoch": 875.29, "learning_rate": 1.7456134689969317e-09, "loss": 0.0825, "step": 297600 }, { "epoch": 875.59, "learning_rate": 1.6095643537872296e-09, "loss": 0.0776, "step": 297700 }, { "epoch": 875.88, "learning_rate": 1.479033312390965e-09, "loss": 0.0765, "step": 297800 }, { "epoch": 876.18, "learning_rate": 1.3540204889106457e-09, "loss": 0.0739, "step": 297900 }, { "epoch": 876.47, "learning_rate": 1.235693649733194e-09, "loss": 0.0792, "step": 298000 }, { "epoch": 876.47, "eval_cer": 0.06943899568458219, "eval_loss": 0.5723451972007751, "eval_runtime": 5.0657, "eval_samples_per_second": 70.869, "eval_steps_per_second": 2.369, "eval_wer": 0.26148637755924553, "step": 298000 }, { "epoch": 876.76, "learning_rate": 1.1216624845133972e-09, "loss": 0.084, "step": 298100 }, { "epoch": 877.06, "learning_rate": 1.0131499317367344e-09, "loss": 0.0804, "step": 298200 }, { "epoch": 877.35, "learning_rate": 9.101561111979351e-10, "loss": 0.0799, "step": 298300 }, { "epoch": 877.65, "learning_rate": 8.126811365982701e-10, "loss": 0.0856, "step": 298400 }, { "epoch": 877.94, "learning_rate": 7.207251155483264e-10, "loss": 0.0837, "step": 298500 }, { "epoch": 878.24, "learning_rate": 6.342881495641217e-10, "loss": 0.0811, "step": 298600 }, { "epoch": 878.53, "learning_rate": 5.533703340693253e-10, "loss": 0.0792, "step": 298700 }, { "epoch": 878.82, "learning_rate": 4.77971758395257e-10, "loss": 0.0818, "step": 298800 }, { "epoch": 879.12, "learning_rate": 4.0809250577977797e-10, "loss": 0.0848, "step": 298900 }, { "epoch": 879.41, "learning_rate": 3.4373265336673514e-10, "loss": 0.083, "step": 299000 }, { "epoch": 879.41, "eval_cer": 0.06974412623686849, "eval_loss": 0.5728374123573303, "eval_runtime": 4.2557, "eval_samples_per_second": 84.357, "eval_steps_per_second": 2.82, "eval_wer": 0.2621312268257295, "step": 299000 }, { "epoch": 879.71, "learning_rate": 2.848922722081815e-10, "loss": 0.0856, "step": 299100 }, { "epoch": 880.0, "learning_rate": 2.315714272621561e-10, "loss": 0.0794, "step": 299200 }, { "epoch": 880.29, "learning_rate": 1.8377017739323876e-10, "loss": 0.0758, "step": 299300 }, { "epoch": 880.59, "learning_rate": 1.4148857537199522e-10, "loss": 0.0836, "step": 299400 }, { "epoch": 880.88, "learning_rate": 1.0472666787664232e-10, "loss": 0.0777, "step": 299500 }, { "epoch": 881.18, "learning_rate": 7.348449549082759e-11, "loss": 0.0828, "step": 299600 }, { "epoch": 881.47, "learning_rate": 4.7762092705294636e-11, "loss": 0.0778, "step": 299700 }, { "epoch": 881.76, "learning_rate": 2.7559487917327988e-11, "loss": 0.078, "step": 299800 }, { "epoch": 882.06, "learning_rate": 1.2876703428532644e-11, "loss": 0.0842, "step": 299900 }, { "epoch": 882.35, "learning_rate": 3.713755449830103e-12, "loss": 0.0753, "step": 300000 }, { "epoch": 882.35, "eval_cer": 0.0693518155267861, "eval_loss": 0.5725403428077698, "eval_runtime": 5.1749, "eval_samples_per_second": 69.373, "eval_steps_per_second": 2.319, "eval_wer": 0.26116395292600353, "step": 300000 } ], "max_steps": 300000, "num_train_epochs": 883, "total_flos": 4.30858254034925e+21, "trial_name": null, "trial_params": null }