diff --git "a/trainer_state.json" "b/trainer_state.json" new file mode 100644--- /dev/null +++ "b/trainer_state.json" @@ -0,0 +1,21016 @@ +{ + "best_metric": 1.0, + "best_model_checkpoint": "./wav2vec2-large-xlsr-am-readspeech/checkpoint-1000", + "epoch": 882.3529411764706, + "global_step": 300000, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.29, + "learning_rate": 9.600000000000001e-07, + "loss": 86.8013, + "step": 100 + }, + { + "epoch": 0.59, + "learning_rate": 1.9500000000000004e-06, + "loss": 89.2281, + "step": 200 + }, + { + "epoch": 0.88, + "learning_rate": 2.9400000000000002e-06, + "loss": 88.7762, + "step": 300 + }, + { + "epoch": 1.18, + "learning_rate": 3.920000000000001e-06, + "loss": 77.8155, + "step": 400 + }, + { + "epoch": 1.47, + "learning_rate": 4.92e-06, + "loss": 52.179, + "step": 500 + }, + { + "epoch": 1.76, + "learning_rate": 5.92e-06, + "loss": 35.7863, + "step": 600 + }, + { + "epoch": 2.06, + "learning_rate": 6.92e-06, + "loss": 26.2136, + "step": 700 + }, + { + "epoch": 2.35, + "learning_rate": 7.92e-06, + "loss": 20.6276, + "step": 800 + }, + { + "epoch": 2.65, + "learning_rate": 8.920000000000001e-06, + "loss": 15.9237, + "step": 900 + }, + { + "epoch": 2.94, + "learning_rate": 9.920000000000002e-06, + "loss": 11.6857, + "step": 1000 + }, + { + "epoch": 2.94, + "eval_cer": 1.0, + "eval_loss": 7.346815586090088, + "eval_runtime": 5.3, + "eval_samples_per_second": 67.735, + "eval_steps_per_second": 2.264, + "eval_wer": 1.0, + "step": 1000 + }, + { + "epoch": 3.24, + "learning_rate": 9.999997663999142e-06, + "loss": 9.1586, + "step": 1100 + }, + { + "epoch": 3.53, + "learning_rate": 9.999989825813658e-06, + "loss": 7.1107, + "step": 1200 + }, + { + "epoch": 3.82, + "learning_rate": 9.999976467788685e-06, + "loss": 5.7195, + "step": 1300 + }, + { + "epoch": 4.12, + "learning_rate": 9.999957589938964e-06, + "loss": 4.9527, + "step": 1400 + }, + { + "epoch": 4.41, + "learning_rate": 9.999933192285338e-06, + "loss": 4.5071, + "step": 1500 + }, + { + "epoch": 4.71, + "learning_rate": 9.999903274854741e-06, + "loss": 4.3014, + "step": 1600 + }, + { + "epoch": 5.0, + "learning_rate": 9.9998678376802e-06, + "loss": 4.1745, + "step": 1700 + }, + { + "epoch": 5.29, + "learning_rate": 9.999826880800839e-06, + "loss": 4.0713, + "step": 1800 + }, + { + "epoch": 5.59, + "learning_rate": 9.999780404261869e-06, + "loss": 4.0451, + "step": 1900 + }, + { + "epoch": 5.88, + "learning_rate": 9.999728408114603e-06, + "loss": 4.0204, + "step": 2000 + }, + { + "epoch": 5.88, + "eval_cer": 1.0, + "eval_loss": 3.9740476608276367, + "eval_runtime": 4.9396, + "eval_samples_per_second": 72.677, + "eval_steps_per_second": 2.429, + "eval_wer": 1.0, + "step": 2000 + }, + { + "epoch": 6.18, + "learning_rate": 9.99967089241644e-06, + "loss": 4.0045, + "step": 2100 + }, + { + "epoch": 6.47, + "learning_rate": 9.999607857230877e-06, + "loss": 3.9876, + "step": 2200 + }, + { + "epoch": 6.76, + "learning_rate": 9.999539302627506e-06, + "loss": 3.9874, + "step": 2300 + }, + { + "epoch": 7.06, + "learning_rate": 9.999465228682003e-06, + "loss": 3.9738, + "step": 2400 + }, + { + "epoch": 7.35, + "learning_rate": 9.999385635476149e-06, + "loss": 3.9781, + "step": 2500 + }, + { + "epoch": 7.65, + "learning_rate": 9.99930052309781e-06, + "loss": 3.9684, + "step": 2600 + }, + { + "epoch": 7.94, + "learning_rate": 9.999209891640947e-06, + "loss": 3.9763, + "step": 2700 + }, + { + "epoch": 8.24, + "learning_rate": 9.999113741205614e-06, + "loss": 3.9637, + "step": 2800 + }, + { + "epoch": 8.53, + "learning_rate": 9.99901207189796e-06, + "loss": 3.9731, + "step": 2900 + }, + { + "epoch": 8.82, + "learning_rate": 9.998904883830225e-06, + "loss": 3.9552, + "step": 3000 + }, + { + "epoch": 8.82, + "eval_cer": 1.0, + "eval_loss": 3.934492826461792, + "eval_runtime": 5.2265, + "eval_samples_per_second": 68.688, + "eval_steps_per_second": 2.296, + "eval_wer": 1.0, + "step": 3000 + }, + { + "epoch": 9.12, + "learning_rate": 9.99879217712074e-06, + "loss": 3.9658, + "step": 3100 + }, + { + "epoch": 9.41, + "learning_rate": 9.998673951893931e-06, + "loss": 3.9614, + "step": 3200 + }, + { + "epoch": 9.71, + "learning_rate": 9.998550208280315e-06, + "loss": 3.9444, + "step": 3300 + }, + { + "epoch": 10.0, + "learning_rate": 9.9984209464165e-06, + "loss": 3.9541, + "step": 3400 + }, + { + "epoch": 10.29, + "learning_rate": 9.998286166445188e-06, + "loss": 3.9426, + "step": 3500 + }, + { + "epoch": 10.59, + "learning_rate": 9.998145868515175e-06, + "loss": 3.9418, + "step": 3600 + }, + { + "epoch": 10.88, + "learning_rate": 9.99800005278134e-06, + "loss": 3.9312, + "step": 3700 + }, + { + "epoch": 11.18, + "learning_rate": 9.997848719404663e-06, + "loss": 3.996, + "step": 3800 + }, + { + "epoch": 11.47, + "learning_rate": 9.99769186855221e-06, + "loss": 3.933, + "step": 3900 + }, + { + "epoch": 11.76, + "learning_rate": 9.997529500397141e-06, + "loss": 3.9274, + "step": 4000 + }, + { + "epoch": 11.76, + "eval_cer": 1.0, + "eval_loss": 3.912527322769165, + "eval_runtime": 5.1053, + "eval_samples_per_second": 70.319, + "eval_steps_per_second": 2.35, + "eval_wer": 1.0, + "step": 4000 + }, + { + "epoch": 12.06, + "learning_rate": 9.997361615118704e-06, + "loss": 3.9269, + "step": 4100 + }, + { + "epoch": 12.35, + "learning_rate": 9.997188212902243e-06, + "loss": 3.9286, + "step": 4200 + }, + { + "epoch": 12.65, + "learning_rate": 9.997009293939183e-06, + "loss": 3.9162, + "step": 4300 + }, + { + "epoch": 12.94, + "learning_rate": 9.99682485842705e-06, + "loss": 3.9178, + "step": 4400 + }, + { + "epoch": 13.24, + "learning_rate": 9.996634906569453e-06, + "loss": 3.9131, + "step": 4500 + }, + { + "epoch": 13.53, + "learning_rate": 9.996439438576094e-06, + "loss": 3.9081, + "step": 4600 + }, + { + "epoch": 13.82, + "learning_rate": 9.996238454662763e-06, + "loss": 3.9048, + "step": 4700 + }, + { + "epoch": 14.12, + "learning_rate": 9.996031955051341e-06, + "loss": 3.9077, + "step": 4800 + }, + { + "epoch": 14.41, + "learning_rate": 9.995819939969797e-06, + "loss": 3.8908, + "step": 4900 + }, + { + "epoch": 14.71, + "learning_rate": 9.995602409652191e-06, + "loss": 3.8873, + "step": 5000 + }, + { + "epoch": 14.71, + "eval_cer": 1.0, + "eval_loss": 3.8573012351989746, + "eval_runtime": 4.9589, + "eval_samples_per_second": 72.395, + "eval_steps_per_second": 2.42, + "eval_wer": 1.0, + "step": 5000 + }, + { + "epoch": 15.0, + "learning_rate": 9.995379364338668e-06, + "loss": 3.8741, + "step": 5100 + }, + { + "epoch": 15.29, + "learning_rate": 9.995150804275463e-06, + "loss": 3.8651, + "step": 5200 + }, + { + "epoch": 15.59, + "learning_rate": 9.994916729714902e-06, + "loss": 3.8553, + "step": 5300 + }, + { + "epoch": 15.88, + "learning_rate": 9.994677140915393e-06, + "loss": 3.8397, + "step": 5400 + }, + { + "epoch": 16.18, + "learning_rate": 9.994432038141437e-06, + "loss": 3.828, + "step": 5500 + }, + { + "epoch": 16.47, + "learning_rate": 9.994181421663621e-06, + "loss": 3.802, + "step": 5600 + }, + { + "epoch": 16.76, + "learning_rate": 9.993925291758616e-06, + "loss": 3.7886, + "step": 5700 + }, + { + "epoch": 17.06, + "learning_rate": 9.993663648709183e-06, + "loss": 3.7534, + "step": 5800 + }, + { + "epoch": 17.35, + "learning_rate": 9.993396492804167e-06, + "loss": 3.7186, + "step": 5900 + }, + { + "epoch": 17.65, + "learning_rate": 9.993123824338502e-06, + "loss": 3.6704, + "step": 6000 + }, + { + "epoch": 17.65, + "eval_cer": 0.9529227147901138, + "eval_loss": 3.5608274936676025, + "eval_runtime": 5.4159, + "eval_samples_per_second": 66.286, + "eval_steps_per_second": 2.216, + "eval_wer": 0.9709817830082218, + "step": 6000 + }, + { + "epoch": 17.94, + "learning_rate": 9.992845643613204e-06, + "loss": 3.6186, + "step": 6100 + }, + { + "epoch": 18.24, + "learning_rate": 9.992561950935379e-06, + "loss": 3.5561, + "step": 6200 + }, + { + "epoch": 18.53, + "learning_rate": 9.99227274661821e-06, + "loss": 3.4841, + "step": 6300 + }, + { + "epoch": 18.82, + "learning_rate": 9.991978030980974e-06, + "loss": 3.3961, + "step": 6400 + }, + { + "epoch": 19.12, + "learning_rate": 9.99167780434903e-06, + "loss": 3.2749, + "step": 6500 + }, + { + "epoch": 19.41, + "learning_rate": 9.991372067053812e-06, + "loss": 3.1487, + "step": 6600 + }, + { + "epoch": 19.71, + "learning_rate": 9.991060819432854e-06, + "loss": 3.0266, + "step": 6700 + }, + { + "epoch": 20.0, + "learning_rate": 9.990744061829757e-06, + "loss": 2.8801, + "step": 6800 + }, + { + "epoch": 20.29, + "learning_rate": 9.990421794594216e-06, + "loss": 2.7497, + "step": 6900 + }, + { + "epoch": 20.59, + "learning_rate": 9.990094018082002e-06, + "loss": 2.6412, + "step": 7000 + }, + { + "epoch": 20.59, + "eval_cer": 0.5278322653764004, + "eval_loss": 2.214904546737671, + "eval_runtime": 5.2522, + "eval_samples_per_second": 68.352, + "eval_steps_per_second": 2.285, + "eval_wer": 0.9247138481379977, + "step": 7000 + }, + { + "epoch": 20.88, + "learning_rate": 9.989760732654972e-06, + "loss": 2.5238, + "step": 7100 + }, + { + "epoch": 21.18, + "learning_rate": 9.98942193868106e-06, + "loss": 2.4326, + "step": 7200 + }, + { + "epoch": 21.47, + "learning_rate": 9.98907763653429e-06, + "loss": 2.3556, + "step": 7300 + }, + { + "epoch": 21.76, + "learning_rate": 9.988727826594757e-06, + "loss": 2.2815, + "step": 7400 + }, + { + "epoch": 22.06, + "learning_rate": 9.988372509248643e-06, + "loss": 2.2246, + "step": 7500 + }, + { + "epoch": 22.35, + "learning_rate": 9.988011684888205e-06, + "loss": 2.1379, + "step": 7600 + }, + { + "epoch": 22.65, + "learning_rate": 9.987645353911787e-06, + "loss": 2.0879, + "step": 7700 + }, + { + "epoch": 22.94, + "learning_rate": 9.987273516723803e-06, + "loss": 2.0537, + "step": 7800 + }, + { + "epoch": 23.24, + "learning_rate": 9.986896173734752e-06, + "loss": 1.9776, + "step": 7900 + }, + { + "epoch": 23.53, + "learning_rate": 9.986513325361209e-06, + "loss": 1.952, + "step": 8000 + }, + { + "epoch": 23.53, + "eval_cer": 0.3740464670241053, + "eval_loss": 1.5460247993469238, + "eval_runtime": 4.7627, + "eval_samples_per_second": 75.378, + "eval_steps_per_second": 2.52, + "eval_wer": 0.8410446558117041, + "step": 8000 + }, + { + "epoch": 23.82, + "learning_rate": 9.986124972025826e-06, + "loss": 1.8922, + "step": 8100 + }, + { + "epoch": 24.12, + "learning_rate": 9.985731114157335e-06, + "loss": 1.8636, + "step": 8200 + }, + { + "epoch": 24.41, + "learning_rate": 9.985331752190543e-06, + "loss": 1.8044, + "step": 8300 + }, + { + "epoch": 24.71, + "learning_rate": 9.984926886566336e-06, + "loss": 1.79, + "step": 8400 + }, + { + "epoch": 25.0, + "learning_rate": 9.98451651773167e-06, + "loss": 1.7611, + "step": 8500 + }, + { + "epoch": 25.29, + "learning_rate": 9.98410064613958e-06, + "loss": 1.7184, + "step": 8600 + }, + { + "epoch": 25.59, + "learning_rate": 9.98367927224918e-06, + "loss": 1.6872, + "step": 8700 + }, + { + "epoch": 25.88, + "learning_rate": 9.983252396525649e-06, + "loss": 1.6614, + "step": 8800 + }, + { + "epoch": 26.18, + "learning_rate": 9.982820019440246e-06, + "loss": 1.638, + "step": 8900 + }, + { + "epoch": 26.47, + "learning_rate": 9.982382141470308e-06, + "loss": 1.6156, + "step": 9000 + }, + { + "epoch": 26.47, + "eval_cer": 0.30373566976156224, + "eval_loss": 1.222609519958496, + "eval_runtime": 5.389, + "eval_samples_per_second": 66.617, + "eval_steps_per_second": 2.227, + "eval_wer": 0.7757536675802031, + "step": 9000 + }, + { + "epoch": 26.76, + "learning_rate": 9.981938763099232e-06, + "loss": 1.5778, + "step": 9100 + }, + { + "epoch": 27.06, + "learning_rate": 9.981489884816498e-06, + "loss": 1.5274, + "step": 9200 + }, + { + "epoch": 27.35, + "learning_rate": 9.981035507117654e-06, + "loss": 1.514, + "step": 9300 + }, + { + "epoch": 27.65, + "learning_rate": 9.98057563050432e-06, + "loss": 1.4823, + "step": 9400 + }, + { + "epoch": 27.94, + "learning_rate": 9.980110255484182e-06, + "loss": 1.4603, + "step": 9500 + }, + { + "epoch": 28.24, + "learning_rate": 9.979639382571006e-06, + "loss": 1.4423, + "step": 9600 + }, + { + "epoch": 28.53, + "learning_rate": 9.979163012284619e-06, + "loss": 1.4232, + "step": 9700 + }, + { + "epoch": 28.82, + "learning_rate": 9.978681145150916e-06, + "loss": 1.4045, + "step": 9800 + }, + { + "epoch": 29.12, + "learning_rate": 9.97819378170187e-06, + "loss": 1.386, + "step": 9900 + }, + { + "epoch": 29.41, + "learning_rate": 9.977700922475513e-06, + "loss": 1.3531, + "step": 10000 + }, + { + "epoch": 29.41, + "eval_cer": 0.257660956366331, + "eval_loss": 0.9876303672790527, + "eval_runtime": 5.4057, + "eval_samples_per_second": 66.412, + "eval_steps_per_second": 2.22, + "eval_wer": 0.7182008705465097, + "step": 10000 + }, + { + "epoch": 29.71, + "learning_rate": 9.977202568015948e-06, + "loss": 1.3442, + "step": 10100 + }, + { + "epoch": 30.0, + "learning_rate": 9.97669871887334e-06, + "loss": 1.3231, + "step": 10200 + }, + { + "epoch": 30.29, + "learning_rate": 9.976189375603929e-06, + "loss": 1.2896, + "step": 10300 + }, + { + "epoch": 30.59, + "learning_rate": 9.97567453877001e-06, + "loss": 1.2658, + "step": 10400 + }, + { + "epoch": 30.88, + "learning_rate": 9.975154208939948e-06, + "loss": 1.2543, + "step": 10500 + }, + { + "epoch": 31.18, + "learning_rate": 9.974628386688175e-06, + "loss": 1.2248, + "step": 10600 + }, + { + "epoch": 31.47, + "learning_rate": 9.974097072595177e-06, + "loss": 1.2266, + "step": 10700 + }, + { + "epoch": 31.76, + "learning_rate": 9.973560267247515e-06, + "loss": 1.2195, + "step": 10800 + }, + { + "epoch": 32.06, + "learning_rate": 9.973017971237804e-06, + "loss": 1.1713, + "step": 10900 + }, + { + "epoch": 32.35, + "learning_rate": 9.972470185164722e-06, + "loss": 1.1879, + "step": 11000 + }, + { + "epoch": 32.35, + "eval_cer": 0.22592737892855586, + "eval_loss": 0.8309646844863892, + "eval_runtime": 4.5066, + "eval_samples_per_second": 79.661, + "eval_steps_per_second": 2.663, + "eval_wer": 0.6782202160245042, + "step": 11000 + }, + { + "epoch": 32.65, + "learning_rate": 9.971916909633008e-06, + "loss": 1.1622, + "step": 11100 + }, + { + "epoch": 32.94, + "learning_rate": 9.971358145253464e-06, + "loss": 1.1509, + "step": 11200 + }, + { + "epoch": 33.24, + "learning_rate": 9.970793892642948e-06, + "loss": 1.1338, + "step": 11300 + }, + { + "epoch": 33.53, + "learning_rate": 9.970224152424376e-06, + "loss": 1.1136, + "step": 11400 + }, + { + "epoch": 33.82, + "learning_rate": 9.969648925226726e-06, + "loss": 1.1073, + "step": 11500 + }, + { + "epoch": 34.12, + "learning_rate": 9.969068211685031e-06, + "loss": 1.0743, + "step": 11600 + }, + { + "epoch": 34.41, + "learning_rate": 9.968482012440383e-06, + "loss": 1.0671, + "step": 11700 + }, + { + "epoch": 34.71, + "learning_rate": 9.967890328139928e-06, + "loss": 1.0719, + "step": 11800 + }, + { + "epoch": 35.0, + "learning_rate": 9.967293159436865e-06, + "loss": 1.0557, + "step": 11900 + }, + { + "epoch": 35.29, + "learning_rate": 9.966690506990456e-06, + "loss": 1.0329, + "step": 12000 + }, + { + "epoch": 35.29, + "eval_cer": 0.19951179111634193, + "eval_loss": 0.7249646782875061, + "eval_runtime": 5.2152, + "eval_samples_per_second": 68.837, + "eval_steps_per_second": 2.301, + "eval_wer": 0.619700145091085, + "step": 12000 + }, + { + "epoch": 35.59, + "learning_rate": 9.966082371466006e-06, + "loss": 1.0479, + "step": 12100 + }, + { + "epoch": 35.88, + "learning_rate": 9.96546875353488e-06, + "loss": 1.0269, + "step": 12200 + }, + { + "epoch": 36.18, + "learning_rate": 9.964849653874494e-06, + "loss": 1.03, + "step": 12300 + }, + { + "epoch": 36.47, + "learning_rate": 9.964225073168317e-06, + "loss": 1.0069, + "step": 12400 + }, + { + "epoch": 36.76, + "learning_rate": 9.963595012105866e-06, + "loss": 0.9811, + "step": 12500 + }, + { + "epoch": 37.06, + "learning_rate": 9.96295947138271e-06, + "loss": 0.9897, + "step": 12600 + }, + { + "epoch": 37.35, + "learning_rate": 9.962318451700465e-06, + "loss": 0.9777, + "step": 12700 + }, + { + "epoch": 37.65, + "learning_rate": 9.961671953766802e-06, + "loss": 0.9655, + "step": 12800 + }, + { + "epoch": 37.94, + "learning_rate": 9.961019978295433e-06, + "loss": 0.9528, + "step": 12900 + }, + { + "epoch": 38.24, + "learning_rate": 9.960362526006118e-06, + "loss": 0.9425, + "step": 13000 + }, + { + "epoch": 38.24, + "eval_cer": 0.18373218255525042, + "eval_loss": 0.6471496820449829, + "eval_runtime": 5.0928, + "eval_samples_per_second": 70.492, + "eval_steps_per_second": 2.356, + "eval_wer": 0.588102531033371, + "step": 13000 + }, + { + "epoch": 38.53, + "learning_rate": 9.959699597624666e-06, + "loss": 0.9307, + "step": 13100 + }, + { + "epoch": 38.82, + "learning_rate": 9.95903119388293e-06, + "loss": 0.9336, + "step": 13200 + }, + { + "epoch": 39.12, + "learning_rate": 9.958357315518809e-06, + "loss": 0.9246, + "step": 13300 + }, + { + "epoch": 39.41, + "learning_rate": 9.957677963276242e-06, + "loss": 0.9039, + "step": 13400 + }, + { + "epoch": 39.71, + "learning_rate": 9.956993137905216e-06, + "loss": 0.9019, + "step": 13500 + }, + { + "epoch": 40.0, + "learning_rate": 9.956302840161757e-06, + "loss": 0.9067, + "step": 13600 + }, + { + "epoch": 40.29, + "learning_rate": 9.955607070807934e-06, + "loss": 0.8912, + "step": 13700 + }, + { + "epoch": 40.59, + "learning_rate": 9.954905830611852e-06, + "loss": 0.8837, + "step": 13800 + }, + { + "epoch": 40.88, + "learning_rate": 9.954199120347664e-06, + "loss": 0.8715, + "step": 13900 + }, + { + "epoch": 41.18, + "learning_rate": 9.953486940795553e-06, + "loss": 0.8704, + "step": 14000 + }, + { + "epoch": 41.18, + "eval_cer": 0.17021925809685715, + "eval_loss": 0.5903766751289368, + "eval_runtime": 4.8914, + "eval_samples_per_second": 73.395, + "eval_steps_per_second": 2.453, + "eval_wer": 0.556504916975657, + "step": 14000 + }, + { + "epoch": 41.47, + "learning_rate": 9.952769292741748e-06, + "loss": 0.8592, + "step": 14100 + }, + { + "epoch": 41.76, + "learning_rate": 9.952046176978508e-06, + "loss": 0.8599, + "step": 14200 + }, + { + "epoch": 42.06, + "learning_rate": 9.951317594304132e-06, + "loss": 0.8541, + "step": 14300 + }, + { + "epoch": 42.35, + "learning_rate": 9.950583545522953e-06, + "loss": 0.8308, + "step": 14400 + }, + { + "epoch": 42.65, + "learning_rate": 9.94984403144534e-06, + "loss": 0.8349, + "step": 14500 + }, + { + "epoch": 42.94, + "learning_rate": 9.949099052887694e-06, + "loss": 0.8297, + "step": 14600 + }, + { + "epoch": 43.24, + "learning_rate": 9.948356142136993e-06, + "loss": 0.8316, + "step": 14700 + }, + { + "epoch": 43.53, + "learning_rate": 9.947600291716784e-06, + "loss": 0.8122, + "step": 14800 + }, + { + "epoch": 43.82, + "learning_rate": 9.946838979293566e-06, + "loss": 0.8249, + "step": 14900 + }, + { + "epoch": 44.12, + "learning_rate": 9.946072205707802e-06, + "loss": 0.8113, + "step": 15000 + }, + { + "epoch": 44.12, + "eval_cer": 0.16285253476308792, + "eval_loss": 0.5454097986221313, + "eval_runtime": 5.4231, + "eval_samples_per_second": 66.199, + "eval_steps_per_second": 2.213, + "eval_wer": 0.5442527809124618, + "step": 15000 + }, + { + "epoch": 44.41, + "learning_rate": 9.945299971805988e-06, + "loss": 0.7922, + "step": 15100 + }, + { + "epoch": 44.71, + "learning_rate": 9.944522278440648e-06, + "loss": 0.7931, + "step": 15200 + }, + { + "epoch": 45.0, + "learning_rate": 9.943739126470331e-06, + "loss": 0.7999, + "step": 15300 + }, + { + "epoch": 45.29, + "learning_rate": 9.942950516759613e-06, + "loss": 0.7875, + "step": 15400 + }, + { + "epoch": 45.59, + "learning_rate": 9.942156450179096e-06, + "loss": 0.7786, + "step": 15500 + }, + { + "epoch": 45.88, + "learning_rate": 9.941356927605407e-06, + "loss": 0.7762, + "step": 15600 + }, + { + "epoch": 46.18, + "learning_rate": 9.940551949921196e-06, + "loss": 0.7804, + "step": 15700 + }, + { + "epoch": 46.47, + "learning_rate": 9.939741518015131e-06, + "loss": 0.7618, + "step": 15800 + }, + { + "epoch": 46.76, + "learning_rate": 9.938925632781907e-06, + "loss": 0.7633, + "step": 15900 + }, + { + "epoch": 47.06, + "learning_rate": 9.938104295122233e-06, + "loss": 0.751, + "step": 16000 + }, + { + "epoch": 47.06, + "eval_cer": 0.15430887929907153, + "eval_loss": 0.5159721970558167, + "eval_runtime": 5.2316, + "eval_samples_per_second": 68.622, + "eval_steps_per_second": 2.294, + "eval_wer": 0.524907302917943, + "step": 16000 + }, + { + "epoch": 47.35, + "learning_rate": 9.937277505942848e-06, + "loss": 0.7442, + "step": 16100 + }, + { + "epoch": 47.65, + "learning_rate": 9.936445266156499e-06, + "loss": 0.747, + "step": 16200 + }, + { + "epoch": 47.94, + "learning_rate": 9.935607576681951e-06, + "loss": 0.7361, + "step": 16300 + }, + { + "epoch": 48.24, + "learning_rate": 9.934764438443993e-06, + "loss": 0.7332, + "step": 16400 + }, + { + "epoch": 48.53, + "learning_rate": 9.933915852373421e-06, + "loss": 0.7431, + "step": 16500 + }, + { + "epoch": 48.82, + "learning_rate": 9.933061819407052e-06, + "loss": 0.7295, + "step": 16600 + }, + { + "epoch": 49.12, + "learning_rate": 9.93220234048771e-06, + "loss": 0.72, + "step": 16700 + }, + { + "epoch": 49.41, + "learning_rate": 9.931337416564234e-06, + "loss": 0.7169, + "step": 16800 + }, + { + "epoch": 49.71, + "learning_rate": 9.930467048591479e-06, + "loss": 0.7173, + "step": 16900 + }, + { + "epoch": 50.0, + "learning_rate": 9.929591237530298e-06, + "loss": 0.7202, + "step": 17000 + }, + { + "epoch": 50.0, + "eval_cer": 0.14737805675428273, + "eval_loss": 0.4853704273700714, + "eval_runtime": 4.7551, + "eval_samples_per_second": 75.498, + "eval_steps_per_second": 2.524, + "eval_wer": 0.5070127357730131, + "step": 17000 + }, + { + "epoch": 50.29, + "learning_rate": 9.928709984347566e-06, + "loss": 0.6911, + "step": 17100 + }, + { + "epoch": 50.59, + "learning_rate": 9.927823290016156e-06, + "loss": 0.7064, + "step": 17200 + }, + { + "epoch": 50.88, + "learning_rate": 9.926940103785579e-06, + "loss": 0.7016, + "step": 17300 + }, + { + "epoch": 51.18, + "learning_rate": 9.926042584486431e-06, + "loss": 0.7164, + "step": 17400 + }, + { + "epoch": 51.47, + "learning_rate": 9.925139626983336e-06, + "loss": 0.6982, + "step": 17500 + }, + { + "epoch": 51.76, + "learning_rate": 9.924231232273133e-06, + "loss": 0.6939, + "step": 17600 + }, + { + "epoch": 52.06, + "learning_rate": 9.923317401358663e-06, + "loss": 0.6864, + "step": 17700 + }, + { + "epoch": 52.35, + "learning_rate": 9.922398135248766e-06, + "loss": 0.6765, + "step": 17800 + }, + { + "epoch": 52.65, + "learning_rate": 9.921473434958289e-06, + "loss": 0.6748, + "step": 17900 + }, + { + "epoch": 52.94, + "learning_rate": 9.920543301508068e-06, + "loss": 0.6876, + "step": 18000 + }, + { + "epoch": 52.94, + "eval_cer": 0.14423957107362365, + "eval_loss": 0.46753910183906555, + "eval_runtime": 4.6127, + "eval_samples_per_second": 77.829, + "eval_steps_per_second": 2.602, + "eval_wer": 0.5110430436885378, + "step": 18000 + }, + { + "epoch": 53.24, + "learning_rate": 9.919607735924945e-06, + "loss": 0.6811, + "step": 18100 + }, + { + "epoch": 53.53, + "learning_rate": 9.918666739241758e-06, + "loss": 0.6627, + "step": 18200 + }, + { + "epoch": 53.82, + "learning_rate": 9.917720312497337e-06, + "loss": 0.6605, + "step": 18300 + }, + { + "epoch": 54.12, + "learning_rate": 9.91676845673651e-06, + "loss": 0.67, + "step": 18400 + }, + { + "epoch": 54.41, + "learning_rate": 9.915811173010097e-06, + "loss": 0.649, + "step": 18500 + }, + { + "epoch": 54.71, + "learning_rate": 9.914848462374911e-06, + "loss": 0.6546, + "step": 18600 + }, + { + "epoch": 55.0, + "learning_rate": 9.913880325893755e-06, + "loss": 0.6598, + "step": 18700 + }, + { + "epoch": 55.29, + "learning_rate": 9.912906764635423e-06, + "loss": 0.6558, + "step": 18800 + }, + { + "epoch": 55.59, + "learning_rate": 9.911927779674696e-06, + "loss": 0.6528, + "step": 18900 + }, + { + "epoch": 55.88, + "learning_rate": 9.910943372092349e-06, + "loss": 0.6503, + "step": 19000 + }, + { + "epoch": 55.88, + "eval_cer": 0.13796259971230548, + "eval_loss": 0.4472251534461975, + "eval_runtime": 5.2128, + "eval_samples_per_second": 68.869, + "eval_steps_per_second": 2.302, + "eval_wer": 0.4826696759632436, + "step": 19000 + }, + { + "epoch": 56.18, + "learning_rate": 9.909953542975134e-06, + "loss": 0.6274, + "step": 19100 + }, + { + "epoch": 56.47, + "learning_rate": 9.908958293415795e-06, + "loss": 0.6333, + "step": 19200 + }, + { + "epoch": 56.76, + "learning_rate": 9.907957624513058e-06, + "loss": 0.6317, + "step": 19300 + }, + { + "epoch": 57.06, + "learning_rate": 9.90695153737163e-06, + "loss": 0.6302, + "step": 19400 + }, + { + "epoch": 57.35, + "learning_rate": 9.905950174956017e-06, + "loss": 0.6387, + "step": 19500 + }, + { + "epoch": 57.65, + "learning_rate": 9.904933308829825e-06, + "loss": 0.6304, + "step": 19600 + }, + { + "epoch": 57.94, + "learning_rate": 9.903911027803696e-06, + "loss": 0.6136, + "step": 19700 + }, + { + "epoch": 58.24, + "learning_rate": 9.902883333006202e-06, + "loss": 0.6128, + "step": 19800 + }, + { + "epoch": 58.53, + "learning_rate": 9.901850225571881e-06, + "loss": 0.6113, + "step": 19900 + }, + { + "epoch": 58.82, + "learning_rate": 9.900811706641256e-06, + "loss": 0.629, + "step": 20000 + }, + { + "epoch": 58.82, + "eval_cer": 0.13430103308486988, + "eval_loss": 0.43461212515830994, + "eval_runtime": 4.8127, + "eval_samples_per_second": 74.594, + "eval_steps_per_second": 2.493, + "eval_wer": 0.46912784136708047, + "step": 20000 + }, + { + "epoch": 59.12, + "learning_rate": 9.89976777736082e-06, + "loss": 0.6202, + "step": 20100 + }, + { + "epoch": 59.41, + "learning_rate": 9.898718438883044e-06, + "loss": 0.6079, + "step": 20200 + }, + { + "epoch": 59.71, + "learning_rate": 9.89766369236636e-06, + "loss": 0.6134, + "step": 20300 + }, + { + "epoch": 60.0, + "learning_rate": 9.89660353897518e-06, + "loss": 0.6198, + "step": 20400 + }, + { + "epoch": 60.29, + "learning_rate": 9.895537979879882e-06, + "loss": 0.6029, + "step": 20500 + }, + { + "epoch": 60.59, + "learning_rate": 9.89446701625681e-06, + "loss": 0.6027, + "step": 20600 + }, + { + "epoch": 60.88, + "learning_rate": 9.893390649288274e-06, + "loss": 0.6029, + "step": 20700 + }, + { + "epoch": 61.18, + "learning_rate": 9.892308880162558e-06, + "loss": 0.5978, + "step": 20800 + }, + { + "epoch": 61.47, + "learning_rate": 9.891221710073895e-06, + "loss": 0.5906, + "step": 20900 + }, + { + "epoch": 61.76, + "learning_rate": 9.890129140222492e-06, + "loss": 0.5847, + "step": 21000 + }, + { + "epoch": 61.76, + "eval_cer": 0.13168562835098732, + "eval_loss": 0.421942800283432, + "eval_runtime": 4.6895, + "eval_samples_per_second": 76.554, + "eval_steps_per_second": 2.559, + "eval_wer": 0.47573754634854104, + "step": 21000 + }, + { + "epoch": 62.06, + "learning_rate": 9.889031171814516e-06, + "loss": 0.5831, + "step": 21100 + }, + { + "epoch": 62.35, + "learning_rate": 9.887927806062085e-06, + "loss": 0.5945, + "step": 21200 + }, + { + "epoch": 62.65, + "learning_rate": 9.886819044183287e-06, + "loss": 0.5786, + "step": 21300 + }, + { + "epoch": 62.94, + "learning_rate": 9.885704887402158e-06, + "loss": 0.5858, + "step": 21400 + }, + { + "epoch": 63.24, + "learning_rate": 9.8845853369487e-06, + "loss": 0.5825, + "step": 21500 + }, + { + "epoch": 63.53, + "learning_rate": 9.883460394058857e-06, + "loss": 0.5805, + "step": 21600 + }, + { + "epoch": 63.82, + "learning_rate": 9.882330059974536e-06, + "loss": 0.58, + "step": 21700 + }, + { + "epoch": 64.12, + "learning_rate": 9.881194335943589e-06, + "loss": 0.5717, + "step": 21800 + }, + { + "epoch": 64.41, + "learning_rate": 9.880053223219826e-06, + "loss": 0.5771, + "step": 21900 + }, + { + "epoch": 64.71, + "learning_rate": 9.878906723062995e-06, + "loss": 0.5777, + "step": 22000 + }, + { + "epoch": 64.71, + "eval_cer": 0.12732662046118304, + "eval_loss": 0.4089703857898712, + "eval_runtime": 4.8857, + "eval_samples_per_second": 73.48, + "eval_steps_per_second": 2.456, + "eval_wer": 0.4549411575044333, + "step": 22000 + }, + { + "epoch": 65.0, + "learning_rate": 9.877754836738805e-06, + "loss": 0.565, + "step": 22100 + }, + { + "epoch": 65.29, + "learning_rate": 9.876597565518899e-06, + "loss": 0.5735, + "step": 22200 + }, + { + "epoch": 65.59, + "learning_rate": 9.875434910680871e-06, + "loss": 0.5607, + "step": 22300 + }, + { + "epoch": 65.88, + "learning_rate": 9.87426687350826e-06, + "loss": 0.5723, + "step": 22400 + }, + { + "epoch": 66.18, + "learning_rate": 9.87309345529054e-06, + "loss": 0.5574, + "step": 22500 + }, + { + "epoch": 66.47, + "learning_rate": 9.871914657323133e-06, + "loss": 0.5535, + "step": 22600 + }, + { + "epoch": 66.76, + "learning_rate": 9.870730480907395e-06, + "loss": 0.5475, + "step": 22700 + }, + { + "epoch": 67.06, + "learning_rate": 9.869540927350623e-06, + "loss": 0.5536, + "step": 22800 + }, + { + "epoch": 67.35, + "learning_rate": 9.868345997966044e-06, + "loss": 0.5532, + "step": 22900 + }, + { + "epoch": 67.65, + "learning_rate": 9.867157723711235e-06, + "loss": 0.5609, + "step": 23000 + }, + { + "epoch": 67.65, + "eval_cer": 0.12440608517501417, + "eval_loss": 0.40106838941574097, + "eval_runtime": 5.3761, + "eval_samples_per_second": 66.777, + "eval_steps_per_second": 2.232, + "eval_wer": 0.45010478800580367, + "step": 23000 + }, + { + "epoch": 67.94, + "learning_rate": 9.86595210035974e-06, + "loss": 0.5303, + "step": 23100 + }, + { + "epoch": 68.24, + "learning_rate": 9.864741105142399e-06, + "loss": 0.536, + "step": 23200 + }, + { + "epoch": 68.53, + "learning_rate": 9.863524739396117e-06, + "loss": 0.5378, + "step": 23300 + }, + { + "epoch": 68.82, + "learning_rate": 9.86230300446372e-06, + "loss": 0.55, + "step": 23400 + }, + { + "epoch": 69.12, + "learning_rate": 9.861075901693973e-06, + "loss": 0.5482, + "step": 23500 + }, + { + "epoch": 69.41, + "learning_rate": 9.859843432441557e-06, + "loss": 0.539, + "step": 23600 + }, + { + "epoch": 69.71, + "learning_rate": 9.858605598067082e-06, + "loss": 0.5286, + "step": 23700 + }, + { + "epoch": 70.0, + "learning_rate": 9.857362399937081e-06, + "loss": 0.5451, + "step": 23800 + }, + { + "epoch": 70.29, + "learning_rate": 9.856113839424007e-06, + "loss": 0.5403, + "step": 23900 + }, + { + "epoch": 70.59, + "learning_rate": 9.854859917906234e-06, + "loss": 0.5287, + "step": 24000 + }, + { + "epoch": 70.59, + "eval_cer": 0.1208752887842727, + "eval_loss": 0.39059486985206604, + "eval_runtime": 5.0091, + "eval_samples_per_second": 71.669, + "eval_steps_per_second": 2.396, + "eval_wer": 0.4380138642592294, + "step": 24000 + }, + { + "epoch": 70.88, + "learning_rate": 9.853600636768053e-06, + "loss": 0.5235, + "step": 24100 + }, + { + "epoch": 71.18, + "learning_rate": 9.852335997399674e-06, + "loss": 0.5141, + "step": 24200 + }, + { + "epoch": 71.47, + "learning_rate": 9.85106600119722e-06, + "loss": 0.5232, + "step": 24300 + }, + { + "epoch": 71.76, + "learning_rate": 9.84979064956273e-06, + "loss": 0.514, + "step": 24400 + }, + { + "epoch": 72.06, + "learning_rate": 9.848509943904152e-06, + "loss": 0.5304, + "step": 24500 + }, + { + "epoch": 72.35, + "learning_rate": 9.84722388563535e-06, + "loss": 0.5154, + "step": 24600 + }, + { + "epoch": 72.65, + "learning_rate": 9.845932476176093e-06, + "loss": 0.5131, + "step": 24700 + }, + { + "epoch": 72.94, + "learning_rate": 9.844635716952054e-06, + "loss": 0.5105, + "step": 24800 + }, + { + "epoch": 73.24, + "learning_rate": 9.843333609394823e-06, + "loss": 0.5116, + "step": 24900 + }, + { + "epoch": 73.53, + "learning_rate": 9.842026154941883e-06, + "loss": 0.5048, + "step": 25000 + }, + { + "epoch": 73.53, + "eval_cer": 0.1172137221568371, + "eval_loss": 0.38722869753837585, + "eval_runtime": 5.2278, + "eval_samples_per_second": 68.671, + "eval_steps_per_second": 2.295, + "eval_wer": 0.42237626954699337, + "step": 25000 + }, + { + "epoch": 73.82, + "learning_rate": 9.840713355036629e-06, + "loss": 0.5126, + "step": 25100 + }, + { + "epoch": 74.12, + "learning_rate": 9.839395211128352e-06, + "loss": 0.5006, + "step": 25200 + }, + { + "epoch": 74.41, + "learning_rate": 9.838071724672239e-06, + "loss": 0.5051, + "step": 25300 + }, + { + "epoch": 74.71, + "learning_rate": 9.836742897129383e-06, + "loss": 0.507, + "step": 25400 + }, + { + "epoch": 75.0, + "learning_rate": 9.835422098064685e-06, + "loss": 0.5031, + "step": 25500 + }, + { + "epoch": 75.29, + "learning_rate": 9.834082646129353e-06, + "loss": 0.4998, + "step": 25600 + }, + { + "epoch": 75.59, + "learning_rate": 9.832737857511103e-06, + "loss": 0.4934, + "step": 25700 + }, + { + "epoch": 75.88, + "learning_rate": 9.83138773369454e-06, + "loss": 0.5012, + "step": 25800 + }, + { + "epoch": 76.18, + "learning_rate": 9.830032276170158e-06, + "loss": 0.4894, + "step": 25900 + }, + { + "epoch": 76.47, + "learning_rate": 9.828671486434347e-06, + "loss": 0.481, + "step": 26000 + }, + { + "epoch": 76.47, + "eval_cer": 0.11594960986879387, + "eval_loss": 0.38624435663223267, + "eval_runtime": 4.6342, + "eval_samples_per_second": 77.468, + "eval_steps_per_second": 2.589, + "eval_wer": 0.4201192971142995, + "step": 26000 + }, + { + "epoch": 76.76, + "learning_rate": 9.827305365989374e-06, + "loss": 0.4965, + "step": 26100 + }, + { + "epoch": 77.06, + "learning_rate": 9.825933916343396e-06, + "loss": 0.4878, + "step": 26200 + }, + { + "epoch": 77.35, + "learning_rate": 9.824557139010453e-06, + "loss": 0.4873, + "step": 26300 + }, + { + "epoch": 77.65, + "learning_rate": 9.823175035510463e-06, + "loss": 0.4824, + "step": 26400 + }, + { + "epoch": 77.94, + "learning_rate": 9.821787607369233e-06, + "loss": 0.4853, + "step": 26500 + }, + { + "epoch": 78.24, + "learning_rate": 9.820394856118438e-06, + "loss": 0.4765, + "step": 26600 + }, + { + "epoch": 78.53, + "learning_rate": 9.818996783295635e-06, + "loss": 0.4826, + "step": 26700 + }, + { + "epoch": 78.82, + "learning_rate": 9.817593390444255e-06, + "loss": 0.4766, + "step": 26800 + }, + { + "epoch": 79.12, + "learning_rate": 9.816184679113603e-06, + "loss": 0.4784, + "step": 26900 + }, + { + "epoch": 79.41, + "learning_rate": 9.814770650858849e-06, + "loss": 0.4762, + "step": 27000 + }, + { + "epoch": 79.41, + "eval_cer": 0.11289830434593087, + "eval_loss": 0.3742750585079193, + "eval_runtime": 4.6829, + "eval_samples_per_second": 76.661, + "eval_steps_per_second": 2.562, + "eval_wer": 0.4112526197001451, + "step": 27000 + }, + { + "epoch": 79.71, + "learning_rate": 9.813351307241043e-06, + "loss": 0.481, + "step": 27100 + }, + { + "epoch": 80.0, + "learning_rate": 9.811926649827097e-06, + "loss": 0.4865, + "step": 27200 + }, + { + "epoch": 80.29, + "learning_rate": 9.810496680189789e-06, + "loss": 0.4767, + "step": 27300 + }, + { + "epoch": 80.59, + "learning_rate": 9.809061399907764e-06, + "loss": 0.4693, + "step": 27400 + }, + { + "epoch": 80.88, + "learning_rate": 9.807620810565528e-06, + "loss": 0.4666, + "step": 27500 + }, + { + "epoch": 81.18, + "learning_rate": 9.806174913753448e-06, + "loss": 0.4701, + "step": 27600 + }, + { + "epoch": 81.47, + "learning_rate": 9.804723711067753e-06, + "loss": 0.4746, + "step": 27700 + }, + { + "epoch": 81.76, + "learning_rate": 9.803267204110525e-06, + "loss": 0.469, + "step": 27800 + }, + { + "epoch": 82.06, + "learning_rate": 9.801805394489707e-06, + "loss": 0.4672, + "step": 27900 + }, + { + "epoch": 82.35, + "learning_rate": 9.80033828381909e-06, + "loss": 0.457, + "step": 28000 + }, + { + "epoch": 82.35, + "eval_cer": 0.11137265158449937, + "eval_loss": 0.3707512617111206, + "eval_runtime": 4.6031, + "eval_samples_per_second": 77.991, + "eval_steps_per_second": 2.607, + "eval_wer": 0.4064162502015154, + "step": 28000 + }, + { + "epoch": 82.65, + "learning_rate": 9.798865873718322e-06, + "loss": 0.4656, + "step": 28100 + }, + { + "epoch": 82.94, + "learning_rate": 9.7973881658129e-06, + "loss": 0.459, + "step": 28200 + }, + { + "epoch": 83.24, + "learning_rate": 9.79590516173417e-06, + "loss": 0.4512, + "step": 28300 + }, + { + "epoch": 83.53, + "learning_rate": 9.794416863119322e-06, + "loss": 0.4469, + "step": 28400 + }, + { + "epoch": 83.82, + "learning_rate": 9.792923271611394e-06, + "loss": 0.4683, + "step": 28500 + }, + { + "epoch": 84.12, + "learning_rate": 9.791424388859268e-06, + "loss": 0.4602, + "step": 28600 + }, + { + "epoch": 84.41, + "learning_rate": 9.789920216517665e-06, + "loss": 0.4606, + "step": 28700 + }, + { + "epoch": 84.71, + "learning_rate": 9.788410756247145e-06, + "loss": 0.45, + "step": 28800 + }, + { + "epoch": 85.0, + "learning_rate": 9.78689600971411e-06, + "loss": 0.4629, + "step": 28900 + }, + { + "epoch": 85.29, + "learning_rate": 9.785375978590792e-06, + "loss": 0.4471, + "step": 29000 + }, + { + "epoch": 85.29, + "eval_cer": 0.10819057582494224, + "eval_loss": 0.36229872703552246, + "eval_runtime": 4.7496, + "eval_samples_per_second": 75.585, + "eval_steps_per_second": 2.527, + "eval_wer": 0.3954538126712881, + "step": 29000 + }, + { + "epoch": 85.59, + "learning_rate": 9.783850664555262e-06, + "loss": 0.4499, + "step": 29100 + }, + { + "epoch": 85.88, + "learning_rate": 9.782320069291418e-06, + "loss": 0.4433, + "step": 29200 + }, + { + "epoch": 86.18, + "learning_rate": 9.780784194488996e-06, + "loss": 0.4469, + "step": 29300 + }, + { + "epoch": 86.47, + "learning_rate": 9.779243041843552e-06, + "loss": 0.4439, + "step": 29400 + }, + { + "epoch": 86.76, + "learning_rate": 9.777696613056476e-06, + "loss": 0.4418, + "step": 29500 + }, + { + "epoch": 87.06, + "learning_rate": 9.776144909834977e-06, + "loss": 0.4423, + "step": 29600 + }, + { + "epoch": 87.35, + "learning_rate": 9.77460352974585e-06, + "loss": 0.432, + "step": 29700 + }, + { + "epoch": 87.65, + "learning_rate": 9.773041335501925e-06, + "loss": 0.4438, + "step": 29800 + }, + { + "epoch": 87.94, + "learning_rate": 9.771473871962867e-06, + "loss": 0.4341, + "step": 29900 + }, + { + "epoch": 88.24, + "learning_rate": 9.769901140859106e-06, + "loss": 0.4398, + "step": 30000 + }, + { + "epoch": 88.24, + "eval_cer": 0.10762390479926769, + "eval_loss": 0.35913577675819397, + "eval_runtime": 4.6645, + "eval_samples_per_second": 76.965, + "eval_steps_per_second": 2.573, + "eval_wer": 0.3954538126712881, + "step": 30000 + }, + { + "epoch": 88.53, + "learning_rate": 9.768323143926892e-06, + "loss": 0.4313, + "step": 30100 + }, + { + "epoch": 88.82, + "learning_rate": 9.766739882908285e-06, + "loss": 0.4258, + "step": 30200 + }, + { + "epoch": 89.12, + "learning_rate": 9.765151359551158e-06, + "loss": 0.4304, + "step": 30300 + }, + { + "epoch": 89.41, + "learning_rate": 9.763557575609193e-06, + "loss": 0.4465, + "step": 30400 + }, + { + "epoch": 89.71, + "learning_rate": 9.761958532841882e-06, + "loss": 0.4321, + "step": 30500 + }, + { + "epoch": 90.0, + "learning_rate": 9.760354233014517e-06, + "loss": 0.4274, + "step": 30600 + }, + { + "epoch": 90.29, + "learning_rate": 9.758744677898202e-06, + "loss": 0.4369, + "step": 30700 + }, + { + "epoch": 90.59, + "learning_rate": 9.757129869269835e-06, + "loss": 0.4213, + "step": 30800 + }, + { + "epoch": 90.88, + "learning_rate": 9.755509808912114e-06, + "loss": 0.4364, + "step": 30900 + }, + { + "epoch": 91.18, + "learning_rate": 9.753884498613542e-06, + "loss": 0.4254, + "step": 31000 + }, + { + "epoch": 91.18, + "eval_cer": 0.10474695959199685, + "eval_loss": 0.3557164967060089, + "eval_runtime": 4.7708, + "eval_samples_per_second": 75.249, + "eval_steps_per_second": 2.515, + "eval_wer": 0.37901015637594715, + "step": 31000 + }, + { + "epoch": 91.47, + "learning_rate": 9.75225394016841e-06, + "loss": 0.412, + "step": 31100 + }, + { + "epoch": 91.76, + "learning_rate": 9.750618135376806e-06, + "loss": 0.421, + "step": 31200 + }, + { + "epoch": 92.06, + "learning_rate": 9.74897708604461e-06, + "loss": 0.4324, + "step": 31300 + }, + { + "epoch": 92.35, + "learning_rate": 9.747330793983493e-06, + "loss": 0.415, + "step": 31400 + }, + { + "epoch": 92.65, + "learning_rate": 9.745679261010912e-06, + "loss": 0.422, + "step": 31500 + }, + { + "epoch": 92.94, + "learning_rate": 9.74402248895011e-06, + "loss": 0.4192, + "step": 31600 + }, + { + "epoch": 93.24, + "learning_rate": 9.74236047963011e-06, + "loss": 0.4083, + "step": 31700 + }, + { + "epoch": 93.53, + "learning_rate": 9.740709933242481e-06, + "loss": 0.4127, + "step": 31800 + }, + { + "epoch": 93.82, + "learning_rate": 9.739037507241007e-06, + "loss": 0.4061, + "step": 31900 + }, + { + "epoch": 94.12, + "learning_rate": 9.737359849483607e-06, + "loss": 0.4166, + "step": 32000 + }, + { + "epoch": 94.12, + "eval_cer": 0.1032648969094634, + "eval_loss": 0.3532021641731262, + "eval_runtime": 5.0385, + "eval_samples_per_second": 71.251, + "eval_steps_per_second": 2.382, + "eval_wer": 0.3785265194260842, + "step": 32000 + }, + { + "epoch": 94.41, + "learning_rate": 9.73567696182237e-06, + "loss": 0.4109, + "step": 32100 + }, + { + "epoch": 94.71, + "learning_rate": 9.733988846115149e-06, + "loss": 0.4132, + "step": 32200 + }, + { + "epoch": 95.0, + "learning_rate": 9.732295504225576e-06, + "loss": 0.4151, + "step": 32300 + }, + { + "epoch": 95.29, + "learning_rate": 9.73059693802305e-06, + "loss": 0.4015, + "step": 32400 + }, + { + "epoch": 95.59, + "learning_rate": 9.728893149382734e-06, + "loss": 0.4102, + "step": 32500 + }, + { + "epoch": 95.88, + "learning_rate": 9.727184140185564e-06, + "loss": 0.4153, + "step": 32600 + }, + { + "epoch": 96.18, + "learning_rate": 9.725469912318232e-06, + "loss": 0.4144, + "step": 32700 + }, + { + "epoch": 96.47, + "learning_rate": 9.723750467673199e-06, + "loss": 0.4073, + "step": 32800 + }, + { + "epoch": 96.76, + "learning_rate": 9.722025808148674e-06, + "loss": 0.3992, + "step": 32900 + }, + { + "epoch": 97.06, + "learning_rate": 9.720295935648633e-06, + "loss": 0.4, + "step": 33000 + }, + { + "epoch": 97.06, + "eval_cer": 0.10322130683056537, + "eval_loss": 0.34583190083503723, + "eval_runtime": 4.6042, + "eval_samples_per_second": 77.972, + "eval_steps_per_second": 2.606, + "eval_wer": 0.3833628889247139, + "step": 33000 + }, + { + "epoch": 97.35, + "learning_rate": 9.718560852082806e-06, + "loss": 0.401, + "step": 33100 + }, + { + "epoch": 97.65, + "learning_rate": 9.716820559366672e-06, + "loss": 0.4072, + "step": 33200 + }, + { + "epoch": 97.94, + "learning_rate": 9.715075059421456e-06, + "loss": 0.4067, + "step": 33300 + }, + { + "epoch": 98.24, + "learning_rate": 9.713324354174148e-06, + "loss": 0.4008, + "step": 33400 + }, + { + "epoch": 98.53, + "learning_rate": 9.711568445557466e-06, + "loss": 0.4097, + "step": 33500 + }, + { + "epoch": 98.82, + "learning_rate": 9.709807335509887e-06, + "loss": 0.3962, + "step": 33600 + }, + { + "epoch": 99.12, + "learning_rate": 9.70804102597562e-06, + "loss": 0.3883, + "step": 33700 + }, + { + "epoch": 99.41, + "learning_rate": 9.706269518904619e-06, + "loss": 0.3923, + "step": 33800 + }, + { + "epoch": 99.71, + "learning_rate": 9.704510608990784e-06, + "loss": 0.395, + "step": 33900 + }, + { + "epoch": 100.0, + "learning_rate": 9.702728764645592e-06, + "loss": 0.4022, + "step": 34000 + }, + { + "epoch": 100.0, + "eval_cer": 0.10160847391133777, + "eval_loss": 0.34906402230262756, + "eval_runtime": 4.8096, + "eval_samples_per_second": 74.642, + "eval_steps_per_second": 2.495, + "eval_wer": 0.3683701434789618, + "step": 34000 + }, + { + "epoch": 100.29, + "learning_rate": 9.700941728628244e-06, + "loss": 0.3898, + "step": 34100 + }, + { + "epoch": 100.59, + "learning_rate": 9.699149502911573e-06, + "loss": 0.3897, + "step": 34200 + }, + { + "epoch": 100.88, + "learning_rate": 9.697352089474145e-06, + "loss": 0.3872, + "step": 34300 + }, + { + "epoch": 101.18, + "learning_rate": 9.69554949030025e-06, + "loss": 0.3732, + "step": 34400 + }, + { + "epoch": 101.47, + "learning_rate": 9.693741707379902e-06, + "loss": 0.3864, + "step": 34500 + }, + { + "epoch": 101.76, + "learning_rate": 9.691928742708842e-06, + "loss": 0.3826, + "step": 34600 + }, + { + "epoch": 102.06, + "learning_rate": 9.690110598288529e-06, + "loss": 0.3873, + "step": 34700 + }, + { + "epoch": 102.35, + "learning_rate": 9.688287276126135e-06, + "loss": 0.385, + "step": 34800 + }, + { + "epoch": 102.65, + "learning_rate": 9.686458778234561e-06, + "loss": 0.3854, + "step": 34900 + }, + { + "epoch": 102.94, + "learning_rate": 9.684625106632409e-06, + "loss": 0.3896, + "step": 35000 + }, + { + "epoch": 102.94, + "eval_cer": 0.10012641122880432, + "eval_loss": 0.3409387767314911, + "eval_runtime": 58.5958, + "eval_samples_per_second": 6.127, + "eval_steps_per_second": 0.205, + "eval_wer": 0.3688537804288248, + "step": 35000 + }, + { + "epoch": 103.24, + "learning_rate": 9.682786263343997e-06, + "loss": 0.3738, + "step": 35100 + }, + { + "epoch": 103.53, + "learning_rate": 9.680942250399357e-06, + "loss": 0.3861, + "step": 35200 + }, + { + "epoch": 103.82, + "learning_rate": 9.679093069834222e-06, + "loss": 0.3821, + "step": 35300 + }, + { + "epoch": 104.12, + "learning_rate": 9.677238723690032e-06, + "loss": 0.3817, + "step": 35400 + }, + { + "epoch": 104.41, + "learning_rate": 9.67537921401393e-06, + "loss": 0.3838, + "step": 35500 + }, + { + "epoch": 104.71, + "learning_rate": 9.67351454285876e-06, + "loss": 0.3896, + "step": 35600 + }, + { + "epoch": 105.0, + "learning_rate": 9.671644712283061e-06, + "loss": 0.3829, + "step": 35700 + }, + { + "epoch": 105.29, + "learning_rate": 9.669769724351072e-06, + "loss": 0.3738, + "step": 35800 + }, + { + "epoch": 105.59, + "learning_rate": 9.667889581132725e-06, + "loss": 0.3801, + "step": 35900 + }, + { + "epoch": 105.88, + "learning_rate": 9.666004284703638e-06, + "loss": 0.3816, + "step": 36000 + }, + { + "epoch": 105.88, + "eval_cer": 0.09733664617932958, + "eval_loss": 0.3380275368690491, + "eval_runtime": 34.8574, + "eval_samples_per_second": 10.299, + "eval_steps_per_second": 0.344, + "eval_wer": 0.35563437046590357, + "step": 36000 + }, + { + "epoch": 106.18, + "learning_rate": 9.664132767111955e-06, + "loss": 0.3751, + "step": 36100 + }, + { + "epoch": 106.47, + "learning_rate": 9.66223722199109e-06, + "loss": 0.3835, + "step": 36200 + }, + { + "epoch": 106.76, + "learning_rate": 9.66033652989952e-06, + "loss": 0.379, + "step": 36300 + }, + { + "epoch": 107.06, + "learning_rate": 9.658430692935558e-06, + "loss": 0.3625, + "step": 36400 + }, + { + "epoch": 107.35, + "learning_rate": 9.656519713203187e-06, + "loss": 0.3571, + "step": 36500 + }, + { + "epoch": 107.65, + "learning_rate": 9.654603592812074e-06, + "loss": 0.3687, + "step": 36600 + }, + { + "epoch": 107.94, + "learning_rate": 9.652682333877558e-06, + "loss": 0.3668, + "step": 36700 + }, + { + "epoch": 108.24, + "learning_rate": 9.65075593852065e-06, + "loss": 0.3718, + "step": 36800 + }, + { + "epoch": 108.53, + "learning_rate": 9.648824408868035e-06, + "loss": 0.3668, + "step": 36900 + }, + { + "epoch": 108.82, + "learning_rate": 9.646887747052065e-06, + "loss": 0.3647, + "step": 37000 + }, + { + "epoch": 108.82, + "eval_cer": 0.09681356523255306, + "eval_loss": 0.33798158168792725, + "eval_runtime": 35.9194, + "eval_samples_per_second": 9.995, + "eval_steps_per_second": 0.334, + "eval_wer": 0.3541834596163147, + "step": 37000 + }, + { + "epoch": 109.12, + "learning_rate": 9.644945955210753e-06, + "loss": 0.3667, + "step": 37100 + }, + { + "epoch": 109.41, + "learning_rate": 9.642999035487783e-06, + "loss": 0.3653, + "step": 37200 + }, + { + "epoch": 109.71, + "learning_rate": 9.641046990032494e-06, + "loss": 0.3671, + "step": 37300 + }, + { + "epoch": 110.0, + "learning_rate": 9.639089820999886e-06, + "loss": 0.3664, + "step": 37400 + }, + { + "epoch": 110.29, + "learning_rate": 9.637127530550618e-06, + "loss": 0.3663, + "step": 37500 + }, + { + "epoch": 110.59, + "learning_rate": 9.635160120850996e-06, + "loss": 0.3561, + "step": 37600 + }, + { + "epoch": 110.88, + "learning_rate": 9.633187594072984e-06, + "loss": 0.3648, + "step": 37700 + }, + { + "epoch": 111.18, + "learning_rate": 9.631209952394191e-06, + "loss": 0.3632, + "step": 37800 + }, + { + "epoch": 111.47, + "learning_rate": 9.629227197997876e-06, + "loss": 0.3618, + "step": 37900 + }, + { + "epoch": 111.76, + "learning_rate": 9.62723933307294e-06, + "loss": 0.3607, + "step": 38000 + }, + { + "epoch": 111.76, + "eval_cer": 0.09485201168214115, + "eval_loss": 0.33785539865493774, + "eval_runtime": 22.4984, + "eval_samples_per_second": 15.957, + "eval_steps_per_second": 0.533, + "eval_wer": 0.3478961792680961, + "step": 38000 + }, + { + "epoch": 112.06, + "learning_rate": 9.625246359813927e-06, + "loss": 0.3587, + "step": 38100 + }, + { + "epoch": 112.35, + "learning_rate": 9.62324828042102e-06, + "loss": 0.3528, + "step": 38200 + }, + { + "epoch": 112.65, + "learning_rate": 9.621245097100039e-06, + "loss": 0.3506, + "step": 38300 + }, + { + "epoch": 112.94, + "learning_rate": 9.619236812062436e-06, + "loss": 0.3573, + "step": 38400 + }, + { + "epoch": 113.24, + "learning_rate": 9.617223427525302e-06, + "loss": 0.3528, + "step": 38500 + }, + { + "epoch": 113.53, + "learning_rate": 9.615204945711349e-06, + "loss": 0.3503, + "step": 38600 + }, + { + "epoch": 113.82, + "learning_rate": 9.613181368848924e-06, + "loss": 0.3521, + "step": 38700 + }, + { + "epoch": 114.12, + "learning_rate": 9.611173011070848e-06, + "loss": 0.3508, + "step": 38800 + }, + { + "epoch": 114.41, + "learning_rate": 9.60913930171365e-06, + "loss": 0.3445, + "step": 38900 + }, + { + "epoch": 114.71, + "learning_rate": 9.607100504004268e-06, + "loss": 0.3561, + "step": 39000 + }, + { + "epoch": 114.71, + "eval_cer": 0.09432893073536464, + "eval_loss": 0.33478814363479614, + "eval_runtime": 23.7686, + "eval_samples_per_second": 15.104, + "eval_steps_per_second": 0.505, + "eval_wer": 0.349347090117685, + "step": 39000 + }, + { + "epoch": 115.0, + "learning_rate": 9.605056620193475e-06, + "loss": 0.3502, + "step": 39100 + }, + { + "epoch": 115.29, + "learning_rate": 9.603007652537659e-06, + "loss": 0.351, + "step": 39200 + }, + { + "epoch": 115.59, + "learning_rate": 9.600953603298815e-06, + "loss": 0.3366, + "step": 39300 + }, + { + "epoch": 115.88, + "learning_rate": 9.598894474744556e-06, + "loss": 0.344, + "step": 39400 + }, + { + "epoch": 116.18, + "learning_rate": 9.596830269148097e-06, + "loss": 0.3349, + "step": 39500 + }, + { + "epoch": 116.47, + "learning_rate": 9.594760988788259e-06, + "loss": 0.3499, + "step": 39600 + }, + { + "epoch": 116.76, + "learning_rate": 9.592686635949466e-06, + "loss": 0.337, + "step": 39700 + }, + { + "epoch": 117.06, + "learning_rate": 9.590607212921742e-06, + "loss": 0.3441, + "step": 39800 + }, + { + "epoch": 117.35, + "learning_rate": 9.588522722000706e-06, + "loss": 0.3356, + "step": 39900 + }, + { + "epoch": 117.65, + "learning_rate": 9.586433165487577e-06, + "loss": 0.344, + "step": 40000 + }, + { + "epoch": 117.65, + "eval_cer": 0.0920622466326664, + "eval_loss": 0.33385178446769714, + "eval_runtime": 22.867, + "eval_samples_per_second": 15.699, + "eval_steps_per_second": 0.525, + "eval_wer": 0.3417701112364985, + "step": 40000 + }, + { + "epoch": 117.94, + "learning_rate": 9.584359516942819e-06, + "loss": 0.3554, + "step": 40100 + }, + { + "epoch": 118.24, + "learning_rate": 9.582259886769778e-06, + "loss": 0.3421, + "step": 40200 + }, + { + "epoch": 118.53, + "learning_rate": 9.580155197918625e-06, + "loss": 0.3341, + "step": 40300 + }, + { + "epoch": 118.82, + "learning_rate": 9.578045452712876e-06, + "loss": 0.3332, + "step": 40400 + }, + { + "epoch": 119.12, + "learning_rate": 9.575930653481624e-06, + "loss": 0.3365, + "step": 40500 + }, + { + "epoch": 119.41, + "learning_rate": 9.573810802559544e-06, + "loss": 0.338, + "step": 40600 + }, + { + "epoch": 119.71, + "learning_rate": 9.571685902286891e-06, + "loss": 0.3389, + "step": 40700 + }, + { + "epoch": 120.0, + "learning_rate": 9.569555955009488e-06, + "loss": 0.3331, + "step": 40800 + }, + { + "epoch": 120.29, + "learning_rate": 9.567420963078737e-06, + "loss": 0.3195, + "step": 40900 + }, + { + "epoch": 120.59, + "learning_rate": 9.565280928851602e-06, + "loss": 0.337, + "step": 41000 + }, + { + "epoch": 120.59, + "eval_cer": 0.09219301686936053, + "eval_loss": 0.33047986030578613, + "eval_runtime": 4.9286, + "eval_samples_per_second": 72.84, + "eval_steps_per_second": 2.435, + "eval_wer": 0.3414476866032565, + "step": 41000 + }, + { + "epoch": 120.88, + "learning_rate": 9.563135854690617e-06, + "loss": 0.3345, + "step": 41100 + }, + { + "epoch": 121.18, + "learning_rate": 9.560985742963882e-06, + "loss": 0.3337, + "step": 41200 + }, + { + "epoch": 121.47, + "learning_rate": 9.558830596045055e-06, + "loss": 0.3205, + "step": 41300 + }, + { + "epoch": 121.76, + "learning_rate": 9.556670416313354e-06, + "loss": 0.3442, + "step": 41400 + }, + { + "epoch": 122.06, + "learning_rate": 9.554505206153552e-06, + "loss": 0.3381, + "step": 41500 + }, + { + "epoch": 122.35, + "learning_rate": 9.552334967955979e-06, + "loss": 0.3314, + "step": 41600 + }, + { + "epoch": 122.65, + "learning_rate": 9.55015970411651e-06, + "loss": 0.3291, + "step": 41700 + }, + { + "epoch": 122.94, + "learning_rate": 9.547979417036575e-06, + "loss": 0.3297, + "step": 41800 + }, + { + "epoch": 123.24, + "learning_rate": 9.54579410912314e-06, + "loss": 0.3262, + "step": 41900 + }, + { + "epoch": 123.53, + "learning_rate": 9.543603782788727e-06, + "loss": 0.3297, + "step": 42000 + }, + { + "epoch": 123.53, + "eval_cer": 0.09036223355564274, + "eval_loss": 0.33064666390419006, + "eval_runtime": 4.4896, + "eval_samples_per_second": 79.963, + "eval_steps_per_second": 2.673, + "eval_wer": 0.3311300983395131, + "step": 42000 + }, + { + "epoch": 123.82, + "learning_rate": 9.541408440451385e-06, + "loss": 0.3193, + "step": 42100 + }, + { + "epoch": 124.12, + "learning_rate": 9.539208084534708e-06, + "loss": 0.324, + "step": 42200 + }, + { + "epoch": 124.41, + "learning_rate": 9.537002717467826e-06, + "loss": 0.3244, + "step": 42300 + }, + { + "epoch": 124.71, + "learning_rate": 9.534792341685395e-06, + "loss": 0.3289, + "step": 42400 + }, + { + "epoch": 125.0, + "learning_rate": 9.532576959627604e-06, + "loss": 0.3297, + "step": 42500 + }, + { + "epoch": 125.29, + "learning_rate": 9.530356573740171e-06, + "loss": 0.3193, + "step": 42600 + }, + { + "epoch": 125.59, + "learning_rate": 9.528131186474335e-06, + "loss": 0.3198, + "step": 42700 + }, + { + "epoch": 125.88, + "learning_rate": 9.525900800286855e-06, + "loss": 0.3172, + "step": 42800 + }, + { + "epoch": 126.18, + "learning_rate": 9.523665417640016e-06, + "loss": 0.3288, + "step": 42900 + }, + { + "epoch": 126.47, + "learning_rate": 9.521425041001606e-06, + "loss": 0.3229, + "step": 43000 + }, + { + "epoch": 126.47, + "eval_cer": 0.09123403513360359, + "eval_loss": 0.33507028222084045, + "eval_runtime": 4.4014, + "eval_samples_per_second": 81.566, + "eval_steps_per_second": 2.726, + "eval_wer": 0.33548283088827985, + "step": 43000 + }, + { + "epoch": 126.76, + "learning_rate": 9.519179672844941e-06, + "loss": 0.3121, + "step": 43100 + }, + { + "epoch": 127.06, + "learning_rate": 9.516929315648835e-06, + "loss": 0.3136, + "step": 43200 + }, + { + "epoch": 127.35, + "learning_rate": 9.51467397189762e-06, + "loss": 0.3205, + "step": 43300 + }, + { + "epoch": 127.65, + "learning_rate": 9.512413644081122e-06, + "loss": 0.322, + "step": 43400 + }, + { + "epoch": 127.94, + "learning_rate": 9.510148334694681e-06, + "loss": 0.3181, + "step": 43500 + }, + { + "epoch": 128.24, + "learning_rate": 9.50787804623913e-06, + "loss": 0.3117, + "step": 43600 + }, + { + "epoch": 128.53, + "learning_rate": 9.505602781220798e-06, + "loss": 0.3191, + "step": 43700 + }, + { + "epoch": 128.82, + "learning_rate": 9.503322542151511e-06, + "loss": 0.3155, + "step": 43800 + }, + { + "epoch": 129.12, + "learning_rate": 9.501037331548584e-06, + "loss": 0.3125, + "step": 43900 + }, + { + "epoch": 129.41, + "learning_rate": 9.49874715193482e-06, + "loss": 0.3099, + "step": 44000 + }, + { + "epoch": 129.41, + "eval_cer": 0.08870581055751711, + "eval_loss": 0.3309319317340851, + "eval_runtime": 4.8326, + "eval_samples_per_second": 74.288, + "eval_steps_per_second": 2.483, + "eval_wer": 0.3283894889569563, + "step": 44000 + }, + { + "epoch": 129.71, + "learning_rate": 9.496452005838512e-06, + "loss": 0.314, + "step": 44100 + }, + { + "epoch": 130.0, + "learning_rate": 9.494151895793431e-06, + "loss": 0.3089, + "step": 44200 + }, + { + "epoch": 130.29, + "learning_rate": 9.491846824338831e-06, + "loss": 0.3162, + "step": 44300 + }, + { + "epoch": 130.59, + "learning_rate": 9.48953679401944e-06, + "loss": 0.3042, + "step": 44400 + }, + { + "epoch": 130.88, + "learning_rate": 9.487221807385463e-06, + "loss": 0.3177, + "step": 44500 + }, + { + "epoch": 131.18, + "learning_rate": 9.484901866992578e-06, + "loss": 0.3209, + "step": 44600 + }, + { + "epoch": 131.47, + "learning_rate": 9.48260024881784e-06, + "loss": 0.3126, + "step": 44700 + }, + { + "epoch": 131.76, + "learning_rate": 9.480270458069627e-06, + "loss": 0.2984, + "step": 44800 + }, + { + "epoch": 132.06, + "learning_rate": 9.477935721236585e-06, + "loss": 0.3085, + "step": 44900 + }, + { + "epoch": 132.35, + "learning_rate": 9.475596040896196e-06, + "loss": 0.3123, + "step": 45000 + }, + { + "epoch": 132.35, + "eval_cer": 0.09040582363454078, + "eval_loss": 0.33625489473342896, + "eval_runtime": 5.2006, + "eval_samples_per_second": 69.03, + "eval_steps_per_second": 2.307, + "eval_wer": 0.3364501047880058, + "step": 45000 + }, + { + "epoch": 132.65, + "learning_rate": 9.473251419631397e-06, + "loss": 0.3057, + "step": 45100 + }, + { + "epoch": 132.94, + "learning_rate": 9.47090186003058e-06, + "loss": 0.302, + "step": 45200 + }, + { + "epoch": 133.24, + "learning_rate": 9.468547364687589e-06, + "loss": 0.3071, + "step": 45300 + }, + { + "epoch": 133.53, + "learning_rate": 9.466187936201714e-06, + "loss": 0.2985, + "step": 45400 + }, + { + "epoch": 133.82, + "learning_rate": 9.463823577177698e-06, + "loss": 0.3045, + "step": 45500 + }, + { + "epoch": 134.12, + "learning_rate": 9.461454290225717e-06, + "loss": 0.31, + "step": 45600 + }, + { + "epoch": 134.41, + "learning_rate": 9.4590800779614e-06, + "loss": 0.3005, + "step": 45700 + }, + { + "epoch": 134.71, + "learning_rate": 9.4567009430058e-06, + "loss": 0.2996, + "step": 45800 + }, + { + "epoch": 135.0, + "learning_rate": 9.454316887985417e-06, + "loss": 0.2984, + "step": 45900 + }, + { + "epoch": 135.29, + "learning_rate": 9.45192791553217e-06, + "loss": 0.3057, + "step": 46000 + }, + { + "epoch": 135.29, + "eval_cer": 0.0899263327666623, + "eval_loss": 0.329167902469635, + "eval_runtime": 5.0924, + "eval_samples_per_second": 70.498, + "eval_steps_per_second": 2.356, + "eval_wer": 0.3359664678381428, + "step": 46000 + }, + { + "epoch": 135.59, + "learning_rate": 9.44953402828342e-06, + "loss": 0.3065, + "step": 46100 + }, + { + "epoch": 135.88, + "learning_rate": 9.447135228881942e-06, + "loss": 0.2978, + "step": 46200 + }, + { + "epoch": 136.18, + "learning_rate": 9.44473151997594e-06, + "loss": 0.2965, + "step": 46300 + }, + { + "epoch": 136.47, + "learning_rate": 9.44232290421904e-06, + "loss": 0.2928, + "step": 46400 + }, + { + "epoch": 136.76, + "learning_rate": 9.439909384270277e-06, + "loss": 0.3002, + "step": 46500 + }, + { + "epoch": 137.06, + "learning_rate": 9.437490962794108e-06, + "loss": 0.3014, + "step": 46600 + }, + { + "epoch": 137.35, + "learning_rate": 9.435067642460396e-06, + "loss": 0.2988, + "step": 46700 + }, + { + "epoch": 137.65, + "learning_rate": 9.432639425944417e-06, + "loss": 0.2897, + "step": 46800 + }, + { + "epoch": 137.94, + "learning_rate": 9.430206315926848e-06, + "loss": 0.301, + "step": 46900 + }, + { + "epoch": 138.24, + "learning_rate": 9.427768315093772e-06, + "loss": 0.304, + "step": 47000 + }, + { + "epoch": 138.24, + "eval_cer": 0.08805195937404647, + "eval_loss": 0.32851627469062805, + "eval_runtime": 5.1462, + "eval_samples_per_second": 69.76, + "eval_steps_per_second": 2.332, + "eval_wer": 0.3300016121231662, + "step": 47000 + }, + { + "epoch": 138.53, + "learning_rate": 9.425325426136666e-06, + "loss": 0.3, + "step": 47100 + }, + { + "epoch": 138.82, + "learning_rate": 9.422877651752406e-06, + "loss": 0.3031, + "step": 47200 + }, + { + "epoch": 139.12, + "learning_rate": 9.42044954537496e-06, + "loss": 0.2905, + "step": 47300 + }, + { + "epoch": 139.41, + "learning_rate": 9.417992057035348e-06, + "loss": 0.2997, + "step": 47400 + }, + { + "epoch": 139.71, + "learning_rate": 9.415529691364405e-06, + "loss": 0.3007, + "step": 47500 + }, + { + "epoch": 140.0, + "learning_rate": 9.413062451080509e-06, + "loss": 0.2976, + "step": 47600 + }, + { + "epoch": 140.29, + "learning_rate": 9.410590338907417e-06, + "loss": 0.2914, + "step": 47700 + }, + { + "epoch": 140.59, + "learning_rate": 9.40811335757427e-06, + "loss": 0.2941, + "step": 47800 + }, + { + "epoch": 140.88, + "learning_rate": 9.405631509815582e-06, + "loss": 0.3046, + "step": 47900 + }, + { + "epoch": 141.18, + "learning_rate": 9.403144798371238e-06, + "loss": 0.2888, + "step": 48000 + }, + { + "epoch": 141.18, + "eval_cer": 0.0869622074015954, + "eval_loss": 0.3325551450252533, + "eval_runtime": 4.8817, + "eval_samples_per_second": 73.54, + "eval_steps_per_second": 2.458, + "eval_wer": 0.3282282766403353, + "step": 48000 + }, + { + "epoch": 141.47, + "learning_rate": 9.40065322598649e-06, + "loss": 0.2881, + "step": 48100 + }, + { + "epoch": 141.76, + "learning_rate": 9.398156795411963e-06, + "loss": 0.2817, + "step": 48200 + }, + { + "epoch": 142.06, + "learning_rate": 9.395680546289059e-06, + "loss": 0.2959, + "step": 48300 + }, + { + "epoch": 142.35, + "learning_rate": 9.393174456121325e-06, + "loss": 0.2927, + "step": 48400 + }, + { + "epoch": 142.65, + "learning_rate": 9.390663516020151e-06, + "loss": 0.2758, + "step": 48500 + }, + { + "epoch": 142.94, + "learning_rate": 9.388147728757537e-06, + "loss": 0.2924, + "step": 48600 + }, + { + "epoch": 143.24, + "learning_rate": 9.385627097110841e-06, + "loss": 0.2873, + "step": 48700 + }, + { + "epoch": 143.53, + "learning_rate": 9.38310162386276e-06, + "loss": 0.2857, + "step": 48800 + }, + { + "epoch": 143.82, + "learning_rate": 9.380571311801346e-06, + "loss": 0.2893, + "step": 48900 + }, + { + "epoch": 144.12, + "learning_rate": 9.378036163719985e-06, + "loss": 0.2832, + "step": 49000 + }, + { + "epoch": 144.12, + "eval_cer": 0.0869622074015954, + "eval_loss": 0.33355438709259033, + "eval_runtime": 5.3667, + "eval_samples_per_second": 66.894, + "eval_steps_per_second": 2.236, + "eval_wer": 0.3266161534741254, + "step": 49000 + }, + { + "epoch": 144.41, + "learning_rate": 9.375496182417404e-06, + "loss": 0.2903, + "step": 49100 + }, + { + "epoch": 144.71, + "learning_rate": 9.372951370697672e-06, + "loss": 0.2803, + "step": 49200 + }, + { + "epoch": 145.0, + "learning_rate": 9.370401731370179e-06, + "loss": 0.2853, + "step": 49300 + }, + { + "epoch": 145.29, + "learning_rate": 9.367847267249653e-06, + "loss": 0.287, + "step": 49400 + }, + { + "epoch": 145.59, + "learning_rate": 9.365287981156147e-06, + "loss": 0.2842, + "step": 49500 + }, + { + "epoch": 145.88, + "learning_rate": 9.362723875915033e-06, + "loss": 0.2797, + "step": 49600 + }, + { + "epoch": 146.18, + "learning_rate": 9.360154954357012e-06, + "loss": 0.2833, + "step": 49700 + }, + { + "epoch": 146.47, + "learning_rate": 9.357581219318092e-06, + "loss": 0.2881, + "step": 49800 + }, + { + "epoch": 146.76, + "learning_rate": 9.355002673639604e-06, + "loss": 0.2759, + "step": 49900 + }, + { + "epoch": 147.06, + "learning_rate": 9.352419320168182e-06, + "loss": 0.2812, + "step": 50000 + }, + { + "epoch": 147.06, + "eval_cer": 0.08652630661261497, + "eval_loss": 0.3421614170074463, + "eval_runtime": 5.2345, + "eval_samples_per_second": 68.583, + "eval_steps_per_second": 2.292, + "eval_wer": 0.32210220860873773, + "step": 50000 + }, + { + "epoch": 147.35, + "learning_rate": 9.34983116175577e-06, + "loss": 0.2795, + "step": 50100 + }, + { + "epoch": 147.65, + "learning_rate": 9.347238201259622e-06, + "loss": 0.2813, + "step": 50200 + }, + { + "epoch": 147.94, + "learning_rate": 9.344640441542285e-06, + "loss": 0.2888, + "step": 50300 + }, + { + "epoch": 148.24, + "learning_rate": 9.342037885471612e-06, + "loss": 0.2841, + "step": 50400 + }, + { + "epoch": 148.53, + "learning_rate": 9.339430535920744e-06, + "loss": 0.2747, + "step": 50500 + }, + { + "epoch": 148.82, + "learning_rate": 9.336818395768117e-06, + "loss": 0.2747, + "step": 50600 + }, + { + "epoch": 149.12, + "learning_rate": 9.334201467897458e-06, + "loss": 0.2762, + "step": 50700 + }, + { + "epoch": 149.41, + "learning_rate": 9.331579755197777e-06, + "loss": 0.2795, + "step": 50800 + }, + { + "epoch": 149.71, + "learning_rate": 9.32897954917077e-06, + "loss": 0.2718, + "step": 50900 + }, + { + "epoch": 150.0, + "learning_rate": 9.32634832327718e-06, + "loss": 0.2809, + "step": 51000 + }, + { + "epoch": 150.0, + "eval_cer": 0.0866570768493091, + "eval_loss": 0.3332664370536804, + "eval_runtime": 4.6401, + "eval_samples_per_second": 77.369, + "eval_steps_per_second": 2.586, + "eval_wer": 0.32532645494115753, + "step": 51000 + }, + { + "epoch": 150.29, + "learning_rate": 9.323712321224206e-06, + "loss": 0.2733, + "step": 51100 + }, + { + "epoch": 150.59, + "learning_rate": 9.321071545921912e-06, + "loss": 0.2667, + "step": 51200 + }, + { + "epoch": 150.88, + "learning_rate": 9.318426000285638e-06, + "loss": 0.285, + "step": 51300 + }, + { + "epoch": 151.18, + "learning_rate": 9.315775687235985e-06, + "loss": 0.2748, + "step": 51400 + }, + { + "epoch": 151.47, + "learning_rate": 9.313120609698822e-06, + "loss": 0.2712, + "step": 51500 + }, + { + "epoch": 151.76, + "learning_rate": 9.310460770605275e-06, + "loss": 0.27, + "step": 51600 + }, + { + "epoch": 152.06, + "learning_rate": 9.307796172891725e-06, + "loss": 0.278, + "step": 51700 + }, + { + "epoch": 152.35, + "learning_rate": 9.30512681949981e-06, + "loss": 0.2729, + "step": 51800 + }, + { + "epoch": 152.65, + "learning_rate": 9.302452713376417e-06, + "loss": 0.2729, + "step": 51900 + }, + { + "epoch": 152.94, + "learning_rate": 9.299773857473677e-06, + "loss": 0.2714, + "step": 52000 + }, + { + "epoch": 152.94, + "eval_cer": 0.08609040582363454, + "eval_loss": 0.32614585757255554, + "eval_runtime": 4.6598, + "eval_samples_per_second": 77.042, + "eval_steps_per_second": 2.575, + "eval_wer": 0.3238755440915686, + "step": 52000 + }, + { + "epoch": 153.24, + "learning_rate": 9.297090254748968e-06, + "loss": 0.2639, + "step": 52100 + }, + { + "epoch": 153.53, + "learning_rate": 9.294401908164907e-06, + "loss": 0.2636, + "step": 52200 + }, + { + "epoch": 153.82, + "learning_rate": 9.291708820689352e-06, + "loss": 0.274, + "step": 52300 + }, + { + "epoch": 154.12, + "learning_rate": 9.289010995295385e-06, + "loss": 0.2677, + "step": 52400 + }, + { + "epoch": 154.41, + "learning_rate": 9.286308434961327e-06, + "loss": 0.2707, + "step": 52500 + }, + { + "epoch": 154.71, + "learning_rate": 9.283601142670726e-06, + "loss": 0.2779, + "step": 52600 + }, + { + "epoch": 155.0, + "learning_rate": 9.28088912141235e-06, + "loss": 0.2754, + "step": 52700 + }, + { + "epoch": 155.29, + "learning_rate": 9.278172374180191e-06, + "loss": 0.2692, + "step": 52800 + }, + { + "epoch": 155.59, + "learning_rate": 9.275450903973456e-06, + "loss": 0.2626, + "step": 52900 + }, + { + "epoch": 155.88, + "learning_rate": 9.272724713796566e-06, + "loss": 0.2672, + "step": 53000 + }, + { + "epoch": 155.88, + "eval_cer": 0.08548014471906194, + "eval_loss": 0.3363560140132904, + "eval_runtime": 5.1126, + "eval_samples_per_second": 70.218, + "eval_steps_per_second": 2.347, + "eval_wer": 0.3203288731259068, + "step": 53000 + }, + { + "epoch": 156.18, + "learning_rate": 9.269993806659154e-06, + "loss": 0.2577, + "step": 53100 + }, + { + "epoch": 156.47, + "learning_rate": 9.26725818557606e-06, + "loss": 0.2576, + "step": 53200 + }, + { + "epoch": 156.76, + "learning_rate": 9.26451785356733e-06, + "loss": 0.2611, + "step": 53300 + }, + { + "epoch": 157.06, + "learning_rate": 9.261772813658206e-06, + "loss": 0.2618, + "step": 53400 + }, + { + "epoch": 157.35, + "learning_rate": 9.259023068879129e-06, + "loss": 0.2622, + "step": 53500 + }, + { + "epoch": 157.65, + "learning_rate": 9.25626862226574e-06, + "loss": 0.2703, + "step": 53600 + }, + { + "epoch": 157.94, + "learning_rate": 9.253509476858861e-06, + "loss": 0.2649, + "step": 53700 + }, + { + "epoch": 158.24, + "learning_rate": 9.25074563570451e-06, + "loss": 0.2642, + "step": 53800 + }, + { + "epoch": 158.53, + "learning_rate": 9.247977101853883e-06, + "loss": 0.2607, + "step": 53900 + }, + { + "epoch": 158.82, + "learning_rate": 9.245203878363358e-06, + "loss": 0.2697, + "step": 54000 + }, + { + "epoch": 158.82, + "eval_cer": 0.08343141101085393, + "eval_loss": 0.3369295001029968, + "eval_runtime": 5.4163, + "eval_samples_per_second": 66.282, + "eval_steps_per_second": 2.216, + "eval_wer": 0.3117846203449944, + "step": 54000 + }, + { + "epoch": 159.12, + "learning_rate": 9.242425968294492e-06, + "loss": 0.2545, + "step": 54100 + }, + { + "epoch": 159.41, + "learning_rate": 9.239643374714014e-06, + "loss": 0.2519, + "step": 54200 + }, + { + "epoch": 159.71, + "learning_rate": 9.236856100693828e-06, + "loss": 0.2657, + "step": 54300 + }, + { + "epoch": 160.0, + "learning_rate": 9.234064149310995e-06, + "loss": 0.2644, + "step": 54400 + }, + { + "epoch": 160.29, + "learning_rate": 9.23126752364775e-06, + "loss": 0.2577, + "step": 54500 + }, + { + "epoch": 160.59, + "learning_rate": 9.228466226791484e-06, + "loss": 0.2632, + "step": 54600 + }, + { + "epoch": 160.88, + "learning_rate": 9.225660261834746e-06, + "loss": 0.2579, + "step": 54700 + }, + { + "epoch": 161.18, + "learning_rate": 9.222849631875233e-06, + "loss": 0.2599, + "step": 54800 + }, + { + "epoch": 161.47, + "learning_rate": 9.220034340015803e-06, + "loss": 0.2576, + "step": 54900 + }, + { + "epoch": 161.76, + "learning_rate": 9.217214389364448e-06, + "loss": 0.2557, + "step": 55000 + }, + { + "epoch": 161.76, + "eval_cer": 0.08504424393008152, + "eval_loss": 0.33482369780540466, + "eval_runtime": 4.9338, + "eval_samples_per_second": 72.764, + "eval_steps_per_second": 2.432, + "eval_wer": 0.31678220216024505, + "step": 55000 + }, + { + "epoch": 162.06, + "learning_rate": 9.214418052132991e-06, + "loss": 0.2633, + "step": 55100 + }, + { + "epoch": 162.35, + "learning_rate": 9.211588839752508e-06, + "loss": 0.2735, + "step": 55200 + }, + { + "epoch": 162.65, + "learning_rate": 9.208754977903685e-06, + "loss": 0.2596, + "step": 55300 + }, + { + "epoch": 162.94, + "learning_rate": 9.205916469715018e-06, + "loss": 0.2607, + "step": 55400 + }, + { + "epoch": 163.24, + "learning_rate": 9.203073318320138e-06, + "loss": 0.2635, + "step": 55500 + }, + { + "epoch": 163.53, + "learning_rate": 9.200225526857794e-06, + "loss": 0.2498, + "step": 55600 + }, + { + "epoch": 163.82, + "learning_rate": 9.197373098471868e-06, + "loss": 0.2624, + "step": 55700 + }, + { + "epoch": 164.12, + "learning_rate": 9.194516036311354e-06, + "loss": 0.2563, + "step": 55800 + }, + { + "epoch": 164.41, + "learning_rate": 9.191654343530363e-06, + "loss": 0.2477, + "step": 55900 + }, + { + "epoch": 164.71, + "learning_rate": 9.188788023288119e-06, + "loss": 0.2481, + "step": 56000 + }, + { + "epoch": 164.71, + "eval_cer": 0.084521162983305, + "eval_loss": 0.3317776620388031, + "eval_runtime": 4.9296, + "eval_samples_per_second": 72.825, + "eval_steps_per_second": 2.434, + "eval_wer": 0.3143640174109302, + "step": 56000 + }, + { + "epoch": 165.0, + "learning_rate": 9.185917078748954e-06, + "loss": 0.2539, + "step": 56100 + }, + { + "epoch": 165.29, + "learning_rate": 9.183041513082305e-06, + "loss": 0.2472, + "step": 56200 + }, + { + "epoch": 165.59, + "learning_rate": 9.180161329462708e-06, + "loss": 0.2495, + "step": 56300 + }, + { + "epoch": 165.88, + "learning_rate": 9.177276531069804e-06, + "loss": 0.2523, + "step": 56400 + }, + { + "epoch": 166.18, + "learning_rate": 9.174387121088321e-06, + "loss": 0.2498, + "step": 56500 + }, + { + "epoch": 166.47, + "learning_rate": 9.171493102708084e-06, + "loss": 0.2514, + "step": 56600 + }, + { + "epoch": 166.76, + "learning_rate": 9.168594479124003e-06, + "loss": 0.2484, + "step": 56700 + }, + { + "epoch": 167.06, + "learning_rate": 9.165691253536068e-06, + "loss": 0.2464, + "step": 56800 + }, + { + "epoch": 167.35, + "learning_rate": 9.162783429149358e-06, + "loss": 0.2405, + "step": 56900 + }, + { + "epoch": 167.65, + "learning_rate": 9.15987100917402e-06, + "loss": 0.254, + "step": 57000 + }, + { + "epoch": 167.65, + "eval_cer": 0.08356218124754806, + "eval_loss": 0.3432825803756714, + "eval_runtime": 4.4479, + "eval_samples_per_second": 80.713, + "eval_steps_per_second": 2.698, + "eval_wer": 0.3121070449782363, + "step": 57000 + }, + { + "epoch": 167.94, + "learning_rate": 9.156953996825281e-06, + "loss": 0.2475, + "step": 57100 + }, + { + "epoch": 168.24, + "learning_rate": 9.154032395323438e-06, + "loss": 0.254, + "step": 57200 + }, + { + "epoch": 168.53, + "learning_rate": 9.151106207893846e-06, + "loss": 0.2501, + "step": 57300 + }, + { + "epoch": 168.82, + "learning_rate": 9.148175437766935e-06, + "loss": 0.2431, + "step": 57400 + }, + { + "epoch": 169.12, + "learning_rate": 9.145240088178183e-06, + "loss": 0.2534, + "step": 57500 + }, + { + "epoch": 169.41, + "learning_rate": 9.142329584267872e-06, + "loss": 0.2476, + "step": 57600 + }, + { + "epoch": 169.71, + "learning_rate": 9.139385131195785e-06, + "loss": 0.2359, + "step": 57700 + }, + { + "epoch": 170.0, + "learning_rate": 9.136436108366091e-06, + "loss": 0.2545, + "step": 57800 + }, + { + "epoch": 170.29, + "learning_rate": 9.133482519034428e-06, + "loss": 0.2479, + "step": 57900 + }, + { + "epoch": 170.59, + "learning_rate": 9.13052436646147e-06, + "loss": 0.2454, + "step": 58000 + }, + { + "epoch": 170.59, + "eval_cer": 0.08212370864391265, + "eval_loss": 0.3390425443649292, + "eval_runtime": 4.4296, + "eval_samples_per_second": 81.045, + "eval_steps_per_second": 2.709, + "eval_wer": 0.3088827986458165, + "step": 58000 + }, + { + "epoch": 170.88, + "learning_rate": 9.127561653912929e-06, + "loss": 0.2439, + "step": 58100 + }, + { + "epoch": 171.18, + "learning_rate": 9.12459438465955e-06, + "loss": 0.2415, + "step": 58200 + }, + { + "epoch": 171.47, + "learning_rate": 9.121622561977108e-06, + "loss": 0.251, + "step": 58300 + }, + { + "epoch": 171.76, + "learning_rate": 9.118646189146411e-06, + "loss": 0.2406, + "step": 58400 + }, + { + "epoch": 172.06, + "learning_rate": 9.115665269453284e-06, + "loss": 0.2458, + "step": 58500 + }, + { + "epoch": 172.35, + "learning_rate": 9.11267980618857e-06, + "loss": 0.2376, + "step": 58600 + }, + { + "epoch": 172.65, + "learning_rate": 9.109689802648138e-06, + "loss": 0.2432, + "step": 58700 + }, + { + "epoch": 172.94, + "learning_rate": 9.106695262132857e-06, + "loss": 0.2409, + "step": 58800 + }, + { + "epoch": 173.24, + "learning_rate": 9.10369618794861e-06, + "loss": 0.2432, + "step": 58900 + }, + { + "epoch": 173.53, + "learning_rate": 9.10069258340629e-06, + "loss": 0.239, + "step": 59000 + }, + { + "epoch": 173.53, + "eval_cer": 0.08295192014297546, + "eval_loss": 0.34216058254241943, + "eval_runtime": 5.0698, + "eval_samples_per_second": 70.811, + "eval_steps_per_second": 2.367, + "eval_wer": 0.3133967435112043, + "step": 59000 + }, + { + "epoch": 173.82, + "learning_rate": 9.097684451821783e-06, + "loss": 0.237, + "step": 59100 + }, + { + "epoch": 174.12, + "learning_rate": 9.094671796515979e-06, + "loss": 0.2288, + "step": 59200 + }, + { + "epoch": 174.41, + "learning_rate": 9.091654620814756e-06, + "loss": 0.2372, + "step": 59300 + }, + { + "epoch": 174.71, + "learning_rate": 9.088632928048988e-06, + "loss": 0.2379, + "step": 59400 + }, + { + "epoch": 175.0, + "learning_rate": 9.085606721554536e-06, + "loss": 0.2377, + "step": 59500 + }, + { + "epoch": 175.29, + "learning_rate": 9.082576004672238e-06, + "loss": 0.2292, + "step": 59600 + }, + { + "epoch": 175.59, + "learning_rate": 9.079540780747916e-06, + "loss": 0.2307, + "step": 59700 + }, + { + "epoch": 175.88, + "learning_rate": 9.076501053132367e-06, + "loss": 0.2442, + "step": 59800 + }, + { + "epoch": 176.18, + "learning_rate": 9.07345682518136e-06, + "loss": 0.2385, + "step": 59900 + }, + { + "epoch": 176.47, + "learning_rate": 9.070408100255632e-06, + "loss": 0.2358, + "step": 60000 + }, + { + "epoch": 176.47, + "eval_cer": 0.08247242927509699, + "eval_loss": 0.34609493613243103, + "eval_runtime": 5.0633, + "eval_samples_per_second": 70.902, + "eval_steps_per_second": 2.37, + "eval_wer": 0.31194583266161535, + "step": 60000 + }, + { + "epoch": 176.76, + "learning_rate": 9.067354881720881e-06, + "loss": 0.2394, + "step": 60100 + }, + { + "epoch": 177.06, + "learning_rate": 9.064297172947772e-06, + "loss": 0.2336, + "step": 60200 + }, + { + "epoch": 177.35, + "learning_rate": 9.061265621467159e-06, + "loss": 0.2455, + "step": 60300 + }, + { + "epoch": 177.65, + "learning_rate": 9.058198987167215e-06, + "loss": 0.2339, + "step": 60400 + }, + { + "epoch": 177.94, + "learning_rate": 9.05512787273675e-06, + "loss": 0.2365, + "step": 60500 + }, + { + "epoch": 178.24, + "learning_rate": 9.052052281566177e-06, + "loss": 0.2398, + "step": 60600 + }, + { + "epoch": 178.53, + "learning_rate": 9.04897221705086e-06, + "loss": 0.2351, + "step": 60700 + }, + { + "epoch": 178.82, + "learning_rate": 9.045887682591096e-06, + "loss": 0.2369, + "step": 60800 + }, + { + "epoch": 179.12, + "learning_rate": 9.042798681592122e-06, + "loss": 0.2355, + "step": 60900 + }, + { + "epoch": 179.41, + "learning_rate": 9.039705217464103e-06, + "loss": 0.2321, + "step": 61000 + }, + { + "epoch": 179.41, + "eval_cer": 0.08168780785493222, + "eval_loss": 0.3485713005065918, + "eval_runtime": 4.9102, + "eval_samples_per_second": 73.113, + "eval_steps_per_second": 2.444, + "eval_wer": 0.3075931001128486, + "step": 61000 + }, + { + "epoch": 179.71, + "learning_rate": 9.036607293622126e-06, + "loss": 0.24, + "step": 61100 + }, + { + "epoch": 180.0, + "learning_rate": 9.033504913486213e-06, + "loss": 0.2412, + "step": 61200 + }, + { + "epoch": 180.29, + "learning_rate": 9.030398080481293e-06, + "loss": 0.2303, + "step": 61300 + }, + { + "epoch": 180.59, + "learning_rate": 9.027286798037222e-06, + "loss": 0.2324, + "step": 61400 + }, + { + "epoch": 180.88, + "learning_rate": 9.024171069588759e-06, + "loss": 0.2271, + "step": 61500 + }, + { + "epoch": 181.18, + "learning_rate": 9.0210821222651e-06, + "loss": 0.2296, + "step": 61600 + }, + { + "epoch": 181.47, + "learning_rate": 9.01795755650591e-06, + "loss": 0.2331, + "step": 61700 + }, + { + "epoch": 181.76, + "learning_rate": 9.014828555041533e-06, + "loss": 0.233, + "step": 61800 + }, + { + "epoch": 182.06, + "learning_rate": 9.011695121326294e-06, + "loss": 0.2292, + "step": 61900 + }, + { + "epoch": 182.35, + "learning_rate": 9.008557258819412e-06, + "loss": 0.2254, + "step": 62000 + }, + { + "epoch": 182.35, + "eval_cer": 0.08125190706595178, + "eval_loss": 0.3570455014705658, + "eval_runtime": 4.4496, + "eval_samples_per_second": 80.681, + "eval_steps_per_second": 2.697, + "eval_wer": 0.3048524907302918, + "step": 62000 + }, + { + "epoch": 182.65, + "learning_rate": 9.005414970984991e-06, + "loss": 0.2275, + "step": 62100 + }, + { + "epoch": 182.94, + "learning_rate": 9.002268261292025e-06, + "loss": 0.2326, + "step": 62200 + }, + { + "epoch": 183.24, + "learning_rate": 8.999117133214384e-06, + "loss": 0.2203, + "step": 62300 + }, + { + "epoch": 183.53, + "learning_rate": 8.995961590230823e-06, + "loss": 0.2262, + "step": 62400 + }, + { + "epoch": 183.82, + "learning_rate": 8.992801635824966e-06, + "loss": 0.2349, + "step": 62500 + }, + { + "epoch": 184.12, + "learning_rate": 8.989637273485308e-06, + "loss": 0.2266, + "step": 62600 + }, + { + "epoch": 184.41, + "learning_rate": 8.986468506705211e-06, + "loss": 0.2297, + "step": 62700 + }, + { + "epoch": 184.71, + "learning_rate": 8.983295338982898e-06, + "loss": 0.2277, + "step": 62800 + }, + { + "epoch": 185.0, + "learning_rate": 8.980117773821452e-06, + "loss": 0.2191, + "step": 62900 + }, + { + "epoch": 185.29, + "learning_rate": 8.976935814728811e-06, + "loss": 0.2243, + "step": 63000 + }, + { + "epoch": 185.29, + "eval_cer": 0.081469857460442, + "eval_loss": 0.3529977798461914, + "eval_runtime": 5.5886, + "eval_samples_per_second": 64.238, + "eval_steps_per_second": 2.147, + "eval_wer": 0.30146703208125103, + "step": 63000 + }, + { + "epoch": 185.59, + "learning_rate": 8.973749465217761e-06, + "loss": 0.2322, + "step": 63100 + }, + { + "epoch": 185.88, + "learning_rate": 8.970558728805939e-06, + "loss": 0.2267, + "step": 63200 + }, + { + "epoch": 186.18, + "learning_rate": 8.96736360901582e-06, + "loss": 0.2199, + "step": 63300 + }, + { + "epoch": 186.47, + "learning_rate": 8.964164109374725e-06, + "loss": 0.2243, + "step": 63400 + }, + { + "epoch": 186.76, + "learning_rate": 8.9609602334148e-06, + "loss": 0.2279, + "step": 63500 + }, + { + "epoch": 187.06, + "learning_rate": 8.957751984673035e-06, + "loss": 0.2254, + "step": 63600 + }, + { + "epoch": 187.35, + "learning_rate": 8.954539366691238e-06, + "loss": 0.2284, + "step": 63700 + }, + { + "epoch": 187.65, + "learning_rate": 8.951354574451317e-06, + "loss": 0.225, + "step": 63800 + }, + { + "epoch": 187.94, + "learning_rate": 8.948133272238002e-06, + "loss": 0.2196, + "step": 63900 + }, + { + "epoch": 188.24, + "learning_rate": 8.944907611403423e-06, + "loss": 0.2238, + "step": 64000 + }, + { + "epoch": 188.24, + "eval_cer": 0.08094677651366548, + "eval_loss": 0.35666173696517944, + "eval_runtime": 5.2701, + "eval_samples_per_second": 68.12, + "eval_steps_per_second": 2.277, + "eval_wer": 0.2988876350153152, + "step": 64000 + }, + { + "epoch": 188.53, + "learning_rate": 8.941677595508617e-06, + "loss": 0.2272, + "step": 64100 + }, + { + "epoch": 188.82, + "learning_rate": 8.938443228119427e-06, + "loss": 0.23, + "step": 64200 + }, + { + "epoch": 189.12, + "learning_rate": 8.935204512806494e-06, + "loss": 0.2261, + "step": 64300 + }, + { + "epoch": 189.41, + "learning_rate": 8.931993905234649e-06, + "loss": 0.2222, + "step": 64400 + }, + { + "epoch": 189.71, + "learning_rate": 8.928746548195306e-06, + "loss": 0.2331, + "step": 64500 + }, + { + "epoch": 190.0, + "learning_rate": 8.925494853937067e-06, + "loss": 0.2166, + "step": 64600 + }, + { + "epoch": 190.29, + "learning_rate": 8.922238826049705e-06, + "loss": 0.2224, + "step": 64700 + }, + { + "epoch": 190.59, + "learning_rate": 8.918978468127777e-06, + "loss": 0.213, + "step": 64800 + }, + { + "epoch": 190.88, + "learning_rate": 8.915713783770622e-06, + "loss": 0.2186, + "step": 64900 + }, + { + "epoch": 191.18, + "learning_rate": 8.912444776582354e-06, + "loss": 0.2143, + "step": 65000 + }, + { + "epoch": 191.18, + "eval_cer": 0.08016215509350072, + "eval_loss": 0.3535269796848297, + "eval_runtime": 4.4256, + "eval_samples_per_second": 81.12, + "eval_steps_per_second": 2.712, + "eval_wer": 0.3001773335482831, + "step": 65000 + }, + { + "epoch": 191.47, + "learning_rate": 8.909171450171858e-06, + "loss": 0.2201, + "step": 65100 + }, + { + "epoch": 191.76, + "learning_rate": 8.90589380815279e-06, + "loss": 0.215, + "step": 65200 + }, + { + "epoch": 192.06, + "learning_rate": 8.902611854143569e-06, + "loss": 0.218, + "step": 65300 + }, + { + "epoch": 192.35, + "learning_rate": 8.899325591767371e-06, + "loss": 0.2169, + "step": 65400 + }, + { + "epoch": 192.65, + "learning_rate": 8.896035024652135e-06, + "loss": 0.218, + "step": 65500 + }, + { + "epoch": 192.94, + "learning_rate": 8.892740156430548e-06, + "loss": 0.2225, + "step": 65600 + }, + { + "epoch": 193.24, + "learning_rate": 8.889440990740048e-06, + "loss": 0.2191, + "step": 65700 + }, + { + "epoch": 193.53, + "learning_rate": 8.886137531222812e-06, + "loss": 0.2262, + "step": 65800 + }, + { + "epoch": 193.82, + "learning_rate": 8.882829781525762e-06, + "loss": 0.219, + "step": 65900 + }, + { + "epoch": 194.12, + "learning_rate": 8.879517745300557e-06, + "loss": 0.2068, + "step": 66000 + }, + { + "epoch": 194.12, + "eval_cer": 0.0793339435944379, + "eval_loss": 0.35546955466270447, + "eval_runtime": 4.9742, + "eval_samples_per_second": 72.173, + "eval_steps_per_second": 2.412, + "eval_wer": 0.2992100596485571, + "step": 66000 + }, + { + "epoch": 194.41, + "learning_rate": 8.876201426203583e-06, + "loss": 0.2166, + "step": 66100 + }, + { + "epoch": 194.71, + "learning_rate": 8.872880827895957e-06, + "loss": 0.2128, + "step": 66200 + }, + { + "epoch": 195.0, + "learning_rate": 8.869555954043525e-06, + "loss": 0.2172, + "step": 66300 + }, + { + "epoch": 195.29, + "learning_rate": 8.866226808316844e-06, + "loss": 0.2199, + "step": 66400 + }, + { + "epoch": 195.59, + "learning_rate": 8.862893394391192e-06, + "loss": 0.2214, + "step": 66500 + }, + { + "epoch": 195.88, + "learning_rate": 8.859555715946561e-06, + "loss": 0.2143, + "step": 66600 + }, + { + "epoch": 196.18, + "learning_rate": 8.856213776667646e-06, + "loss": 0.2128, + "step": 66700 + }, + { + "epoch": 196.47, + "learning_rate": 8.85286758024385e-06, + "loss": 0.2083, + "step": 66800 + }, + { + "epoch": 196.76, + "learning_rate": 8.84951713036927e-06, + "loss": 0.2139, + "step": 66900 + }, + { + "epoch": 197.06, + "learning_rate": 8.846162430742708e-06, + "loss": 0.2177, + "step": 67000 + }, + { + "epoch": 197.06, + "eval_cer": 0.0796390741467242, + "eval_loss": 0.3596145808696747, + "eval_runtime": 4.9633, + "eval_samples_per_second": 72.331, + "eval_steps_per_second": 2.418, + "eval_wer": 0.300822182814767, + "step": 67000 + }, + { + "epoch": 197.35, + "learning_rate": 8.842803485067648e-06, + "loss": 0.2133, + "step": 67100 + }, + { + "epoch": 197.65, + "learning_rate": 8.839440297052269e-06, + "loss": 0.2151, + "step": 67200 + }, + { + "epoch": 197.94, + "learning_rate": 8.836072870409429e-06, + "loss": 0.229, + "step": 67300 + }, + { + "epoch": 198.24, + "learning_rate": 8.832701208856665e-06, + "loss": 0.2118, + "step": 67400 + }, + { + "epoch": 198.53, + "learning_rate": 8.829325316116191e-06, + "loss": 0.2137, + "step": 67500 + }, + { + "epoch": 198.82, + "learning_rate": 8.825945195914893e-06, + "loss": 0.2113, + "step": 67600 + }, + { + "epoch": 199.12, + "learning_rate": 8.822560851984324e-06, + "loss": 0.2267, + "step": 67700 + }, + { + "epoch": 199.41, + "learning_rate": 8.819172288060696e-06, + "loss": 0.2123, + "step": 67800 + }, + { + "epoch": 199.71, + "learning_rate": 8.815779507884882e-06, + "loss": 0.2234, + "step": 67900 + }, + { + "epoch": 200.0, + "learning_rate": 8.812382515202413e-06, + "loss": 0.214, + "step": 68000 + }, + { + "epoch": 200.0, + "eval_cer": 0.08020574517239876, + "eval_loss": 0.3504684865474701, + "eval_runtime": 4.4424, + "eval_samples_per_second": 80.812, + "eval_steps_per_second": 2.701, + "eval_wer": 0.3000161212316621, + "step": 68000 + }, + { + "epoch": 200.29, + "learning_rate": 8.808981313763467e-06, + "loss": 0.2106, + "step": 68100 + }, + { + "epoch": 200.59, + "learning_rate": 8.805575907322868e-06, + "loss": 0.2152, + "step": 68200 + }, + { + "epoch": 200.88, + "learning_rate": 8.80216629964008e-06, + "loss": 0.221, + "step": 68300 + }, + { + "epoch": 201.18, + "learning_rate": 8.798752494479213e-06, + "loss": 0.2061, + "step": 68400 + }, + { + "epoch": 201.47, + "learning_rate": 8.795334495609003e-06, + "loss": 0.2031, + "step": 68500 + }, + { + "epoch": 201.76, + "learning_rate": 8.79191230680282e-06, + "loss": 0.2065, + "step": 68600 + }, + { + "epoch": 202.06, + "learning_rate": 8.78848593183866e-06, + "loss": 0.2109, + "step": 68700 + }, + { + "epoch": 202.35, + "learning_rate": 8.785055374499135e-06, + "loss": 0.2076, + "step": 68800 + }, + { + "epoch": 202.65, + "learning_rate": 8.781620638571478e-06, + "loss": 0.2059, + "step": 68900 + }, + { + "epoch": 202.94, + "learning_rate": 8.778181727847537e-06, + "loss": 0.2027, + "step": 69000 + }, + { + "epoch": 202.94, + "eval_cer": 0.0793339435944379, + "eval_loss": 0.3646654784679413, + "eval_runtime": 4.806, + "eval_samples_per_second": 74.698, + "eval_steps_per_second": 2.497, + "eval_wer": 0.2956633886828954, + "step": 69000 + }, + { + "epoch": 203.24, + "learning_rate": 8.774738646123767e-06, + "loss": 0.1986, + "step": 69100 + }, + { + "epoch": 203.53, + "learning_rate": 8.771291397201227e-06, + "loss": 0.206, + "step": 69200 + }, + { + "epoch": 203.82, + "learning_rate": 8.76787451960502e-06, + "loss": 0.2011, + "step": 69300 + }, + { + "epoch": 204.12, + "learning_rate": 8.764418989283467e-06, + "loss": 0.2044, + "step": 69400 + }, + { + "epoch": 204.41, + "learning_rate": 8.760959303155737e-06, + "loss": 0.2121, + "step": 69500 + }, + { + "epoch": 204.71, + "learning_rate": 8.757495465041219e-06, + "loss": 0.2046, + "step": 69600 + }, + { + "epoch": 205.0, + "learning_rate": 8.75402747876389e-06, + "loss": 0.2066, + "step": 69700 + }, + { + "epoch": 205.29, + "learning_rate": 8.750555348152299e-06, + "loss": 0.2158, + "step": 69800 + }, + { + "epoch": 205.59, + "learning_rate": 8.747079077039577e-06, + "loss": 0.1984, + "step": 69900 + }, + { + "epoch": 205.88, + "learning_rate": 8.743598669263422e-06, + "loss": 0.2062, + "step": 70000 + }, + { + "epoch": 205.88, + "eval_cer": 0.0796390741467242, + "eval_loss": 0.3702377378940582, + "eval_runtime": 4.7589, + "eval_samples_per_second": 75.438, + "eval_steps_per_second": 2.522, + "eval_wer": 0.2975979364823472, + "step": 70000 + }, + { + "epoch": 206.18, + "learning_rate": 8.740114128666103e-06, + "loss": 0.2108, + "step": 70100 + }, + { + "epoch": 206.47, + "learning_rate": 8.736625459094445e-06, + "loss": 0.2085, + "step": 70200 + }, + { + "epoch": 206.76, + "learning_rate": 8.733132664399839e-06, + "loss": 0.2036, + "step": 70300 + }, + { + "epoch": 207.06, + "learning_rate": 8.729635748438225e-06, + "loss": 0.2005, + "step": 70400 + }, + { + "epoch": 207.35, + "learning_rate": 8.726134715070092e-06, + "loss": 0.207, + "step": 70500 + }, + { + "epoch": 207.65, + "learning_rate": 8.722629568160476e-06, + "loss": 0.2073, + "step": 70600 + }, + { + "epoch": 207.94, + "learning_rate": 8.71912031157896e-06, + "loss": 0.2015, + "step": 70700 + }, + { + "epoch": 208.24, + "learning_rate": 8.71560694919965e-06, + "loss": 0.1977, + "step": 70800 + }, + { + "epoch": 208.53, + "learning_rate": 8.712089484901201e-06, + "loss": 0.2027, + "step": 70900 + }, + { + "epoch": 208.82, + "learning_rate": 8.708567922566781e-06, + "loss": 0.2097, + "step": 71000 + }, + { + "epoch": 208.82, + "eval_cer": 0.07981343446231638, + "eval_loss": 0.3614213764667511, + "eval_runtime": 4.5359, + "eval_samples_per_second": 79.147, + "eval_steps_per_second": 2.646, + "eval_wer": 0.2972755118491053, + "step": 71000 + }, + { + "epoch": 209.12, + "learning_rate": 8.705042266084098e-06, + "loss": 0.2017, + "step": 71100 + }, + { + "epoch": 209.41, + "learning_rate": 8.701512519345366e-06, + "loss": 0.202, + "step": 71200 + }, + { + "epoch": 209.71, + "learning_rate": 8.69797868624732e-06, + "loss": 0.2067, + "step": 71300 + }, + { + "epoch": 210.0, + "learning_rate": 8.69444077069121e-06, + "loss": 0.2098, + "step": 71400 + }, + { + "epoch": 210.29, + "learning_rate": 8.690898776582786e-06, + "loss": 0.2027, + "step": 71500 + }, + { + "epoch": 210.59, + "learning_rate": 8.687352707832303e-06, + "loss": 0.1998, + "step": 71600 + }, + { + "epoch": 210.88, + "learning_rate": 8.683802568354519e-06, + "loss": 0.2014, + "step": 71700 + }, + { + "epoch": 211.18, + "learning_rate": 8.680248362068677e-06, + "loss": 0.1935, + "step": 71800 + }, + { + "epoch": 211.47, + "learning_rate": 8.676690092898518e-06, + "loss": 0.2037, + "step": 71900 + }, + { + "epoch": 211.76, + "learning_rate": 8.673127764772264e-06, + "loss": 0.2041, + "step": 72000 + }, + { + "epoch": 211.76, + "eval_cer": 0.0793339435944379, + "eval_loss": 0.3621172606945038, + "eval_runtime": 4.7752, + "eval_samples_per_second": 75.18, + "eval_steps_per_second": 2.513, + "eval_wer": 0.2964694502660003, + "step": 72000 + }, + { + "epoch": 212.06, + "learning_rate": 8.66956138162262e-06, + "loss": 0.2003, + "step": 72100 + }, + { + "epoch": 212.35, + "learning_rate": 8.665990947386765e-06, + "loss": 0.1893, + "step": 72200 + }, + { + "epoch": 212.65, + "learning_rate": 8.662416466006352e-06, + "loss": 0.1984, + "step": 72300 + }, + { + "epoch": 212.94, + "learning_rate": 8.658837941427502e-06, + "loss": 0.2038, + "step": 72400 + }, + { + "epoch": 213.24, + "learning_rate": 8.655255377600802e-06, + "loss": 0.2029, + "step": 72500 + }, + { + "epoch": 213.53, + "learning_rate": 8.65166877848129e-06, + "loss": 0.2029, + "step": 72600 + }, + { + "epoch": 213.82, + "learning_rate": 8.648078148028466e-06, + "loss": 0.1899, + "step": 72700 + }, + { + "epoch": 214.12, + "learning_rate": 8.644483490206283e-06, + "loss": 0.1949, + "step": 72800 + }, + { + "epoch": 214.41, + "learning_rate": 8.640920815698158e-06, + "loss": 0.2023, + "step": 72900 + }, + { + "epoch": 214.71, + "learning_rate": 8.637318155221476e-06, + "loss": 0.2099, + "step": 73000 + }, + { + "epoch": 214.71, + "eval_cer": 0.07837496185868097, + "eval_loss": 0.3655032813549042, + "eval_runtime": 5.0092, + "eval_samples_per_second": 71.667, + "eval_steps_per_second": 2.396, + "eval_wer": 0.29614702563275835, + "step": 73000 + }, + { + "epoch": 215.0, + "learning_rate": 8.633711479254145e-06, + "loss": 0.1991, + "step": 73100 + }, + { + "epoch": 215.29, + "learning_rate": 8.630100791777824e-06, + "loss": 0.1907, + "step": 73200 + }, + { + "epoch": 215.59, + "learning_rate": 8.626486096778608e-06, + "loss": 0.1894, + "step": 73300 + }, + { + "epoch": 215.88, + "learning_rate": 8.622867398247007e-06, + "loss": 0.193, + "step": 73400 + }, + { + "epoch": 216.18, + "learning_rate": 8.619244700177962e-06, + "loss": 0.1929, + "step": 73500 + }, + { + "epoch": 216.47, + "learning_rate": 8.615618006570818e-06, + "loss": 0.192, + "step": 73600 + }, + { + "epoch": 216.76, + "learning_rate": 8.611987321429341e-06, + "loss": 0.1951, + "step": 73700 + }, + { + "epoch": 217.06, + "learning_rate": 8.608352648761697e-06, + "loss": 0.1962, + "step": 73800 + }, + { + "epoch": 217.35, + "learning_rate": 8.604713992580456e-06, + "loss": 0.1981, + "step": 73900 + }, + { + "epoch": 217.65, + "learning_rate": 8.601071356902584e-06, + "loss": 0.2009, + "step": 74000 + }, + { + "epoch": 217.65, + "eval_cer": 0.07854932217427314, + "eval_loss": 0.36690473556518555, + "eval_runtime": 4.8416, + "eval_samples_per_second": 74.149, + "eval_steps_per_second": 2.479, + "eval_wer": 0.2948573270997904, + "step": 74000 + }, + { + "epoch": 217.94, + "learning_rate": 8.597424745749446e-06, + "loss": 0.1953, + "step": 74100 + }, + { + "epoch": 218.24, + "learning_rate": 8.59377416314679e-06, + "loss": 0.1933, + "step": 74200 + }, + { + "epoch": 218.53, + "learning_rate": 8.59011961312475e-06, + "loss": 0.1988, + "step": 74300 + }, + { + "epoch": 218.82, + "learning_rate": 8.58646109971784e-06, + "loss": 0.1955, + "step": 74400 + }, + { + "epoch": 219.12, + "learning_rate": 8.58279862696495e-06, + "loss": 0.1873, + "step": 74500 + }, + { + "epoch": 219.41, + "learning_rate": 8.57913219890934e-06, + "loss": 0.1928, + "step": 74600 + }, + { + "epoch": 219.71, + "learning_rate": 8.575461819598637e-06, + "loss": 0.1936, + "step": 74700 + }, + { + "epoch": 220.0, + "learning_rate": 8.57178749308483e-06, + "loss": 0.1883, + "step": 74800 + }, + { + "epoch": 220.29, + "learning_rate": 8.568109223424269e-06, + "loss": 0.1984, + "step": 74900 + }, + { + "epoch": 220.59, + "learning_rate": 8.56442701467765e-06, + "loss": 0.188, + "step": 75000 + }, + { + "epoch": 220.59, + "eval_cer": 0.07911599319994769, + "eval_loss": 0.3651310205459595, + "eval_runtime": 4.7688, + "eval_samples_per_second": 75.282, + "eval_steps_per_second": 2.516, + "eval_wer": 0.2963082379493793, + "step": 75000 + }, + { + "epoch": 220.88, + "learning_rate": 8.560740870910022e-06, + "loss": 0.1876, + "step": 75100 + }, + { + "epoch": 221.18, + "learning_rate": 8.55705079619078e-06, + "loss": 0.188, + "step": 75200 + }, + { + "epoch": 221.47, + "learning_rate": 8.553356794593654e-06, + "loss": 0.1815, + "step": 75300 + }, + { + "epoch": 221.76, + "learning_rate": 8.549658870196714e-06, + "loss": 0.1993, + "step": 75400 + }, + { + "epoch": 222.06, + "learning_rate": 8.545957027082354e-06, + "loss": 0.1927, + "step": 75500 + }, + { + "epoch": 222.35, + "learning_rate": 8.542251269337301e-06, + "loss": 0.1961, + "step": 75600 + }, + { + "epoch": 222.65, + "learning_rate": 8.538541601052601e-06, + "loss": 0.1909, + "step": 75700 + }, + { + "epoch": 222.94, + "learning_rate": 8.534828026323619e-06, + "loss": 0.1906, + "step": 75800 + }, + { + "epoch": 223.24, + "learning_rate": 8.531110549250025e-06, + "loss": 0.1893, + "step": 75900 + }, + { + "epoch": 223.53, + "learning_rate": 8.527389173935807e-06, + "loss": 0.1904, + "step": 76000 + }, + { + "epoch": 223.53, + "eval_cer": 0.07854932217427314, + "eval_loss": 0.3699847459793091, + "eval_runtime": 4.7309, + "eval_samples_per_second": 75.884, + "eval_steps_per_second": 2.537, + "eval_wer": 0.2943736901499275, + "step": 76000 + }, + { + "epoch": 223.82, + "learning_rate": 8.523663904489252e-06, + "loss": 0.1924, + "step": 76100 + }, + { + "epoch": 224.12, + "learning_rate": 8.519934745022946e-06, + "loss": 0.1919, + "step": 76200 + }, + { + "epoch": 224.41, + "learning_rate": 8.516201699653767e-06, + "loss": 0.1839, + "step": 76300 + }, + { + "epoch": 224.71, + "learning_rate": 8.51246477250289e-06, + "loss": 0.1907, + "step": 76400 + }, + { + "epoch": 225.0, + "learning_rate": 8.50876139492468e-06, + "loss": 0.1808, + "step": 76500 + }, + { + "epoch": 225.29, + "learning_rate": 8.50501675530586e-06, + "loss": 0.1896, + "step": 76600 + }, + { + "epoch": 225.59, + "learning_rate": 8.501268246253185e-06, + "loss": 0.1865, + "step": 76700 + }, + { + "epoch": 225.88, + "learning_rate": 8.497515871904896e-06, + "loss": 0.1868, + "step": 76800 + }, + { + "epoch": 226.18, + "learning_rate": 8.493759636403502e-06, + "loss": 0.1851, + "step": 76900 + }, + { + "epoch": 226.47, + "learning_rate": 8.489999543895777e-06, + "loss": 0.1901, + "step": 77000 + }, + { + "epoch": 226.47, + "eval_cer": 0.07850573209537509, + "eval_loss": 0.37494558095932007, + "eval_runtime": 4.7868, + "eval_samples_per_second": 74.998, + "eval_steps_per_second": 2.507, + "eval_wer": 0.2937288408834435, + "step": 77000 + }, + { + "epoch": 226.76, + "learning_rate": 8.486235598532748e-06, + "loss": 0.1895, + "step": 77100 + }, + { + "epoch": 227.06, + "learning_rate": 8.482467804469701e-06, + "loss": 0.1884, + "step": 77200 + }, + { + "epoch": 227.35, + "learning_rate": 8.478696165866164e-06, + "loss": 0.1808, + "step": 77300 + }, + { + "epoch": 227.65, + "learning_rate": 8.474920686885921e-06, + "loss": 0.1905, + "step": 77400 + }, + { + "epoch": 227.94, + "learning_rate": 8.471141371696981e-06, + "loss": 0.187, + "step": 77500 + }, + { + "epoch": 228.24, + "learning_rate": 8.467358224471598e-06, + "loss": 0.1942, + "step": 77600 + }, + { + "epoch": 228.53, + "learning_rate": 8.463571249386255e-06, + "loss": 0.187, + "step": 77700 + }, + { + "epoch": 228.82, + "learning_rate": 8.459780450621655e-06, + "loss": 0.1821, + "step": 77800 + }, + { + "epoch": 229.12, + "learning_rate": 8.45598583236273e-06, + "loss": 0.1905, + "step": 77900 + }, + { + "epoch": 229.41, + "learning_rate": 8.452187398798625e-06, + "loss": 0.1857, + "step": 78000 + }, + { + "epoch": 229.41, + "eval_cer": 0.07802624122749661, + "eval_loss": 0.3787274658679962, + "eval_runtime": 4.6442, + "eval_samples_per_second": 77.301, + "eval_steps_per_second": 2.584, + "eval_wer": 0.29098823150088665, + "step": 78000 + }, + { + "epoch": 229.71, + "learning_rate": 8.448385154122697e-06, + "loss": 0.1909, + "step": 78100 + }, + { + "epoch": 230.0, + "learning_rate": 8.444579102532511e-06, + "loss": 0.178, + "step": 78200 + }, + { + "epoch": 230.29, + "learning_rate": 8.440769248229831e-06, + "loss": 0.1833, + "step": 78300 + }, + { + "epoch": 230.59, + "learning_rate": 8.436955595420629e-06, + "loss": 0.1824, + "step": 78400 + }, + { + "epoch": 230.88, + "learning_rate": 8.433138148315059e-06, + "loss": 0.1811, + "step": 78500 + }, + { + "epoch": 231.18, + "learning_rate": 8.429316911127469e-06, + "loss": 0.1839, + "step": 78600 + }, + { + "epoch": 231.47, + "learning_rate": 8.42549188807639e-06, + "loss": 0.1871, + "step": 78700 + }, + { + "epoch": 231.76, + "learning_rate": 8.421663083384539e-06, + "loss": 0.1796, + "step": 78800 + }, + { + "epoch": 232.06, + "learning_rate": 8.417830501278794e-06, + "loss": 0.1853, + "step": 78900 + }, + { + "epoch": 232.35, + "learning_rate": 8.413994145990216e-06, + "loss": 0.1796, + "step": 79000 + }, + { + "epoch": 232.35, + "eval_cer": 0.078418551937579, + "eval_loss": 0.3776050806045532, + "eval_runtime": 4.6833, + "eval_samples_per_second": 76.656, + "eval_steps_per_second": 2.562, + "eval_wer": 0.2943736901499275, + "step": 79000 + }, + { + "epoch": 232.65, + "learning_rate": 8.410154021754026e-06, + "loss": 0.1848, + "step": 79100 + }, + { + "epoch": 232.94, + "learning_rate": 8.406310132809604e-06, + "loss": 0.182, + "step": 79200 + }, + { + "epoch": 233.24, + "learning_rate": 8.402462483400494e-06, + "loss": 0.1849, + "step": 79300 + }, + { + "epoch": 233.53, + "learning_rate": 8.398611077774382e-06, + "loss": 0.1856, + "step": 79400 + }, + { + "epoch": 233.82, + "learning_rate": 8.394755920183107e-06, + "loss": 0.1754, + "step": 79500 + }, + { + "epoch": 234.12, + "learning_rate": 8.390897014882645e-06, + "loss": 0.1732, + "step": 79600 + }, + { + "epoch": 234.41, + "learning_rate": 8.387034366133113e-06, + "loss": 0.1879, + "step": 79700 + }, + { + "epoch": 234.71, + "learning_rate": 8.383167978198762e-06, + "loss": 0.1751, + "step": 79800 + }, + { + "epoch": 235.0, + "learning_rate": 8.379297855347966e-06, + "loss": 0.1849, + "step": 79900 + }, + { + "epoch": 235.29, + "learning_rate": 8.37542400185323e-06, + "loss": 0.1836, + "step": 80000 + }, + { + "epoch": 235.29, + "eval_cer": 0.078418551937579, + "eval_loss": 0.38717299699783325, + "eval_runtime": 4.8192, + "eval_samples_per_second": 74.494, + "eval_steps_per_second": 2.49, + "eval_wer": 0.2930839916169595, + "step": 80000 + }, + { + "epoch": 235.59, + "learning_rate": 8.371546421991167e-06, + "loss": 0.1776, + "step": 80100 + }, + { + "epoch": 235.88, + "learning_rate": 8.367665120042513e-06, + "loss": 0.179, + "step": 80200 + }, + { + "epoch": 236.18, + "learning_rate": 8.363780100292104e-06, + "loss": 0.1853, + "step": 80300 + }, + { + "epoch": 236.47, + "learning_rate": 8.359891367028895e-06, + "loss": 0.1792, + "step": 80400 + }, + { + "epoch": 236.76, + "learning_rate": 8.356037867317286e-06, + "loss": 0.1834, + "step": 80500 + }, + { + "epoch": 237.06, + "learning_rate": 8.352141756939638e-06, + "loss": 0.1799, + "step": 80600 + }, + { + "epoch": 237.35, + "learning_rate": 8.348241945897569e-06, + "loss": 0.1832, + "step": 80700 + }, + { + "epoch": 237.65, + "learning_rate": 8.344338438496354e-06, + "loss": 0.1799, + "step": 80800 + }, + { + "epoch": 237.94, + "learning_rate": 8.340431239045348e-06, + "loss": 0.1772, + "step": 80900 + }, + { + "epoch": 238.24, + "learning_rate": 8.336520351857981e-06, + "loss": 0.1833, + "step": 81000 + }, + { + "epoch": 238.24, + "eval_cer": 0.07889804280545748, + "eval_loss": 0.3830723762512207, + "eval_runtime": 4.9874, + "eval_samples_per_second": 71.981, + "eval_steps_per_second": 2.406, + "eval_wer": 0.2930839916169595, + "step": 81000 + }, + { + "epoch": 238.53, + "learning_rate": 8.33260578125176e-06, + "loss": 0.1729, + "step": 81100 + }, + { + "epoch": 238.82, + "learning_rate": 8.32868753154825e-06, + "loss": 0.1789, + "step": 81200 + }, + { + "epoch": 239.12, + "learning_rate": 8.324765607073083e-06, + "loss": 0.1753, + "step": 81300 + }, + { + "epoch": 239.41, + "learning_rate": 8.320840012155949e-06, + "loss": 0.1704, + "step": 81400 + }, + { + "epoch": 239.71, + "learning_rate": 8.316910751130583e-06, + "loss": 0.1784, + "step": 81500 + }, + { + "epoch": 240.0, + "learning_rate": 8.312977828334777e-06, + "loss": 0.1784, + "step": 81600 + }, + { + "epoch": 240.29, + "learning_rate": 8.309041248110355e-06, + "loss": 0.178, + "step": 81700 + }, + { + "epoch": 240.59, + "learning_rate": 8.305101014803185e-06, + "loss": 0.1754, + "step": 81800 + }, + { + "epoch": 240.88, + "learning_rate": 8.301157132763172e-06, + "loss": 0.1795, + "step": 81900 + }, + { + "epoch": 241.18, + "learning_rate": 8.297209606344238e-06, + "loss": 0.1702, + "step": 82000 + }, + { + "epoch": 241.18, + "eval_cer": 0.07824419162198684, + "eval_loss": 0.3892400562763214, + "eval_runtime": 4.742, + "eval_samples_per_second": 75.706, + "eval_steps_per_second": 2.531, + "eval_wer": 0.2914718684507496, + "step": 82000 + }, + { + "epoch": 241.47, + "learning_rate": 8.29325843990434e-06, + "loss": 0.1775, + "step": 82100 + }, + { + "epoch": 241.76, + "learning_rate": 8.289303637805442e-06, + "loss": 0.1759, + "step": 82200 + }, + { + "epoch": 242.06, + "learning_rate": 8.285345204413531e-06, + "loss": 0.1819, + "step": 82300 + }, + { + "epoch": 242.35, + "learning_rate": 8.281383144098599e-06, + "loss": 0.1693, + "step": 82400 + }, + { + "epoch": 242.65, + "learning_rate": 8.277417461234639e-06, + "loss": 0.1743, + "step": 82500 + }, + { + "epoch": 242.94, + "learning_rate": 8.27344816019965e-06, + "loss": 0.1764, + "step": 82600 + }, + { + "epoch": 243.24, + "learning_rate": 8.269475245375624e-06, + "loss": 0.1715, + "step": 82700 + }, + { + "epoch": 243.53, + "learning_rate": 8.265498721148536e-06, + "loss": 0.1747, + "step": 82800 + }, + { + "epoch": 243.82, + "learning_rate": 8.261598229793867e-06, + "loss": 0.1758, + "step": 82900 + }, + { + "epoch": 244.12, + "learning_rate": 8.257614571903827e-06, + "loss": 0.1782, + "step": 83000 + }, + { + "epoch": 244.12, + "eval_cer": 0.07833137177978292, + "eval_loss": 0.38854503631591797, + "eval_runtime": 4.6398, + "eval_samples_per_second": 77.374, + "eval_steps_per_second": 2.586, + "eval_wer": 0.29340641625020153, + "step": 83000 + }, + { + "epoch": 244.41, + "learning_rate": 8.253627317704554e-06, + "loss": 0.1749, + "step": 83100 + }, + { + "epoch": 244.71, + "learning_rate": 8.24963647159786e-06, + "loss": 0.1746, + "step": 83200 + }, + { + "epoch": 245.0, + "learning_rate": 8.245642037989519e-06, + "loss": 0.1728, + "step": 83300 + }, + { + "epoch": 245.29, + "learning_rate": 8.241644021289268e-06, + "loss": 0.1726, + "step": 83400 + }, + { + "epoch": 245.59, + "learning_rate": 8.237642425910796e-06, + "loss": 0.1696, + "step": 83500 + }, + { + "epoch": 245.88, + "learning_rate": 8.233637256271744e-06, + "loss": 0.1729, + "step": 83600 + }, + { + "epoch": 246.18, + "learning_rate": 8.229628516793703e-06, + "loss": 0.172, + "step": 83700 + }, + { + "epoch": 246.47, + "learning_rate": 8.2256162119022e-06, + "loss": 0.1728, + "step": 83800 + }, + { + "epoch": 246.76, + "learning_rate": 8.2216003460267e-06, + "loss": 0.1773, + "step": 83900 + }, + { + "epoch": 247.06, + "learning_rate": 8.217580923600598e-06, + "loss": 0.1701, + "step": 84000 + }, + { + "epoch": 247.06, + "eval_cer": 0.07737239004402598, + "eval_loss": 0.3914085924625397, + "eval_runtime": 4.7341, + "eval_samples_per_second": 75.833, + "eval_steps_per_second": 2.535, + "eval_wer": 0.2895373206512978, + "step": 84000 + }, + { + "epoch": 247.35, + "learning_rate": 8.21355794906122e-06, + "loss": 0.1728, + "step": 84100 + }, + { + "epoch": 247.65, + "learning_rate": 8.209531426849805e-06, + "loss": 0.1745, + "step": 84200 + }, + { + "epoch": 247.94, + "learning_rate": 8.205501361411516e-06, + "loss": 0.1684, + "step": 84300 + }, + { + "epoch": 248.24, + "learning_rate": 8.201467757195422e-06, + "loss": 0.17, + "step": 84400 + }, + { + "epoch": 248.53, + "learning_rate": 8.197430618654507e-06, + "loss": 0.1723, + "step": 84500 + }, + { + "epoch": 248.82, + "learning_rate": 8.193389950245647e-06, + "loss": 0.1755, + "step": 84600 + }, + { + "epoch": 249.12, + "learning_rate": 8.18934575642962e-06, + "loss": 0.1714, + "step": 84700 + }, + { + "epoch": 249.41, + "learning_rate": 8.185298041671098e-06, + "loss": 0.167, + "step": 84800 + }, + { + "epoch": 249.71, + "learning_rate": 8.181246810438635e-06, + "loss": 0.1716, + "step": 84900 + }, + { + "epoch": 250.0, + "learning_rate": 8.177192067204668e-06, + "loss": 0.1694, + "step": 85000 + }, + { + "epoch": 250.0, + "eval_cer": 0.07815701146419075, + "eval_loss": 0.3912142217159271, + "eval_runtime": 4.7431, + "eval_samples_per_second": 75.689, + "eval_steps_per_second": 2.53, + "eval_wer": 0.2903433822344027, + "step": 85000 + }, + { + "epoch": 250.29, + "learning_rate": 8.173174416300648e-06, + "loss": 0.1667, + "step": 85100 + }, + { + "epoch": 250.59, + "learning_rate": 8.169112697504755e-06, + "loss": 0.1663, + "step": 85200 + }, + { + "epoch": 250.88, + "learning_rate": 8.16504748010306e-06, + "loss": 0.1759, + "step": 85300 + }, + { + "epoch": 251.18, + "learning_rate": 8.160978768583436e-06, + "loss": 0.1643, + "step": 85400 + }, + { + "epoch": 251.47, + "learning_rate": 8.156906567437623e-06, + "loss": 0.1659, + "step": 85500 + }, + { + "epoch": 251.76, + "learning_rate": 8.15283088116121e-06, + "loss": 0.1669, + "step": 85600 + }, + { + "epoch": 252.06, + "learning_rate": 8.148751714253633e-06, + "loss": 0.168, + "step": 85700 + }, + { + "epoch": 252.35, + "learning_rate": 8.14466907121817e-06, + "loss": 0.1734, + "step": 85800 + }, + { + "epoch": 252.65, + "learning_rate": 8.140582956561936e-06, + "loss": 0.1641, + "step": 85900 + }, + { + "epoch": 252.94, + "learning_rate": 8.13649337479588e-06, + "loss": 0.17, + "step": 86000 + }, + { + "epoch": 252.94, + "eval_cer": 0.07772111067521033, + "eval_loss": 0.404951274394989, + "eval_runtime": 4.4459, + "eval_samples_per_second": 80.749, + "eval_steps_per_second": 2.699, + "eval_wer": 0.29131065613412865, + "step": 86000 + }, + { + "epoch": 253.24, + "learning_rate": 8.132400330434778e-06, + "loss": 0.1724, + "step": 86100 + }, + { + "epoch": 253.53, + "learning_rate": 8.128303827997228e-06, + "loss": 0.1713, + "step": 86200 + }, + { + "epoch": 253.82, + "learning_rate": 8.12420387200565e-06, + "loss": 0.1699, + "step": 86300 + }, + { + "epoch": 254.12, + "learning_rate": 8.120100466986268e-06, + "loss": 0.163, + "step": 86400 + }, + { + "epoch": 254.41, + "learning_rate": 8.115993617469121e-06, + "loss": 0.1714, + "step": 86500 + }, + { + "epoch": 254.71, + "learning_rate": 8.11188332798805e-06, + "loss": 0.1717, + "step": 86600 + }, + { + "epoch": 255.0, + "learning_rate": 8.10776960308069e-06, + "loss": 0.1671, + "step": 86700 + }, + { + "epoch": 255.29, + "learning_rate": 8.10365244728847e-06, + "loss": 0.1674, + "step": 86800 + }, + { + "epoch": 255.59, + "learning_rate": 8.099531865156609e-06, + "loss": 0.1612, + "step": 86900 + }, + { + "epoch": 255.88, + "learning_rate": 8.095407861234105e-06, + "loss": 0.1654, + "step": 87000 + }, + { + "epoch": 255.88, + "eval_cer": 0.07676212893945338, + "eval_loss": 0.3947739899158478, + "eval_runtime": 4.6602, + "eval_samples_per_second": 77.036, + "eval_steps_per_second": 2.575, + "eval_wer": 0.2882476221183298, + "step": 87000 + }, + { + "epoch": 256.18, + "learning_rate": 8.091280440073735e-06, + "loss": 0.1648, + "step": 87100 + }, + { + "epoch": 256.47, + "learning_rate": 8.08714960623205e-06, + "loss": 0.1632, + "step": 87200 + }, + { + "epoch": 256.76, + "learning_rate": 8.083015364269366e-06, + "loss": 0.1645, + "step": 87300 + }, + { + "epoch": 257.06, + "learning_rate": 8.078877718749765e-06, + "loss": 0.162, + "step": 87400 + }, + { + "epoch": 257.35, + "learning_rate": 8.07473667424108e-06, + "loss": 0.1624, + "step": 87500 + }, + { + "epoch": 257.65, + "learning_rate": 8.070592235314904e-06, + "loss": 0.1625, + "step": 87600 + }, + { + "epoch": 257.94, + "learning_rate": 8.066444406546573e-06, + "loss": 0.1648, + "step": 87700 + }, + { + "epoch": 258.24, + "learning_rate": 8.062293192515168e-06, + "loss": 0.17, + "step": 87800 + }, + { + "epoch": 258.53, + "learning_rate": 8.0581385978035e-06, + "loss": 0.1681, + "step": 87900 + }, + { + "epoch": 258.82, + "learning_rate": 8.053980626998121e-06, + "loss": 0.1638, + "step": 88000 + }, + { + "epoch": 258.82, + "eval_cer": 0.0775031602807201, + "eval_loss": 0.40064844489097595, + "eval_runtime": 4.8954, + "eval_samples_per_second": 73.334, + "eval_steps_per_second": 2.451, + "eval_wer": 0.29098823150088665, + "step": 88000 + }, + { + "epoch": 259.12, + "learning_rate": 8.049819284689309e-06, + "loss": 0.1636, + "step": 88100 + }, + { + "epoch": 259.41, + "learning_rate": 8.045654575471056e-06, + "loss": 0.1604, + "step": 88200 + }, + { + "epoch": 259.71, + "learning_rate": 8.041486503941082e-06, + "loss": 0.1713, + "step": 88300 + }, + { + "epoch": 260.0, + "learning_rate": 8.037315074700811e-06, + "loss": 0.1648, + "step": 88400 + }, + { + "epoch": 260.29, + "learning_rate": 8.033140292355377e-06, + "loss": 0.1635, + "step": 88500 + }, + { + "epoch": 260.59, + "learning_rate": 8.028962161513614e-06, + "loss": 0.1645, + "step": 88600 + }, + { + "epoch": 260.88, + "learning_rate": 8.024780686788054e-06, + "loss": 0.1615, + "step": 88700 + }, + { + "epoch": 261.18, + "learning_rate": 8.020595872794921e-06, + "loss": 0.1629, + "step": 88800 + }, + { + "epoch": 261.47, + "learning_rate": 8.016407724154126e-06, + "loss": 0.1644, + "step": 88900 + }, + { + "epoch": 261.76, + "learning_rate": 8.012216245489255e-06, + "loss": 0.1599, + "step": 89000 + }, + { + "epoch": 261.76, + "eval_cer": 0.07654417854496316, + "eval_loss": 0.40178772807121277, + "eval_runtime": 4.5847, + "eval_samples_per_second": 78.303, + "eval_steps_per_second": 2.617, + "eval_wer": 0.286313074318878, + "step": 89000 + }, + { + "epoch": 262.06, + "learning_rate": 8.00806340591371e-06, + "loss": 0.1659, + "step": 89100 + }, + { + "epoch": 262.35, + "learning_rate": 8.003865314270893e-06, + "loss": 0.1621, + "step": 89200 + }, + { + "epoch": 262.65, + "learning_rate": 7.99966390645045e-06, + "loss": 0.1645, + "step": 89300 + }, + { + "epoch": 262.94, + "learning_rate": 7.995459187090606e-06, + "loss": 0.1664, + "step": 89400 + }, + { + "epoch": 263.24, + "learning_rate": 7.99125116083325e-06, + "loss": 0.1548, + "step": 89500 + }, + { + "epoch": 263.53, + "learning_rate": 7.98703983232392e-06, + "loss": 0.1647, + "step": 89600 + }, + { + "epoch": 263.82, + "learning_rate": 7.98282520621179e-06, + "loss": 0.159, + "step": 89700 + }, + { + "epoch": 264.12, + "learning_rate": 7.978607287149686e-06, + "loss": 0.1754, + "step": 89800 + }, + { + "epoch": 264.41, + "learning_rate": 7.974386079794062e-06, + "loss": 0.1626, + "step": 89900 + }, + { + "epoch": 264.71, + "learning_rate": 7.970203849953575e-06, + "loss": 0.1627, + "step": 90000 + }, + { + "epoch": 264.71, + "eval_cer": 0.07684930909724946, + "eval_loss": 0.39812856912612915, + "eval_runtime": 5.3822, + "eval_samples_per_second": 66.701, + "eval_steps_per_second": 2.23, + "eval_wer": 0.28453973883604705, + "step": 90000 + }, + { + "epoch": 265.0, + "learning_rate": 7.9659761127614e-06, + "loss": 0.1689, + "step": 90100 + }, + { + "epoch": 265.29, + "learning_rate": 7.961745101220146e-06, + "loss": 0.1623, + "step": 90200 + }, + { + "epoch": 265.59, + "learning_rate": 7.957510820000723e-06, + "loss": 0.1558, + "step": 90300 + }, + { + "epoch": 265.88, + "learning_rate": 7.95327327377765e-06, + "loss": 0.1607, + "step": 90400 + }, + { + "epoch": 266.18, + "learning_rate": 7.949032467229056e-06, + "loss": 0.1588, + "step": 90500 + }, + { + "epoch": 266.47, + "learning_rate": 7.94478840503666e-06, + "loss": 0.1731, + "step": 90600 + }, + { + "epoch": 266.76, + "learning_rate": 7.94054109188578e-06, + "loss": 0.164, + "step": 90700 + }, + { + "epoch": 267.06, + "learning_rate": 7.936290532465327e-06, + "loss": 0.1632, + "step": 90800 + }, + { + "epoch": 267.35, + "learning_rate": 7.932036731467787e-06, + "loss": 0.1602, + "step": 90900 + }, + { + "epoch": 267.65, + "learning_rate": 7.927779693589236e-06, + "loss": 0.1624, + "step": 91000 + }, + { + "epoch": 267.65, + "eval_cer": 0.07645699838716707, + "eval_loss": 0.40907594561576843, + "eval_runtime": 5.3309, + "eval_samples_per_second": 67.344, + "eval_steps_per_second": 2.251, + "eval_wer": 0.28776398516846685, + "step": 91000 + }, + { + "epoch": 267.94, + "learning_rate": 7.923519423529306e-06, + "loss": 0.1629, + "step": 91100 + }, + { + "epoch": 268.24, + "learning_rate": 7.919255925991218e-06, + "loss": 0.1559, + "step": 91200 + }, + { + "epoch": 268.53, + "learning_rate": 7.91498920568174e-06, + "loss": 0.1572, + "step": 91300 + }, + { + "epoch": 268.82, + "learning_rate": 7.910719267311208e-06, + "loss": 0.1595, + "step": 91400 + }, + { + "epoch": 269.12, + "learning_rate": 7.906446115593504e-06, + "loss": 0.1653, + "step": 91500 + }, + { + "epoch": 269.41, + "learning_rate": 7.90216975524606e-06, + "loss": 0.1601, + "step": 91600 + }, + { + "epoch": 269.71, + "learning_rate": 7.897890190989852e-06, + "loss": 0.1628, + "step": 91700 + }, + { + "epoch": 270.0, + "learning_rate": 7.893607427549386e-06, + "loss": 0.1616, + "step": 91800 + }, + { + "epoch": 270.29, + "learning_rate": 7.889321469652712e-06, + "loss": 0.1594, + "step": 91900 + }, + { + "epoch": 270.59, + "learning_rate": 7.885032322031397e-06, + "loss": 0.1612, + "step": 92000 + }, + { + "epoch": 270.59, + "eval_cer": 0.07641340830826904, + "eval_loss": 0.4112890660762787, + "eval_runtime": 4.7995, + "eval_samples_per_second": 74.799, + "eval_steps_per_second": 2.5, + "eval_wer": 0.2887312590681928, + "step": 92000 + }, + { + "epoch": 270.88, + "learning_rate": 7.880739989420528e-06, + "loss": 0.1572, + "step": 92100 + }, + { + "epoch": 271.18, + "learning_rate": 7.876444476558717e-06, + "loss": 0.1645, + "step": 92200 + }, + { + "epoch": 271.47, + "learning_rate": 7.87214578818808e-06, + "loss": 0.1638, + "step": 92300 + }, + { + "epoch": 271.76, + "learning_rate": 7.86784392905424e-06, + "loss": 0.1569, + "step": 92400 + }, + { + "epoch": 272.06, + "learning_rate": 7.863538903906323e-06, + "loss": 0.1581, + "step": 92500 + }, + { + "epoch": 272.35, + "learning_rate": 7.859230717496947e-06, + "loss": 0.1641, + "step": 92600 + }, + { + "epoch": 272.65, + "learning_rate": 7.854919374582222e-06, + "loss": 0.1574, + "step": 92700 + }, + { + "epoch": 272.94, + "learning_rate": 7.850604879921739e-06, + "loss": 0.1504, + "step": 92800 + }, + { + "epoch": 273.24, + "learning_rate": 7.846287238278573e-06, + "loss": 0.1584, + "step": 92900 + }, + { + "epoch": 273.53, + "learning_rate": 7.841966454419276e-06, + "loss": 0.1559, + "step": 93000 + }, + { + "epoch": 273.53, + "eval_cer": 0.07702366941284164, + "eval_loss": 0.41579774022102356, + "eval_runtime": 4.6321, + "eval_samples_per_second": 77.503, + "eval_steps_per_second": 2.591, + "eval_wer": 0.28776398516846685, + "step": 93000 + }, + { + "epoch": 273.82, + "learning_rate": 7.837642533113857e-06, + "loss": 0.1609, + "step": 93100 + }, + { + "epoch": 274.12, + "learning_rate": 7.8333154791358e-06, + "loss": 0.1566, + "step": 93200 + }, + { + "epoch": 274.41, + "learning_rate": 7.828985297262043e-06, + "loss": 0.1611, + "step": 93300 + }, + { + "epoch": 274.71, + "learning_rate": 7.824651992272978e-06, + "loss": 0.1665, + "step": 93400 + }, + { + "epoch": 275.0, + "learning_rate": 7.820315568952442e-06, + "loss": 0.1487, + "step": 93500 + }, + { + "epoch": 275.29, + "learning_rate": 7.81597603208772e-06, + "loss": 0.1605, + "step": 93600 + }, + { + "epoch": 275.59, + "learning_rate": 7.811633386469528e-06, + "loss": 0.164, + "step": 93700 + }, + { + "epoch": 275.88, + "learning_rate": 7.80728763689202e-06, + "loss": 0.1566, + "step": 93800 + }, + { + "epoch": 276.18, + "learning_rate": 7.80293878815277e-06, + "loss": 0.1577, + "step": 93900 + }, + { + "epoch": 276.47, + "learning_rate": 7.798630379785097e-06, + "loss": 0.155, + "step": 94000 + }, + { + "epoch": 276.47, + "eval_cer": 0.0757595571247984, + "eval_loss": 0.41765499114990234, + "eval_runtime": 4.7179, + "eval_samples_per_second": 76.093, + "eval_steps_per_second": 2.543, + "eval_wer": 0.2843785265194261, + "step": 94000 + }, + { + "epoch": 276.76, + "learning_rate": 7.794275378000553e-06, + "loss": 0.158, + "step": 94100 + }, + { + "epoch": 277.06, + "learning_rate": 7.789917291419415e-06, + "loss": 0.1537, + "step": 94200 + }, + { + "epoch": 277.35, + "learning_rate": 7.785556124852882e-06, + "loss": 0.1545, + "step": 94300 + }, + { + "epoch": 277.65, + "learning_rate": 7.78119188311555e-06, + "loss": 0.1583, + "step": 94400 + }, + { + "epoch": 277.94, + "learning_rate": 7.776824571025409e-06, + "loss": 0.1493, + "step": 94500 + }, + { + "epoch": 278.24, + "learning_rate": 7.772454193403844e-06, + "loss": 0.156, + "step": 94600 + }, + { + "epoch": 278.53, + "learning_rate": 7.768080755075625e-06, + "loss": 0.1642, + "step": 94700 + }, + { + "epoch": 278.82, + "learning_rate": 7.76370426086889e-06, + "loss": 0.1466, + "step": 94800 + }, + { + "epoch": 279.12, + "learning_rate": 7.759324715615161e-06, + "loss": 0.1542, + "step": 94900 + }, + { + "epoch": 279.41, + "learning_rate": 7.754942124149329e-06, + "loss": 0.162, + "step": 95000 + }, + { + "epoch": 279.41, + "eval_cer": 0.07510570594132776, + "eval_loss": 0.41507747769355774, + "eval_runtime": 4.8011, + "eval_samples_per_second": 74.775, + "eval_steps_per_second": 2.499, + "eval_wer": 0.2838948895695631, + "step": 95000 + }, + { + "epoch": 279.71, + "learning_rate": 7.750556491309638e-06, + "loss": 0.1493, + "step": 95100 + }, + { + "epoch": 280.0, + "learning_rate": 7.7461678219377e-06, + "loss": 0.1503, + "step": 95200 + }, + { + "epoch": 280.29, + "learning_rate": 7.741776120878473e-06, + "loss": 0.1486, + "step": 95300 + }, + { + "epoch": 280.59, + "learning_rate": 7.737381392980263e-06, + "loss": 0.1515, + "step": 95400 + }, + { + "epoch": 280.88, + "learning_rate": 7.732983643094722e-06, + "loss": 0.1532, + "step": 95500 + }, + { + "epoch": 281.18, + "learning_rate": 7.728582876076831e-06, + "loss": 0.1558, + "step": 95600 + }, + { + "epoch": 281.47, + "learning_rate": 7.724179096784907e-06, + "loss": 0.1523, + "step": 95700 + }, + { + "epoch": 281.76, + "learning_rate": 7.719772310080592e-06, + "loss": 0.1518, + "step": 95800 + }, + { + "epoch": 282.06, + "learning_rate": 7.715362520828843e-06, + "loss": 0.1553, + "step": 95900 + }, + { + "epoch": 282.35, + "learning_rate": 7.71094973389794e-06, + "loss": 0.1483, + "step": 96000 + }, + { + "epoch": 282.35, + "eval_cer": 0.07619545791377882, + "eval_loss": 0.4204952120780945, + "eval_runtime": 4.5847, + "eval_samples_per_second": 78.304, + "eval_steps_per_second": 2.617, + "eval_wer": 0.28453973883604705, + "step": 96000 + }, + { + "epoch": 282.65, + "learning_rate": 7.706533954159466e-06, + "loss": 0.1479, + "step": 96100 + }, + { + "epoch": 282.94, + "learning_rate": 7.702115186488308e-06, + "loss": 0.1518, + "step": 96200 + }, + { + "epoch": 283.24, + "learning_rate": 7.697693435762656e-06, + "loss": 0.1515, + "step": 96300 + }, + { + "epoch": 283.53, + "learning_rate": 7.693268706863994e-06, + "loss": 0.1527, + "step": 96400 + }, + { + "epoch": 283.82, + "learning_rate": 7.688841004677086e-06, + "loss": 0.145, + "step": 96500 + }, + { + "epoch": 284.12, + "learning_rate": 7.684410334089984e-06, + "loss": 0.1493, + "step": 96600 + }, + { + "epoch": 284.41, + "learning_rate": 7.679976699994016e-06, + "loss": 0.1547, + "step": 96700 + }, + { + "epoch": 284.71, + "learning_rate": 7.675540107283781e-06, + "loss": 0.1471, + "step": 96800 + }, + { + "epoch": 285.0, + "learning_rate": 7.671100560857147e-06, + "loss": 0.1592, + "step": 96900 + }, + { + "epoch": 285.29, + "learning_rate": 7.666702505148194e-06, + "loss": 0.1566, + "step": 97000 + }, + { + "epoch": 285.29, + "eval_cer": 0.07549801665141014, + "eval_loss": 0.424325555562973, + "eval_runtime": 5.013, + "eval_samples_per_second": 71.614, + "eval_steps_per_second": 2.394, + "eval_wer": 0.2843785265194261, + "step": 97000 + }, + { + "epoch": 285.59, + "learning_rate": 7.662257095410217e-06, + "loss": 0.1477, + "step": 97100 + }, + { + "epoch": 285.88, + "learning_rate": 7.657808746619888e-06, + "loss": 0.1592, + "step": 97200 + }, + { + "epoch": 286.18, + "learning_rate": 7.65335746368805e-06, + "loss": 0.1451, + "step": 97300 + }, + { + "epoch": 286.47, + "learning_rate": 7.64890325152879e-06, + "loss": 0.1537, + "step": 97400 + }, + { + "epoch": 286.76, + "learning_rate": 7.644446115059424e-06, + "loss": 0.151, + "step": 97500 + }, + { + "epoch": 287.06, + "learning_rate": 7.6400306741939e-06, + "loss": 0.1557, + "step": 97600 + }, + { + "epoch": 287.35, + "learning_rate": 7.635567732989454e-06, + "loss": 0.1524, + "step": 97700 + }, + { + "epoch": 287.65, + "learning_rate": 7.631101882196917e-06, + "loss": 0.1494, + "step": 97800 + }, + { + "epoch": 287.94, + "learning_rate": 7.626633126746452e-06, + "loss": 0.1485, + "step": 97900 + }, + { + "epoch": 288.24, + "learning_rate": 7.622161471571434e-06, + "loss": 0.143, + "step": 98000 + }, + { + "epoch": 288.24, + "eval_cer": 0.07684930909724946, + "eval_loss": 0.4253920018672943, + "eval_runtime": 4.609, + "eval_samples_per_second": 77.891, + "eval_steps_per_second": 2.604, + "eval_wer": 0.29018216991778173, + "step": 98000 + }, + { + "epoch": 288.53, + "learning_rate": 7.617686921608436e-06, + "loss": 0.1556, + "step": 98100 + }, + { + "epoch": 288.82, + "learning_rate": 7.613209481797228e-06, + "loss": 0.1475, + "step": 98200 + }, + { + "epoch": 289.12, + "learning_rate": 7.60872915708077e-06, + "loss": 0.1514, + "step": 98300 + }, + { + "epoch": 289.41, + "learning_rate": 7.604245952405205e-06, + "loss": 0.1576, + "step": 98400 + }, + { + "epoch": 289.71, + "learning_rate": 7.599759872719859e-06, + "loss": 0.142, + "step": 98500 + }, + { + "epoch": 290.0, + "learning_rate": 7.595270922977229e-06, + "loss": 0.1549, + "step": 98600 + }, + { + "epoch": 290.29, + "learning_rate": 7.590779108132982e-06, + "loss": 0.1465, + "step": 98700 + }, + { + "epoch": 290.59, + "learning_rate": 7.5862844331459475e-06, + "loss": 0.1434, + "step": 98800 + }, + { + "epoch": 290.88, + "learning_rate": 7.581786902978113e-06, + "loss": 0.1414, + "step": 98900 + }, + { + "epoch": 291.18, + "learning_rate": 7.577286522594618e-06, + "loss": 0.1463, + "step": 99000 + }, + { + "epoch": 291.18, + "eval_cer": 0.07532365633581797, + "eval_loss": 0.4343777000904083, + "eval_runtime": 4.7592, + "eval_samples_per_second": 75.433, + "eval_steps_per_second": 2.521, + "eval_wer": 0.2826051910365952, + "step": 99000 + }, + { + "epoch": 291.47, + "learning_rate": 7.572783296963745e-06, + "loss": 0.1457, + "step": 99100 + }, + { + "epoch": 291.76, + "learning_rate": 7.568277231056922e-06, + "loss": 0.1504, + "step": 99200 + }, + { + "epoch": 292.06, + "learning_rate": 7.563768329848713e-06, + "loss": 0.1503, + "step": 99300 + }, + { + "epoch": 292.35, + "learning_rate": 7.559256598316809e-06, + "loss": 0.1444, + "step": 99400 + }, + { + "epoch": 292.65, + "learning_rate": 7.5547420414420294e-06, + "loss": 0.1469, + "step": 99500 + }, + { + "epoch": 292.94, + "learning_rate": 7.5502246642083056e-06, + "loss": 0.1487, + "step": 99600 + }, + { + "epoch": 293.24, + "learning_rate": 7.545704471602689e-06, + "loss": 0.1445, + "step": 99700 + }, + { + "epoch": 293.53, + "learning_rate": 7.541226712540208e-06, + "loss": 0.146, + "step": 99800 + }, + { + "epoch": 293.82, + "learning_rate": 7.5367009321935426e-06, + "loss": 0.1479, + "step": 99900 + }, + { + "epoch": 294.12, + "learning_rate": 7.53217235140478e-06, + "loss": 0.149, + "step": 100000 + }, + { + "epoch": 294.12, + "eval_cer": 0.07610827775598274, + "eval_loss": 0.4314731955528259, + "eval_runtime": 4.9571, + "eval_samples_per_second": 72.421, + "eval_steps_per_second": 2.421, + "eval_wer": 0.2847009511526681, + "step": 100000 + }, + { + "epoch": 294.41, + "learning_rate": 7.527640975173338e-06, + "loss": 0.1434, + "step": 100100 + }, + { + "epoch": 294.71, + "learning_rate": 7.523106808501723e-06, + "loss": 0.1478, + "step": 100200 + }, + { + "epoch": 295.0, + "learning_rate": 7.5185698563955214e-06, + "loss": 0.1441, + "step": 100300 + }, + { + "epoch": 295.29, + "learning_rate": 7.514030123863388e-06, + "loss": 0.1417, + "step": 100400 + }, + { + "epoch": 295.59, + "learning_rate": 7.509487615917055e-06, + "loss": 0.1458, + "step": 100500 + }, + { + "epoch": 295.88, + "learning_rate": 7.504942337571315e-06, + "loss": 0.1491, + "step": 100600 + }, + { + "epoch": 296.18, + "learning_rate": 7.500394293844018e-06, + "loss": 0.1427, + "step": 100700 + }, + { + "epoch": 296.47, + "learning_rate": 7.495843489756072e-06, + "loss": 0.153, + "step": 100800 + }, + { + "epoch": 296.76, + "learning_rate": 7.491289930331425e-06, + "loss": 0.1457, + "step": 100900 + }, + { + "epoch": 297.06, + "learning_rate": 7.486733620597073e-06, + "loss": 0.144, + "step": 101000 + }, + { + "epoch": 297.06, + "eval_cer": 0.07554160673030819, + "eval_loss": 0.4298832416534424, + "eval_runtime": 5.3958, + "eval_samples_per_second": 66.533, + "eval_steps_per_second": 2.224, + "eval_wer": 0.2834112526197001, + "step": 101000 + }, + { + "epoch": 297.35, + "learning_rate": 7.482174565583045e-06, + "loss": 0.138, + "step": 101100 + }, + { + "epoch": 297.65, + "learning_rate": 7.4776127703224025e-06, + "loss": 0.1473, + "step": 101200 + }, + { + "epoch": 297.94, + "learning_rate": 7.4730482398512305e-06, + "loss": 0.1439, + "step": 101300 + }, + { + "epoch": 298.24, + "learning_rate": 7.468480979208635e-06, + "loss": 0.1396, + "step": 101400 + }, + { + "epoch": 298.53, + "learning_rate": 7.463910993436735e-06, + "loss": 0.1436, + "step": 101500 + }, + { + "epoch": 298.82, + "learning_rate": 7.4593382875806576e-06, + "loss": 0.147, + "step": 101600 + }, + { + "epoch": 299.12, + "learning_rate": 7.454762866688535e-06, + "loss": 0.1414, + "step": 101700 + }, + { + "epoch": 299.41, + "learning_rate": 7.4501847358114945e-06, + "loss": 0.1399, + "step": 101800 + }, + { + "epoch": 299.71, + "learning_rate": 7.445603900003656e-06, + "loss": 0.1494, + "step": 101900 + }, + { + "epoch": 300.0, + "learning_rate": 7.441020364322124e-06, + "loss": 0.1415, + "step": 102000 + }, + { + "epoch": 300.0, + "eval_cer": 0.07610827775598274, + "eval_loss": 0.4383721649646759, + "eval_runtime": 5.4378, + "eval_samples_per_second": 66.019, + "eval_steps_per_second": 2.207, + "eval_wer": 0.28518458810253106, + "step": 102000 + }, + { + "epoch": 300.29, + "learning_rate": 7.4364341338269885e-06, + "loss": 0.1471, + "step": 102100 + }, + { + "epoch": 300.59, + "learning_rate": 7.431845213581309e-06, + "loss": 0.145, + "step": 102200 + }, + { + "epoch": 300.88, + "learning_rate": 7.427253608651116e-06, + "loss": 0.1422, + "step": 102300 + }, + { + "epoch": 301.18, + "learning_rate": 7.422659324105404e-06, + "loss": 0.1493, + "step": 102400 + }, + { + "epoch": 301.47, + "learning_rate": 7.4180623650161274e-06, + "loss": 0.1512, + "step": 102500 + }, + { + "epoch": 301.76, + "learning_rate": 7.413462736458192e-06, + "loss": 0.1461, + "step": 102600 + }, + { + "epoch": 302.06, + "learning_rate": 7.408860443509448e-06, + "loss": 0.1468, + "step": 102700 + }, + { + "epoch": 302.35, + "learning_rate": 7.404255491250691e-06, + "loss": 0.1334, + "step": 102800 + }, + { + "epoch": 302.65, + "learning_rate": 7.3996478847656525e-06, + "loss": 0.1459, + "step": 102900 + }, + { + "epoch": 302.94, + "learning_rate": 7.39503762914099e-06, + "loss": 0.1456, + "step": 103000 + }, + { + "epoch": 302.94, + "eval_cer": 0.0748441654679395, + "eval_loss": 0.4347250163555145, + "eval_runtime": 4.8036, + "eval_samples_per_second": 74.735, + "eval_steps_per_second": 2.498, + "eval_wer": 0.2801870062872803, + "step": 103000 + }, + { + "epoch": 303.24, + "learning_rate": 7.390424729466288e-06, + "loss": 0.1469, + "step": 103100 + }, + { + "epoch": 303.53, + "learning_rate": 7.3858091908340515e-06, + "loss": 0.14, + "step": 103200 + }, + { + "epoch": 303.82, + "learning_rate": 7.381191018339697e-06, + "loss": 0.1417, + "step": 103300 + }, + { + "epoch": 304.12, + "learning_rate": 7.376570217081548e-06, + "loss": 0.1355, + "step": 103400 + }, + { + "epoch": 304.41, + "learning_rate": 7.371946792160831e-06, + "loss": 0.1428, + "step": 103500 + }, + { + "epoch": 304.71, + "learning_rate": 7.367320748681672e-06, + "loss": 0.1422, + "step": 103600 + }, + { + "epoch": 305.0, + "learning_rate": 7.362692091751083e-06, + "loss": 0.1432, + "step": 103700 + }, + { + "epoch": 305.29, + "learning_rate": 7.3580608264789614e-06, + "loss": 0.1523, + "step": 103800 + }, + { + "epoch": 305.59, + "learning_rate": 7.353426957978087e-06, + "loss": 0.1367, + "step": 103900 + }, + { + "epoch": 305.88, + "learning_rate": 7.348790491364114e-06, + "loss": 0.1442, + "step": 104000 + }, + { + "epoch": 305.88, + "eval_cer": 0.07562878688810427, + "eval_loss": 0.4230651557445526, + "eval_runtime": 4.398, + "eval_samples_per_second": 81.628, + "eval_steps_per_second": 2.729, + "eval_wer": 0.28244397871997423, + "step": 104000 + }, + { + "epoch": 306.18, + "learning_rate": 7.3441514317555615e-06, + "loss": 0.1306, + "step": 104100 + }, + { + "epoch": 306.47, + "learning_rate": 7.339509784273812e-06, + "loss": 0.1443, + "step": 104200 + }, + { + "epoch": 306.76, + "learning_rate": 7.334865554043108e-06, + "loss": 0.1424, + "step": 104300 + }, + { + "epoch": 307.06, + "learning_rate": 7.33021874619054e-06, + "loss": 0.1352, + "step": 104400 + }, + { + "epoch": 307.35, + "learning_rate": 7.325569365846044e-06, + "loss": 0.1362, + "step": 104500 + }, + { + "epoch": 307.65, + "learning_rate": 7.320917418142398e-06, + "loss": 0.143, + "step": 104600 + }, + { + "epoch": 307.94, + "learning_rate": 7.3162629082152136e-06, + "loss": 0.1449, + "step": 104700 + }, + { + "epoch": 308.24, + "learning_rate": 7.311605841202931e-06, + "loss": 0.142, + "step": 104800 + }, + { + "epoch": 308.53, + "learning_rate": 7.306946222246813e-06, + "loss": 0.151, + "step": 104900 + }, + { + "epoch": 308.82, + "learning_rate": 7.302284056490938e-06, + "loss": 0.1357, + "step": 105000 + }, + { + "epoch": 308.82, + "eval_cer": 0.07510570594132776, + "eval_loss": 0.44283321499824524, + "eval_runtime": 4.9758, + "eval_samples_per_second": 72.149, + "eval_steps_per_second": 2.412, + "eval_wer": 0.28131549250362725, + "step": 105000 + }, + { + "epoch": 309.12, + "learning_rate": 7.297619349082201e-06, + "loss": 0.1349, + "step": 105100 + }, + { + "epoch": 309.41, + "learning_rate": 7.292952105170298e-06, + "loss": 0.1374, + "step": 105200 + }, + { + "epoch": 309.71, + "learning_rate": 7.288282329907726e-06, + "loss": 0.143, + "step": 105300 + }, + { + "epoch": 310.0, + "learning_rate": 7.28361002844978e-06, + "loss": 0.1453, + "step": 105400 + }, + { + "epoch": 310.29, + "learning_rate": 7.27893520595454e-06, + "loss": 0.142, + "step": 105500 + }, + { + "epoch": 310.59, + "learning_rate": 7.274257867582868e-06, + "loss": 0.135, + "step": 105600 + }, + { + "epoch": 310.88, + "learning_rate": 7.269578018498409e-06, + "loss": 0.1452, + "step": 105700 + }, + { + "epoch": 311.18, + "learning_rate": 7.264942499799369e-06, + "loss": 0.1379, + "step": 105800 + }, + { + "epoch": 311.47, + "learning_rate": 7.260257669769517e-06, + "loss": 0.1339, + "step": 105900 + }, + { + "epoch": 311.76, + "learning_rate": 7.255570344482677e-06, + "loss": 0.1446, + "step": 106000 + }, + { + "epoch": 311.76, + "eval_cer": 0.07532365633581797, + "eval_loss": 0.44697633385658264, + "eval_runtime": 5.0129, + "eval_samples_per_second": 71.616, + "eval_steps_per_second": 2.394, + "eval_wer": 0.2842173142028051, + "step": 106000 + }, + { + "epoch": 312.06, + "learning_rate": 7.250880529113518e-06, + "loss": 0.1406, + "step": 106100 + }, + { + "epoch": 312.35, + "learning_rate": 7.246188228839456e-06, + "loss": 0.1378, + "step": 106200 + }, + { + "epoch": 312.65, + "learning_rate": 7.241493448840649e-06, + "loss": 0.1446, + "step": 106300 + }, + { + "epoch": 312.94, + "learning_rate": 7.236796194299992e-06, + "loss": 0.1424, + "step": 106400 + }, + { + "epoch": 313.24, + "learning_rate": 7.232096470403117e-06, + "loss": 0.1387, + "step": 106500 + }, + { + "epoch": 313.53, + "learning_rate": 7.227394282338378e-06, + "loss": 0.1411, + "step": 106600 + }, + { + "epoch": 313.82, + "learning_rate": 7.222689635296852e-06, + "loss": 0.1337, + "step": 106700 + }, + { + "epoch": 314.12, + "learning_rate": 7.217982534472326e-06, + "loss": 0.1403, + "step": 106800 + }, + { + "epoch": 314.41, + "learning_rate": 7.213320092658842e-06, + "loss": 0.1401, + "step": 106900 + }, + { + "epoch": 314.71, + "learning_rate": 7.208608124268647e-06, + "loss": 0.1345, + "step": 107000 + }, + { + "epoch": 314.71, + "eval_cer": 0.07471339523124537, + "eval_loss": 0.457571417093277, + "eval_runtime": 4.9987, + "eval_samples_per_second": 71.818, + "eval_steps_per_second": 2.401, + "eval_wer": 0.28083185555376433, + "step": 107000 + }, + { + "epoch": 315.0, + "learning_rate": 7.20389371764102e-06, + "loss": 0.1436, + "step": 107100 + }, + { + "epoch": 315.29, + "learning_rate": 7.199176877980525e-06, + "loss": 0.1302, + "step": 107200 + }, + { + "epoch": 315.59, + "learning_rate": 7.194457610494413e-06, + "loss": 0.1348, + "step": 107300 + }, + { + "epoch": 315.88, + "learning_rate": 7.189735920392614e-06, + "loss": 0.1376, + "step": 107400 + }, + { + "epoch": 316.18, + "learning_rate": 7.185011812887735e-06, + "loss": 0.1341, + "step": 107500 + }, + { + "epoch": 316.47, + "learning_rate": 7.180285293195048e-06, + "loss": 0.1361, + "step": 107600 + }, + { + "epoch": 316.76, + "learning_rate": 7.1755563665324905e-06, + "loss": 0.1361, + "step": 107700 + }, + { + "epoch": 317.06, + "learning_rate": 7.170825038120654e-06, + "loss": 0.1341, + "step": 107800 + }, + { + "epoch": 317.35, + "learning_rate": 7.1660913131827855e-06, + "loss": 0.1393, + "step": 107900 + }, + { + "epoch": 317.65, + "learning_rate": 7.161355196944777e-06, + "loss": 0.137, + "step": 108000 + }, + { + "epoch": 317.65, + "eval_cer": 0.07562878688810427, + "eval_loss": 0.45369425415992737, + "eval_runtime": 4.9175, + "eval_samples_per_second": 73.004, + "eval_steps_per_second": 2.44, + "eval_wer": 0.285990649685636, + "step": 108000 + }, + { + "epoch": 317.94, + "learning_rate": 7.156616694635158e-06, + "loss": 0.1378, + "step": 108100 + }, + { + "epoch": 318.24, + "learning_rate": 7.151875811485094e-06, + "loss": 0.1325, + "step": 108200 + }, + { + "epoch": 318.53, + "learning_rate": 7.147132552728379e-06, + "loss": 0.1417, + "step": 108300 + }, + { + "epoch": 318.82, + "learning_rate": 7.142386923601428e-06, + "loss": 0.1339, + "step": 108400 + }, + { + "epoch": 319.12, + "learning_rate": 7.137638929343274e-06, + "loss": 0.143, + "step": 108500 + }, + { + "epoch": 319.41, + "learning_rate": 7.132888575195561e-06, + "loss": 0.1337, + "step": 108600 + }, + { + "epoch": 319.71, + "learning_rate": 7.128135866402539e-06, + "loss": 0.1351, + "step": 108700 + }, + { + "epoch": 320.0, + "learning_rate": 7.123380808211055e-06, + "loss": 0.1378, + "step": 108800 + }, + { + "epoch": 320.29, + "learning_rate": 7.118623405870554e-06, + "loss": 0.135, + "step": 108900 + }, + { + "epoch": 320.59, + "learning_rate": 7.113863664633064e-06, + "loss": 0.1318, + "step": 109000 + }, + { + "epoch": 320.59, + "eval_cer": 0.07523647617802189, + "eval_loss": 0.4415852725505829, + "eval_runtime": 5.3729, + "eval_samples_per_second": 66.817, + "eval_steps_per_second": 2.233, + "eval_wer": 0.28163791713686925, + "step": 109000 + }, + { + "epoch": 320.88, + "learning_rate": 7.109101589753197e-06, + "loss": 0.1359, + "step": 109100 + }, + { + "epoch": 321.18, + "learning_rate": 7.1043371864881424e-06, + "loss": 0.13, + "step": 109200 + }, + { + "epoch": 321.47, + "learning_rate": 7.099570460097659e-06, + "loss": 0.1373, + "step": 109300 + }, + { + "epoch": 321.76, + "learning_rate": 7.094849117742743e-06, + "loss": 0.1411, + "step": 109400 + }, + { + "epoch": 322.06, + "learning_rate": 7.090077783990845e-06, + "loss": 0.1401, + "step": 109500 + }, + { + "epoch": 322.35, + "learning_rate": 7.0853041428554725e-06, + "loss": 0.1341, + "step": 109600 + }, + { + "epoch": 322.65, + "learning_rate": 7.080528199606582e-06, + "loss": 0.1352, + "step": 109700 + }, + { + "epoch": 322.94, + "learning_rate": 7.075749959516676e-06, + "loss": 0.1343, + "step": 109800 + }, + { + "epoch": 323.24, + "learning_rate": 7.0709694278607836e-06, + "loss": 0.142, + "step": 109900 + }, + { + "epoch": 323.53, + "learning_rate": 7.066186609916472e-06, + "loss": 0.137, + "step": 110000 + }, + { + "epoch": 323.53, + "eval_cer": 0.07414672420557081, + "eval_loss": 0.4473969638347626, + "eval_runtime": 4.4522, + "eval_samples_per_second": 80.635, + "eval_steps_per_second": 2.695, + "eval_wer": 0.27760760922134453, + "step": 110000 + }, + { + "epoch": 323.82, + "learning_rate": 7.06140151096383e-06, + "loss": 0.1354, + "step": 110100 + }, + { + "epoch": 324.12, + "learning_rate": 7.056614136285462e-06, + "loss": 0.1351, + "step": 110200 + }, + { + "epoch": 324.41, + "learning_rate": 7.051824491166489e-06, + "loss": 0.1303, + "step": 110300 + }, + { + "epoch": 324.71, + "learning_rate": 7.047032580894535e-06, + "loss": 0.1328, + "step": 110400 + }, + { + "epoch": 325.0, + "learning_rate": 7.042238410759725e-06, + "loss": 0.129, + "step": 110500 + }, + { + "epoch": 325.29, + "learning_rate": 7.0374419860546804e-06, + "loss": 0.1365, + "step": 110600 + }, + { + "epoch": 325.59, + "learning_rate": 7.032643312074512e-06, + "loss": 0.1309, + "step": 110700 + }, + { + "epoch": 325.88, + "learning_rate": 7.027842394116812e-06, + "loss": 0.1313, + "step": 110800 + }, + { + "epoch": 326.18, + "learning_rate": 7.02303923748165e-06, + "loss": 0.1343, + "step": 110900 + }, + { + "epoch": 326.47, + "learning_rate": 7.018233847471566e-06, + "loss": 0.1351, + "step": 111000 + }, + { + "epoch": 326.47, + "eval_cer": 0.07571596704590035, + "eval_loss": 0.45716190338134766, + "eval_runtime": 4.8972, + "eval_samples_per_second": 73.307, + "eval_steps_per_second": 2.45, + "eval_wer": 0.28357246493632116, + "step": 111000 + }, + { + "epoch": 326.76, + "learning_rate": 7.0134262293915704e-06, + "loss": 0.1296, + "step": 111100 + }, + { + "epoch": 327.06, + "learning_rate": 7.008616388549128e-06, + "loss": 0.1242, + "step": 111200 + }, + { + "epoch": 327.35, + "learning_rate": 7.003804330254161e-06, + "loss": 0.1326, + "step": 111300 + }, + { + "epoch": 327.65, + "learning_rate": 6.998990059819037e-06, + "loss": 0.1379, + "step": 111400 + }, + { + "epoch": 327.94, + "learning_rate": 6.994173582558566e-06, + "loss": 0.1339, + "step": 111500 + }, + { + "epoch": 328.24, + "learning_rate": 6.989354903789993e-06, + "loss": 0.139, + "step": 111600 + }, + { + "epoch": 328.53, + "learning_rate": 6.984534028833002e-06, + "loss": 0.1295, + "step": 111700 + }, + { + "epoch": 328.82, + "learning_rate": 6.97971096300969e-06, + "loss": 0.1318, + "step": 111800 + }, + { + "epoch": 329.12, + "learning_rate": 6.974885711644581e-06, + "loss": 0.1331, + "step": 111900 + }, + { + "epoch": 329.41, + "learning_rate": 6.9700582800646064e-06, + "loss": 0.1357, + "step": 112000 + }, + { + "epoch": 329.41, + "eval_cer": 0.0754544265725121, + "eval_loss": 0.4541434347629547, + "eval_runtime": 4.8992, + "eval_samples_per_second": 73.277, + "eval_steps_per_second": 2.449, + "eval_wer": 0.28212155408673223, + "step": 112000 + }, + { + "epoch": 329.71, + "learning_rate": 6.965228673599105e-06, + "loss": 0.1317, + "step": 112100 + }, + { + "epoch": 330.0, + "learning_rate": 6.960396897579821e-06, + "loss": 0.1278, + "step": 112200 + }, + { + "epoch": 330.29, + "learning_rate": 6.9555629573408886e-06, + "loss": 0.1307, + "step": 112300 + }, + { + "epoch": 330.59, + "learning_rate": 6.950726858218837e-06, + "loss": 0.1302, + "step": 112400 + }, + { + "epoch": 330.88, + "learning_rate": 6.945888605552571e-06, + "loss": 0.1333, + "step": 112500 + }, + { + "epoch": 331.18, + "learning_rate": 6.94104820468338e-06, + "loss": 0.1276, + "step": 112600 + }, + { + "epoch": 331.47, + "learning_rate": 6.93620566095492e-06, + "loss": 0.1303, + "step": 112700 + }, + { + "epoch": 331.76, + "learning_rate": 6.931360979713216e-06, + "loss": 0.1302, + "step": 112800 + }, + { + "epoch": 332.06, + "learning_rate": 6.926514166306653e-06, + "loss": 0.1292, + "step": 112900 + }, + { + "epoch": 332.35, + "learning_rate": 6.921665226085965e-06, + "loss": 0.1362, + "step": 113000 + }, + { + "epoch": 332.35, + "eval_cer": 0.0760646876770847, + "eval_loss": 0.44597867131233215, + "eval_runtime": 5.0068, + "eval_samples_per_second": 71.703, + "eval_steps_per_second": 2.397, + "eval_wer": 0.2866354989521199, + "step": 113000 + }, + { + "epoch": 332.65, + "learning_rate": 6.9168141644042386e-06, + "loss": 0.1331, + "step": 113100 + }, + { + "epoch": 332.94, + "learning_rate": 6.9119609866169e-06, + "loss": 0.1309, + "step": 113200 + }, + { + "epoch": 333.24, + "learning_rate": 6.907105698081715e-06, + "loss": 0.1275, + "step": 113300 + }, + { + "epoch": 333.53, + "learning_rate": 6.9022483041587785e-06, + "loss": 0.1323, + "step": 113400 + }, + { + "epoch": 333.82, + "learning_rate": 6.897486020635022e-06, + "loss": 0.129, + "step": 113500 + }, + { + "epoch": 334.12, + "learning_rate": 6.892624473866769e-06, + "loss": 0.1377, + "step": 113600 + }, + { + "epoch": 334.41, + "learning_rate": 6.8877608376976024e-06, + "loss": 0.1258, + "step": 113700 + }, + { + "epoch": 334.71, + "learning_rate": 6.88289511749683e-06, + "loss": 0.1307, + "step": 113800 + }, + { + "epoch": 335.0, + "learning_rate": 6.878027318636063e-06, + "loss": 0.1331, + "step": 113900 + }, + { + "epoch": 335.29, + "learning_rate": 6.873157446489203e-06, + "loss": 0.1279, + "step": 114000 + }, + { + "epoch": 335.29, + "eval_cer": 0.07371082341659038, + "eval_loss": 0.4529751241207123, + "eval_runtime": 4.2881, + "eval_samples_per_second": 83.72, + "eval_steps_per_second": 2.798, + "eval_wer": 0.2758342737385136, + "step": 114000 + }, + { + "epoch": 335.59, + "learning_rate": 6.868285506432445e-06, + "loss": 0.1319, + "step": 114100 + }, + { + "epoch": 335.88, + "learning_rate": 6.863411503844266e-06, + "loss": 0.1291, + "step": 114200 + }, + { + "epoch": 336.18, + "learning_rate": 6.858535444105418e-06, + "loss": 0.1266, + "step": 114300 + }, + { + "epoch": 336.47, + "learning_rate": 6.8536573325989285e-06, + "loss": 0.1277, + "step": 114400 + }, + { + "epoch": 336.76, + "learning_rate": 6.848777174710084e-06, + "loss": 0.1297, + "step": 114500 + }, + { + "epoch": 337.06, + "learning_rate": 6.843894975826434e-06, + "loss": 0.1306, + "step": 114600 + }, + { + "epoch": 337.35, + "learning_rate": 6.839010741337779e-06, + "loss": 0.1285, + "step": 114700 + }, + { + "epoch": 337.65, + "learning_rate": 6.834124476636171e-06, + "loss": 0.1291, + "step": 114800 + }, + { + "epoch": 337.94, + "learning_rate": 6.829236187115898e-06, + "loss": 0.1378, + "step": 114900 + }, + { + "epoch": 338.24, + "learning_rate": 6.8243458781734866e-06, + "loss": 0.1345, + "step": 115000 + }, + { + "epoch": 338.24, + "eval_cer": 0.07427749444226495, + "eval_loss": 0.47045978903770447, + "eval_runtime": 5.4296, + "eval_samples_per_second": 66.119, + "eval_steps_per_second": 2.21, + "eval_wer": 0.27873609543769146, + "step": 115000 + }, + { + "epoch": 338.53, + "learning_rate": 6.81945355520769e-06, + "loss": 0.1245, + "step": 115100 + }, + { + "epoch": 338.82, + "learning_rate": 6.81455922361949e-06, + "loss": 0.1318, + "step": 115200 + }, + { + "epoch": 339.12, + "learning_rate": 6.8096628888120795e-06, + "loss": 0.1235, + "step": 115300 + }, + { + "epoch": 339.41, + "learning_rate": 6.804764556190868e-06, + "loss": 0.1266, + "step": 115400 + }, + { + "epoch": 339.71, + "learning_rate": 6.7998642311634675e-06, + "loss": 0.1291, + "step": 115500 + }, + { + "epoch": 340.0, + "learning_rate": 6.794961919139691e-06, + "loss": 0.1256, + "step": 115600 + }, + { + "epoch": 340.29, + "learning_rate": 6.790057625531546e-06, + "loss": 0.1342, + "step": 115700 + }, + { + "epoch": 340.59, + "learning_rate": 6.785151355753222e-06, + "loss": 0.1247, + "step": 115800 + }, + { + "epoch": 340.88, + "learning_rate": 6.780243115221098e-06, + "loss": 0.1296, + "step": 115900 + }, + { + "epoch": 341.18, + "learning_rate": 6.775332909353724e-06, + "loss": 0.132, + "step": 116000 + }, + { + "epoch": 341.18, + "eval_cer": 0.07466980515234732, + "eval_loss": 0.4567488431930542, + "eval_runtime": 5.3257, + "eval_samples_per_second": 67.409, + "eval_steps_per_second": 2.253, + "eval_wer": 0.27841367080444945, + "step": 116000 + }, + { + "epoch": 341.47, + "learning_rate": 6.770420743571821e-06, + "loss": 0.1232, + "step": 116100 + }, + { + "epoch": 341.76, + "learning_rate": 6.765506623298272e-06, + "loss": 0.1265, + "step": 116200 + }, + { + "epoch": 342.06, + "learning_rate": 6.760590553958122e-06, + "loss": 0.1267, + "step": 116300 + }, + { + "epoch": 342.35, + "learning_rate": 6.755672540978561e-06, + "loss": 0.126, + "step": 116400 + }, + { + "epoch": 342.65, + "learning_rate": 6.750752589788931e-06, + "loss": 0.1285, + "step": 116500 + }, + { + "epoch": 342.94, + "learning_rate": 6.74583070582071e-06, + "loss": 0.1268, + "step": 116600 + }, + { + "epoch": 343.24, + "learning_rate": 6.740906894507514e-06, + "loss": 0.1268, + "step": 116700 + }, + { + "epoch": 343.53, + "learning_rate": 6.735981161285079e-06, + "loss": 0.1222, + "step": 116800 + }, + { + "epoch": 343.82, + "learning_rate": 6.73105351159127e-06, + "loss": 0.1282, + "step": 116900 + }, + { + "epoch": 344.12, + "learning_rate": 6.7261239508660655e-06, + "loss": 0.1282, + "step": 117000 + }, + { + "epoch": 344.12, + "eval_cer": 0.07462621507344928, + "eval_loss": 0.45933759212493896, + "eval_runtime": 4.7882, + "eval_samples_per_second": 74.976, + "eval_steps_per_second": 2.506, + "eval_wer": 0.28002579397065935, + "step": 117000 + }, + { + "epoch": 344.41, + "learning_rate": 6.721192484551554e-06, + "loss": 0.1233, + "step": 117100 + }, + { + "epoch": 344.71, + "learning_rate": 6.716259118091923e-06, + "loss": 0.1296, + "step": 117200 + }, + { + "epoch": 345.0, + "learning_rate": 6.711323856933466e-06, + "loss": 0.1248, + "step": 117300 + }, + { + "epoch": 345.29, + "learning_rate": 6.706386706524562e-06, + "loss": 0.1272, + "step": 117400 + }, + { + "epoch": 345.59, + "learning_rate": 6.701447672315678e-06, + "loss": 0.1314, + "step": 117500 + }, + { + "epoch": 345.88, + "learning_rate": 6.696506759759362e-06, + "loss": 0.1268, + "step": 117600 + }, + { + "epoch": 346.18, + "learning_rate": 6.691563974310231e-06, + "loss": 0.1285, + "step": 117700 + }, + { + "epoch": 346.47, + "learning_rate": 6.686619321424976e-06, + "loss": 0.1218, + "step": 117800 + }, + { + "epoch": 346.76, + "learning_rate": 6.681672806562342e-06, + "loss": 0.1261, + "step": 117900 + }, + { + "epoch": 347.06, + "learning_rate": 6.676724435183138e-06, + "loss": 0.1297, + "step": 118000 + }, + { + "epoch": 347.06, + "eval_cer": 0.07497493570463362, + "eval_loss": 0.4662339687347412, + "eval_runtime": 4.4705, + "eval_samples_per_second": 80.304, + "eval_steps_per_second": 2.684, + "eval_wer": 0.28034821860390136, + "step": 118000 + }, + { + "epoch": 347.35, + "learning_rate": 6.671774212750215e-06, + "loss": 0.1214, + "step": 118100 + }, + { + "epoch": 347.65, + "learning_rate": 6.666822144728472e-06, + "loss": 0.1347, + "step": 118200 + }, + { + "epoch": 347.94, + "learning_rate": 6.661868236584843e-06, + "loss": 0.1279, + "step": 118300 + }, + { + "epoch": 348.24, + "learning_rate": 6.656912493788296e-06, + "loss": 0.1223, + "step": 118400 + }, + { + "epoch": 348.53, + "learning_rate": 6.651954921809825e-06, + "loss": 0.1335, + "step": 118500 + }, + { + "epoch": 348.82, + "learning_rate": 6.64699552612244e-06, + "loss": 0.1201, + "step": 118600 + }, + { + "epoch": 349.12, + "learning_rate": 6.642034312201164e-06, + "loss": 0.1347, + "step": 118700 + }, + { + "epoch": 349.41, + "learning_rate": 6.637071285523029e-06, + "loss": 0.1183, + "step": 118800 + }, + { + "epoch": 349.71, + "learning_rate": 6.6321561088346606e-06, + "loss": 0.1266, + "step": 118900 + }, + { + "epoch": 350.0, + "learning_rate": 6.627189491072736e-06, + "loss": 0.1237, + "step": 119000 + }, + { + "epoch": 350.0, + "eval_cer": 0.07458262499455125, + "eval_loss": 0.4724867343902588, + "eval_runtime": 4.6268, + "eval_samples_per_second": 77.592, + "eval_steps_per_second": 2.594, + "eval_wer": 0.2817991294534902, + "step": 119000 + }, + { + "epoch": 350.29, + "learning_rate": 6.622221076942194e-06, + "loss": 0.1275, + "step": 119100 + }, + { + "epoch": 350.59, + "learning_rate": 6.617250871928014e-06, + "loss": 0.1247, + "step": 119200 + }, + { + "epoch": 350.88, + "learning_rate": 6.612278881517154e-06, + "loss": 0.1222, + "step": 119300 + }, + { + "epoch": 351.18, + "learning_rate": 6.607354857694247e-06, + "loss": 0.1243, + "step": 119400 + }, + { + "epoch": 351.47, + "learning_rate": 6.602379330675764e-06, + "loss": 0.1328, + "step": 119500 + }, + { + "epoch": 351.76, + "learning_rate": 6.5974020346783354e-06, + "loss": 0.1303, + "step": 119600 + }, + { + "epoch": 352.06, + "learning_rate": 6.592422975196755e-06, + "loss": 0.1245, + "step": 119700 + }, + { + "epoch": 352.35, + "learning_rate": 6.5874421577277505e-06, + "loss": 0.1286, + "step": 119800 + }, + { + "epoch": 352.65, + "learning_rate": 6.582459587769996e-06, + "loss": 0.1287, + "step": 119900 + }, + { + "epoch": 352.94, + "learning_rate": 6.577475270824101e-06, + "loss": 0.1278, + "step": 120000 + }, + { + "epoch": 352.94, + "eval_cer": 0.07379800357438647, + "eval_loss": 0.46413475275039673, + "eval_runtime": 4.9638, + "eval_samples_per_second": 72.324, + "eval_steps_per_second": 2.418, + "eval_wer": 0.2769627599548605, + "step": 120000 + }, + { + "epoch": 353.24, + "learning_rate": 6.572489212392604e-06, + "loss": 0.1223, + "step": 120100 + }, + { + "epoch": 353.53, + "learning_rate": 6.567501417979963e-06, + "loss": 0.1258, + "step": 120200 + }, + { + "epoch": 353.82, + "learning_rate": 6.562511893092552e-06, + "loss": 0.1242, + "step": 120300 + }, + { + "epoch": 354.12, + "learning_rate": 6.557520643238662e-06, + "loss": 0.1243, + "step": 120400 + }, + { + "epoch": 354.41, + "learning_rate": 6.552527673928481e-06, + "loss": 0.1278, + "step": 120500 + }, + { + "epoch": 354.71, + "learning_rate": 6.547532990674099e-06, + "loss": 0.1259, + "step": 120600 + }, + { + "epoch": 355.0, + "learning_rate": 6.5425365989894976e-06, + "loss": 0.122, + "step": 120700 + }, + { + "epoch": 355.29, + "learning_rate": 6.537538504390543e-06, + "loss": 0.1225, + "step": 120800 + }, + { + "epoch": 355.59, + "learning_rate": 6.532538712394982e-06, + "loss": 0.1256, + "step": 120900 + }, + { + "epoch": 355.88, + "learning_rate": 6.527537228522437e-06, + "loss": 0.1294, + "step": 121000 + }, + { + "epoch": 355.88, + "eval_cer": 0.07419031428446886, + "eval_loss": 0.4756881296634674, + "eval_runtime": 4.9381, + "eval_samples_per_second": 72.7, + "eval_steps_per_second": 2.43, + "eval_wer": 0.2790585200709334, + "step": 121000 + }, + { + "epoch": 356.18, + "learning_rate": 6.522534058294396e-06, + "loss": 0.1159, + "step": 121100 + }, + { + "epoch": 356.47, + "learning_rate": 6.51752920723421e-06, + "loss": 0.1259, + "step": 121200 + }, + { + "epoch": 356.76, + "learning_rate": 6.5125226808670865e-06, + "loss": 0.1215, + "step": 121300 + }, + { + "epoch": 357.06, + "learning_rate": 6.5075144847200775e-06, + "loss": 0.122, + "step": 121400 + }, + { + "epoch": 357.35, + "learning_rate": 6.502504624322086e-06, + "loss": 0.1248, + "step": 121500 + }, + { + "epoch": 357.65, + "learning_rate": 6.497493105203845e-06, + "loss": 0.1208, + "step": 121600 + }, + { + "epoch": 357.94, + "learning_rate": 6.492479932897925e-06, + "loss": 0.1218, + "step": 121700 + }, + { + "epoch": 358.24, + "learning_rate": 6.487515269276015e-06, + "loss": 0.1193, + "step": 121800 + }, + { + "epoch": 358.53, + "learning_rate": 6.482498823593491e-06, + "loss": 0.1177, + "step": 121900 + }, + { + "epoch": 358.82, + "learning_rate": 6.477480741276527e-06, + "loss": 0.1238, + "step": 122000 + }, + { + "epoch": 358.82, + "eval_cer": 0.07449544483675516, + "eval_loss": 0.48461535573005676, + "eval_runtime": 4.649, + "eval_samples_per_second": 77.221, + "eval_steps_per_second": 2.581, + "eval_wer": 0.2774463969047235, + "step": 122000 + }, + { + "epoch": 359.12, + "learning_rate": 6.472461027864931e-06, + "loss": 0.1186, + "step": 122100 + }, + { + "epoch": 359.41, + "learning_rate": 6.467439688900324e-06, + "loss": 0.1233, + "step": 122200 + }, + { + "epoch": 359.71, + "learning_rate": 6.46241672992611e-06, + "loss": 0.1199, + "step": 122300 + }, + { + "epoch": 360.0, + "learning_rate": 6.457392156487486e-06, + "loss": 0.1133, + "step": 122400 + }, + { + "epoch": 360.29, + "learning_rate": 6.452365974131434e-06, + "loss": 0.1211, + "step": 122500 + }, + { + "epoch": 360.59, + "learning_rate": 6.447338188406705e-06, + "loss": 0.1204, + "step": 122600 + }, + { + "epoch": 360.88, + "learning_rate": 6.442308804863825e-06, + "loss": 0.1291, + "step": 122700 + }, + { + "epoch": 361.18, + "learning_rate": 6.437277829055086e-06, + "loss": 0.1222, + "step": 122800 + }, + { + "epoch": 361.47, + "learning_rate": 6.432245266534533e-06, + "loss": 0.122, + "step": 122900 + }, + { + "epoch": 361.76, + "learning_rate": 6.4272111228579685e-06, + "loss": 0.1259, + "step": 123000 + }, + { + "epoch": 361.76, + "eval_cer": 0.07388518373218256, + "eval_loss": 0.47283557057380676, + "eval_runtime": 5.3824, + "eval_samples_per_second": 66.699, + "eval_steps_per_second": 2.23, + "eval_wer": 0.2774463969047235, + "step": 123000 + }, + { + "epoch": 362.06, + "learning_rate": 6.4221754035829305e-06, + "loss": 0.1164, + "step": 123100 + }, + { + "epoch": 362.35, + "learning_rate": 6.417138114268706e-06, + "loss": 0.1214, + "step": 123200 + }, + { + "epoch": 362.65, + "learning_rate": 6.412099260476314e-06, + "loss": 0.1232, + "step": 123300 + }, + { + "epoch": 362.94, + "learning_rate": 6.4070588477684956e-06, + "loss": 0.1279, + "step": 123400 + }, + { + "epoch": 363.24, + "learning_rate": 6.4020168817097175e-06, + "loss": 0.1245, + "step": 123500 + }, + { + "epoch": 363.53, + "learning_rate": 6.396973367866159e-06, + "loss": 0.1182, + "step": 123600 + }, + { + "epoch": 363.82, + "learning_rate": 6.391928311805709e-06, + "loss": 0.1142, + "step": 123700 + }, + { + "epoch": 364.12, + "learning_rate": 6.386881719097959e-06, + "loss": 0.1221, + "step": 123800 + }, + { + "epoch": 364.41, + "learning_rate": 6.3818335953141955e-06, + "loss": 0.1157, + "step": 123900 + }, + { + "epoch": 364.71, + "learning_rate": 6.376783946027399e-06, + "loss": 0.1188, + "step": 124000 + }, + { + "epoch": 364.71, + "eval_cer": 0.07558519680920622, + "eval_loss": 0.4801531732082367, + "eval_runtime": 4.7837, + "eval_samples_per_second": 75.046, + "eval_steps_per_second": 2.509, + "eval_wer": 0.2809930678703853, + "step": 124000 + }, + { + "epoch": 365.0, + "learning_rate": 6.37173277681223e-06, + "loss": 0.1251, + "step": 124100 + }, + { + "epoch": 365.29, + "learning_rate": 6.366680093245028e-06, + "loss": 0.1198, + "step": 124200 + }, + { + "epoch": 365.59, + "learning_rate": 6.361625900903804e-06, + "loss": 0.1168, + "step": 124300 + }, + { + "epoch": 365.88, + "learning_rate": 6.356570205368238e-06, + "loss": 0.1275, + "step": 124400 + }, + { + "epoch": 366.18, + "learning_rate": 6.3515130122196656e-06, + "loss": 0.121, + "step": 124500 + }, + { + "epoch": 366.47, + "learning_rate": 6.346454327041079e-06, + "loss": 0.1218, + "step": 124600 + }, + { + "epoch": 366.76, + "learning_rate": 6.341394155417111e-06, + "loss": 0.1177, + "step": 124700 + }, + { + "epoch": 367.06, + "learning_rate": 6.336332502934044e-06, + "loss": 0.1193, + "step": 124800 + }, + { + "epoch": 367.35, + "learning_rate": 6.331269375179788e-06, + "loss": 0.115, + "step": 124900 + }, + { + "epoch": 367.65, + "learning_rate": 6.3262047777438884e-06, + "loss": 0.1203, + "step": 125000 + }, + { + "epoch": 367.65, + "eval_cer": 0.07405954404777472, + "eval_loss": 0.4863865375518799, + "eval_runtime": 5.4102, + "eval_samples_per_second": 66.357, + "eval_steps_per_second": 2.218, + "eval_wer": 0.2761566983717556, + "step": 125000 + }, + { + "epoch": 367.94, + "learning_rate": 6.321138716217509e-06, + "loss": 0.1207, + "step": 125100 + }, + { + "epoch": 368.24, + "learning_rate": 6.31607119619343e-06, + "loss": 0.1183, + "step": 125200 + }, + { + "epoch": 368.53, + "learning_rate": 6.31100222326604e-06, + "loss": 0.1204, + "step": 125300 + }, + { + "epoch": 368.82, + "learning_rate": 6.305931803031335e-06, + "loss": 0.1168, + "step": 125400 + }, + { + "epoch": 369.12, + "learning_rate": 6.3008599410869085e-06, + "loss": 0.1181, + "step": 125500 + }, + { + "epoch": 369.41, + "learning_rate": 6.295786643031946e-06, + "loss": 0.1203, + "step": 125600 + }, + { + "epoch": 369.71, + "learning_rate": 6.290711914467214e-06, + "loss": 0.1233, + "step": 125700 + }, + { + "epoch": 370.0, + "learning_rate": 6.285635760995063e-06, + "loss": 0.1258, + "step": 125800 + }, + { + "epoch": 370.29, + "learning_rate": 6.280608970954318e-06, + "loss": 0.1191, + "step": 125900 + }, + { + "epoch": 370.59, + "learning_rate": 6.275529998589889e-06, + "loss": 0.1203, + "step": 126000 + }, + { + "epoch": 370.59, + "eval_cer": 0.07401595396887668, + "eval_loss": 0.4892123341560364, + "eval_runtime": 4.6022, + "eval_samples_per_second": 78.006, + "eval_steps_per_second": 2.607, + "eval_wer": 0.2769627599548605, + "step": 126000 + }, + { + "epoch": 370.88, + "learning_rate": 6.270449618078422e-06, + "loss": 0.1201, + "step": 126100 + }, + { + "epoch": 371.18, + "learning_rate": 6.2653678350285066e-06, + "loss": 0.1213, + "step": 126200 + }, + { + "epoch": 371.47, + "learning_rate": 6.260284655050277e-06, + "loss": 0.1264, + "step": 126300 + }, + { + "epoch": 371.76, + "learning_rate": 6.255200083755416e-06, + "loss": 0.1181, + "step": 126400 + }, + { + "epoch": 372.06, + "learning_rate": 6.250114126757135e-06, + "loss": 0.1226, + "step": 126500 + }, + { + "epoch": 372.35, + "learning_rate": 6.245026789670181e-06, + "loss": 0.1249, + "step": 126600 + }, + { + "epoch": 372.65, + "learning_rate": 6.239938078110822e-06, + "loss": 0.1211, + "step": 126700 + }, + { + "epoch": 372.94, + "learning_rate": 6.2348479976968425e-06, + "loss": 0.1227, + "step": 126800 + }, + { + "epoch": 373.24, + "learning_rate": 6.22975655404754e-06, + "loss": 0.1192, + "step": 126900 + }, + { + "epoch": 373.53, + "learning_rate": 6.224714687498088e-06, + "loss": 0.1167, + "step": 127000 + }, + { + "epoch": 373.53, + "eval_cer": 0.07475698531014341, + "eval_loss": 0.49567899107933044, + "eval_runtime": 5.3774, + "eval_samples_per_second": 66.761, + "eval_steps_per_second": 2.232, + "eval_wer": 0.28163791713686925, + "step": 127000 + }, + { + "epoch": 373.82, + "learning_rate": 6.21962054773413e-06, + "loss": 0.1229, + "step": 127100 + }, + { + "epoch": 374.12, + "learning_rate": 6.2145250615455e-06, + "loss": 0.1165, + "step": 127200 + }, + { + "epoch": 374.41, + "learning_rate": 6.209428234557462e-06, + "loss": 0.1258, + "step": 127300 + }, + { + "epoch": 374.71, + "learning_rate": 6.204330072396759e-06, + "loss": 0.1203, + "step": 127400 + }, + { + "epoch": 375.0, + "learning_rate": 6.199230580691613e-06, + "loss": 0.1226, + "step": 127500 + }, + { + "epoch": 375.29, + "learning_rate": 6.194129765071708e-06, + "loss": 0.1153, + "step": 127600 + }, + { + "epoch": 375.59, + "learning_rate": 6.189027631168194e-06, + "loss": 0.1205, + "step": 127700 + }, + { + "epoch": 375.88, + "learning_rate": 6.183924184613672e-06, + "loss": 0.1221, + "step": 127800 + }, + { + "epoch": 376.18, + "learning_rate": 6.178819431042198e-06, + "loss": 0.1199, + "step": 127900 + }, + { + "epoch": 376.47, + "learning_rate": 6.1737133760892655e-06, + "loss": 0.1173, + "step": 128000 + }, + { + "epoch": 376.47, + "eval_cer": 0.07462621507344928, + "eval_loss": 0.4890415072441101, + "eval_runtime": 4.8418, + "eval_samples_per_second": 74.147, + "eval_steps_per_second": 2.478, + "eval_wer": 0.2801870062872803, + "step": 128000 + }, + { + "epoch": 376.76, + "learning_rate": 6.168606025391807e-06, + "loss": 0.1158, + "step": 128100 + }, + { + "epoch": 377.06, + "learning_rate": 6.163497384588187e-06, + "loss": 0.1153, + "step": 128200 + }, + { + "epoch": 377.35, + "learning_rate": 6.158387459318186e-06, + "loss": 0.1216, + "step": 128300 + }, + { + "epoch": 377.65, + "learning_rate": 6.153276255223016e-06, + "loss": 0.1168, + "step": 128400 + }, + { + "epoch": 377.94, + "learning_rate": 6.148163777945292e-06, + "loss": 0.118, + "step": 128500 + }, + { + "epoch": 378.24, + "learning_rate": 6.143050033129035e-06, + "loss": 0.115, + "step": 128600 + }, + { + "epoch": 378.53, + "learning_rate": 6.137935026419669e-06, + "loss": 0.1152, + "step": 128700 + }, + { + "epoch": 378.82, + "learning_rate": 6.132818763464003e-06, + "loss": 0.1227, + "step": 128800 + }, + { + "epoch": 379.12, + "learning_rate": 6.127701249910245e-06, + "loss": 0.1223, + "step": 128900 + }, + { + "epoch": 379.41, + "learning_rate": 6.122582491407975e-06, + "loss": 0.1184, + "step": 129000 + }, + { + "epoch": 379.41, + "eval_cer": 0.07388518373218256, + "eval_loss": 0.4918311536312103, + "eval_runtime": 4.5282, + "eval_samples_per_second": 79.281, + "eval_steps_per_second": 2.65, + "eval_wer": 0.2737385136224408, + "step": 129000 + }, + { + "epoch": 379.71, + "learning_rate": 6.117462493608148e-06, + "loss": 0.1195, + "step": 129100 + }, + { + "epoch": 380.0, + "learning_rate": 6.112341262163092e-06, + "loss": 0.1158, + "step": 129200 + }, + { + "epoch": 380.29, + "learning_rate": 6.10721880272649e-06, + "loss": 0.1154, + "step": 129300 + }, + { + "epoch": 380.59, + "learning_rate": 6.102095120953385e-06, + "loss": 0.1211, + "step": 129400 + }, + { + "epoch": 380.88, + "learning_rate": 6.09697022250017e-06, + "loss": 0.1211, + "step": 129500 + }, + { + "epoch": 381.18, + "learning_rate": 6.091844113024581e-06, + "loss": 0.1209, + "step": 129600 + }, + { + "epoch": 381.47, + "learning_rate": 6.086716798185686e-06, + "loss": 0.1197, + "step": 129700 + }, + { + "epoch": 381.76, + "learning_rate": 6.081588283643892e-06, + "loss": 0.1169, + "step": 129800 + }, + { + "epoch": 382.06, + "learning_rate": 6.0764585750609215e-06, + "loss": 0.1198, + "step": 129900 + }, + { + "epoch": 382.35, + "learning_rate": 6.071327678099823e-06, + "loss": 0.1142, + "step": 130000 + }, + { + "epoch": 382.35, + "eval_cer": 0.07401595396887668, + "eval_loss": 0.4911036491394043, + "eval_runtime": 5.3976, + "eval_samples_per_second": 66.51, + "eval_steps_per_second": 2.223, + "eval_wer": 0.2774463969047235, + "step": 130000 + }, + { + "epoch": 382.65, + "learning_rate": 6.066195598424953e-06, + "loss": 0.1159, + "step": 130100 + }, + { + "epoch": 382.94, + "learning_rate": 6.0610623417019734e-06, + "loss": 0.1172, + "step": 130200 + }, + { + "epoch": 383.24, + "learning_rate": 6.055927913597847e-06, + "loss": 0.1167, + "step": 130300 + }, + { + "epoch": 383.53, + "learning_rate": 6.0507923197808275e-06, + "loss": 0.1167, + "step": 130400 + }, + { + "epoch": 383.82, + "learning_rate": 6.045655565920457e-06, + "loss": 0.1305, + "step": 130500 + }, + { + "epoch": 384.12, + "learning_rate": 6.040517657687562e-06, + "loss": 0.1127, + "step": 130600 + }, + { + "epoch": 384.41, + "learning_rate": 6.035378600754237e-06, + "loss": 0.1232, + "step": 130700 + }, + { + "epoch": 384.71, + "learning_rate": 6.030238400793849e-06, + "loss": 0.1166, + "step": 130800 + }, + { + "epoch": 385.0, + "learning_rate": 6.025097063481024e-06, + "loss": 0.1152, + "step": 130900 + }, + { + "epoch": 385.29, + "learning_rate": 6.019954594491645e-06, + "loss": 0.1118, + "step": 131000 + }, + { + "epoch": 385.29, + "eval_cer": 0.07610827775598274, + "eval_loss": 0.49062150716781616, + "eval_runtime": 4.4732, + "eval_samples_per_second": 80.256, + "eval_steps_per_second": 2.683, + "eval_wer": 0.2847009511526681, + "step": 131000 + }, + { + "epoch": 385.59, + "learning_rate": 6.014810999502842e-06, + "loss": 0.1142, + "step": 131100 + }, + { + "epoch": 385.88, + "learning_rate": 6.009666284192995e-06, + "loss": 0.1225, + "step": 131200 + }, + { + "epoch": 386.18, + "learning_rate": 6.004571918040052e-06, + "loss": 0.1195, + "step": 131300 + }, + { + "epoch": 386.47, + "learning_rate": 5.99942499018966e-06, + "loss": 0.1158, + "step": 131400 + }, + { + "epoch": 386.76, + "learning_rate": 5.994276959003917e-06, + "loss": 0.1169, + "step": 131500 + }, + { + "epoch": 387.06, + "learning_rate": 5.989127830166097e-06, + "loss": 0.1152, + "step": 131600 + }, + { + "epoch": 387.35, + "learning_rate": 5.983977609360683e-06, + "loss": 0.1156, + "step": 131700 + }, + { + "epoch": 387.65, + "learning_rate": 5.978826302273363e-06, + "loss": 0.1097, + "step": 131800 + }, + { + "epoch": 387.94, + "learning_rate": 5.973673914591029e-06, + "loss": 0.115, + "step": 131900 + }, + { + "epoch": 388.24, + "learning_rate": 5.968520452001762e-06, + "loss": 0.1156, + "step": 132000 + }, + { + "epoch": 388.24, + "eval_cer": 0.07462621507344928, + "eval_loss": 0.49032217264175415, + "eval_runtime": 4.9494, + "eval_samples_per_second": 72.533, + "eval_steps_per_second": 2.425, + "eval_wer": 0.2793809447041754, + "step": 132000 + }, + { + "epoch": 388.53, + "learning_rate": 5.963365920194832e-06, + "loss": 0.111, + "step": 132100 + }, + { + "epoch": 388.82, + "learning_rate": 5.958210324860687e-06, + "loss": 0.1128, + "step": 132200 + }, + { + "epoch": 389.12, + "learning_rate": 5.953053671690952e-06, + "loss": 0.1155, + "step": 132300 + }, + { + "epoch": 389.41, + "learning_rate": 5.947947548620953e-06, + "loss": 0.1136, + "step": 132400 + }, + { + "epoch": 389.71, + "learning_rate": 5.9427888072958684e-06, + "loss": 0.1123, + "step": 132500 + }, + { + "epoch": 390.0, + "learning_rate": 5.937629025160088e-06, + "loss": 0.12, + "step": 132600 + }, + { + "epoch": 390.29, + "learning_rate": 5.9324682079098565e-06, + "loss": 0.1158, + "step": 132700 + }, + { + "epoch": 390.59, + "learning_rate": 5.927306361242563e-06, + "loss": 0.1151, + "step": 132800 + }, + { + "epoch": 390.88, + "learning_rate": 5.922143490856731e-06, + "loss": 0.1119, + "step": 132900 + }, + { + "epoch": 391.18, + "learning_rate": 5.9169796024520155e-06, + "loss": 0.1102, + "step": 133000 + }, + { + "epoch": 391.18, + "eval_cer": 0.07471339523124537, + "eval_loss": 0.5015389919281006, + "eval_runtime": 4.6902, + "eval_samples_per_second": 76.543, + "eval_steps_per_second": 2.559, + "eval_wer": 0.27889730775431243, + "step": 133000 + }, + { + "epoch": 391.47, + "learning_rate": 5.911814701729196e-06, + "loss": 0.1132, + "step": 133100 + }, + { + "epoch": 391.76, + "learning_rate": 5.906648794390167e-06, + "loss": 0.1146, + "step": 133200 + }, + { + "epoch": 392.06, + "learning_rate": 5.9014818861379375e-06, + "loss": 0.112, + "step": 133300 + }, + { + "epoch": 392.35, + "learning_rate": 5.89631398267662e-06, + "loss": 0.1116, + "step": 133400 + }, + { + "epoch": 392.65, + "learning_rate": 5.891145089711425e-06, + "loss": 0.1121, + "step": 133500 + }, + { + "epoch": 392.94, + "learning_rate": 5.885975212948656e-06, + "loss": 0.1157, + "step": 133600 + }, + { + "epoch": 393.24, + "learning_rate": 5.880804358095702e-06, + "loss": 0.1101, + "step": 133700 + }, + { + "epoch": 393.53, + "learning_rate": 5.875632530861034e-06, + "loss": 0.1167, + "step": 133800 + }, + { + "epoch": 393.82, + "learning_rate": 5.870511469659539e-06, + "loss": 0.1119, + "step": 133900 + }, + { + "epoch": 394.12, + "learning_rate": 5.8653377243724815e-06, + "loss": 0.1191, + "step": 134000 + }, + { + "epoch": 394.12, + "eval_cer": 0.07475698531014341, + "eval_loss": 0.5096559524536133, + "eval_runtime": 5.1149, + "eval_samples_per_second": 70.188, + "eval_steps_per_second": 2.346, + "eval_wer": 0.2779300338545865, + "step": 134000 + }, + { + "epoch": 394.41, + "learning_rate": 5.86016302377841e-06, + "loss": 0.1136, + "step": 134100 + }, + { + "epoch": 394.71, + "learning_rate": 5.854987373590043e-06, + "loss": 0.1159, + "step": 134200 + }, + { + "epoch": 395.0, + "learning_rate": 5.8498107795211376e-06, + "loss": 0.1145, + "step": 134300 + }, + { + "epoch": 395.29, + "learning_rate": 5.8446332472865054e-06, + "loss": 0.1102, + "step": 134400 + }, + { + "epoch": 395.59, + "learning_rate": 5.839454782601983e-06, + "loss": 0.1104, + "step": 134500 + }, + { + "epoch": 395.88, + "learning_rate": 5.834275391184444e-06, + "loss": 0.1101, + "step": 134600 + }, + { + "epoch": 396.18, + "learning_rate": 5.829095078751781e-06, + "loss": 0.1105, + "step": 134700 + }, + { + "epoch": 396.47, + "learning_rate": 5.823913851022901e-06, + "loss": 0.1167, + "step": 134800 + }, + { + "epoch": 396.76, + "learning_rate": 5.818731713717729e-06, + "loss": 0.1175, + "step": 134900 + }, + { + "epoch": 397.06, + "learning_rate": 5.813548672557189e-06, + "loss": 0.1129, + "step": 135000 + }, + { + "epoch": 397.06, + "eval_cer": 0.07366723333769234, + "eval_loss": 0.5002287030220032, + "eval_runtime": 5.5456, + "eval_samples_per_second": 64.736, + "eval_steps_per_second": 2.164, + "eval_wer": 0.2763179106883766, + "step": 135000 + }, + { + "epoch": 397.35, + "learning_rate": 5.808364733263202e-06, + "loss": 0.1121, + "step": 135100 + }, + { + "epoch": 397.65, + "learning_rate": 5.803179901558684e-06, + "loss": 0.1149, + "step": 135200 + }, + { + "epoch": 397.94, + "learning_rate": 5.797994183167534e-06, + "loss": 0.1112, + "step": 135300 + }, + { + "epoch": 398.24, + "learning_rate": 5.792807583814628e-06, + "loss": 0.1118, + "step": 135400 + }, + { + "epoch": 398.53, + "learning_rate": 5.787620109225819e-06, + "loss": 0.1175, + "step": 135500 + }, + { + "epoch": 398.82, + "learning_rate": 5.782431765127925e-06, + "loss": 0.1092, + "step": 135600 + }, + { + "epoch": 399.12, + "learning_rate": 5.777242557248722e-06, + "loss": 0.1143, + "step": 135700 + }, + { + "epoch": 399.41, + "learning_rate": 5.772052491316941e-06, + "loss": 0.1126, + "step": 135800 + }, + { + "epoch": 399.71, + "learning_rate": 5.766861573062257e-06, + "loss": 0.1176, + "step": 135900 + }, + { + "epoch": 400.0, + "learning_rate": 5.761669808215291e-06, + "loss": 0.1097, + "step": 136000 + }, + { + "epoch": 400.0, + "eval_cer": 0.07488775554683753, + "eval_loss": 0.5063867568969727, + "eval_runtime": 4.6813, + "eval_samples_per_second": 76.689, + "eval_steps_per_second": 2.563, + "eval_wer": 0.2809930678703853, + "step": 136000 + }, + { + "epoch": 400.29, + "learning_rate": 5.756477202507598e-06, + "loss": 0.1192, + "step": 136100 + }, + { + "epoch": 400.59, + "learning_rate": 5.751283761671659e-06, + "loss": 0.1035, + "step": 136200 + }, + { + "epoch": 400.88, + "learning_rate": 5.746089491440875e-06, + "loss": 0.1048, + "step": 136300 + }, + { + "epoch": 401.18, + "learning_rate": 5.740894397549567e-06, + "loss": 0.106, + "step": 136400 + }, + { + "epoch": 401.47, + "learning_rate": 5.735698485732963e-06, + "loss": 0.1065, + "step": 136500 + }, + { + "epoch": 401.76, + "learning_rate": 5.730501761727196e-06, + "loss": 0.1117, + "step": 136600 + }, + { + "epoch": 402.06, + "learning_rate": 5.725304231269293e-06, + "loss": 0.1157, + "step": 136700 + }, + { + "epoch": 402.35, + "learning_rate": 5.720105900097174e-06, + "loss": 0.1119, + "step": 136800 + }, + { + "epoch": 402.65, + "learning_rate": 5.7149067739496375e-06, + "loss": 0.1088, + "step": 136900 + }, + { + "epoch": 402.94, + "learning_rate": 5.709706858566368e-06, + "loss": 0.1049, + "step": 137000 + }, + { + "epoch": 402.94, + "eval_cer": 0.07288261191752757, + "eval_loss": 0.497284859418869, + "eval_runtime": 4.9493, + "eval_samples_per_second": 72.535, + "eval_steps_per_second": 2.425, + "eval_wer": 0.2732548766725778, + "step": 137000 + }, + { + "epoch": 403.24, + "learning_rate": 5.704506159687914e-06, + "loss": 0.1091, + "step": 137100 + }, + { + "epoch": 403.53, + "learning_rate": 5.699304683055693e-06, + "loss": 0.1183, + "step": 137200 + }, + { + "epoch": 403.82, + "learning_rate": 5.69410243441198e-06, + "loss": 0.1084, + "step": 137300 + }, + { + "epoch": 404.12, + "learning_rate": 5.6888994194999015e-06, + "loss": 0.1108, + "step": 137400 + }, + { + "epoch": 404.41, + "learning_rate": 5.683695644063432e-06, + "loss": 0.1056, + "step": 137500 + }, + { + "epoch": 404.71, + "learning_rate": 5.6784911138473804e-06, + "loss": 0.1134, + "step": 137600 + }, + { + "epoch": 405.0, + "learning_rate": 5.6732858345973975e-06, + "loss": 0.113, + "step": 137700 + }, + { + "epoch": 405.29, + "learning_rate": 5.6680798120599556e-06, + "loss": 0.1164, + "step": 137800 + }, + { + "epoch": 405.59, + "learning_rate": 5.662873051982345e-06, + "loss": 0.117, + "step": 137900 + }, + { + "epoch": 405.88, + "learning_rate": 5.657665560112675e-06, + "loss": 0.117, + "step": 138000 + }, + { + "epoch": 405.88, + "eval_cer": 0.0742339043633669, + "eval_loss": 0.5041438341140747, + "eval_runtime": 5.2679, + "eval_samples_per_second": 68.149, + "eval_steps_per_second": 2.278, + "eval_wer": 0.2790585200709334, + "step": 138000 + }, + { + "epoch": 406.18, + "learning_rate": 5.652457342199862e-06, + "loss": 0.1129, + "step": 138100 + }, + { + "epoch": 406.47, + "learning_rate": 5.647248403993621e-06, + "loss": 0.1138, + "step": 138200 + }, + { + "epoch": 406.76, + "learning_rate": 5.642038751244467e-06, + "loss": 0.1099, + "step": 138300 + }, + { + "epoch": 407.06, + "learning_rate": 5.636828389703699e-06, + "loss": 0.1094, + "step": 138400 + }, + { + "epoch": 407.35, + "learning_rate": 5.631617325123402e-06, + "loss": 0.1055, + "step": 138500 + }, + { + "epoch": 407.65, + "learning_rate": 5.626405563256434e-06, + "loss": 0.1122, + "step": 138600 + }, + { + "epoch": 407.94, + "learning_rate": 5.62124523779462e-06, + "loss": 0.1102, + "step": 138700 + }, + { + "epoch": 408.24, + "learning_rate": 5.616032105445265e-06, + "loss": 0.1095, + "step": 138800 + }, + { + "epoch": 408.53, + "learning_rate": 5.610818293014856e-06, + "loss": 0.1117, + "step": 138900 + }, + { + "epoch": 408.82, + "learning_rate": 5.605603806259288e-06, + "loss": 0.1082, + "step": 139000 + }, + { + "epoch": 408.82, + "eval_cer": 0.07218517065515889, + "eval_loss": 0.5032652616500854, + "eval_runtime": 4.4402, + "eval_samples_per_second": 80.853, + "eval_steps_per_second": 2.703, + "eval_wer": 0.2713203288731259, + "step": 139000 + }, + { + "epoch": 409.12, + "learning_rate": 5.600388650935198e-06, + "loss": 0.1117, + "step": 139100 + }, + { + "epoch": 409.41, + "learning_rate": 5.595172832799962e-06, + "loss": 0.1055, + "step": 139200 + }, + { + "epoch": 409.71, + "learning_rate": 5.589956357611688e-06, + "loss": 0.1079, + "step": 139300 + }, + { + "epoch": 410.0, + "learning_rate": 5.584739231129208e-06, + "loss": 0.1094, + "step": 139400 + }, + { + "epoch": 410.29, + "learning_rate": 5.579521459112074e-06, + "loss": 0.1046, + "step": 139500 + }, + { + "epoch": 410.59, + "learning_rate": 5.574303047320551e-06, + "loss": 0.1145, + "step": 139600 + }, + { + "epoch": 410.88, + "learning_rate": 5.569136195093107e-06, + "loss": 0.1112, + "step": 139700 + }, + { + "epoch": 411.18, + "learning_rate": 5.563916527290414e-06, + "loss": 0.1119, + "step": 139800 + }, + { + "epoch": 411.47, + "learning_rate": 5.558696236940708e-06, + "loss": 0.1083, + "step": 139900 + }, + { + "epoch": 411.76, + "learning_rate": 5.553475329807039e-06, + "loss": 0.1119, + "step": 140000 + }, + { + "epoch": 411.76, + "eval_cer": 0.073318512706508, + "eval_loss": 0.5045868754386902, + "eval_runtime": 4.7184, + "eval_samples_per_second": 76.085, + "eval_steps_per_second": 2.543, + "eval_wer": 0.27518942447202965, + "step": 140000 + }, + { + "epoch": 412.06, + "learning_rate": 5.548253811653128e-06, + "loss": 0.1071, + "step": 140100 + }, + { + "epoch": 412.35, + "learning_rate": 5.543031688243378e-06, + "loss": 0.1126, + "step": 140200 + }, + { + "epoch": 412.65, + "learning_rate": 5.537808965342856e-06, + "loss": 0.1018, + "step": 140300 + }, + { + "epoch": 412.94, + "learning_rate": 5.5325856487172936e-06, + "loss": 0.1087, + "step": 140400 + }, + { + "epoch": 413.24, + "learning_rate": 5.527361744133073e-06, + "loss": 0.1081, + "step": 140500 + }, + { + "epoch": 413.53, + "learning_rate": 5.522137257357233e-06, + "loss": 0.108, + "step": 140600 + }, + { + "epoch": 413.82, + "learning_rate": 5.516912194157449e-06, + "loss": 0.1138, + "step": 140700 + }, + { + "epoch": 414.12, + "learning_rate": 5.5116865603020355e-06, + "loss": 0.1073, + "step": 140800 + }, + { + "epoch": 414.41, + "learning_rate": 5.5064603615599364e-06, + "loss": 0.1084, + "step": 140900 + }, + { + "epoch": 414.71, + "learning_rate": 5.5012336037007165e-06, + "loss": 0.113, + "step": 141000 + }, + { + "epoch": 414.71, + "eval_cer": 0.0739287738110806, + "eval_loss": 0.5068278908729553, + "eval_runtime": 4.4954, + "eval_samples_per_second": 79.86, + "eval_steps_per_second": 2.669, + "eval_wer": 0.27712397227148156, + "step": 141000 + }, + { + "epoch": 415.0, + "learning_rate": 5.496006292494563e-06, + "loss": 0.1068, + "step": 141100 + }, + { + "epoch": 415.29, + "learning_rate": 5.490778433712272e-06, + "loss": 0.1119, + "step": 141200 + }, + { + "epoch": 415.59, + "learning_rate": 5.485550033125242e-06, + "loss": 0.1073, + "step": 141300 + }, + { + "epoch": 415.88, + "learning_rate": 5.480321096505472e-06, + "loss": 0.1052, + "step": 141400 + }, + { + "epoch": 416.18, + "learning_rate": 5.475091629625551e-06, + "loss": 0.1095, + "step": 141500 + }, + { + "epoch": 416.47, + "learning_rate": 5.469861638258653e-06, + "loss": 0.1113, + "step": 141600 + }, + { + "epoch": 416.76, + "learning_rate": 5.4646311281785355e-06, + "loss": 0.1081, + "step": 141700 + }, + { + "epoch": 417.06, + "learning_rate": 5.459400105159525e-06, + "loss": 0.1029, + "step": 141800 + }, + { + "epoch": 417.35, + "learning_rate": 5.454168574976514e-06, + "loss": 0.1133, + "step": 141900 + }, + { + "epoch": 417.65, + "learning_rate": 5.4489365434049535e-06, + "loss": 0.1091, + "step": 142000 + }, + { + "epoch": 417.65, + "eval_cer": 0.07275184168083344, + "eval_loss": 0.5030051469802856, + "eval_runtime": 5.6004, + "eval_samples_per_second": 64.103, + "eval_steps_per_second": 2.143, + "eval_wer": 0.2748669998387877, + "step": 142000 + }, + { + "epoch": 417.94, + "learning_rate": 5.443704016220852e-06, + "loss": 0.1109, + "step": 142100 + }, + { + "epoch": 418.24, + "learning_rate": 5.438470999200765e-06, + "loss": 0.1039, + "step": 142200 + }, + { + "epoch": 418.53, + "learning_rate": 5.433237498121785e-06, + "loss": 0.1073, + "step": 142300 + }, + { + "epoch": 418.82, + "learning_rate": 5.428003518761542e-06, + "loss": 0.1132, + "step": 142400 + }, + { + "epoch": 419.12, + "learning_rate": 5.422769066898191e-06, + "loss": 0.1089, + "step": 142500 + }, + { + "epoch": 419.41, + "learning_rate": 5.417534148310413e-06, + "loss": 0.1145, + "step": 142600 + }, + { + "epoch": 419.71, + "learning_rate": 5.412298768777399e-06, + "loss": 0.1076, + "step": 142700 + }, + { + "epoch": 420.0, + "learning_rate": 5.407062934078855e-06, + "loss": 0.106, + "step": 142800 + }, + { + "epoch": 420.29, + "learning_rate": 5.401826649994986e-06, + "loss": 0.1088, + "step": 142900 + }, + { + "epoch": 420.59, + "learning_rate": 5.39658992230649e-06, + "loss": 0.1079, + "step": 143000 + }, + { + "epoch": 420.59, + "eval_cer": 0.0736236432587943, + "eval_loss": 0.5185303688049316, + "eval_runtime": 4.7112, + "eval_samples_per_second": 76.202, + "eval_steps_per_second": 2.547, + "eval_wer": 0.27551184910527166, + "step": 143000 + }, + { + "epoch": 420.88, + "learning_rate": 5.39135275679456e-06, + "loss": 0.1097, + "step": 143100 + }, + { + "epoch": 421.18, + "learning_rate": 5.38611515924087e-06, + "loss": 0.108, + "step": 143200 + }, + { + "epoch": 421.47, + "learning_rate": 5.380877135427571e-06, + "loss": 0.107, + "step": 143300 + }, + { + "epoch": 421.76, + "learning_rate": 5.3756386911372885e-06, + "loss": 0.1098, + "step": 143400 + }, + { + "epoch": 422.06, + "learning_rate": 5.370399832153105e-06, + "loss": 0.1081, + "step": 143500 + }, + { + "epoch": 422.35, + "learning_rate": 5.365160564258564e-06, + "loss": 0.1028, + "step": 143600 + }, + { + "epoch": 422.65, + "learning_rate": 5.359920893237661e-06, + "loss": 0.1014, + "step": 143700 + }, + { + "epoch": 422.94, + "learning_rate": 5.354680824874838e-06, + "loss": 0.1069, + "step": 143800 + }, + { + "epoch": 423.24, + "learning_rate": 5.349440364954974e-06, + "loss": 0.1084, + "step": 143900 + }, + { + "epoch": 423.53, + "learning_rate": 5.34419951926338e-06, + "loss": 0.1076, + "step": 144000 + }, + { + "epoch": 423.53, + "eval_cer": 0.07405954404777472, + "eval_loss": 0.5147412419319153, + "eval_runtime": 4.5037, + "eval_samples_per_second": 79.712, + "eval_steps_per_second": 2.664, + "eval_wer": 0.2785748831210704, + "step": 144000 + }, + { + "epoch": 423.82, + "learning_rate": 5.338958293585792e-06, + "loss": 0.1043, + "step": 144100 + }, + { + "epoch": 424.12, + "learning_rate": 5.33376911154043e-06, + "loss": 0.1108, + "step": 144200 + }, + { + "epoch": 424.41, + "learning_rate": 5.328527146905228e-06, + "loss": 0.1142, + "step": 144300 + }, + { + "epoch": 424.71, + "learning_rate": 5.3232848195858635e-06, + "loss": 0.1071, + "step": 144400 + }, + { + "epoch": 425.0, + "learning_rate": 5.3180421353697085e-06, + "loss": 0.1034, + "step": 144500 + }, + { + "epoch": 425.29, + "learning_rate": 5.312799100044533e-06, + "loss": 0.1069, + "step": 144600 + }, + { + "epoch": 425.59, + "learning_rate": 5.3075557193984864e-06, + "loss": 0.1037, + "step": 144700 + }, + { + "epoch": 425.88, + "learning_rate": 5.302311999220111e-06, + "loss": 0.108, + "step": 144800 + }, + { + "epoch": 426.18, + "learning_rate": 5.297067945298313e-06, + "loss": 0.1121, + "step": 144900 + }, + { + "epoch": 426.47, + "learning_rate": 5.291823563422372e-06, + "loss": 0.107, + "step": 145000 + }, + { + "epoch": 426.47, + "eval_cer": 0.07292620199642562, + "eval_loss": 0.5176792740821838, + "eval_runtime": 4.7997, + "eval_samples_per_second": 74.796, + "eval_steps_per_second": 2.5, + "eval_wer": 0.2737385136224408, + "step": 145000 + }, + { + "epoch": 426.76, + "learning_rate": 5.28657885938193e-06, + "loss": 0.1021, + "step": 145100 + }, + { + "epoch": 427.06, + "learning_rate": 5.281333838966982e-06, + "loss": 0.1001, + "step": 145200 + }, + { + "epoch": 427.35, + "learning_rate": 5.276088507967876e-06, + "loss": 0.1103, + "step": 145300 + }, + { + "epoch": 427.65, + "learning_rate": 5.2708428721752995e-06, + "loss": 0.1074, + "step": 145400 + }, + { + "epoch": 427.94, + "learning_rate": 5.265596937380277e-06, + "loss": 0.1005, + "step": 145500 + }, + { + "epoch": 428.24, + "learning_rate": 5.260350709374167e-06, + "loss": 0.1044, + "step": 145600 + }, + { + "epoch": 428.53, + "learning_rate": 5.255104193948646e-06, + "loss": 0.1069, + "step": 145700 + }, + { + "epoch": 428.82, + "learning_rate": 5.24985739689571e-06, + "loss": 0.1122, + "step": 145800 + }, + { + "epoch": 429.12, + "learning_rate": 5.2446103240076685e-06, + "loss": 0.1052, + "step": 145900 + }, + { + "epoch": 429.41, + "learning_rate": 5.239362981077132e-06, + "loss": 0.1082, + "step": 146000 + }, + { + "epoch": 429.41, + "eval_cer": 0.07344928294320213, + "eval_loss": 0.51496821641922, + "eval_runtime": 4.8758, + "eval_samples_per_second": 73.63, + "eval_steps_per_second": 2.461, + "eval_wer": 0.2764791230049976, + "step": 146000 + }, + { + "epoch": 429.71, + "learning_rate": 5.23411537389701e-06, + "loss": 0.1047, + "step": 146100 + }, + { + "epoch": 430.0, + "learning_rate": 5.2288675082605045e-06, + "loss": 0.1101, + "step": 146200 + }, + { + "epoch": 430.29, + "learning_rate": 5.223619389961103e-06, + "loss": 0.1032, + "step": 146300 + }, + { + "epoch": 430.59, + "learning_rate": 5.218371024792572e-06, + "loss": 0.0983, + "step": 146400 + }, + { + "epoch": 430.88, + "learning_rate": 5.213122418548948e-06, + "loss": 0.1118, + "step": 146500 + }, + { + "epoch": 431.18, + "learning_rate": 5.2078735770245385e-06, + "loss": 0.1063, + "step": 146600 + }, + { + "epoch": 431.47, + "learning_rate": 5.202624506013904e-06, + "loss": 0.1084, + "step": 146700 + }, + { + "epoch": 431.76, + "learning_rate": 5.197375211311864e-06, + "loss": 0.1056, + "step": 146800 + }, + { + "epoch": 432.06, + "learning_rate": 5.192178194899027e-06, + "loss": 0.1106, + "step": 146900 + }, + { + "epoch": 432.35, + "learning_rate": 5.186928472291934e-06, + "loss": 0.1018, + "step": 147000 + }, + { + "epoch": 432.35, + "eval_cer": 0.07375441349548843, + "eval_loss": 0.5148587822914124, + "eval_runtime": 5.1845, + "eval_samples_per_second": 69.245, + "eval_steps_per_second": 2.315, + "eval_wer": 0.2742221505723037, + "step": 147000 + }, + { + "epoch": 432.65, + "learning_rate": 5.181678543321391e-06, + "loss": 0.1075, + "step": 147100 + }, + { + "epoch": 432.94, + "learning_rate": 5.176428413783156e-06, + "loss": 0.1031, + "step": 147200 + }, + { + "epoch": 433.24, + "learning_rate": 5.171178089473222e-06, + "loss": 0.1064, + "step": 147300 + }, + { + "epoch": 433.53, + "learning_rate": 5.165927576187788e-06, + "loss": 0.1091, + "step": 147400 + }, + { + "epoch": 433.82, + "learning_rate": 5.160676879723263e-06, + "loss": 0.1027, + "step": 147500 + }, + { + "epoch": 434.12, + "learning_rate": 5.155426005876261e-06, + "loss": 0.1088, + "step": 147600 + }, + { + "epoch": 434.41, + "learning_rate": 5.150174960443588e-06, + "loss": 0.1016, + "step": 147700 + }, + { + "epoch": 434.71, + "learning_rate": 5.14492374922224e-06, + "loss": 0.1046, + "step": 147800 + }, + { + "epoch": 435.0, + "learning_rate": 5.139672378009402e-06, + "loss": 0.1044, + "step": 147900 + }, + { + "epoch": 435.29, + "learning_rate": 5.134420852602428e-06, + "loss": 0.1028, + "step": 148000 + }, + { + "epoch": 435.29, + "eval_cer": 0.07292620199642562, + "eval_loss": 0.5164076685905457, + "eval_runtime": 5.4, + "eval_samples_per_second": 66.482, + "eval_steps_per_second": 2.222, + "eval_wer": 0.2748669998387877, + "step": 148000 + }, + { + "epoch": 435.59, + "learning_rate": 5.129169178798846e-06, + "loss": 0.1016, + "step": 148100 + }, + { + "epoch": 435.88, + "learning_rate": 5.1239173623963465e-06, + "loss": 0.1081, + "step": 148200 + }, + { + "epoch": 436.18, + "learning_rate": 5.118665409192778e-06, + "loss": 0.1082, + "step": 148300 + }, + { + "epoch": 436.47, + "learning_rate": 5.113465846457636e-06, + "loss": 0.0973, + "step": 148400 + }, + { + "epoch": 436.76, + "learning_rate": 5.108213638269423e-06, + "loss": 0.1, + "step": 148500 + }, + { + "epoch": 437.06, + "learning_rate": 5.102961310616583e-06, + "loss": 0.1126, + "step": 148600 + }, + { + "epoch": 437.35, + "learning_rate": 5.09770886929753e-06, + "loss": 0.096, + "step": 148700 + }, + { + "epoch": 437.65, + "learning_rate": 5.092456320110802e-06, + "loss": 0.1005, + "step": 148800 + }, + { + "epoch": 437.94, + "learning_rate": 5.087203668855059e-06, + "loss": 0.1019, + "step": 148900 + }, + { + "epoch": 438.24, + "learning_rate": 5.081950921329067e-06, + "loss": 0.1031, + "step": 149000 + }, + { + "epoch": 438.24, + "eval_cer": 0.07318774246981387, + "eval_loss": 0.5136764049530029, + "eval_runtime": 5.3659, + "eval_samples_per_second": 66.903, + "eval_steps_per_second": 2.236, + "eval_wer": 0.2747057875221667, + "step": 149000 + }, + { + "epoch": 438.53, + "learning_rate": 5.076698083331706e-06, + "loss": 0.1097, + "step": 149100 + }, + { + "epoch": 438.82, + "learning_rate": 5.07144516066195e-06, + "loss": 0.1034, + "step": 149200 + }, + { + "epoch": 439.12, + "learning_rate": 5.066192159118869e-06, + "loss": 0.1075, + "step": 149300 + }, + { + "epoch": 439.41, + "learning_rate": 5.060939084501621e-06, + "loss": 0.1065, + "step": 149400 + }, + { + "epoch": 439.71, + "learning_rate": 5.055685942609444e-06, + "loss": 0.1049, + "step": 149500 + }, + { + "epoch": 440.0, + "learning_rate": 5.050432739241649e-06, + "loss": 0.1031, + "step": 149600 + }, + { + "epoch": 440.29, + "learning_rate": 5.045179480197614e-06, + "loss": 0.1079, + "step": 149700 + }, + { + "epoch": 440.59, + "learning_rate": 5.039926171276781e-06, + "loss": 0.1001, + "step": 149800 + }, + { + "epoch": 440.88, + "learning_rate": 5.03467281827865e-06, + "loss": 0.1063, + "step": 149900 + }, + { + "epoch": 441.18, + "learning_rate": 5.02941942700276e-06, + "loss": 0.1101, + "step": 150000 + }, + { + "epoch": 441.18, + "eval_cer": 0.0720979904973628, + "eval_loss": 0.5085006356239319, + "eval_runtime": 4.5834, + "eval_samples_per_second": 78.325, + "eval_steps_per_second": 2.618, + "eval_wer": 0.27035305497339995, + "step": 150000 + }, + { + "epoch": 441.47, + "learning_rate": 5.024166003248703e-06, + "loss": 0.1019, + "step": 150100 + }, + { + "epoch": 441.76, + "learning_rate": 5.018912552816099e-06, + "loss": 0.1026, + "step": 150200 + }, + { + "epoch": 442.06, + "learning_rate": 5.0136590815046005e-06, + "loss": 0.1031, + "step": 150300 + }, + { + "epoch": 442.35, + "learning_rate": 5.008405595113883e-06, + "loss": 0.1048, + "step": 150400 + }, + { + "epoch": 442.65, + "learning_rate": 5.003152099443643e-06, + "loss": 0.1062, + "step": 150500 + }, + { + "epoch": 442.94, + "learning_rate": 4.997898600293576e-06, + "loss": 0.1024, + "step": 150600 + }, + { + "epoch": 443.24, + "learning_rate": 4.992645103463394e-06, + "loss": 0.106, + "step": 150700 + }, + { + "epoch": 443.53, + "learning_rate": 4.9873916147527965e-06, + "loss": 0.1097, + "step": 150800 + }, + { + "epoch": 443.82, + "learning_rate": 4.9821381399614795e-06, + "loss": 0.1016, + "step": 150900 + }, + { + "epoch": 444.12, + "learning_rate": 4.976937219323197e-06, + "loss": 0.1037, + "step": 151000 + }, + { + "epoch": 444.12, + "eval_cer": 0.07188004010287259, + "eval_loss": 0.5222977995872498, + "eval_runtime": 5.3886, + "eval_samples_per_second": 66.622, + "eval_steps_per_second": 2.227, + "eval_wer": 0.2709979042398839, + "step": 151000 + }, + { + "epoch": 444.41, + "learning_rate": 4.971683789485565e-06, + "loss": 0.1015, + "step": 151100 + }, + { + "epoch": 444.71, + "learning_rate": 4.966430390908183e-06, + "loss": 0.1074, + "step": 151200 + }, + { + "epoch": 445.0, + "learning_rate": 4.961177029390647e-06, + "loss": 0.0986, + "step": 151300 + }, + { + "epoch": 445.29, + "learning_rate": 4.955923710732511e-06, + "loss": 0.1052, + "step": 151400 + }, + { + "epoch": 445.59, + "learning_rate": 4.950670440733284e-06, + "loss": 0.1072, + "step": 151500 + }, + { + "epoch": 445.88, + "learning_rate": 4.945417225192419e-06, + "loss": 0.1041, + "step": 151600 + }, + { + "epoch": 446.18, + "learning_rate": 4.940164069909305e-06, + "loss": 0.101, + "step": 151700 + }, + { + "epoch": 446.47, + "learning_rate": 4.934910980683273e-06, + "loss": 0.105, + "step": 151800 + }, + { + "epoch": 446.76, + "learning_rate": 4.929657963313573e-06, + "loss": 0.1043, + "step": 151900 + }, + { + "epoch": 447.06, + "learning_rate": 4.924405023599384e-06, + "loss": 0.101, + "step": 152000 + }, + { + "epoch": 447.06, + "eval_cer": 0.07257748136524127, + "eval_loss": 0.5275741815567017, + "eval_runtime": 4.7697, + "eval_samples_per_second": 75.267, + "eval_steps_per_second": 2.516, + "eval_wer": 0.2745445752055457, + "step": 152000 + }, + { + "epoch": 447.35, + "learning_rate": 4.919152167339793e-06, + "loss": 0.1, + "step": 152100 + }, + { + "epoch": 447.65, + "learning_rate": 4.913899400333793e-06, + "loss": 0.1068, + "step": 152200 + }, + { + "epoch": 447.94, + "learning_rate": 4.908646728380285e-06, + "loss": 0.1072, + "step": 152300 + }, + { + "epoch": 448.24, + "learning_rate": 4.90339415727806e-06, + "loss": 0.0946, + "step": 152400 + }, + { + "epoch": 448.53, + "learning_rate": 4.898141692825804e-06, + "loss": 0.1033, + "step": 152500 + }, + { + "epoch": 448.82, + "learning_rate": 4.892889340822079e-06, + "loss": 0.1096, + "step": 152600 + }, + { + "epoch": 449.12, + "learning_rate": 4.88763710706532e-06, + "loss": 0.0976, + "step": 152700 + }, + { + "epoch": 449.41, + "learning_rate": 4.882384997353843e-06, + "loss": 0.1001, + "step": 152800 + }, + { + "epoch": 449.71, + "learning_rate": 4.877133017485817e-06, + "loss": 0.1071, + "step": 152900 + }, + { + "epoch": 450.0, + "learning_rate": 4.871881173259271e-06, + "loss": 0.11, + "step": 153000 + }, + { + "epoch": 450.0, + "eval_cer": 0.07144413931389215, + "eval_loss": 0.5202327370643616, + "eval_runtime": 4.6964, + "eval_samples_per_second": 76.442, + "eval_steps_per_second": 2.555, + "eval_wer": 0.2680960825407061, + "step": 153000 + }, + { + "epoch": 450.29, + "learning_rate": 4.866629470472086e-06, + "loss": 0.0997, + "step": 153100 + }, + { + "epoch": 450.59, + "learning_rate": 4.861377914921982e-06, + "loss": 0.1028, + "step": 153200 + }, + { + "epoch": 450.88, + "learning_rate": 4.856126512406523e-06, + "loss": 0.1034, + "step": 153300 + }, + { + "epoch": 451.18, + "learning_rate": 4.850875268723097e-06, + "loss": 0.0986, + "step": 153400 + }, + { + "epoch": 451.47, + "learning_rate": 4.845624189668923e-06, + "loss": 0.0993, + "step": 153500 + }, + { + "epoch": 451.76, + "learning_rate": 4.8403732810410364e-06, + "loss": 0.1028, + "step": 153600 + }, + { + "epoch": 452.06, + "learning_rate": 4.835122548636279e-06, + "loss": 0.1034, + "step": 153700 + }, + { + "epoch": 452.35, + "learning_rate": 4.829871998251308e-06, + "loss": 0.1045, + "step": 153800 + }, + { + "epoch": 452.65, + "learning_rate": 4.82462163568257e-06, + "loss": 0.0997, + "step": 153900 + }, + { + "epoch": 452.94, + "learning_rate": 4.819371466726311e-06, + "loss": 0.101, + "step": 154000 + }, + { + "epoch": 452.94, + "eval_cer": 0.07235953097075105, + "eval_loss": 0.5265692472457886, + "eval_runtime": 5.2446, + "eval_samples_per_second": 68.452, + "eval_steps_per_second": 2.288, + "eval_wer": 0.27067547960664196, + "step": 154000 + }, + { + "epoch": 453.24, + "learning_rate": 4.814121497178561e-06, + "loss": 0.1029, + "step": 154100 + }, + { + "epoch": 453.53, + "learning_rate": 4.808871732835127e-06, + "loss": 0.1099, + "step": 154200 + }, + { + "epoch": 453.82, + "learning_rate": 4.803622179491595e-06, + "loss": 0.1007, + "step": 154300 + }, + { + "epoch": 454.12, + "learning_rate": 4.798372842943313e-06, + "loss": 0.1024, + "step": 154400 + }, + { + "epoch": 454.41, + "learning_rate": 4.793123728985394e-06, + "loss": 0.1029, + "step": 154500 + }, + { + "epoch": 454.71, + "learning_rate": 4.787874843412701e-06, + "loss": 0.1021, + "step": 154600 + }, + { + "epoch": 455.0, + "learning_rate": 4.782626192019848e-06, + "loss": 0.1064, + "step": 154700 + }, + { + "epoch": 455.29, + "learning_rate": 4.77737778060119e-06, + "loss": 0.106, + "step": 154800 + }, + { + "epoch": 455.59, + "learning_rate": 4.7721296149508145e-06, + "loss": 0.1033, + "step": 154900 + }, + { + "epoch": 455.88, + "learning_rate": 4.766881700862543e-06, + "loss": 0.0996, + "step": 155000 + }, + { + "epoch": 455.88, + "eval_cer": 0.0717928599450765, + "eval_loss": 0.5203773975372314, + "eval_runtime": 4.9467, + "eval_samples_per_second": 72.574, + "eval_steps_per_second": 2.426, + "eval_wer": 0.26777365790746416, + "step": 155000 + }, + { + "epoch": 456.18, + "learning_rate": 4.7616340441299125e-06, + "loss": 0.0956, + "step": 155100 + }, + { + "epoch": 456.47, + "learning_rate": 4.75638665054618e-06, + "loss": 0.1047, + "step": 155200 + }, + { + "epoch": 456.76, + "learning_rate": 4.751139525904315e-06, + "loss": 0.1088, + "step": 155300 + }, + { + "epoch": 457.06, + "learning_rate": 4.745892675996981e-06, + "loss": 0.1061, + "step": 155400 + }, + { + "epoch": 457.35, + "learning_rate": 4.740646106616548e-06, + "loss": 0.0984, + "step": 155500 + }, + { + "epoch": 457.65, + "learning_rate": 4.7353998235550695e-06, + "loss": 0.0978, + "step": 155600 + }, + { + "epoch": 457.94, + "learning_rate": 4.7301538326042854e-06, + "loss": 0.1028, + "step": 155700 + }, + { + "epoch": 458.24, + "learning_rate": 4.724908139555617e-06, + "loss": 0.1034, + "step": 155800 + }, + { + "epoch": 458.53, + "learning_rate": 4.719662750200145e-06, + "loss": 0.0987, + "step": 155900 + }, + { + "epoch": 458.82, + "learning_rate": 4.714522568855664e-06, + "loss": 0.1012, + "step": 156000 + }, + { + "epoch": 458.82, + "eval_cer": 0.07161849962948433, + "eval_loss": 0.5153563618659973, + "eval_runtime": 5.0809, + "eval_samples_per_second": 70.657, + "eval_steps_per_second": 2.362, + "eval_wer": 0.26954699339029503, + "step": 156000 + }, + { + "epoch": 459.12, + "learning_rate": 4.709277797896285e-06, + "loss": 0.0998, + "step": 156100 + }, + { + "epoch": 459.41, + "learning_rate": 4.704033347885536e-06, + "loss": 0.0976, + "step": 156200 + }, + { + "epoch": 459.71, + "learning_rate": 4.698789224613135e-06, + "loss": 0.103, + "step": 156300 + }, + { + "epoch": 460.0, + "learning_rate": 4.6935454338684375e-06, + "loss": 0.1093, + "step": 156400 + }, + { + "epoch": 460.29, + "learning_rate": 4.68830198144043e-06, + "loss": 0.1001, + "step": 156500 + }, + { + "epoch": 460.59, + "learning_rate": 4.683058873117732e-06, + "loss": 0.098, + "step": 156600 + }, + { + "epoch": 460.88, + "learning_rate": 4.677816114688576e-06, + "loss": 0.0984, + "step": 156700 + }, + { + "epoch": 461.18, + "learning_rate": 4.672573711940808e-06, + "loss": 0.0993, + "step": 156800 + }, + { + "epoch": 461.47, + "learning_rate": 4.6673316706618886e-06, + "loss": 0.1009, + "step": 156900 + }, + { + "epoch": 461.76, + "learning_rate": 4.662089996638871e-06, + "loss": 0.1033, + "step": 157000 + }, + { + "epoch": 461.76, + "eval_cer": 0.07192363018177063, + "eval_loss": 0.5216103792190552, + "eval_runtime": 4.9964, + "eval_samples_per_second": 71.851, + "eval_steps_per_second": 2.402, + "eval_wer": 0.269708205706916, + "step": 157000 + }, + { + "epoch": 462.06, + "learning_rate": 4.656848695658411e-06, + "loss": 0.1007, + "step": 157100 + }, + { + "epoch": 462.35, + "learning_rate": 4.651607773506746e-06, + "loss": 0.0969, + "step": 157200 + }, + { + "epoch": 462.65, + "learning_rate": 4.646367235969696e-06, + "loss": 0.0991, + "step": 157300 + }, + { + "epoch": 462.94, + "learning_rate": 4.641127088832661e-06, + "loss": 0.0989, + "step": 157400 + }, + { + "epoch": 463.24, + "learning_rate": 4.635887337880604e-06, + "loss": 0.1087, + "step": 157500 + }, + { + "epoch": 463.53, + "learning_rate": 4.630647988898058e-06, + "loss": 0.0969, + "step": 157600 + }, + { + "epoch": 463.82, + "learning_rate": 4.625409047669106e-06, + "loss": 0.1004, + "step": 157700 + }, + { + "epoch": 464.12, + "learning_rate": 4.620170519977379e-06, + "loss": 0.0976, + "step": 157800 + }, + { + "epoch": 464.41, + "learning_rate": 4.614932411606059e-06, + "loss": 0.0994, + "step": 157900 + }, + { + "epoch": 464.71, + "learning_rate": 4.6096947283378616e-06, + "loss": 0.1053, + "step": 158000 + }, + { + "epoch": 464.71, + "eval_cer": 0.07188004010287259, + "eval_loss": 0.516394317150116, + "eval_runtime": 4.9144, + "eval_samples_per_second": 73.051, + "eval_steps_per_second": 2.442, + "eval_wer": 0.270030630340158, + "step": 158000 + }, + { + "epoch": 465.0, + "learning_rate": 4.60445747595503e-06, + "loss": 0.1061, + "step": 158100 + }, + { + "epoch": 465.29, + "learning_rate": 4.599273026216009e-06, + "loss": 0.1009, + "step": 158200 + }, + { + "epoch": 465.59, + "learning_rate": 4.594036648495641e-06, + "loss": 0.0989, + "step": 158300 + }, + { + "epoch": 465.88, + "learning_rate": 4.5888007189466934e-06, + "loss": 0.0972, + "step": 158400 + }, + { + "epoch": 466.18, + "learning_rate": 4.583565243349476e-06, + "loss": 0.0979, + "step": 158500 + }, + { + "epoch": 466.47, + "learning_rate": 4.578330227483797e-06, + "loss": 0.1039, + "step": 158600 + }, + { + "epoch": 466.76, + "learning_rate": 4.573095677128959e-06, + "loss": 0.1023, + "step": 158700 + }, + { + "epoch": 467.06, + "learning_rate": 4.567861598063745e-06, + "loss": 0.1064, + "step": 158800 + }, + { + "epoch": 467.35, + "learning_rate": 4.562627996066427e-06, + "loss": 0.0988, + "step": 158900 + }, + { + "epoch": 467.65, + "learning_rate": 4.557394876914746e-06, + "loss": 0.0974, + "step": 159000 + }, + { + "epoch": 467.65, + "eval_cer": 0.07196722026066867, + "eval_loss": 0.5301560163497925, + "eval_runtime": 4.5122, + "eval_samples_per_second": 79.561, + "eval_steps_per_second": 2.659, + "eval_wer": 0.26793487022408513, + "step": 159000 + }, + { + "epoch": 467.94, + "learning_rate": 4.552162246385904e-06, + "loss": 0.0982, + "step": 159100 + }, + { + "epoch": 468.24, + "learning_rate": 4.546930110256574e-06, + "loss": 0.1025, + "step": 159200 + }, + { + "epoch": 468.53, + "learning_rate": 4.541698474302873e-06, + "loss": 0.1005, + "step": 159300 + }, + { + "epoch": 468.82, + "learning_rate": 4.5364673443003755e-06, + "loss": 0.1037, + "step": 159400 + }, + { + "epoch": 469.12, + "learning_rate": 4.531236726024092e-06, + "loss": 0.1026, + "step": 159500 + }, + { + "epoch": 469.41, + "learning_rate": 4.526006625248465e-06, + "loss": 0.1028, + "step": 159600 + }, + { + "epoch": 469.71, + "learning_rate": 4.520777047747376e-06, + "loss": 0.0948, + "step": 159700 + }, + { + "epoch": 470.0, + "learning_rate": 4.515547999294117e-06, + "loss": 0.0978, + "step": 159800 + }, + { + "epoch": 470.29, + "learning_rate": 4.510319485661405e-06, + "loss": 0.094, + "step": 159900 + }, + { + "epoch": 470.59, + "learning_rate": 4.5050915126213605e-06, + "loss": 0.1016, + "step": 160000 + }, + { + "epoch": 470.59, + "eval_cer": 0.07192363018177063, + "eval_loss": 0.5172093510627747, + "eval_runtime": 4.8089, + "eval_samples_per_second": 74.653, + "eval_steps_per_second": 2.495, + "eval_wer": 0.26906335644043206, + "step": 160000 + }, + { + "epoch": 470.88, + "learning_rate": 4.49986408594551e-06, + "loss": 0.0979, + "step": 160100 + }, + { + "epoch": 471.18, + "learning_rate": 4.494637211404779e-06, + "loss": 0.0997, + "step": 160200 + }, + { + "epoch": 471.47, + "learning_rate": 4.489410894769476e-06, + "loss": 0.0984, + "step": 160300 + }, + { + "epoch": 471.76, + "learning_rate": 4.484185141809304e-06, + "loss": 0.0979, + "step": 160400 + }, + { + "epoch": 472.06, + "learning_rate": 4.478959958293334e-06, + "loss": 0.096, + "step": 160500 + }, + { + "epoch": 472.35, + "learning_rate": 4.473735349990016e-06, + "loss": 0.095, + "step": 160600 + }, + { + "epoch": 472.65, + "learning_rate": 4.4685113226671594e-06, + "loss": 0.0991, + "step": 160700 + }, + { + "epoch": 472.94, + "learning_rate": 4.4632878820919336e-06, + "loss": 0.1013, + "step": 160800 + }, + { + "epoch": 473.24, + "learning_rate": 4.458065034030865e-06, + "loss": 0.0981, + "step": 160900 + }, + { + "epoch": 473.53, + "learning_rate": 4.452842784249817e-06, + "loss": 0.0947, + "step": 161000 + }, + { + "epoch": 473.53, + "eval_cer": 0.07266466152303735, + "eval_loss": 0.5281272530555725, + "eval_runtime": 5.2217, + "eval_samples_per_second": 68.751, + "eval_steps_per_second": 2.298, + "eval_wer": 0.27196517813960985, + "step": 161000 + }, + { + "epoch": 473.82, + "learning_rate": 4.447621138514001e-06, + "loss": 0.102, + "step": 161100 + }, + { + "epoch": 474.12, + "learning_rate": 4.4424001025879575e-06, + "loss": 0.1006, + "step": 161200 + }, + { + "epoch": 474.41, + "learning_rate": 4.437179682235552e-06, + "loss": 0.0982, + "step": 161300 + }, + { + "epoch": 474.71, + "learning_rate": 4.4319598832199765e-06, + "loss": 0.1011, + "step": 161400 + }, + { + "epoch": 475.0, + "learning_rate": 4.426740711303728e-06, + "loss": 0.0995, + "step": 161500 + }, + { + "epoch": 475.29, + "learning_rate": 4.4215221722486214e-06, + "loss": 0.0995, + "step": 161600 + }, + { + "epoch": 475.59, + "learning_rate": 4.416304271815767e-06, + "loss": 0.0993, + "step": 161700 + }, + { + "epoch": 475.88, + "learning_rate": 4.411087015765568e-06, + "loss": 0.0985, + "step": 161800 + }, + { + "epoch": 476.18, + "learning_rate": 4.4058704098577235e-06, + "loss": 0.0943, + "step": 161900 + }, + { + "epoch": 476.47, + "learning_rate": 4.400654459851207e-06, + "loss": 0.101, + "step": 162000 + }, + { + "epoch": 476.47, + "eval_cer": 0.07222876073405693, + "eval_loss": 0.5367242693901062, + "eval_runtime": 5.1506, + "eval_samples_per_second": 69.7, + "eval_steps_per_second": 2.33, + "eval_wer": 0.2709979042398839, + "step": 162000 + }, + { + "epoch": 476.76, + "learning_rate": 4.395439171504275e-06, + "loss": 0.0996, + "step": 162100 + }, + { + "epoch": 477.06, + "learning_rate": 4.390224550574449e-06, + "loss": 0.0986, + "step": 162200 + }, + { + "epoch": 477.35, + "learning_rate": 4.385010602818511e-06, + "loss": 0.0921, + "step": 162300 + }, + { + "epoch": 477.65, + "learning_rate": 4.37979733399251e-06, + "loss": 0.1047, + "step": 162400 + }, + { + "epoch": 477.94, + "learning_rate": 4.374584749851735e-06, + "loss": 0.1039, + "step": 162500 + }, + { + "epoch": 478.24, + "learning_rate": 4.369372856150725e-06, + "loss": 0.1004, + "step": 162600 + }, + { + "epoch": 478.53, + "learning_rate": 4.364161658643255e-06, + "loss": 0.0994, + "step": 162700 + }, + { + "epoch": 478.82, + "learning_rate": 4.358951163082328e-06, + "loss": 0.0951, + "step": 162800 + }, + { + "epoch": 479.12, + "learning_rate": 4.353741375220182e-06, + "loss": 0.0997, + "step": 162900 + }, + { + "epoch": 479.41, + "learning_rate": 4.348532300808261e-06, + "loss": 0.0984, + "step": 163000 + }, + { + "epoch": 479.41, + "eval_cer": 0.07227235081295497, + "eval_loss": 0.5390114784240723, + "eval_runtime": 5.3346, + "eval_samples_per_second": 67.297, + "eval_steps_per_second": 2.249, + "eval_wer": 0.2718039658229889, + "step": 163000 + }, + { + "epoch": 479.71, + "learning_rate": 4.343323945597232e-06, + "loss": 0.0976, + "step": 163100 + }, + { + "epoch": 480.0, + "learning_rate": 4.338116315336962e-06, + "loss": 0.0963, + "step": 163200 + }, + { + "epoch": 480.29, + "learning_rate": 4.332961481136282e-06, + "loss": 0.0989, + "step": 163300 + }, + { + "epoch": 480.59, + "learning_rate": 4.3277553106309965e-06, + "loss": 0.097, + "step": 163400 + }, + { + "epoch": 480.88, + "learning_rate": 4.322549882263777e-06, + "loss": 0.0983, + "step": 163500 + }, + { + "epoch": 481.18, + "learning_rate": 4.317345201781263e-06, + "loss": 0.0927, + "step": 163600 + }, + { + "epoch": 481.47, + "learning_rate": 4.312141274929265e-06, + "loss": 0.0952, + "step": 163700 + }, + { + "epoch": 481.76, + "learning_rate": 4.306938107452762e-06, + "loss": 0.0965, + "step": 163800 + }, + { + "epoch": 482.06, + "learning_rate": 4.3017357050958994e-06, + "loss": 0.1033, + "step": 163900 + }, + { + "epoch": 482.35, + "learning_rate": 4.296534073601972e-06, + "loss": 0.0995, + "step": 164000 + }, + { + "epoch": 482.35, + "eval_cer": 0.07100823852491173, + "eval_loss": 0.5308058261871338, + "eval_runtime": 4.9229, + "eval_samples_per_second": 72.925, + "eval_steps_per_second": 2.438, + "eval_wer": 0.2672900209576012, + "step": 164000 + }, + { + "epoch": 482.65, + "learning_rate": 4.291333218713423e-06, + "loss": 0.0936, + "step": 164100 + }, + { + "epoch": 482.94, + "learning_rate": 4.286133146171844e-06, + "loss": 0.0969, + "step": 164200 + }, + { + "epoch": 483.24, + "learning_rate": 4.2809338617179585e-06, + "loss": 0.0991, + "step": 164300 + }, + { + "epoch": 483.53, + "learning_rate": 4.275735371091624e-06, + "loss": 0.0983, + "step": 164400 + }, + { + "epoch": 483.82, + "learning_rate": 4.270537680031817e-06, + "loss": 0.0979, + "step": 164500 + }, + { + "epoch": 484.12, + "learning_rate": 4.26534079427663e-06, + "loss": 0.1016, + "step": 164600 + }, + { + "epoch": 484.41, + "learning_rate": 4.260144719563275e-06, + "loss": 0.099, + "step": 164700 + }, + { + "epoch": 484.71, + "learning_rate": 4.25494946162806e-06, + "loss": 0.1006, + "step": 164800 + }, + { + "epoch": 485.0, + "learning_rate": 4.249755026206398e-06, + "loss": 0.0931, + "step": 164900 + }, + { + "epoch": 485.29, + "learning_rate": 4.244561419032788e-06, + "loss": 0.0954, + "step": 165000 + }, + { + "epoch": 485.29, + "eval_cer": 0.07174926986617845, + "eval_loss": 0.5440545678138733, + "eval_runtime": 5.088, + "eval_samples_per_second": 70.558, + "eval_steps_per_second": 2.358, + "eval_wer": 0.2666451716911172, + "step": 165000 + }, + { + "epoch": 485.59, + "learning_rate": 4.239368645840816e-06, + "loss": 0.1025, + "step": 165100 + }, + { + "epoch": 485.88, + "learning_rate": 4.234176712363151e-06, + "loss": 0.1006, + "step": 165200 + }, + { + "epoch": 486.18, + "learning_rate": 4.228985624331532e-06, + "loss": 0.1006, + "step": 165300 + }, + { + "epoch": 486.47, + "learning_rate": 4.223795387476766e-06, + "loss": 0.1019, + "step": 165400 + }, + { + "epoch": 486.76, + "learning_rate": 4.218606007528718e-06, + "loss": 0.1005, + "step": 165500 + }, + { + "epoch": 487.06, + "learning_rate": 4.213417490216308e-06, + "loss": 0.0988, + "step": 165600 + }, + { + "epoch": 487.35, + "learning_rate": 4.208229841267508e-06, + "loss": 0.1007, + "step": 165700 + }, + { + "epoch": 487.65, + "learning_rate": 4.203043066409322e-06, + "loss": 0.0926, + "step": 165800 + }, + { + "epoch": 487.94, + "learning_rate": 4.197857171367799e-06, + "loss": 0.0971, + "step": 165900 + }, + { + "epoch": 488.24, + "learning_rate": 4.192672161868012e-06, + "loss": 0.0983, + "step": 166000 + }, + { + "epoch": 488.24, + "eval_cer": 0.07231594089185302, + "eval_loss": 0.5344653725624084, + "eval_runtime": 5.4383, + "eval_samples_per_second": 66.014, + "eval_steps_per_second": 2.207, + "eval_wer": 0.270514267290021, + "step": 166000 + }, + { + "epoch": 488.53, + "learning_rate": 4.187488043634053e-06, + "loss": 0.0942, + "step": 166100 + }, + { + "epoch": 488.82, + "learning_rate": 4.1823048223890385e-06, + "loss": 0.1031, + "step": 166200 + }, + { + "epoch": 489.12, + "learning_rate": 4.177122503855086e-06, + "loss": 0.0953, + "step": 166300 + }, + { + "epoch": 489.41, + "learning_rate": 4.171941093753323e-06, + "loss": 0.0953, + "step": 166400 + }, + { + "epoch": 489.71, + "learning_rate": 4.166760597803871e-06, + "loss": 0.0945, + "step": 166500 + }, + { + "epoch": 490.0, + "learning_rate": 4.161581021725842e-06, + "loss": 0.0958, + "step": 166600 + }, + { + "epoch": 490.29, + "learning_rate": 4.156402371237335e-06, + "loss": 0.0953, + "step": 166700 + }, + { + "epoch": 490.59, + "learning_rate": 4.1512246520554224e-06, + "loss": 0.0997, + "step": 166800 + }, + { + "epoch": 490.88, + "learning_rate": 4.146047869896156e-06, + "loss": 0.0972, + "step": 166900 + }, + { + "epoch": 491.18, + "learning_rate": 4.140872030474547e-06, + "loss": 0.103, + "step": 167000 + }, + { + "epoch": 491.18, + "eval_cer": 0.07231594089185302, + "eval_loss": 0.5379437208175659, + "eval_runtime": 4.8891, + "eval_samples_per_second": 73.428, + "eval_steps_per_second": 2.454, + "eval_wer": 0.2713203288731259, + "step": 167000 + }, + { + "epoch": 491.47, + "learning_rate": 4.135697139504564e-06, + "loss": 0.0962, + "step": 167100 + }, + { + "epoch": 491.76, + "learning_rate": 4.130523202699138e-06, + "loss": 0.0972, + "step": 167200 + }, + { + "epoch": 492.06, + "learning_rate": 4.1253502257701364e-06, + "loss": 0.1022, + "step": 167300 + }, + { + "epoch": 492.35, + "learning_rate": 4.120178214428373e-06, + "loss": 0.0895, + "step": 167400 + }, + { + "epoch": 492.65, + "learning_rate": 4.115058879957378e-06, + "loss": 0.0959, + "step": 167500 + }, + { + "epoch": 492.94, + "learning_rate": 4.109888807119945e-06, + "loss": 0.0977, + "step": 167600 + }, + { + "epoch": 493.24, + "learning_rate": 4.104719716938696e-06, + "loss": 0.0994, + "step": 167700 + }, + { + "epoch": 493.53, + "learning_rate": 4.099551615120152e-06, + "loss": 0.0979, + "step": 167800 + }, + { + "epoch": 493.82, + "learning_rate": 4.094384507369739e-06, + "loss": 0.0988, + "step": 167900 + }, + { + "epoch": 494.12, + "learning_rate": 4.089218399391795e-06, + "loss": 0.0948, + "step": 168000 + }, + { + "epoch": 494.12, + "eval_cer": 0.07131336907719803, + "eval_loss": 0.5431644320487976, + "eval_runtime": 4.7451, + "eval_samples_per_second": 75.657, + "eval_steps_per_second": 2.529, + "eval_wer": 0.2653554731581493, + "step": 168000 + }, + { + "epoch": 494.41, + "learning_rate": 4.084104942918741e-06, + "loss": 0.0947, + "step": 168100 + }, + { + "epoch": 494.71, + "learning_rate": 4.0789408414543055e-06, + "loss": 0.0927, + "step": 168200 + }, + { + "epoch": 495.0, + "learning_rate": 4.073777756811685e-06, + "loss": 0.0954, + "step": 168300 + }, + { + "epoch": 495.29, + "learning_rate": 4.068615694690766e-06, + "loss": 0.0966, + "step": 168400 + }, + { + "epoch": 495.59, + "learning_rate": 4.063454660790316e-06, + "loss": 0.0959, + "step": 168500 + }, + { + "epoch": 495.88, + "learning_rate": 4.05829466080796e-06, + "loss": 0.0946, + "step": 168600 + }, + { + "epoch": 496.18, + "learning_rate": 4.053135700440182e-06, + "loss": 0.0995, + "step": 168700 + }, + { + "epoch": 496.47, + "learning_rate": 4.047977785382323e-06, + "loss": 0.0941, + "step": 168800 + }, + { + "epoch": 496.76, + "learning_rate": 4.042820921328565e-06, + "loss": 0.0924, + "step": 168900 + }, + { + "epoch": 497.06, + "learning_rate": 4.037716666796161e-06, + "loss": 0.0916, + "step": 169000 + }, + { + "epoch": 497.06, + "eval_cer": 0.07183645002397454, + "eval_loss": 0.5349707007408142, + "eval_runtime": 5.3743, + "eval_samples_per_second": 66.799, + "eval_steps_per_second": 2.233, + "eval_wer": 0.269708205706916, + "step": 169000 + }, + { + "epoch": 497.35, + "learning_rate": 4.0325619111764545e-06, + "loss": 0.0976, + "step": 169100 + }, + { + "epoch": 497.65, + "learning_rate": 4.0274082235795125e-06, + "loss": 0.0961, + "step": 169200 + }, + { + "epoch": 497.94, + "learning_rate": 4.022255609694858e-06, + "loss": 0.0924, + "step": 169300 + }, + { + "epoch": 498.24, + "learning_rate": 4.017104075210819e-06, + "loss": 0.0984, + "step": 169400 + }, + { + "epoch": 498.53, + "learning_rate": 4.011953625814535e-06, + "loss": 0.0939, + "step": 169500 + }, + { + "epoch": 498.82, + "learning_rate": 4.006804267191951e-06, + "loss": 0.1, + "step": 169600 + }, + { + "epoch": 499.12, + "learning_rate": 4.001656005027803e-06, + "loss": 0.0974, + "step": 169700 + }, + { + "epoch": 499.41, + "learning_rate": 3.996508845005622e-06, + "loss": 0.0932, + "step": 169800 + }, + { + "epoch": 499.71, + "learning_rate": 3.991362792807717e-06, + "loss": 0.0986, + "step": 169900 + }, + { + "epoch": 500.0, + "learning_rate": 3.986217854115173e-06, + "loss": 0.0955, + "step": 170000 + }, + { + "epoch": 500.0, + "eval_cer": 0.07157490955058629, + "eval_loss": 0.5349684953689575, + "eval_runtime": 4.8795, + "eval_samples_per_second": 73.573, + "eval_steps_per_second": 2.459, + "eval_wer": 0.27083669192326293, + "step": 170000 + }, + { + "epoch": 500.29, + "learning_rate": 3.981074034607853e-06, + "loss": 0.0901, + "step": 170100 + }, + { + "epoch": 500.59, + "learning_rate": 3.97593133996438e-06, + "loss": 0.0926, + "step": 170200 + }, + { + "epoch": 500.88, + "learning_rate": 3.970789775862133e-06, + "loss": 0.1036, + "step": 170300 + }, + { + "epoch": 501.18, + "learning_rate": 3.9656493479772475e-06, + "loss": 0.0972, + "step": 170400 + }, + { + "epoch": 501.47, + "learning_rate": 3.960510061984599e-06, + "loss": 0.0938, + "step": 170500 + }, + { + "epoch": 501.76, + "learning_rate": 3.95537192355781e-06, + "loss": 0.0953, + "step": 170600 + }, + { + "epoch": 502.06, + "learning_rate": 3.950234938369229e-06, + "loss": 0.097, + "step": 170700 + }, + { + "epoch": 502.35, + "learning_rate": 3.9450991120899345e-06, + "loss": 0.0993, + "step": 170800 + }, + { + "epoch": 502.65, + "learning_rate": 3.939964450389728e-06, + "loss": 0.0974, + "step": 170900 + }, + { + "epoch": 502.94, + "learning_rate": 3.934830958937119e-06, + "loss": 0.1022, + "step": 171000 + }, + { + "epoch": 502.94, + "eval_cer": 0.07083387820931956, + "eval_loss": 0.5352509021759033, + "eval_runtime": 5.2076, + "eval_samples_per_second": 68.938, + "eval_steps_per_second": 2.304, + "eval_wer": 0.2653554731581493, + "step": 171000 + }, + { + "epoch": 503.24, + "learning_rate": 3.929698643399334e-06, + "loss": 0.0976, + "step": 171100 + }, + { + "epoch": 503.53, + "learning_rate": 3.924567509442289e-06, + "loss": 0.0972, + "step": 171200 + }, + { + "epoch": 503.82, + "learning_rate": 3.919437562730608e-06, + "loss": 0.0917, + "step": 171300 + }, + { + "epoch": 504.12, + "learning_rate": 3.914308808927598e-06, + "loss": 0.0919, + "step": 171400 + }, + { + "epoch": 504.41, + "learning_rate": 3.909181253695248e-06, + "loss": 0.0967, + "step": 171500 + }, + { + "epoch": 504.71, + "learning_rate": 3.9040549026942304e-06, + "loss": 0.0962, + "step": 171600 + }, + { + "epoch": 505.0, + "learning_rate": 3.8989297615838775e-06, + "loss": 0.1009, + "step": 171700 + }, + { + "epoch": 505.29, + "learning_rate": 3.893805836022198e-06, + "loss": 0.0947, + "step": 171800 + }, + { + "epoch": 505.59, + "learning_rate": 3.888683131665849e-06, + "loss": 0.0963, + "step": 171900 + }, + { + "epoch": 505.88, + "learning_rate": 3.883561654170144e-06, + "loss": 0.0928, + "step": 172000 + }, + { + "epoch": 505.88, + "eval_cer": 0.07166208970838238, + "eval_loss": 0.5374095439910889, + "eval_runtime": 4.9233, + "eval_samples_per_second": 72.919, + "eval_steps_per_second": 2.437, + "eval_wer": 0.2653554731581493, + "step": 172000 + }, + { + "epoch": 506.18, + "learning_rate": 3.878441409189042e-06, + "loss": 0.0975, + "step": 172100 + }, + { + "epoch": 506.47, + "learning_rate": 3.8733224023751394e-06, + "loss": 0.0945, + "step": 172200 + }, + { + "epoch": 506.76, + "learning_rate": 3.868204639379668e-06, + "loss": 0.096, + "step": 172300 + }, + { + "epoch": 507.06, + "learning_rate": 3.863088125852486e-06, + "loss": 0.0946, + "step": 172400 + }, + { + "epoch": 507.35, + "learning_rate": 3.857972867442068e-06, + "loss": 0.0915, + "step": 172500 + }, + { + "epoch": 507.65, + "learning_rate": 3.852858869795512e-06, + "loss": 0.0966, + "step": 172600 + }, + { + "epoch": 507.94, + "learning_rate": 3.847746138558514e-06, + "loss": 0.0907, + "step": 172700 + }, + { + "epoch": 508.24, + "learning_rate": 3.842634679375379e-06, + "loss": 0.0976, + "step": 172800 + }, + { + "epoch": 508.53, + "learning_rate": 3.837524497889005e-06, + "loss": 0.1, + "step": 172900 + }, + { + "epoch": 508.82, + "learning_rate": 3.832415599740879e-06, + "loss": 0.0965, + "step": 173000 + }, + { + "epoch": 508.82, + "eval_cer": 0.07144413931389215, + "eval_loss": 0.5368661880493164, + "eval_runtime": 5.3628, + "eval_samples_per_second": 66.942, + "eval_steps_per_second": 2.238, + "eval_wer": 0.2682572948573271, + "step": 173000 + }, + { + "epoch": 509.12, + "learning_rate": 3.827307990571073e-06, + "loss": 0.09, + "step": 173100 + }, + { + "epoch": 509.41, + "learning_rate": 3.822201676018233e-06, + "loss": 0.103, + "step": 173200 + }, + { + "epoch": 509.71, + "learning_rate": 3.817096661719582e-06, + "loss": 0.0981, + "step": 173300 + }, + { + "epoch": 510.0, + "learning_rate": 3.8119929533108995e-06, + "loss": 0.0987, + "step": 173400 + }, + { + "epoch": 510.29, + "learning_rate": 3.806890556426529e-06, + "loss": 0.0963, + "step": 173500 + }, + { + "epoch": 510.59, + "learning_rate": 3.801789476699365e-06, + "loss": 0.0938, + "step": 173600 + }, + { + "epoch": 510.88, + "learning_rate": 3.7966897197608445e-06, + "loss": 0.0927, + "step": 173700 + }, + { + "epoch": 511.18, + "learning_rate": 3.7915912912409496e-06, + "loss": 0.095, + "step": 173800 + }, + { + "epoch": 511.47, + "learning_rate": 3.7864941967681905e-06, + "loss": 0.0991, + "step": 173900 + }, + { + "epoch": 511.76, + "learning_rate": 3.7813984419696097e-06, + "loss": 0.0903, + "step": 174000 + }, + { + "epoch": 511.76, + "eval_cer": 0.07201081033956672, + "eval_loss": 0.5484318137168884, + "eval_runtime": 4.907, + "eval_samples_per_second": 73.161, + "eval_steps_per_second": 2.445, + "eval_wer": 0.270514267290021, + "step": 174000 + }, + { + "epoch": 512.06, + "learning_rate": 3.776304032470769e-06, + "loss": 0.0956, + "step": 174100 + }, + { + "epoch": 512.35, + "learning_rate": 3.771210973895741e-06, + "loss": 0.089, + "step": 174200 + }, + { + "epoch": 512.65, + "learning_rate": 3.7661701821540377e-06, + "loss": 0.0915, + "step": 174300 + }, + { + "epoch": 512.94, + "learning_rate": 3.7610798286434015e-06, + "loss": 0.0941, + "step": 174400 + }, + { + "epoch": 513.24, + "learning_rate": 3.755990842863646e-06, + "loss": 0.0977, + "step": 174500 + }, + { + "epoch": 513.53, + "learning_rate": 3.750903230432862e-06, + "loss": 0.0973, + "step": 174600 + }, + { + "epoch": 513.82, + "learning_rate": 3.7458169969676174e-06, + "loss": 0.0957, + "step": 174700 + }, + { + "epoch": 514.12, + "learning_rate": 3.740732148082967e-06, + "loss": 0.0926, + "step": 174800 + }, + { + "epoch": 514.41, + "learning_rate": 3.735648689392428e-06, + "loss": 0.095, + "step": 174900 + }, + { + "epoch": 514.71, + "learning_rate": 3.7305666265079883e-06, + "loss": 0.0947, + "step": 175000 + }, + { + "epoch": 514.71, + "eval_cer": 0.07153131947168824, + "eval_loss": 0.5374939441680908, + "eval_runtime": 5.2741, + "eval_samples_per_second": 68.069, + "eval_steps_per_second": 2.275, + "eval_wer": 0.26712880864098015, + "step": 175000 + }, + { + "epoch": 515.0, + "learning_rate": 3.7254859650400955e-06, + "loss": 0.0919, + "step": 175100 + }, + { + "epoch": 515.29, + "learning_rate": 3.720406710597645e-06, + "loss": 0.0903, + "step": 175200 + }, + { + "epoch": 515.59, + "learning_rate": 3.7153288687879858e-06, + "loss": 0.0929, + "step": 175300 + }, + { + "epoch": 515.88, + "learning_rate": 3.7102524452169e-06, + "loss": 0.0922, + "step": 175400 + }, + { + "epoch": 516.18, + "learning_rate": 3.705177445488609e-06, + "loss": 0.0971, + "step": 175500 + }, + { + "epoch": 516.47, + "learning_rate": 3.7001038752057626e-06, + "loss": 0.093, + "step": 175600 + }, + { + "epoch": 516.76, + "learning_rate": 3.695031739969428e-06, + "loss": 0.0887, + "step": 175700 + }, + { + "epoch": 517.06, + "learning_rate": 3.6899610453790945e-06, + "loss": 0.0924, + "step": 175800 + }, + { + "epoch": 517.35, + "learning_rate": 3.6848917970326547e-06, + "loss": 0.0946, + "step": 175900 + }, + { + "epoch": 517.65, + "learning_rate": 3.679824000526408e-06, + "loss": 0.1018, + "step": 176000 + }, + { + "epoch": 517.65, + "eval_cer": 0.07109541868270781, + "eval_loss": 0.5277024507522583, + "eval_runtime": 5.1447, + "eval_samples_per_second": 69.78, + "eval_steps_per_second": 2.332, + "eval_wer": 0.2672900209576012, + "step": 176000 + }, + { + "epoch": 517.94, + "learning_rate": 3.674757661455051e-06, + "loss": 0.0893, + "step": 176100 + }, + { + "epoch": 518.24, + "learning_rate": 3.66969278541167e-06, + "loss": 0.0914, + "step": 176200 + }, + { + "epoch": 518.53, + "learning_rate": 3.664629377987739e-06, + "loss": 0.0916, + "step": 176300 + }, + { + "epoch": 518.82, + "learning_rate": 3.659567444773108e-06, + "loss": 0.0939, + "step": 176400 + }, + { + "epoch": 519.12, + "learning_rate": 3.654506991355996e-06, + "loss": 0.0963, + "step": 176500 + }, + { + "epoch": 519.41, + "learning_rate": 3.6494480233229978e-06, + "loss": 0.0929, + "step": 176600 + }, + { + "epoch": 519.71, + "learning_rate": 3.64439054625906e-06, + "loss": 0.0916, + "step": 176700 + }, + { + "epoch": 520.0, + "learning_rate": 3.6393851181263416e-06, + "loss": 0.0896, + "step": 176800 + }, + { + "epoch": 520.29, + "learning_rate": 3.6343306246998226e-06, + "loss": 0.0928, + "step": 176900 + }, + { + "epoch": 520.59, + "learning_rate": 3.629277638931521e-06, + "loss": 0.0889, + "step": 177000 + }, + { + "epoch": 520.59, + "eval_cer": 0.07070310797262543, + "eval_loss": 0.5390043258666992, + "eval_runtime": 4.8192, + "eval_samples_per_second": 74.493, + "eval_steps_per_second": 2.49, + "eval_wer": 0.2653554731581493, + "step": 177000 + }, + { + "epoch": 520.88, + "learning_rate": 3.6242261663997854e-06, + "loss": 0.0883, + "step": 177100 + }, + { + "epoch": 521.18, + "learning_rate": 3.6191762126812878e-06, + "loss": 0.096, + "step": 177200 + }, + { + "epoch": 521.47, + "learning_rate": 3.6141277833510248e-06, + "loss": 0.0906, + "step": 177300 + }, + { + "epoch": 521.76, + "learning_rate": 3.609080883982315e-06, + "loss": 0.0884, + "step": 177400 + }, + { + "epoch": 522.06, + "learning_rate": 3.6040355201467834e-06, + "loss": 0.0902, + "step": 177500 + }, + { + "epoch": 522.35, + "learning_rate": 3.598991697414361e-06, + "loss": 0.092, + "step": 177600 + }, + { + "epoch": 522.65, + "learning_rate": 3.5939494213532784e-06, + "loss": 0.0931, + "step": 177700 + }, + { + "epoch": 522.94, + "learning_rate": 3.5889086975300547e-06, + "loss": 0.0945, + "step": 177800 + }, + { + "epoch": 523.24, + "learning_rate": 3.583869531509503e-06, + "loss": 0.0915, + "step": 177900 + }, + { + "epoch": 523.53, + "learning_rate": 3.578831928854708e-06, + "loss": 0.091, + "step": 178000 + }, + { + "epoch": 523.53, + "eval_cer": 0.0720979904973628, + "eval_loss": 0.5432314276695251, + "eval_runtime": 5.2897, + "eval_samples_per_second": 67.868, + "eval_steps_per_second": 2.269, + "eval_wer": 0.2685797194905691, + "step": 178000 + }, + { + "epoch": 523.82, + "learning_rate": 3.573795895127036e-06, + "loss": 0.0902, + "step": 178100 + }, + { + "epoch": 524.12, + "learning_rate": 3.568811772666565e-06, + "loss": 0.0872, + "step": 178200 + }, + { + "epoch": 524.41, + "learning_rate": 3.5637788776423364e-06, + "loss": 0.0873, + "step": 178300 + }, + { + "epoch": 524.71, + "learning_rate": 3.55874756816335e-06, + "loss": 0.0884, + "step": 178400 + }, + { + "epoch": 525.0, + "learning_rate": 3.5537178497840207e-06, + "loss": 0.0956, + "step": 178500 + }, + { + "epoch": 525.29, + "learning_rate": 3.5486897280570045e-06, + "loss": 0.0907, + "step": 178600 + }, + { + "epoch": 525.59, + "learning_rate": 3.5436632085332013e-06, + "loss": 0.0923, + "step": 178700 + }, + { + "epoch": 525.88, + "learning_rate": 3.538638296761735e-06, + "loss": 0.0912, + "step": 178800 + }, + { + "epoch": 526.18, + "learning_rate": 3.533614998289961e-06, + "loss": 0.0942, + "step": 178900 + }, + { + "epoch": 526.47, + "learning_rate": 3.5285933186634514e-06, + "loss": 0.095, + "step": 179000 + }, + { + "epoch": 526.47, + "eval_cer": 0.0705723377359313, + "eval_loss": 0.5412935018539429, + "eval_runtime": 4.9199, + "eval_samples_per_second": 72.97, + "eval_steps_per_second": 2.439, + "eval_wer": 0.26068031597614055, + "step": 179000 + }, + { + "epoch": 526.76, + "learning_rate": 3.5235732634259866e-06, + "loss": 0.0962, + "step": 179100 + }, + { + "epoch": 527.06, + "learning_rate": 3.518554838119562e-06, + "loss": 0.0937, + "step": 179200 + }, + { + "epoch": 527.35, + "learning_rate": 3.513538048284366e-06, + "loss": 0.0938, + "step": 179300 + }, + { + "epoch": 527.65, + "learning_rate": 3.5085228994587883e-06, + "loss": 0.0929, + "step": 179400 + }, + { + "epoch": 527.94, + "learning_rate": 3.5035093971794004e-06, + "loss": 0.092, + "step": 179500 + }, + { + "epoch": 528.24, + "learning_rate": 3.498497546980959e-06, + "loss": 0.0938, + "step": 179600 + }, + { + "epoch": 528.53, + "learning_rate": 3.493487354396401e-06, + "loss": 0.0941, + "step": 179700 + }, + { + "epoch": 528.82, + "learning_rate": 3.4884788249568245e-06, + "loss": 0.0949, + "step": 179800 + }, + { + "epoch": 529.12, + "learning_rate": 3.4834719641915003e-06, + "loss": 0.0889, + "step": 179900 + }, + { + "epoch": 529.41, + "learning_rate": 3.478466777627851e-06, + "loss": 0.0941, + "step": 180000 + }, + { + "epoch": 529.41, + "eval_cer": 0.07161849962948433, + "eval_loss": 0.5512475371360779, + "eval_runtime": 5.4027, + "eval_samples_per_second": 66.448, + "eval_steps_per_second": 2.221, + "eval_wer": 0.2682572948573271, + "step": 180000 + }, + { + "epoch": 529.71, + "learning_rate": 3.473463270791453e-06, + "loss": 0.0892, + "step": 180100 + }, + { + "epoch": 530.0, + "learning_rate": 3.4684614492060307e-06, + "loss": 0.0917, + "step": 180200 + }, + { + "epoch": 530.29, + "learning_rate": 3.463511311314118e-06, + "loss": 0.0914, + "step": 180300 + }, + { + "epoch": 530.59, + "learning_rate": 3.4585128598041152e-06, + "loss": 0.0944, + "step": 180400 + }, + { + "epoch": 530.88, + "learning_rate": 3.4535161100498956e-06, + "loss": 0.0882, + "step": 180500 + }, + { + "epoch": 531.18, + "learning_rate": 3.4485210675677183e-06, + "loss": 0.0977, + "step": 180600 + }, + { + "epoch": 531.47, + "learning_rate": 3.4435277378719652e-06, + "loss": 0.0932, + "step": 180700 + }, + { + "epoch": 531.76, + "learning_rate": 3.438536126475119e-06, + "loss": 0.093, + "step": 180800 + }, + { + "epoch": 532.06, + "learning_rate": 3.433546238887773e-06, + "loss": 0.0926, + "step": 180900 + }, + { + "epoch": 532.35, + "learning_rate": 3.4285580806186124e-06, + "loss": 0.0911, + "step": 181000 + }, + { + "epoch": 532.35, + "eval_cer": 0.07135695915609608, + "eval_loss": 0.5525036454200745, + "eval_runtime": 5.4419, + "eval_samples_per_second": 65.969, + "eval_steps_per_second": 2.205, + "eval_wer": 0.27035305497339995, + "step": 181000 + }, + { + "epoch": 532.65, + "learning_rate": 3.4235716571744144e-06, + "loss": 0.0887, + "step": 181100 + }, + { + "epoch": 532.94, + "learning_rate": 3.418586974060044e-06, + "loss": 0.0947, + "step": 181200 + }, + { + "epoch": 533.24, + "learning_rate": 3.413604036778442e-06, + "loss": 0.0918, + "step": 181300 + }, + { + "epoch": 533.53, + "learning_rate": 3.4086228508306187e-06, + "loss": 0.0907, + "step": 181400 + }, + { + "epoch": 533.82, + "learning_rate": 3.4036434217156587e-06, + "loss": 0.0874, + "step": 181500 + }, + { + "epoch": 534.12, + "learning_rate": 3.398665754930701e-06, + "loss": 0.0905, + "step": 181600 + }, + { + "epoch": 534.41, + "learning_rate": 3.393689855970944e-06, + "loss": 0.095, + "step": 181700 + }, + { + "epoch": 534.71, + "learning_rate": 3.388715730329629e-06, + "loss": 0.088, + "step": 181800 + }, + { + "epoch": 535.0, + "learning_rate": 3.3837433834980416e-06, + "loss": 0.0935, + "step": 181900 + }, + { + "epoch": 535.29, + "learning_rate": 3.3787728209655064e-06, + "loss": 0.0906, + "step": 182000 + }, + { + "epoch": 535.29, + "eval_cer": 0.07113900876160587, + "eval_loss": 0.5467122793197632, + "eval_runtime": 5.3361, + "eval_samples_per_second": 67.278, + "eval_steps_per_second": 2.249, + "eval_wer": 0.26632274705787523, + "step": 182000 + }, + { + "epoch": 535.59, + "learning_rate": 3.3738040482193736e-06, + "loss": 0.0893, + "step": 182100 + }, + { + "epoch": 535.88, + "learning_rate": 3.3688370707450233e-06, + "loss": 0.0942, + "step": 182200 + }, + { + "epoch": 536.18, + "learning_rate": 3.3638718940258498e-06, + "loss": 0.0911, + "step": 182300 + }, + { + "epoch": 536.47, + "learning_rate": 3.358908523543255e-06, + "loss": 0.0968, + "step": 182400 + }, + { + "epoch": 536.76, + "learning_rate": 3.3539469647766575e-06, + "loss": 0.0864, + "step": 182500 + }, + { + "epoch": 537.06, + "learning_rate": 3.3489872232034666e-06, + "loss": 0.0909, + "step": 182600 + }, + { + "epoch": 537.35, + "learning_rate": 3.3440293042990925e-06, + "loss": 0.0878, + "step": 182700 + }, + { + "epoch": 537.65, + "learning_rate": 3.339073213536926e-06, + "loss": 0.0873, + "step": 182800 + }, + { + "epoch": 537.94, + "learning_rate": 3.334118956388345e-06, + "loss": 0.0927, + "step": 182900 + }, + { + "epoch": 538.24, + "learning_rate": 3.3291665383227007e-06, + "loss": 0.092, + "step": 183000 + }, + { + "epoch": 538.24, + "eval_cer": 0.0717928599450765, + "eval_loss": 0.5496759414672852, + "eval_runtime": 4.3873, + "eval_samples_per_second": 81.827, + "eval_steps_per_second": 2.735, + "eval_wer": 0.2684185071739481, + "step": 183000 + }, + { + "epoch": 538.53, + "learning_rate": 3.3242159648073158e-06, + "loss": 0.0873, + "step": 183100 + }, + { + "epoch": 538.82, + "learning_rate": 3.3192672413074744e-06, + "loss": 0.0883, + "step": 183200 + }, + { + "epoch": 539.12, + "learning_rate": 3.3143203732864228e-06, + "loss": 0.0908, + "step": 183300 + }, + { + "epoch": 539.41, + "learning_rate": 3.3093753662053494e-06, + "loss": 0.0873, + "step": 183400 + }, + { + "epoch": 539.71, + "learning_rate": 3.304432225523402e-06, + "loss": 0.0892, + "step": 183500 + }, + { + "epoch": 540.0, + "learning_rate": 3.299490956697653e-06, + "loss": 0.0878, + "step": 183600 + }, + { + "epoch": 540.29, + "learning_rate": 3.29455156518312e-06, + "loss": 0.09, + "step": 183700 + }, + { + "epoch": 540.59, + "learning_rate": 3.2896140564327445e-06, + "loss": 0.0868, + "step": 183800 + }, + { + "epoch": 540.88, + "learning_rate": 3.2846784358973847e-06, + "loss": 0.0949, + "step": 183900 + }, + { + "epoch": 541.18, + "learning_rate": 3.2797447090258226e-06, + "loss": 0.0885, + "step": 184000 + }, + { + "epoch": 541.18, + "eval_cer": 0.07074669805152348, + "eval_loss": 0.5454766154289246, + "eval_runtime": 5.0489, + "eval_samples_per_second": 71.104, + "eval_steps_per_second": 2.377, + "eval_wer": 0.26229243914235045, + "step": 184000 + }, + { + "epoch": 541.47, + "learning_rate": 3.274812881264742e-06, + "loss": 0.0859, + "step": 184100 + }, + { + "epoch": 541.76, + "learning_rate": 3.2698829580587354e-06, + "loss": 0.0914, + "step": 184200 + }, + { + "epoch": 542.06, + "learning_rate": 3.264954944850292e-06, + "loss": 0.0912, + "step": 184300 + }, + { + "epoch": 542.35, + "learning_rate": 3.260028847079787e-06, + "loss": 0.0925, + "step": 184400 + }, + { + "epoch": 542.65, + "learning_rate": 3.2551046701854907e-06, + "loss": 0.0923, + "step": 184500 + }, + { + "epoch": 542.94, + "learning_rate": 3.250231632556272e-06, + "loss": 0.0877, + "step": 184600 + }, + { + "epoch": 543.24, + "learning_rate": 3.2453112943763365e-06, + "loss": 0.0889, + "step": 184700 + }, + { + "epoch": 543.53, + "learning_rate": 3.2403928933203477e-06, + "loss": 0.0902, + "step": 184800 + }, + { + "epoch": 543.82, + "learning_rate": 3.2354764348180695e-06, + "loss": 0.0907, + "step": 184900 + }, + { + "epoch": 544.12, + "learning_rate": 3.2305619242971294e-06, + "loss": 0.0849, + "step": 185000 + }, + { + "epoch": 544.12, + "eval_cer": 0.07153131947168824, + "eval_loss": 0.550433337688446, + "eval_runtime": 5.0702, + "eval_samples_per_second": 70.805, + "eval_steps_per_second": 2.367, + "eval_wer": 0.2664839593744962, + "step": 185000 + }, + { + "epoch": 544.41, + "learning_rate": 3.225649367182997e-06, + "loss": 0.095, + "step": 185100 + }, + { + "epoch": 544.71, + "learning_rate": 3.2207387688989895e-06, + "loss": 0.0894, + "step": 185200 + }, + { + "epoch": 545.0, + "learning_rate": 3.2158301348662623e-06, + "loss": 0.0883, + "step": 185300 + }, + { + "epoch": 545.29, + "learning_rate": 3.210923470503799e-06, + "loss": 0.0947, + "step": 185400 + }, + { + "epoch": 545.59, + "learning_rate": 3.2060187812284127e-06, + "loss": 0.088, + "step": 185500 + }, + { + "epoch": 545.88, + "learning_rate": 3.2011160724547318e-06, + "loss": 0.0869, + "step": 185600 + }, + { + "epoch": 546.18, + "learning_rate": 3.1962153495951995e-06, + "loss": 0.0904, + "step": 185700 + }, + { + "epoch": 546.47, + "learning_rate": 3.1913166180600718e-06, + "loss": 0.0917, + "step": 185800 + }, + { + "epoch": 546.76, + "learning_rate": 3.186419883257398e-06, + "loss": 0.0874, + "step": 185900 + }, + { + "epoch": 547.06, + "learning_rate": 3.18152515059303e-06, + "loss": 0.0912, + "step": 186000 + }, + { + "epoch": 547.06, + "eval_cer": 0.07100823852491173, + "eval_loss": 0.5470239520072937, + "eval_runtime": 5.3768, + "eval_samples_per_second": 66.768, + "eval_steps_per_second": 2.232, + "eval_wer": 0.2653554731581493, + "step": 186000 + }, + { + "epoch": 547.35, + "learning_rate": 3.176632425470604e-06, + "loss": 0.0929, + "step": 186100 + }, + { + "epoch": 547.65, + "learning_rate": 3.1717417132915425e-06, + "loss": 0.0891, + "step": 186200 + }, + { + "epoch": 547.94, + "learning_rate": 3.166853019455049e-06, + "loss": 0.0859, + "step": 186300 + }, + { + "epoch": 548.24, + "learning_rate": 3.1619663493580914e-06, + "loss": 0.0941, + "step": 186400 + }, + { + "epoch": 548.53, + "learning_rate": 3.157081708395412e-06, + "loss": 0.0942, + "step": 186500 + }, + { + "epoch": 548.82, + "learning_rate": 3.1521991019595033e-06, + "loss": 0.0865, + "step": 186600 + }, + { + "epoch": 549.12, + "learning_rate": 3.1473185354406226e-06, + "loss": 0.0926, + "step": 186700 + }, + { + "epoch": 549.41, + "learning_rate": 3.142440014226766e-06, + "loss": 0.0888, + "step": 186800 + }, + { + "epoch": 549.71, + "learning_rate": 3.1375635437036746e-06, + "loss": 0.0925, + "step": 186900 + }, + { + "epoch": 550.0, + "learning_rate": 3.1326891292548302e-06, + "loss": 0.0928, + "step": 187000 + }, + { + "epoch": 550.0, + "eval_cer": 0.07061592781482935, + "eval_loss": 0.5491250157356262, + "eval_runtime": 5.2902, + "eval_samples_per_second": 67.862, + "eval_steps_per_second": 2.268, + "eval_wer": 0.26438819925842333, + "step": 187000 + }, + { + "epoch": 550.29, + "learning_rate": 3.1278167762614365e-06, + "loss": 0.0886, + "step": 187100 + }, + { + "epoch": 550.59, + "learning_rate": 3.1229464901024297e-06, + "loss": 0.0886, + "step": 187200 + }, + { + "epoch": 550.88, + "learning_rate": 3.1180782761544575e-06, + "loss": 0.093, + "step": 187300 + }, + { + "epoch": 551.18, + "learning_rate": 3.1132121397918824e-06, + "loss": 0.0903, + "step": 187400 + }, + { + "epoch": 551.47, + "learning_rate": 3.108348086386777e-06, + "loss": 0.0916, + "step": 187500 + }, + { + "epoch": 551.76, + "learning_rate": 3.103486121308907e-06, + "loss": 0.0902, + "step": 187600 + }, + { + "epoch": 552.06, + "learning_rate": 3.09862624992574e-06, + "loss": 0.0911, + "step": 187700 + }, + { + "epoch": 552.35, + "learning_rate": 3.0937684776024274e-06, + "loss": 0.0921, + "step": 187800 + }, + { + "epoch": 552.65, + "learning_rate": 3.0889128097018036e-06, + "loss": 0.0908, + "step": 187900 + }, + { + "epoch": 552.94, + "learning_rate": 3.084059251584384e-06, + "loss": 0.0904, + "step": 188000 + }, + { + "epoch": 552.94, + "eval_cer": 0.0714877293927902, + "eval_loss": 0.5426270365715027, + "eval_runtime": 4.6484, + "eval_samples_per_second": 77.231, + "eval_steps_per_second": 2.582, + "eval_wer": 0.2651942608415283, + "step": 188000 + }, + { + "epoch": 553.24, + "learning_rate": 3.0792563125505725e-06, + "loss": 0.0897, + "step": 188100 + }, + { + "epoch": 553.53, + "learning_rate": 3.0744069688402957e-06, + "loss": 0.0876, + "step": 188200 + }, + { + "epoch": 553.82, + "learning_rate": 3.069559750927237e-06, + "loss": 0.0913, + "step": 188300 + }, + { + "epoch": 554.12, + "learning_rate": 3.0647146641625786e-06, + "loss": 0.0878, + "step": 188400 + }, + { + "epoch": 554.41, + "learning_rate": 3.059871713895155e-06, + "loss": 0.0893, + "step": 188500 + }, + { + "epoch": 554.71, + "learning_rate": 3.0550309054714367e-06, + "loss": 0.0894, + "step": 188600 + }, + { + "epoch": 555.0, + "learning_rate": 3.0501922442355305e-06, + "loss": 0.0933, + "step": 188700 + }, + { + "epoch": 555.29, + "learning_rate": 3.045355735529175e-06, + "loss": 0.0917, + "step": 188800 + }, + { + "epoch": 555.59, + "learning_rate": 3.0405213846917307e-06, + "loss": 0.0883, + "step": 188900 + }, + { + "epoch": 555.88, + "learning_rate": 3.0356891970601797e-06, + "loss": 0.0876, + "step": 189000 + }, + { + "epoch": 555.88, + "eval_cer": 0.07105182860380978, + "eval_loss": 0.5487252473831177, + "eval_runtime": 5.1579, + "eval_samples_per_second": 69.602, + "eval_steps_per_second": 2.327, + "eval_wer": 0.26422698694180236, + "step": 189000 + }, + { + "epoch": 556.18, + "learning_rate": 3.030859177969111e-06, + "loss": 0.0936, + "step": 189100 + }, + { + "epoch": 556.47, + "learning_rate": 3.0260313327507186e-06, + "loss": 0.0902, + "step": 189200 + }, + { + "epoch": 556.76, + "learning_rate": 3.0212056667348028e-06, + "loss": 0.0921, + "step": 189300 + }, + { + "epoch": 557.06, + "learning_rate": 3.016382185248753e-06, + "loss": 0.0905, + "step": 189400 + }, + { + "epoch": 557.35, + "learning_rate": 3.0115608936175523e-06, + "loss": 0.0867, + "step": 189500 + }, + { + "epoch": 557.65, + "learning_rate": 3.0067417971637597e-06, + "loss": 0.0923, + "step": 189600 + }, + { + "epoch": 557.94, + "learning_rate": 3.0019249012075125e-06, + "loss": 0.0951, + "step": 189700 + }, + { + "epoch": 558.24, + "learning_rate": 2.9971102110665225e-06, + "loss": 0.0875, + "step": 189800 + }, + { + "epoch": 558.53, + "learning_rate": 2.992297732056062e-06, + "loss": 0.09, + "step": 189900 + }, + { + "epoch": 558.82, + "learning_rate": 2.987487469488968e-06, + "loss": 0.0913, + "step": 190000 + }, + { + "epoch": 558.82, + "eval_cer": 0.07113900876160587, + "eval_loss": 0.5487645268440247, + "eval_runtime": 4.7526, + "eval_samples_per_second": 75.537, + "eval_steps_per_second": 2.525, + "eval_wer": 0.2637433499919394, + "step": 190000 + }, + { + "epoch": 559.12, + "learning_rate": 2.982727498068645e-06, + "loss": 0.0897, + "step": 190100 + }, + { + "epoch": 559.41, + "learning_rate": 2.977921662020099e-06, + "loss": 0.0906, + "step": 190200 + }, + { + "epoch": 559.71, + "learning_rate": 2.9731180582856704e-06, + "loss": 0.0901, + "step": 190300 + }, + { + "epoch": 560.0, + "learning_rate": 2.9683166921683935e-06, + "loss": 0.087, + "step": 190400 + }, + { + "epoch": 560.29, + "learning_rate": 2.963517568968831e-06, + "loss": 0.0888, + "step": 190500 + }, + { + "epoch": 560.59, + "learning_rate": 2.9587206939850745e-06, + "loss": 0.0902, + "step": 190600 + }, + { + "epoch": 560.88, + "learning_rate": 2.9539260725127276e-06, + "loss": 0.0884, + "step": 190700 + }, + { + "epoch": 561.18, + "learning_rate": 2.9491337098449125e-06, + "loss": 0.0893, + "step": 190800 + }, + { + "epoch": 561.47, + "learning_rate": 2.9443436112722536e-06, + "loss": 0.0901, + "step": 190900 + }, + { + "epoch": 561.76, + "learning_rate": 2.9395557820828742e-06, + "loss": 0.0926, + "step": 191000 + }, + { + "epoch": 561.76, + "eval_cer": 0.07144413931389215, + "eval_loss": 0.5500932335853577, + "eval_runtime": 5.4728, + "eval_samples_per_second": 65.597, + "eval_steps_per_second": 2.193, + "eval_wer": 0.26632274705787523, + "step": 191000 + }, + { + "epoch": 562.06, + "learning_rate": 2.934770227562399e-06, + "loss": 0.0911, + "step": 191100 + }, + { + "epoch": 562.35, + "learning_rate": 2.929986952993933e-06, + "loss": 0.0954, + "step": 191200 + }, + { + "epoch": 562.65, + "learning_rate": 2.925205963658071e-06, + "loss": 0.0898, + "step": 191300 + }, + { + "epoch": 562.94, + "learning_rate": 2.9204272648328835e-06, + "loss": 0.0911, + "step": 191400 + }, + { + "epoch": 563.24, + "learning_rate": 2.915650861793908e-06, + "loss": 0.0887, + "step": 191500 + }, + { + "epoch": 563.53, + "learning_rate": 2.910876759814154e-06, + "loss": 0.089, + "step": 191600 + }, + { + "epoch": 563.82, + "learning_rate": 2.9061049641640858e-06, + "loss": 0.0856, + "step": 191700 + }, + { + "epoch": 564.12, + "learning_rate": 2.9013354801116246e-06, + "loss": 0.0859, + "step": 191800 + }, + { + "epoch": 564.41, + "learning_rate": 2.8965683129221395e-06, + "loss": 0.0957, + "step": 191900 + }, + { + "epoch": 564.71, + "learning_rate": 2.891803467858435e-06, + "loss": 0.0842, + "step": 192000 + }, + { + "epoch": 564.71, + "eval_cer": 0.07157490955058629, + "eval_loss": 0.5528156757354736, + "eval_runtime": 4.4134, + "eval_samples_per_second": 81.344, + "eval_steps_per_second": 2.719, + "eval_wer": 0.2666451716911172, + "step": 192000 + }, + { + "epoch": 565.0, + "learning_rate": 2.8870409501807633e-06, + "loss": 0.0866, + "step": 192100 + }, + { + "epoch": 565.29, + "learning_rate": 2.8822807651468005e-06, + "loss": 0.0891, + "step": 192200 + }, + { + "epoch": 565.59, + "learning_rate": 2.8775229180116483e-06, + "loss": 0.0882, + "step": 192300 + }, + { + "epoch": 565.88, + "learning_rate": 2.8727674140278293e-06, + "loss": 0.0932, + "step": 192400 + }, + { + "epoch": 566.18, + "learning_rate": 2.868014258445274e-06, + "loss": 0.0873, + "step": 192500 + }, + { + "epoch": 566.47, + "learning_rate": 2.863263456511328e-06, + "loss": 0.0933, + "step": 192600 + }, + { + "epoch": 566.76, + "learning_rate": 2.858515013470734e-06, + "loss": 0.0903, + "step": 192700 + }, + { + "epoch": 567.06, + "learning_rate": 2.8537689345656307e-06, + "loss": 0.091, + "step": 192800 + }, + { + "epoch": 567.35, + "learning_rate": 2.8490252250355505e-06, + "loss": 0.0909, + "step": 192900 + }, + { + "epoch": 567.65, + "learning_rate": 2.8442838901174e-06, + "loss": 0.0863, + "step": 193000 + }, + { + "epoch": 567.65, + "eval_cer": 0.07126977899829999, + "eval_loss": 0.5538076162338257, + "eval_runtime": 4.856, + "eval_samples_per_second": 73.929, + "eval_steps_per_second": 2.471, + "eval_wer": 0.26616153474125426, + "step": 193000 + }, + { + "epoch": 567.94, + "learning_rate": 2.839592312798779e-06, + "loss": 0.0894, + "step": 193100 + }, + { + "epoch": 568.24, + "learning_rate": 2.834855718928081e-06, + "loss": 0.0901, + "step": 193200 + }, + { + "epoch": 568.53, + "learning_rate": 2.830121515312029e-06, + "loss": 0.0875, + "step": 193300 + }, + { + "epoch": 568.82, + "learning_rate": 2.8253897071770427e-06, + "loss": 0.0842, + "step": 193400 + }, + { + "epoch": 569.12, + "learning_rate": 2.8206602997468963e-06, + "loss": 0.0935, + "step": 193500 + }, + { + "epoch": 569.41, + "learning_rate": 2.8159332982427146e-06, + "loss": 0.0919, + "step": 193600 + }, + { + "epoch": 569.71, + "learning_rate": 2.8112087078829664e-06, + "loss": 0.0862, + "step": 193700 + }, + { + "epoch": 570.0, + "learning_rate": 2.8064865338834586e-06, + "loss": 0.0903, + "step": 193800 + }, + { + "epoch": 570.29, + "learning_rate": 2.8017667814573297e-06, + "loss": 0.0929, + "step": 193900 + }, + { + "epoch": 570.59, + "learning_rate": 2.7970494558150456e-06, + "loss": 0.0885, + "step": 194000 + }, + { + "epoch": 570.59, + "eval_cer": 0.0708774682882176, + "eval_loss": 0.543542742729187, + "eval_runtime": 4.864, + "eval_samples_per_second": 73.807, + "eval_steps_per_second": 2.467, + "eval_wer": 0.2653554731581493, + "step": 194000 + }, + { + "epoch": 570.88, + "learning_rate": 2.792334562164394e-06, + "loss": 0.0874, + "step": 194100 + }, + { + "epoch": 571.18, + "learning_rate": 2.7876221057104745e-06, + "loss": 0.0906, + "step": 194200 + }, + { + "epoch": 571.47, + "learning_rate": 2.7829120916557005e-06, + "loss": 0.0891, + "step": 194300 + }, + { + "epoch": 571.76, + "learning_rate": 2.778204525199786e-06, + "loss": 0.0887, + "step": 194400 + }, + { + "epoch": 572.06, + "learning_rate": 2.773499411539744e-06, + "loss": 0.0853, + "step": 194500 + }, + { + "epoch": 572.35, + "learning_rate": 2.768796755869879e-06, + "loss": 0.0846, + "step": 194600 + }, + { + "epoch": 572.65, + "learning_rate": 2.764096563381784e-06, + "loss": 0.0835, + "step": 194700 + }, + { + "epoch": 572.94, + "learning_rate": 2.759398839264329e-06, + "loss": 0.0919, + "step": 194800 + }, + { + "epoch": 573.24, + "learning_rate": 2.754703588703663e-06, + "loss": 0.0872, + "step": 194900 + }, + { + "epoch": 573.53, + "learning_rate": 2.7500108168832006e-06, + "loss": 0.0875, + "step": 195000 + }, + { + "epoch": 573.53, + "eval_cer": 0.07065951789372739, + "eval_loss": 0.5488081574440002, + "eval_runtime": 5.0704, + "eval_samples_per_second": 70.803, + "eval_steps_per_second": 2.367, + "eval_wer": 0.26261486377559246, + "step": 195000 + }, + { + "epoch": 573.82, + "learning_rate": 2.745320528983624e-06, + "loss": 0.0898, + "step": 195100 + }, + { + "epoch": 574.12, + "learning_rate": 2.7406327301828693e-06, + "loss": 0.0853, + "step": 195200 + }, + { + "epoch": 574.41, + "learning_rate": 2.7359474256561273e-06, + "loss": 0.0854, + "step": 195300 + }, + { + "epoch": 574.71, + "learning_rate": 2.731264620575834e-06, + "loss": 0.093, + "step": 195400 + }, + { + "epoch": 575.0, + "learning_rate": 2.7265843201116658e-06, + "loss": 0.087, + "step": 195500 + }, + { + "epoch": 575.29, + "learning_rate": 2.7219065294305363e-06, + "loss": 0.0918, + "step": 195600 + }, + { + "epoch": 575.59, + "learning_rate": 2.7172312536965857e-06, + "loss": 0.09, + "step": 195700 + }, + { + "epoch": 575.88, + "learning_rate": 2.7125584980711784e-06, + "loss": 0.0884, + "step": 195800 + }, + { + "epoch": 576.18, + "learning_rate": 2.7078882677128983e-06, + "loss": 0.0837, + "step": 195900 + }, + { + "epoch": 576.47, + "learning_rate": 2.7032205677775385e-06, + "loss": 0.0924, + "step": 196000 + }, + { + "epoch": 576.47, + "eval_cer": 0.07079028813042151, + "eval_loss": 0.5483184456825256, + "eval_runtime": 4.8631, + "eval_samples_per_second": 73.821, + "eval_steps_per_second": 2.468, + "eval_wer": 0.26454941157504436, + "step": 196000 + }, + { + "epoch": 576.76, + "learning_rate": 2.6985554034181022e-06, + "loss": 0.0909, + "step": 196100 + }, + { + "epoch": 577.06, + "learning_rate": 2.6939393934276265e-06, + "loss": 0.0874, + "step": 196200 + }, + { + "epoch": 577.35, + "learning_rate": 2.6893258785973584e-06, + "loss": 0.0861, + "step": 196300 + }, + { + "epoch": 577.65, + "learning_rate": 2.684668300784915e-06, + "loss": 0.0831, + "step": 196400 + }, + { + "epoch": 577.94, + "learning_rate": 2.680013279029546e-06, + "loss": 0.0918, + "step": 196500 + }, + { + "epoch": 578.24, + "learning_rate": 2.675360818470253e-06, + "loss": 0.0898, + "step": 196600 + }, + { + "epoch": 578.53, + "learning_rate": 2.670710924243214e-06, + "loss": 0.0918, + "step": 196700 + }, + { + "epoch": 578.82, + "learning_rate": 2.6660636014817764e-06, + "loss": 0.0897, + "step": 196800 + }, + { + "epoch": 579.12, + "learning_rate": 2.6614188553164387e-06, + "loss": 0.0912, + "step": 196900 + }, + { + "epoch": 579.41, + "learning_rate": 2.656776690874868e-06, + "loss": 0.0884, + "step": 197000 + }, + { + "epoch": 579.41, + "eval_cer": 0.07092105836711564, + "eval_loss": 0.5512089133262634, + "eval_runtime": 4.8465, + "eval_samples_per_second": 74.074, + "eval_steps_per_second": 2.476, + "eval_wer": 0.26551668547477025, + "step": 197000 + }, + { + "epoch": 579.71, + "learning_rate": 2.652137113281874e-06, + "loss": 0.0817, + "step": 197100 + }, + { + "epoch": 580.0, + "learning_rate": 2.6475001276594115e-06, + "loss": 0.0875, + "step": 197200 + }, + { + "epoch": 580.29, + "learning_rate": 2.6428657391265756e-06, + "loss": 0.085, + "step": 197300 + }, + { + "epoch": 580.59, + "learning_rate": 2.638233952799588e-06, + "loss": 0.0851, + "step": 197400 + }, + { + "epoch": 580.88, + "learning_rate": 2.633604773791808e-06, + "loss": 0.089, + "step": 197500 + }, + { + "epoch": 581.18, + "learning_rate": 2.628978207213708e-06, + "loss": 0.0921, + "step": 197600 + }, + { + "epoch": 581.47, + "learning_rate": 2.624354258172881e-06, + "loss": 0.0889, + "step": 197700 + }, + { + "epoch": 581.76, + "learning_rate": 2.6197329317740304e-06, + "loss": 0.0874, + "step": 197800 + }, + { + "epoch": 582.06, + "learning_rate": 2.6151142331189556e-06, + "loss": 0.0807, + "step": 197900 + }, + { + "epoch": 582.35, + "learning_rate": 2.610498167306569e-06, + "loss": 0.0904, + "step": 198000 + }, + { + "epoch": 582.35, + "eval_cer": 0.07079028813042151, + "eval_loss": 0.5547834038734436, + "eval_runtime": 4.9397, + "eval_samples_per_second": 72.676, + "eval_steps_per_second": 2.429, + "eval_wer": 0.26600032242463323, + "step": 198000 + }, + { + "epoch": 582.65, + "learning_rate": 2.605884739432867e-06, + "loss": 0.0887, + "step": 198100 + }, + { + "epoch": 582.94, + "learning_rate": 2.601273954590936e-06, + "loss": 0.0895, + "step": 198200 + }, + { + "epoch": 583.24, + "learning_rate": 2.596665817870947e-06, + "loss": 0.085, + "step": 198300 + }, + { + "epoch": 583.53, + "learning_rate": 2.59206033436014e-06, + "loss": 0.084, + "step": 198400 + }, + { + "epoch": 583.82, + "learning_rate": 2.5874575091428383e-06, + "loss": 0.0945, + "step": 198500 + }, + { + "epoch": 584.12, + "learning_rate": 2.5828573473004157e-06, + "loss": 0.0809, + "step": 198600 + }, + { + "epoch": 584.41, + "learning_rate": 2.5782598539113205e-06, + "loss": 0.0859, + "step": 198700 + }, + { + "epoch": 584.71, + "learning_rate": 2.5737109689990237e-06, + "loss": 0.0896, + "step": 198800 + }, + { + "epoch": 585.0, + "learning_rate": 2.569118800928999e-06, + "loss": 0.087, + "step": 198900 + }, + { + "epoch": 585.29, + "learning_rate": 2.564529316479245e-06, + "loss": 0.0882, + "step": 199000 + }, + { + "epoch": 585.29, + "eval_cer": 0.07092105836711564, + "eval_loss": 0.5537840723991394, + "eval_runtime": 4.9542, + "eval_samples_per_second": 72.464, + "eval_steps_per_second": 2.422, + "eval_wer": 0.2656778977913913, + "step": 199000 + }, + { + "epoch": 585.59, + "learning_rate": 2.559942520716414e-06, + "loss": 0.0905, + "step": 199100 + }, + { + "epoch": 585.88, + "learning_rate": 2.5553584187041926e-06, + "loss": 0.0917, + "step": 199200 + }, + { + "epoch": 586.18, + "learning_rate": 2.5507770155032917e-06, + "loss": 0.085, + "step": 199300 + }, + { + "epoch": 586.47, + "learning_rate": 2.5461983161714442e-06, + "loss": 0.0868, + "step": 199400 + }, + { + "epoch": 586.76, + "learning_rate": 2.5416223257633977e-06, + "loss": 0.0875, + "step": 199500 + }, + { + "epoch": 587.06, + "learning_rate": 2.5370490493309086e-06, + "loss": 0.0869, + "step": 199600 + }, + { + "epoch": 587.35, + "learning_rate": 2.5324784919227373e-06, + "loss": 0.0861, + "step": 199700 + }, + { + "epoch": 587.65, + "learning_rate": 2.527910658584643e-06, + "loss": 0.0874, + "step": 199800 + }, + { + "epoch": 587.94, + "learning_rate": 2.5233455543593778e-06, + "loss": 0.0922, + "step": 199900 + }, + { + "epoch": 588.24, + "learning_rate": 2.5187831842866795e-06, + "loss": 0.0917, + "step": 200000 + }, + { + "epoch": 588.24, + "eval_cer": 0.07031079726254305, + "eval_loss": 0.5549612045288086, + "eval_runtime": 4.6478, + "eval_samples_per_second": 77.24, + "eval_steps_per_second": 2.582, + "eval_wer": 0.2650330485249073, + "step": 200000 + }, + { + "epoch": 588.53, + "learning_rate": 2.5142235534032688e-06, + "loss": 0.0845, + "step": 200100 + }, + { + "epoch": 588.82, + "learning_rate": 2.5096666667428427e-06, + "loss": 0.0859, + "step": 200200 + }, + { + "epoch": 589.12, + "learning_rate": 2.5051125293360667e-06, + "loss": 0.0898, + "step": 200300 + }, + { + "epoch": 589.41, + "learning_rate": 2.5005611462105746e-06, + "loss": 0.0914, + "step": 200400 + }, + { + "epoch": 589.71, + "learning_rate": 2.4960125223909555e-06, + "loss": 0.0874, + "step": 200500 + }, + { + "epoch": 590.0, + "learning_rate": 2.4914666628987555e-06, + "loss": 0.0931, + "step": 200600 + }, + { + "epoch": 590.29, + "learning_rate": 2.486923572752467e-06, + "loss": 0.0875, + "step": 200700 + }, + { + "epoch": 590.59, + "learning_rate": 2.4823832569675267e-06, + "loss": 0.0855, + "step": 200800 + }, + { + "epoch": 590.88, + "learning_rate": 2.4778457205563067e-06, + "loss": 0.0874, + "step": 200900 + }, + { + "epoch": 591.18, + "learning_rate": 2.4733109685281124e-06, + "loss": 0.086, + "step": 201000 + }, + { + "epoch": 591.18, + "eval_cer": 0.07048515757813521, + "eval_loss": 0.5632910132408142, + "eval_runtime": 5.3132, + "eval_samples_per_second": 67.568, + "eval_steps_per_second": 2.259, + "eval_wer": 0.2648718362082863, + "step": 201000 + }, + { + "epoch": 591.47, + "learning_rate": 2.468779005889174e-06, + "loss": 0.0856, + "step": 201100 + }, + { + "epoch": 591.76, + "learning_rate": 2.4642498376426442e-06, + "loss": 0.0864, + "step": 201200 + }, + { + "epoch": 592.06, + "learning_rate": 2.4597234687885885e-06, + "loss": 0.0915, + "step": 201300 + }, + { + "epoch": 592.35, + "learning_rate": 2.455199904323983e-06, + "loss": 0.0937, + "step": 201400 + }, + { + "epoch": 592.65, + "learning_rate": 2.4506791492427086e-06, + "loss": 0.0884, + "step": 201500 + }, + { + "epoch": 592.94, + "learning_rate": 2.446161208535543e-06, + "loss": 0.0841, + "step": 201600 + }, + { + "epoch": 593.24, + "learning_rate": 2.4416460871901585e-06, + "loss": 0.0819, + "step": 201700 + }, + { + "epoch": 593.53, + "learning_rate": 2.4371337901911142e-06, + "loss": 0.0884, + "step": 201800 + }, + { + "epoch": 593.82, + "learning_rate": 2.4326243225198505e-06, + "loss": 0.088, + "step": 201900 + }, + { + "epoch": 594.12, + "learning_rate": 2.4281176891546858e-06, + "loss": 0.0851, + "step": 202000 + }, + { + "epoch": 594.12, + "eval_cer": 0.07061592781482935, + "eval_loss": 0.5610267519950867, + "eval_runtime": 5.3517, + "eval_samples_per_second": 67.082, + "eval_steps_per_second": 2.242, + "eval_wer": 0.2651942608415283, + "step": 202000 + }, + { + "epoch": 594.41, + "learning_rate": 2.4236138950708086e-06, + "loss": 0.0849, + "step": 202100 + }, + { + "epoch": 594.71, + "learning_rate": 2.419112945240274e-06, + "loss": 0.0862, + "step": 202200 + }, + { + "epoch": 595.0, + "learning_rate": 2.4146148446319944e-06, + "loss": 0.0856, + "step": 202300 + }, + { + "epoch": 595.29, + "learning_rate": 2.41011959821174e-06, + "loss": 0.0894, + "step": 202400 + }, + { + "epoch": 595.59, + "learning_rate": 2.4056272109421286e-06, + "loss": 0.087, + "step": 202500 + }, + { + "epoch": 595.88, + "learning_rate": 2.401137687782621e-06, + "loss": 0.0889, + "step": 202600 + }, + { + "epoch": 596.18, + "learning_rate": 2.3966510336895166e-06, + "loss": 0.0854, + "step": 202700 + }, + { + "epoch": 596.47, + "learning_rate": 2.3921672536159486e-06, + "loss": 0.0866, + "step": 202800 + }, + { + "epoch": 596.76, + "learning_rate": 2.387686352511875e-06, + "loss": 0.0875, + "step": 202900 + }, + { + "epoch": 597.06, + "learning_rate": 2.383208335324078e-06, + "loss": 0.0852, + "step": 203000 + }, + { + "epoch": 597.06, + "eval_cer": 0.07035438734144109, + "eval_loss": 0.5522825717926025, + "eval_runtime": 4.7713, + "eval_samples_per_second": 75.241, + "eval_steps_per_second": 2.515, + "eval_wer": 0.2624536514589715, + "step": 203000 + }, + { + "epoch": 597.35, + "learning_rate": 2.3787332069961545e-06, + "loss": 0.0834, + "step": 203100 + }, + { + "epoch": 597.65, + "learning_rate": 2.3742609724685123e-06, + "loss": 0.0891, + "step": 203200 + }, + { + "epoch": 597.94, + "learning_rate": 2.3697916366783653e-06, + "loss": 0.0892, + "step": 203300 + }, + { + "epoch": 598.24, + "learning_rate": 2.3653252045597257e-06, + "loss": 0.0858, + "step": 203400 + }, + { + "epoch": 598.53, + "learning_rate": 2.3608616810434028e-06, + "loss": 0.0838, + "step": 203500 + }, + { + "epoch": 598.82, + "learning_rate": 2.3564010710569924e-06, + "loss": 0.0852, + "step": 203600 + }, + { + "epoch": 599.12, + "learning_rate": 2.3519433795248748e-06, + "loss": 0.0938, + "step": 203700 + }, + { + "epoch": 599.41, + "learning_rate": 2.3474886113682097e-06, + "loss": 0.0864, + "step": 203800 + }, + { + "epoch": 599.71, + "learning_rate": 2.3430367715049235e-06, + "loss": 0.0871, + "step": 203900 + }, + { + "epoch": 600.0, + "learning_rate": 2.33858786484972e-06, + "loss": 0.0871, + "step": 204000 + }, + { + "epoch": 600.0, + "eval_cer": 0.0711825988405039, + "eval_loss": 0.5549289584159851, + "eval_runtime": 4.6864, + "eval_samples_per_second": 76.604, + "eval_steps_per_second": 2.561, + "eval_wer": 0.2680960825407061, + "step": 204000 + }, + { + "epoch": 600.29, + "learning_rate": 2.334141896314057e-06, + "loss": 0.0874, + "step": 204100 + }, + { + "epoch": 600.59, + "learning_rate": 2.329698870806151e-06, + "loss": 0.0827, + "step": 204200 + }, + { + "epoch": 600.88, + "learning_rate": 2.325258793230972e-06, + "loss": 0.0825, + "step": 204300 + }, + { + "epoch": 601.18, + "learning_rate": 2.320821668490227e-06, + "loss": 0.0812, + "step": 204400 + }, + { + "epoch": 601.47, + "learning_rate": 2.3163875014823745e-06, + "loss": 0.082, + "step": 204500 + }, + { + "epoch": 601.76, + "learning_rate": 2.3119562971026018e-06, + "loss": 0.086, + "step": 204600 + }, + { + "epoch": 602.06, + "learning_rate": 2.3075280602428245e-06, + "loss": 0.0839, + "step": 204700 + }, + { + "epoch": 602.35, + "learning_rate": 2.3031027957916875e-06, + "loss": 0.0848, + "step": 204800 + }, + { + "epoch": 602.65, + "learning_rate": 2.298680508634544e-06, + "loss": 0.0843, + "step": 204900 + }, + { + "epoch": 602.94, + "learning_rate": 2.294261203653473e-06, + "loss": 0.0852, + "step": 205000 + }, + { + "epoch": 602.94, + "eval_cer": 0.07096464844601369, + "eval_loss": 0.5612467527389526, + "eval_runtime": 4.9666, + "eval_samples_per_second": 72.282, + "eval_steps_per_second": 2.416, + "eval_wer": 0.2666451716911172, + "step": 205000 + }, + { + "epoch": 603.24, + "learning_rate": 2.2898890341045833e-06, + "loss": 0.087, + "step": 205100 + }, + { + "epoch": 603.53, + "learning_rate": 2.2854756781652714e-06, + "loss": 0.0855, + "step": 205200 + }, + { + "epoch": 603.82, + "learning_rate": 2.281065318979769e-06, + "loss": 0.0866, + "step": 205300 + }, + { + "epoch": 604.12, + "learning_rate": 2.276657961416981e-06, + "loss": 0.0895, + "step": 205400 + }, + { + "epoch": 604.41, + "learning_rate": 2.2722536103424977e-06, + "loss": 0.0823, + "step": 205500 + }, + { + "epoch": 604.71, + "learning_rate": 2.2678522706185918e-06, + "loss": 0.083, + "step": 205600 + }, + { + "epoch": 605.0, + "learning_rate": 2.2634539471042104e-06, + "loss": 0.0893, + "step": 205700 + }, + { + "epoch": 605.29, + "learning_rate": 2.2590586446549725e-06, + "loss": 0.0835, + "step": 205800 + }, + { + "epoch": 605.59, + "learning_rate": 2.2546663681231596e-06, + "loss": 0.0869, + "step": 205900 + }, + { + "epoch": 605.88, + "learning_rate": 2.250277122357714e-06, + "loss": 0.083, + "step": 206000 + }, + { + "epoch": 605.88, + "eval_cer": 0.07092105836711564, + "eval_loss": 0.562522292137146, + "eval_runtime": 4.7678, + "eval_samples_per_second": 75.296, + "eval_steps_per_second": 2.517, + "eval_wer": 0.2648718362082863, + "step": 206000 + }, + { + "epoch": 606.18, + "learning_rate": 2.245890912204233e-06, + "loss": 0.0843, + "step": 206100 + }, + { + "epoch": 606.47, + "learning_rate": 2.2415077425049604e-06, + "loss": 0.085, + "step": 206200 + }, + { + "epoch": 606.76, + "learning_rate": 2.2371714042527648e-06, + "loss": 0.0867, + "step": 206300 + }, + { + "epoch": 607.06, + "learning_rate": 2.2327942994500047e-06, + "loss": 0.0816, + "step": 206400 + }, + { + "epoch": 607.35, + "learning_rate": 2.228420249559719e-06, + "loss": 0.0853, + "step": 206500 + }, + { + "epoch": 607.65, + "learning_rate": 2.224049259410736e-06, + "loss": 0.087, + "step": 206600 + }, + { + "epoch": 607.94, + "learning_rate": 2.2196813338284906e-06, + "loss": 0.0845, + "step": 206700 + }, + { + "epoch": 608.24, + "learning_rate": 2.2153164776350483e-06, + "loss": 0.0828, + "step": 206800 + }, + { + "epoch": 608.53, + "learning_rate": 2.2109546956490803e-06, + "loss": 0.0845, + "step": 206900 + }, + { + "epoch": 608.82, + "learning_rate": 2.2065959926858566e-06, + "loss": 0.0859, + "step": 207000 + }, + { + "epoch": 608.82, + "eval_cer": 0.0708774682882176, + "eval_loss": 0.5508594512939453, + "eval_runtime": 5.2083, + "eval_samples_per_second": 68.928, + "eval_steps_per_second": 2.304, + "eval_wer": 0.26390456230856035, + "step": 207000 + }, + { + "epoch": 609.12, + "learning_rate": 2.202240373557264e-06, + "loss": 0.0869, + "step": 207100 + }, + { + "epoch": 609.41, + "learning_rate": 2.197887843071768e-06, + "loss": 0.089, + "step": 207200 + }, + { + "epoch": 609.71, + "learning_rate": 2.19353840603444e-06, + "loss": 0.0842, + "step": 207300 + }, + { + "epoch": 610.0, + "learning_rate": 2.189192067246923e-06, + "loss": 0.0879, + "step": 207400 + }, + { + "epoch": 610.29, + "learning_rate": 2.184848831507445e-06, + "loss": 0.0901, + "step": 207500 + }, + { + "epoch": 610.59, + "learning_rate": 2.180508703610814e-06, + "loss": 0.0862, + "step": 207600 + }, + { + "epoch": 610.88, + "learning_rate": 2.176171688348395e-06, + "loss": 0.0821, + "step": 207700 + }, + { + "epoch": 611.18, + "learning_rate": 2.1718377905081306e-06, + "loss": 0.082, + "step": 207800 + }, + { + "epoch": 611.47, + "learning_rate": 2.167507014874508e-06, + "loss": 0.0832, + "step": 207900 + }, + { + "epoch": 611.76, + "learning_rate": 2.1631793662285754e-06, + "loss": 0.0842, + "step": 208000 + }, + { + "epoch": 611.76, + "eval_cer": 0.07013643694695088, + "eval_loss": 0.5625478625297546, + "eval_runtime": 4.8229, + "eval_samples_per_second": 74.437, + "eval_steps_per_second": 2.488, + "eval_wer": 0.2648718362082863, + "step": 208000 + }, + { + "epoch": 612.06, + "learning_rate": 2.158854849347933e-06, + "loss": 0.087, + "step": 208100 + }, + { + "epoch": 612.35, + "learning_rate": 2.1545334690067107e-06, + "loss": 0.0852, + "step": 208200 + }, + { + "epoch": 612.65, + "learning_rate": 2.1502152299755904e-06, + "loss": 0.0899, + "step": 208300 + }, + { + "epoch": 612.94, + "learning_rate": 2.1459001370217743e-06, + "loss": 0.0866, + "step": 208400 + }, + { + "epoch": 613.24, + "learning_rate": 2.1415881949089956e-06, + "loss": 0.0895, + "step": 208500 + }, + { + "epoch": 613.53, + "learning_rate": 2.1372794083975156e-06, + "loss": 0.0863, + "step": 208600 + }, + { + "epoch": 613.82, + "learning_rate": 2.133016822846251e-06, + "loss": 0.0887, + "step": 208700 + }, + { + "epoch": 614.12, + "learning_rate": 2.1287143301295543e-06, + "loss": 0.0871, + "step": 208800 + }, + { + "epoch": 614.41, + "learning_rate": 2.124415007226515e-06, + "loss": 0.0883, + "step": 208900 + }, + { + "epoch": 614.71, + "learning_rate": 2.120118858883457e-06, + "loss": 0.084, + "step": 209000 + }, + { + "epoch": 614.71, + "eval_cer": 0.0705723377359313, + "eval_loss": 0.5603653192520142, + "eval_runtime": 4.9708, + "eval_samples_per_second": 72.222, + "eval_steps_per_second": 2.414, + "eval_wer": 0.26422698694180236, + "step": 209000 + }, + { + "epoch": 615.0, + "learning_rate": 2.115825889843199e-06, + "loss": 0.0854, + "step": 209100 + }, + { + "epoch": 615.29, + "learning_rate": 2.111536104845055e-06, + "loss": 0.0825, + "step": 209200 + }, + { + "epoch": 615.59, + "learning_rate": 2.1072495086248112e-06, + "loss": 0.0868, + "step": 209300 + }, + { + "epoch": 615.88, + "learning_rate": 2.1029661059147488e-06, + "loss": 0.0801, + "step": 209400 + }, + { + "epoch": 616.18, + "learning_rate": 2.098685901443615e-06, + "loss": 0.084, + "step": 209500 + }, + { + "epoch": 616.47, + "learning_rate": 2.094408899936627e-06, + "loss": 0.0847, + "step": 209600 + }, + { + "epoch": 616.76, + "learning_rate": 2.0901351061154686e-06, + "loss": 0.0809, + "step": 209700 + }, + { + "epoch": 617.06, + "learning_rate": 2.085864524698275e-06, + "loss": 0.0863, + "step": 209800 + }, + { + "epoch": 617.35, + "learning_rate": 2.0815971603996466e-06, + "loss": 0.0842, + "step": 209900 + }, + { + "epoch": 617.65, + "learning_rate": 2.0773330179306243e-06, + "loss": 0.0891, + "step": 210000 + }, + { + "epoch": 617.65, + "eval_cer": 0.0699620766313587, + "eval_loss": 0.5616000890731812, + "eval_runtime": 5.1126, + "eval_samples_per_second": 70.219, + "eval_steps_per_second": 2.347, + "eval_wer": 0.2632597130420764, + "step": 210000 + }, + { + "epoch": 617.94, + "learning_rate": 2.073072101998694e-06, + "loss": 0.0861, + "step": 210100 + }, + { + "epoch": 618.24, + "learning_rate": 2.0688144173077814e-06, + "loss": 0.0872, + "step": 210200 + }, + { + "epoch": 618.53, + "learning_rate": 2.0645599685582372e-06, + "loss": 0.0846, + "step": 210300 + }, + { + "epoch": 618.82, + "learning_rate": 2.0603087604468527e-06, + "loss": 0.0832, + "step": 210400 + }, + { + "epoch": 619.12, + "learning_rate": 2.056060797666832e-06, + "loss": 0.0834, + "step": 210500 + }, + { + "epoch": 619.41, + "learning_rate": 2.051816084907799e-06, + "loss": 0.085, + "step": 210600 + }, + { + "epoch": 619.71, + "learning_rate": 2.0476170253101334e-06, + "loss": 0.0829, + "step": 210700 + }, + { + "epoch": 620.0, + "learning_rate": 2.0434211601942156e-06, + "loss": 0.087, + "step": 210800 + }, + { + "epoch": 620.29, + "learning_rate": 2.0391861602727887e-06, + "loss": 0.0848, + "step": 210900 + }, + { + "epoch": 620.59, + "learning_rate": 2.0349544290014495e-06, + "loss": 0.0839, + "step": 211000 + }, + { + "epoch": 620.59, + "eval_cer": 0.07061592781482935, + "eval_loss": 0.564612865447998, + "eval_runtime": 4.8577, + "eval_samples_per_second": 73.903, + "eval_steps_per_second": 2.47, + "eval_wer": 0.2648718362082863, + "step": 211000 + }, + { + "epoch": 620.88, + "learning_rate": 2.030725971051895e-06, + "loss": 0.0888, + "step": 211100 + }, + { + "epoch": 621.18, + "learning_rate": 2.026500791092223e-06, + "loss": 0.0862, + "step": 211200 + }, + { + "epoch": 621.47, + "learning_rate": 2.022278893786906e-06, + "loss": 0.0774, + "step": 211300 + }, + { + "epoch": 621.76, + "learning_rate": 2.018060283796786e-06, + "loss": 0.0832, + "step": 211400 + }, + { + "epoch": 622.06, + "learning_rate": 2.0138449657790904e-06, + "loss": 0.0831, + "step": 211500 + }, + { + "epoch": 622.35, + "learning_rate": 2.0096329443873976e-06, + "loss": 0.0905, + "step": 211600 + }, + { + "epoch": 622.65, + "learning_rate": 2.005424224271658e-06, + "loss": 0.088, + "step": 211700 + }, + { + "epoch": 622.94, + "learning_rate": 2.0012188100781738e-06, + "loss": 0.0845, + "step": 211800 + }, + { + "epoch": 623.24, + "learning_rate": 1.997016706449591e-06, + "loss": 0.0834, + "step": 211900 + }, + { + "epoch": 623.53, + "learning_rate": 1.992817918024914e-06, + "loss": 0.085, + "step": 212000 + }, + { + "epoch": 623.53, + "eval_cer": 0.07083387820931956, + "eval_loss": 0.5574280023574829, + "eval_runtime": 5.1804, + "eval_samples_per_second": 69.3, + "eval_steps_per_second": 2.316, + "eval_wer": 0.2648718362082863, + "step": 212000 + }, + { + "epoch": 623.82, + "learning_rate": 1.9886224494394724e-06, + "loss": 0.0873, + "step": 212100 + }, + { + "epoch": 624.12, + "learning_rate": 1.9844303053249453e-06, + "loss": 0.0859, + "step": 212200 + }, + { + "epoch": 624.41, + "learning_rate": 1.9802414903093293e-06, + "loss": 0.0868, + "step": 212300 + }, + { + "epoch": 624.71, + "learning_rate": 1.9760560090169512e-06, + "loss": 0.0842, + "step": 212400 + }, + { + "epoch": 625.0, + "learning_rate": 1.9718738660684627e-06, + "loss": 0.0849, + "step": 212500 + }, + { + "epoch": 625.29, + "learning_rate": 1.967695066080818e-06, + "loss": 0.0862, + "step": 212600 + }, + { + "epoch": 625.59, + "learning_rate": 1.9635196136672945e-06, + "loss": 0.0838, + "step": 212700 + }, + { + "epoch": 625.88, + "learning_rate": 1.959347513437461e-06, + "loss": 0.082, + "step": 212800 + }, + { + "epoch": 626.18, + "learning_rate": 1.955178769997193e-06, + "loss": 0.0844, + "step": 212900 + }, + { + "epoch": 626.47, + "learning_rate": 1.9510133879486625e-06, + "loss": 0.0832, + "step": 213000 + }, + { + "epoch": 626.47, + "eval_cer": 0.07044156749923718, + "eval_loss": 0.5674094557762146, + "eval_runtime": 4.8288, + "eval_samples_per_second": 74.345, + "eval_steps_per_second": 2.485, + "eval_wer": 0.2650330485249073, + "step": 213000 + }, + { + "epoch": 626.76, + "learning_rate": 1.946851371890321e-06, + "loss": 0.0817, + "step": 213100 + }, + { + "epoch": 627.06, + "learning_rate": 1.9426927264169165e-06, + "loss": 0.0869, + "step": 213200 + }, + { + "epoch": 627.35, + "learning_rate": 1.9385374561194643e-06, + "loss": 0.0877, + "step": 213300 + }, + { + "epoch": 627.65, + "learning_rate": 1.934385565585259e-06, + "loss": 0.0783, + "step": 213400 + }, + { + "epoch": 627.94, + "learning_rate": 1.930237059397868e-06, + "loss": 0.0846, + "step": 213500 + }, + { + "epoch": 628.24, + "learning_rate": 1.926091942137113e-06, + "loss": 0.0881, + "step": 213600 + }, + { + "epoch": 628.53, + "learning_rate": 1.9219502183790854e-06, + "loss": 0.0902, + "step": 213700 + }, + { + "epoch": 628.82, + "learning_rate": 1.9178118926961197e-06, + "loss": 0.0904, + "step": 213800 + }, + { + "epoch": 629.12, + "learning_rate": 1.9136769696568056e-06, + "loss": 0.0844, + "step": 213900 + }, + { + "epoch": 629.41, + "learning_rate": 1.909545453825975e-06, + "loss": 0.0899, + "step": 214000 + }, + { + "epoch": 629.41, + "eval_cer": 0.06991848655246066, + "eval_loss": 0.5597048997879028, + "eval_runtime": 5.3718, + "eval_samples_per_second": 66.831, + "eval_steps_per_second": 2.234, + "eval_wer": 0.2624536514589715, + "step": 214000 + }, + { + "epoch": 629.71, + "learning_rate": 1.905417349764696e-06, + "loss": 0.0848, + "step": 214100 + }, + { + "epoch": 630.0, + "learning_rate": 1.9012926620302774e-06, + "loss": 0.0819, + "step": 214200 + }, + { + "epoch": 630.29, + "learning_rate": 1.8971713951762444e-06, + "loss": 0.0818, + "step": 214300 + }, + { + "epoch": 630.59, + "learning_rate": 1.8930535537523598e-06, + "loss": 0.0882, + "step": 214400 + }, + { + "epoch": 630.88, + "learning_rate": 1.8889391423045917e-06, + "loss": 0.0839, + "step": 214500 + }, + { + "epoch": 631.18, + "learning_rate": 1.8848281653751282e-06, + "loss": 0.0823, + "step": 214600 + }, + { + "epoch": 631.47, + "learning_rate": 1.8807206275023704e-06, + "loss": 0.0843, + "step": 214700 + }, + { + "epoch": 631.76, + "learning_rate": 1.8766165332209101e-06, + "loss": 0.0872, + "step": 214800 + }, + { + "epoch": 632.06, + "learning_rate": 1.8725568764400725e-06, + "loss": 0.0766, + "step": 214900 + }, + { + "epoch": 632.35, + "learning_rate": 1.8684596483809147e-06, + "loss": 0.0821, + "step": 215000 + }, + { + "epoch": 632.35, + "eval_cer": 0.07052874765703326, + "eval_loss": 0.5650409460067749, + "eval_runtime": 4.9953, + "eval_samples_per_second": 71.867, + "eval_steps_per_second": 2.402, + "eval_wer": 0.26632274705787523, + "step": 215000 + }, + { + "epoch": 632.65, + "learning_rate": 1.8643658774488132e-06, + "loss": 0.0836, + "step": 215100 + }, + { + "epoch": 632.94, + "learning_rate": 1.860275568163169e-06, + "loss": 0.0859, + "step": 215200 + }, + { + "epoch": 633.24, + "learning_rate": 1.8561887250395604e-06, + "loss": 0.0894, + "step": 215300 + }, + { + "epoch": 633.53, + "learning_rate": 1.852105352589741e-06, + "loss": 0.0862, + "step": 215400 + }, + { + "epoch": 633.82, + "learning_rate": 1.848025455321632e-06, + "loss": 0.0842, + "step": 215500 + }, + { + "epoch": 634.12, + "learning_rate": 1.8439490377393176e-06, + "loss": 0.0837, + "step": 215600 + }, + { + "epoch": 634.41, + "learning_rate": 1.8398761043430419e-06, + "loss": 0.0825, + "step": 215700 + }, + { + "epoch": 634.71, + "learning_rate": 1.8358066596292034e-06, + "loss": 0.0854, + "step": 215800 + }, + { + "epoch": 635.0, + "learning_rate": 1.8317407080903416e-06, + "loss": 0.0829, + "step": 215900 + }, + { + "epoch": 635.29, + "learning_rate": 1.8276782542151516e-06, + "loss": 0.0905, + "step": 216000 + }, + { + "epoch": 635.29, + "eval_cer": 0.06930822544788806, + "eval_loss": 0.5545493960380554, + "eval_runtime": 5.1065, + "eval_samples_per_second": 70.303, + "eval_steps_per_second": 2.35, + "eval_wer": 0.2616475898758665, + "step": 216000 + }, + { + "epoch": 635.59, + "learning_rate": 1.823619302488459e-06, + "loss": 0.0823, + "step": 216100 + }, + { + "epoch": 635.88, + "learning_rate": 1.819563857391226e-06, + "loss": 0.0843, + "step": 216200 + }, + { + "epoch": 636.18, + "learning_rate": 1.815511923400544e-06, + "loss": 0.0856, + "step": 216300 + }, + { + "epoch": 636.47, + "learning_rate": 1.8114635049896224e-06, + "loss": 0.0879, + "step": 216400 + }, + { + "epoch": 636.76, + "learning_rate": 1.8074186066277988e-06, + "loss": 0.0804, + "step": 216500 + }, + { + "epoch": 637.06, + "learning_rate": 1.8033772327805188e-06, + "loss": 0.0853, + "step": 216600 + }, + { + "epoch": 637.35, + "learning_rate": 1.7993393879093385e-06, + "loss": 0.0826, + "step": 216700 + }, + { + "epoch": 637.65, + "learning_rate": 1.7953050764719204e-06, + "loss": 0.087, + "step": 216800 + }, + { + "epoch": 637.94, + "learning_rate": 1.7913145931303599e-06, + "loss": 0.0849, + "step": 216900 + }, + { + "epoch": 638.24, + "learning_rate": 1.7872873264724445e-06, + "loss": 0.0815, + "step": 217000 + }, + { + "epoch": 638.24, + "eval_cer": 0.07004925678915479, + "eval_loss": 0.5678441524505615, + "eval_runtime": 5.429, + "eval_samples_per_second": 66.127, + "eval_steps_per_second": 2.21, + "eval_wer": 0.2634209253586974, + "step": 217000 + }, + { + "epoch": 638.53, + "learning_rate": 1.7832636065534054e-06, + "loss": 0.0839, + "step": 217100 + }, + { + "epoch": 638.82, + "learning_rate": 1.7792434378153084e-06, + "loss": 0.0829, + "step": 217200 + }, + { + "epoch": 639.12, + "learning_rate": 1.7752268246963001e-06, + "loss": 0.087, + "step": 217300 + }, + { + "epoch": 639.41, + "learning_rate": 1.7712137716306022e-06, + "loss": 0.0829, + "step": 217400 + }, + { + "epoch": 639.71, + "learning_rate": 1.7672042830485047e-06, + "loss": 0.0878, + "step": 217500 + }, + { + "epoch": 640.0, + "learning_rate": 1.7631983633763632e-06, + "loss": 0.0808, + "step": 217600 + }, + { + "epoch": 640.29, + "learning_rate": 1.7591960170365947e-06, + "loss": 0.0838, + "step": 217700 + }, + { + "epoch": 640.59, + "learning_rate": 1.755197248447668e-06, + "loss": 0.0769, + "step": 217800 + }, + { + "epoch": 640.88, + "learning_rate": 1.751202062024106e-06, + "loss": 0.085, + "step": 217900 + }, + { + "epoch": 641.18, + "learning_rate": 1.7472104621764747e-06, + "loss": 0.0853, + "step": 218000 + }, + { + "epoch": 641.18, + "eval_cer": 0.07004925678915479, + "eval_loss": 0.5571328401565552, + "eval_runtime": 4.4749, + "eval_samples_per_second": 80.226, + "eval_steps_per_second": 2.682, + "eval_wer": 0.2640657746251814, + "step": 218000 + }, + { + "epoch": 641.47, + "learning_rate": 1.7432224533113807e-06, + "loss": 0.0826, + "step": 218100 + }, + { + "epoch": 641.76, + "learning_rate": 1.7392380398314668e-06, + "loss": 0.0874, + "step": 218200 + }, + { + "epoch": 642.06, + "learning_rate": 1.7352572261354073e-06, + "loss": 0.0895, + "step": 218300 + }, + { + "epoch": 642.35, + "learning_rate": 1.7312800166179012e-06, + "loss": 0.0878, + "step": 218400 + }, + { + "epoch": 642.65, + "learning_rate": 1.727306415669669e-06, + "loss": 0.0837, + "step": 218500 + }, + { + "epoch": 642.94, + "learning_rate": 1.7233364276774472e-06, + "loss": 0.0833, + "step": 218600 + }, + { + "epoch": 643.24, + "learning_rate": 1.7193700570239847e-06, + "loss": 0.0801, + "step": 218700 + }, + { + "epoch": 643.53, + "learning_rate": 1.7154073080880357e-06, + "loss": 0.0774, + "step": 218800 + }, + { + "epoch": 643.82, + "learning_rate": 1.7114481852443576e-06, + "loss": 0.0864, + "step": 218900 + }, + { + "epoch": 644.12, + "learning_rate": 1.7074926928637025e-06, + "loss": 0.0853, + "step": 219000 + }, + { + "epoch": 644.12, + "eval_cer": 0.06961335600017436, + "eval_loss": 0.5619438290596008, + "eval_runtime": 5.7032, + "eval_samples_per_second": 62.947, + "eval_steps_per_second": 2.104, + "eval_wer": 0.26390456230856035, + "step": 219000 + }, + { + "epoch": 644.41, + "learning_rate": 1.703540835312817e-06, + "loss": 0.0853, + "step": 219100 + }, + { + "epoch": 644.71, + "learning_rate": 1.6995926169544337e-06, + "loss": 0.0814, + "step": 219200 + }, + { + "epoch": 645.0, + "learning_rate": 1.6956480421472665e-06, + "loss": 0.0854, + "step": 219300 + }, + { + "epoch": 645.29, + "learning_rate": 1.6917071152460103e-06, + "loss": 0.0863, + "step": 219400 + }, + { + "epoch": 645.59, + "learning_rate": 1.6877698406013293e-06, + "loss": 0.0819, + "step": 219500 + }, + { + "epoch": 645.88, + "learning_rate": 1.6838362225598576e-06, + "loss": 0.0848, + "step": 219600 + }, + { + "epoch": 646.18, + "learning_rate": 1.6799062654641918e-06, + "loss": 0.082, + "step": 219700 + }, + { + "epoch": 646.47, + "learning_rate": 1.6759799736528881e-06, + "loss": 0.0814, + "step": 219800 + }, + { + "epoch": 646.76, + "learning_rate": 1.6720573514604543e-06, + "loss": 0.0838, + "step": 219900 + }, + { + "epoch": 647.06, + "learning_rate": 1.6681384032173487e-06, + "loss": 0.0816, + "step": 220000 + }, + { + "epoch": 647.06, + "eval_cer": 0.07044156749923718, + "eval_loss": 0.5699228048324585, + "eval_runtime": 4.8268, + "eval_samples_per_second": 74.376, + "eval_steps_per_second": 2.486, + "eval_wer": 0.26551668547477025, + "step": 220000 + }, + { + "epoch": 647.35, + "learning_rate": 1.6642622677279875e-06, + "loss": 0.0861, + "step": 220100 + }, + { + "epoch": 647.65, + "learning_rate": 1.6603506435113182e-06, + "loss": 0.0821, + "step": 220200 + }, + { + "epoch": 647.94, + "learning_rate": 1.6564427061678367e-06, + "loss": 0.0828, + "step": 220300 + }, + { + "epoch": 648.24, + "learning_rate": 1.6525384600117844e-06, + "loss": 0.0842, + "step": 220400 + }, + { + "epoch": 648.53, + "learning_rate": 1.6486379093533317e-06, + "loss": 0.0847, + "step": 220500 + }, + { + "epoch": 648.82, + "learning_rate": 1.6447410584985756e-06, + "loss": 0.0896, + "step": 220600 + }, + { + "epoch": 649.12, + "learning_rate": 1.6408479117495162e-06, + "loss": 0.0837, + "step": 220700 + }, + { + "epoch": 649.41, + "learning_rate": 1.6369584734040777e-06, + "loss": 0.0854, + "step": 220800 + }, + { + "epoch": 649.71, + "learning_rate": 1.6330727477560798e-06, + "loss": 0.0869, + "step": 220900 + }, + { + "epoch": 650.0, + "learning_rate": 1.6291907390952482e-06, + "loss": 0.0856, + "step": 221000 + }, + { + "epoch": 650.0, + "eval_cer": 0.07018002702584891, + "eval_loss": 0.5630475878715515, + "eval_runtime": 4.4033, + "eval_samples_per_second": 81.53, + "eval_steps_per_second": 2.725, + "eval_wer": 0.26390456230856035, + "step": 221000 + }, + { + "epoch": 650.29, + "learning_rate": 1.6253124517072055e-06, + "loss": 0.0829, + "step": 221100 + }, + { + "epoch": 650.59, + "learning_rate": 1.6214378898734629e-06, + "loss": 0.0792, + "step": 221200 + }, + { + "epoch": 650.88, + "learning_rate": 1.6175670578714258e-06, + "loss": 0.0769, + "step": 221300 + }, + { + "epoch": 651.18, + "learning_rate": 1.6136999599743726e-06, + "loss": 0.0795, + "step": 221400 + }, + { + "epoch": 651.47, + "learning_rate": 1.609836600451466e-06, + "loss": 0.0857, + "step": 221500 + }, + { + "epoch": 651.76, + "learning_rate": 1.6059769835677387e-06, + "loss": 0.0903, + "step": 221600 + }, + { + "epoch": 652.06, + "learning_rate": 1.6021211135840914e-06, + "loss": 0.0827, + "step": 221700 + }, + { + "epoch": 652.35, + "learning_rate": 1.5982689947572938e-06, + "loss": 0.0875, + "step": 221800 + }, + { + "epoch": 652.65, + "learning_rate": 1.5944206313399663e-06, + "loss": 0.0855, + "step": 221900 + }, + { + "epoch": 652.94, + "learning_rate": 1.5905760275805875e-06, + "loss": 0.0801, + "step": 222000 + }, + { + "epoch": 652.94, + "eval_cer": 0.06956976592127631, + "eval_loss": 0.5596914291381836, + "eval_runtime": 5.2656, + "eval_samples_per_second": 68.178, + "eval_steps_per_second": 2.279, + "eval_wer": 0.26309850072545543, + "step": 222000 + }, + { + "epoch": 653.24, + "learning_rate": 1.5867351877234865e-06, + "loss": 0.0821, + "step": 222100 + }, + { + "epoch": 653.53, + "learning_rate": 1.582898116008833e-06, + "loss": 0.0774, + "step": 222200 + }, + { + "epoch": 653.82, + "learning_rate": 1.5790648166726453e-06, + "loss": 0.0818, + "step": 222300 + }, + { + "epoch": 654.12, + "learning_rate": 1.5752352939467664e-06, + "loss": 0.0795, + "step": 222400 + }, + { + "epoch": 654.41, + "learning_rate": 1.5714095520588762e-06, + "loss": 0.0936, + "step": 222500 + }, + { + "epoch": 654.71, + "learning_rate": 1.5675875952324799e-06, + "loss": 0.0829, + "step": 222600 + }, + { + "epoch": 655.0, + "learning_rate": 1.5637694276869036e-06, + "loss": 0.0824, + "step": 222700 + }, + { + "epoch": 655.29, + "learning_rate": 1.5599550536372909e-06, + "loss": 0.0811, + "step": 222800 + }, + { + "epoch": 655.59, + "learning_rate": 1.556144477294596e-06, + "loss": 0.0795, + "step": 222900 + }, + { + "epoch": 655.88, + "learning_rate": 1.5523377028655818e-06, + "loss": 0.0855, + "step": 223000 + }, + { + "epoch": 655.88, + "eval_cer": 0.07061592781482935, + "eval_loss": 0.5634012818336487, + "eval_runtime": 4.6021, + "eval_samples_per_second": 78.007, + "eval_steps_per_second": 2.607, + "eval_wer": 0.2651942608415283, + "step": 223000 + }, + { + "epoch": 656.18, + "learning_rate": 1.548534734552814e-06, + "loss": 0.0817, + "step": 223100 + }, + { + "epoch": 656.47, + "learning_rate": 1.544735576554655e-06, + "loss": 0.0865, + "step": 223200 + }, + { + "epoch": 656.76, + "learning_rate": 1.540940233065263e-06, + "loss": 0.0865, + "step": 223300 + }, + { + "epoch": 657.06, + "learning_rate": 1.5371487082745828e-06, + "loss": 0.0852, + "step": 223400 + }, + { + "epoch": 657.35, + "learning_rate": 1.5333610063683456e-06, + "loss": 0.0814, + "step": 223500 + }, + { + "epoch": 657.65, + "learning_rate": 1.5295771315280612e-06, + "loss": 0.0832, + "step": 223600 + }, + { + "epoch": 657.94, + "learning_rate": 1.5257970879310135e-06, + "loss": 0.0845, + "step": 223700 + }, + { + "epoch": 658.24, + "learning_rate": 1.5220208797502584e-06, + "loss": 0.0876, + "step": 223800 + }, + { + "epoch": 658.53, + "learning_rate": 1.518248511154617e-06, + "loss": 0.0747, + "step": 223900 + }, + { + "epoch": 658.82, + "learning_rate": 1.5145176525169048e-06, + "loss": 0.0826, + "step": 224000 + }, + { + "epoch": 658.82, + "eval_cer": 0.06961335600017436, + "eval_loss": 0.5628807544708252, + "eval_runtime": 4.6717, + "eval_samples_per_second": 76.846, + "eval_steps_per_second": 2.569, + "eval_wer": 0.2619700145091085, + "step": 224000 + }, + { + "epoch": 659.12, + "learning_rate": 1.510752937081314e-06, + "loss": 0.0802, + "step": 224100 + }, + { + "epoch": 659.41, + "learning_rate": 1.5069920736703108e-06, + "loss": 0.086, + "step": 224200 + }, + { + "epoch": 659.71, + "learning_rate": 1.503235066435771e-06, + "loss": 0.0843, + "step": 224300 + }, + { + "epoch": 660.0, + "learning_rate": 1.4994819195253251e-06, + "loss": 0.0874, + "step": 224400 + }, + { + "epoch": 660.29, + "learning_rate": 1.4957326370823293e-06, + "loss": 0.0853, + "step": 224500 + }, + { + "epoch": 660.59, + "learning_rate": 1.4919872232458848e-06, + "loss": 0.0862, + "step": 224600 + }, + { + "epoch": 660.88, + "learning_rate": 1.4882456821508124e-06, + "loss": 0.0812, + "step": 224700 + }, + { + "epoch": 661.18, + "learning_rate": 1.4845080179276621e-06, + "loss": 0.0777, + "step": 224800 + }, + { + "epoch": 661.47, + "learning_rate": 1.4807742347027083e-06, + "loss": 0.0897, + "step": 224900 + }, + { + "epoch": 661.76, + "learning_rate": 1.4770443365979291e-06, + "loss": 0.0885, + "step": 225000 + }, + { + "epoch": 661.76, + "eval_cer": 0.0699620766313587, + "eval_loss": 0.561669111251831, + "eval_runtime": 4.6722, + "eval_samples_per_second": 76.838, + "eval_steps_per_second": 2.568, + "eval_wer": 0.2634209253586974, + "step": 225000 + }, + { + "epoch": 662.06, + "learning_rate": 1.4733183277310282e-06, + "loss": 0.0888, + "step": 225100 + }, + { + "epoch": 662.35, + "learning_rate": 1.4695962122154023e-06, + "loss": 0.0855, + "step": 225200 + }, + { + "epoch": 662.65, + "learning_rate": 1.465877994160156e-06, + "loss": 0.0834, + "step": 225300 + }, + { + "epoch": 662.94, + "learning_rate": 1.4621636776700965e-06, + "loss": 0.0795, + "step": 225400 + }, + { + "epoch": 663.24, + "learning_rate": 1.4584532668457113e-06, + "loss": 0.0819, + "step": 225500 + }, + { + "epoch": 663.53, + "learning_rate": 1.4547467657831893e-06, + "loss": 0.0779, + "step": 225600 + }, + { + "epoch": 663.82, + "learning_rate": 1.4510441785743935e-06, + "loss": 0.0816, + "step": 225700 + }, + { + "epoch": 664.12, + "learning_rate": 1.4473455093068683e-06, + "loss": 0.0854, + "step": 225800 + }, + { + "epoch": 664.41, + "learning_rate": 1.4436507620638395e-06, + "loss": 0.0863, + "step": 225900 + }, + { + "epoch": 664.71, + "learning_rate": 1.4399968296879947e-06, + "loss": 0.0817, + "step": 226000 + }, + { + "epoch": 664.71, + "eval_cer": 0.07009284686805282, + "eval_loss": 0.5662137269973755, + "eval_runtime": 5.0718, + "eval_samples_per_second": 70.784, + "eval_steps_per_second": 2.366, + "eval_wer": 0.2624536514589715, + "step": 226000 + }, + { + "epoch": 665.0, + "learning_rate": 1.436309899404354e-06, + "loss": 0.0853, + "step": 226100 + }, + { + "epoch": 665.29, + "learning_rate": 1.4326269033281902e-06, + "loss": 0.0885, + "step": 226200 + }, + { + "epoch": 665.59, + "learning_rate": 1.4289478455254213e-06, + "loss": 0.0802, + "step": 226300 + }, + { + "epoch": 665.88, + "learning_rate": 1.425272730057617e-06, + "loss": 0.0875, + "step": 226400 + }, + { + "epoch": 666.18, + "learning_rate": 1.4216015609819967e-06, + "loss": 0.0812, + "step": 226500 + }, + { + "epoch": 666.47, + "learning_rate": 1.4179343423514169e-06, + "loss": 0.0812, + "step": 226600 + }, + { + "epoch": 666.76, + "learning_rate": 1.414271078214382e-06, + "loss": 0.0834, + "step": 226700 + }, + { + "epoch": 667.06, + "learning_rate": 1.4106117726150247e-06, + "loss": 0.0836, + "step": 226800 + }, + { + "epoch": 667.35, + "learning_rate": 1.4069564295931093e-06, + "loss": 0.0791, + "step": 226900 + }, + { + "epoch": 667.65, + "learning_rate": 1.403305053184027e-06, + "loss": 0.0823, + "step": 227000 + }, + { + "epoch": 667.65, + "eval_cer": 0.0699620766313587, + "eval_loss": 0.5672768950462341, + "eval_runtime": 4.6733, + "eval_samples_per_second": 76.819, + "eval_steps_per_second": 2.568, + "eval_wer": 0.26261486377559246, + "step": 227000 + }, + { + "epoch": 667.94, + "learning_rate": 1.399657647418783e-06, + "loss": 0.0858, + "step": 227100 + }, + { + "epoch": 668.24, + "learning_rate": 1.3960142163240098e-06, + "loss": 0.0833, + "step": 227200 + }, + { + "epoch": 668.53, + "learning_rate": 1.3923747639219442e-06, + "loss": 0.0878, + "step": 227300 + }, + { + "epoch": 668.82, + "learning_rate": 1.388739294230434e-06, + "loss": 0.0796, + "step": 227400 + }, + { + "epoch": 669.12, + "learning_rate": 1.3851078112629302e-06, + "loss": 0.0843, + "step": 227500 + }, + { + "epoch": 669.41, + "learning_rate": 1.381480319028477e-06, + "loss": 0.0833, + "step": 227600 + }, + { + "epoch": 669.71, + "learning_rate": 1.3778568215317223e-06, + "loss": 0.0881, + "step": 227700 + }, + { + "epoch": 670.0, + "learning_rate": 1.3742373227728972e-06, + "loss": 0.0839, + "step": 227800 + }, + { + "epoch": 670.29, + "learning_rate": 1.3706218267478204e-06, + "loss": 0.0814, + "step": 227900 + }, + { + "epoch": 670.59, + "learning_rate": 1.3670103374478917e-06, + "loss": 0.0805, + "step": 228000 + }, + { + "epoch": 670.59, + "eval_cer": 0.0705723377359313, + "eval_loss": 0.565666675567627, + "eval_runtime": 4.6037, + "eval_samples_per_second": 77.98, + "eval_steps_per_second": 2.607, + "eval_wer": 0.2648718362082863, + "step": 228000 + }, + { + "epoch": 670.88, + "learning_rate": 1.3634028588600878e-06, + "loss": 0.0811, + "step": 228100 + }, + { + "epoch": 671.18, + "learning_rate": 1.359799394966957e-06, + "loss": 0.0803, + "step": 228200 + }, + { + "epoch": 671.47, + "learning_rate": 1.3561999497466155e-06, + "loss": 0.0832, + "step": 228300 + }, + { + "epoch": 671.76, + "learning_rate": 1.3526045271727439e-06, + "loss": 0.0841, + "step": 228400 + }, + { + "epoch": 672.06, + "learning_rate": 1.3490131312145816e-06, + "loss": 0.0799, + "step": 228500 + }, + { + "epoch": 672.35, + "learning_rate": 1.345425765836922e-06, + "loss": 0.0794, + "step": 228600 + }, + { + "epoch": 672.65, + "learning_rate": 1.3418424350001109e-06, + "loss": 0.0792, + "step": 228700 + }, + { + "epoch": 672.94, + "learning_rate": 1.338263142660034e-06, + "loss": 0.0896, + "step": 228800 + }, + { + "epoch": 673.24, + "learning_rate": 1.3346878927681278e-06, + "loss": 0.0869, + "step": 228900 + }, + { + "epoch": 673.53, + "learning_rate": 1.33111668927136e-06, + "loss": 0.0899, + "step": 229000 + }, + { + "epoch": 673.53, + "eval_cer": 0.07000566671025675, + "eval_loss": 0.5663681626319885, + "eval_runtime": 4.6501, + "eval_samples_per_second": 77.202, + "eval_steps_per_second": 2.581, + "eval_wer": 0.26229243914235045, + "step": 229000 + }, + { + "epoch": 673.82, + "learning_rate": 1.327549536112233e-06, + "loss": 0.0784, + "step": 229100 + }, + { + "epoch": 674.12, + "learning_rate": 1.3240220481360283e-06, + "loss": 0.0815, + "step": 229200 + }, + { + "epoch": 674.41, + "learning_rate": 1.3204629668602482e-06, + "loss": 0.0821, + "step": 229300 + }, + { + "epoch": 674.71, + "learning_rate": 1.3169079476835022e-06, + "loss": 0.0837, + "step": 229400 + }, + { + "epoch": 675.0, + "learning_rate": 1.3133569945304225e-06, + "loss": 0.0862, + "step": 229500 + }, + { + "epoch": 675.29, + "learning_rate": 1.3098101113211554e-06, + "loss": 0.081, + "step": 229600 + }, + { + "epoch": 675.59, + "learning_rate": 1.3062673019713551e-06, + "loss": 0.0801, + "step": 229700 + }, + { + "epoch": 675.88, + "learning_rate": 1.3027285703921772e-06, + "loss": 0.0796, + "step": 229800 + }, + { + "epoch": 676.18, + "learning_rate": 1.299193920490275e-06, + "loss": 0.0807, + "step": 229900 + }, + { + "epoch": 676.47, + "learning_rate": 1.2956633561677968e-06, + "loss": 0.0793, + "step": 230000 + }, + { + "epoch": 676.47, + "eval_cer": 0.06974412623686849, + "eval_loss": 0.5635000467300415, + "eval_runtime": 4.8465, + "eval_samples_per_second": 74.073, + "eval_steps_per_second": 2.476, + "eval_wer": 0.26148637755924553, + "step": 230000 + }, + { + "epoch": 676.76, + "learning_rate": 1.2921368813223807e-06, + "loss": 0.0826, + "step": 230100 + }, + { + "epoch": 677.06, + "learning_rate": 1.288614499847149e-06, + "loss": 0.0847, + "step": 230200 + }, + { + "epoch": 677.35, + "learning_rate": 1.2850962156307062e-06, + "loss": 0.0801, + "step": 230300 + }, + { + "epoch": 677.65, + "learning_rate": 1.2815820325571327e-06, + "loss": 0.0805, + "step": 230400 + }, + { + "epoch": 677.94, + "learning_rate": 1.2780719545059821e-06, + "loss": 0.0779, + "step": 230500 + }, + { + "epoch": 678.24, + "learning_rate": 1.274565985352275e-06, + "loss": 0.0856, + "step": 230600 + }, + { + "epoch": 678.53, + "learning_rate": 1.2710641289664977e-06, + "loss": 0.0848, + "step": 230700 + }, + { + "epoch": 678.82, + "learning_rate": 1.267566389214594e-06, + "loss": 0.0854, + "step": 230800 + }, + { + "epoch": 679.12, + "learning_rate": 1.2640727699579651e-06, + "loss": 0.0838, + "step": 230900 + }, + { + "epoch": 679.41, + "learning_rate": 1.2605832750534618e-06, + "loss": 0.0818, + "step": 231000 + }, + { + "epoch": 679.41, + "eval_cer": 0.06983130639466457, + "eval_loss": 0.5645167827606201, + "eval_runtime": 4.407, + "eval_samples_per_second": 81.461, + "eval_steps_per_second": 2.723, + "eval_wer": 0.26438819925842333, + "step": 231000 + }, + { + "epoch": 679.71, + "learning_rate": 1.2570979083533824e-06, + "loss": 0.0812, + "step": 231100 + }, + { + "epoch": 680.0, + "learning_rate": 1.2536166737054679e-06, + "loss": 0.082, + "step": 231200 + }, + { + "epoch": 680.29, + "learning_rate": 1.2501395749528971e-06, + "loss": 0.0848, + "step": 231300 + }, + { + "epoch": 680.59, + "learning_rate": 1.2466666159342839e-06, + "loss": 0.0824, + "step": 231400 + }, + { + "epoch": 680.88, + "learning_rate": 1.2431978004836703e-06, + "loss": 0.0798, + "step": 231500 + }, + { + "epoch": 681.18, + "learning_rate": 1.2397331324305255e-06, + "loss": 0.087, + "step": 231600 + }, + { + "epoch": 681.47, + "learning_rate": 1.2362726155997402e-06, + "loss": 0.0814, + "step": 231700 + }, + { + "epoch": 681.76, + "learning_rate": 1.2328162538116207e-06, + "loss": 0.0796, + "step": 231800 + }, + { + "epoch": 682.06, + "learning_rate": 1.2293640508818878e-06, + "loss": 0.0869, + "step": 231900 + }, + { + "epoch": 682.35, + "learning_rate": 1.22591601062167e-06, + "loss": 0.0784, + "step": 232000 + }, + { + "epoch": 682.35, + "eval_cer": 0.06948258576348024, + "eval_loss": 0.5605387091636658, + "eval_runtime": 4.8376, + "eval_samples_per_second": 74.211, + "eval_steps_per_second": 2.481, + "eval_wer": 0.26293728840883446, + "step": 232000 + }, + { + "epoch": 682.65, + "learning_rate": 1.2224721368375014e-06, + "loss": 0.0781, + "step": 232100 + }, + { + "epoch": 682.94, + "learning_rate": 1.2190324333313154e-06, + "loss": 0.0837, + "step": 232200 + }, + { + "epoch": 683.24, + "learning_rate": 1.2155969039004423e-06, + "loss": 0.078, + "step": 232300 + }, + { + "epoch": 683.53, + "learning_rate": 1.2121655523376036e-06, + "loss": 0.0851, + "step": 232400 + }, + { + "epoch": 683.82, + "learning_rate": 1.208738382430909e-06, + "loss": 0.0844, + "step": 232500 + }, + { + "epoch": 684.12, + "learning_rate": 1.2053153979638527e-06, + "loss": 0.0816, + "step": 232600 + }, + { + "epoch": 684.41, + "learning_rate": 1.2018966027153062e-06, + "loss": 0.0808, + "step": 232700 + }, + { + "epoch": 684.71, + "learning_rate": 1.1984820004595183e-06, + "loss": 0.0838, + "step": 232800 + }, + { + "epoch": 685.0, + "learning_rate": 1.1950715949661068e-06, + "loss": 0.0871, + "step": 232900 + }, + { + "epoch": 685.29, + "learning_rate": 1.1916653900000586e-06, + "loss": 0.0809, + "step": 233000 + }, + { + "epoch": 685.29, + "eval_cer": 0.06948258576348024, + "eval_loss": 0.5701205730438232, + "eval_runtime": 4.8603, + "eval_samples_per_second": 73.863, + "eval_steps_per_second": 2.469, + "eval_wer": 0.26116395292600353, + "step": 233000 + }, + { + "epoch": 685.59, + "learning_rate": 1.1882633893217222e-06, + "loss": 0.077, + "step": 233100 + }, + { + "epoch": 685.88, + "learning_rate": 1.184865596686804e-06, + "loss": 0.0858, + "step": 233200 + }, + { + "epoch": 686.18, + "learning_rate": 1.181472015846366e-06, + "loss": 0.0798, + "step": 233300 + }, + { + "epoch": 686.47, + "learning_rate": 1.1780826505468207e-06, + "loss": 0.0833, + "step": 233400 + }, + { + "epoch": 686.76, + "learning_rate": 1.1746975045299258e-06, + "loss": 0.0831, + "step": 233500 + }, + { + "epoch": 687.06, + "learning_rate": 1.171350369846545e-06, + "loss": 0.0842, + "step": 233600 + }, + { + "epoch": 687.35, + "learning_rate": 1.1680073777664342e-06, + "loss": 0.0804, + "step": 233700 + }, + { + "epoch": 687.65, + "learning_rate": 1.1646348273553372e-06, + "loss": 0.0826, + "step": 233800 + }, + { + "epoch": 687.94, + "learning_rate": 1.161266511072886e-06, + "loss": 0.0797, + "step": 233900 + }, + { + "epoch": 688.24, + "learning_rate": 1.1579024326376014e-06, + "loss": 0.0851, + "step": 234000 + }, + { + "epoch": 688.24, + "eval_cer": 0.0696569460790724, + "eval_loss": 0.5669453740119934, + "eval_runtime": 5.0116, + "eval_samples_per_second": 71.633, + "eval_steps_per_second": 2.394, + "eval_wer": 0.26132516524262456, + "step": 234000 + }, + { + "epoch": 688.53, + "learning_rate": 1.1545425957633266e-06, + "loss": 0.082, + "step": 234100 + }, + { + "epoch": 688.82, + "learning_rate": 1.1511870041592172e-06, + "loss": 0.086, + "step": 234200 + }, + { + "epoch": 689.12, + "learning_rate": 1.1478356615297498e-06, + "loss": 0.0777, + "step": 234300 + }, + { + "epoch": 689.41, + "learning_rate": 1.1444885715747057e-06, + "loss": 0.0808, + "step": 234400 + }, + { + "epoch": 689.71, + "learning_rate": 1.1411457379891722e-06, + "loss": 0.0776, + "step": 234500 + }, + { + "epoch": 690.0, + "learning_rate": 1.1378071644635397e-06, + "loss": 0.0825, + "step": 234600 + }, + { + "epoch": 690.29, + "learning_rate": 1.1344728546834881e-06, + "loss": 0.0817, + "step": 234700 + }, + { + "epoch": 690.59, + "learning_rate": 1.1311428123300016e-06, + "loss": 0.0819, + "step": 234800 + }, + { + "epoch": 690.88, + "learning_rate": 1.1278170410793455e-06, + "loss": 0.0787, + "step": 234900 + }, + { + "epoch": 691.18, + "learning_rate": 1.1244955446030715e-06, + "loss": 0.0883, + "step": 235000 + }, + { + "epoch": 691.18, + "eval_cer": 0.0696569460790724, + "eval_loss": 0.5649272799491882, + "eval_runtime": 5.4507, + "eval_samples_per_second": 65.863, + "eval_steps_per_second": 2.202, + "eval_wer": 0.26309850072545543, + "step": 235000 + }, + { + "epoch": 691.47, + "learning_rate": 1.1211783265680143e-06, + "loss": 0.0801, + "step": 235100 + }, + { + "epoch": 691.76, + "learning_rate": 1.1178653906362797e-06, + "loss": 0.0814, + "step": 235200 + }, + { + "epoch": 692.06, + "learning_rate": 1.1145567404652558e-06, + "loss": 0.0868, + "step": 235300 + }, + { + "epoch": 692.35, + "learning_rate": 1.111252379707587e-06, + "loss": 0.0826, + "step": 235400 + }, + { + "epoch": 692.65, + "learning_rate": 1.107952312011194e-06, + "loss": 0.0756, + "step": 235500 + }, + { + "epoch": 692.94, + "learning_rate": 1.1046565410192528e-06, + "loss": 0.0822, + "step": 235600 + }, + { + "epoch": 693.24, + "learning_rate": 1.1013650703701922e-06, + "loss": 0.0824, + "step": 235700 + }, + { + "epoch": 693.53, + "learning_rate": 1.0980779036977024e-06, + "loss": 0.0784, + "step": 235800 + }, + { + "epoch": 693.82, + "learning_rate": 1.0947950446307127e-06, + "loss": 0.0798, + "step": 235900 + }, + { + "epoch": 694.12, + "learning_rate": 1.0915164967934045e-06, + "loss": 0.0803, + "step": 236000 + }, + { + "epoch": 694.12, + "eval_cer": 0.06930822544788806, + "eval_loss": 0.5643986463546753, + "eval_runtime": 4.3472, + "eval_samples_per_second": 82.582, + "eval_steps_per_second": 2.76, + "eval_wer": 0.2600354667096566, + "step": 236000 + }, + { + "epoch": 694.41, + "learning_rate": 1.0882422638051977e-06, + "loss": 0.0819, + "step": 236100 + }, + { + "epoch": 694.71, + "learning_rate": 1.0849723492807435e-06, + "loss": 0.0846, + "step": 236200 + }, + { + "epoch": 695.0, + "learning_rate": 1.0817067568299344e-06, + "loss": 0.0819, + "step": 236300 + }, + { + "epoch": 695.29, + "learning_rate": 1.0784454900578834e-06, + "loss": 0.0846, + "step": 236400 + }, + { + "epoch": 695.59, + "learning_rate": 1.0751885525649336e-06, + "loss": 0.0828, + "step": 236500 + }, + { + "epoch": 695.88, + "learning_rate": 1.0719359479466484e-06, + "loss": 0.0906, + "step": 236600 + }, + { + "epoch": 696.18, + "learning_rate": 1.068687679793801e-06, + "loss": 0.083, + "step": 236700 + }, + { + "epoch": 696.47, + "learning_rate": 1.0654437516923893e-06, + "loss": 0.0828, + "step": 236800 + }, + { + "epoch": 696.76, + "learning_rate": 1.062204167223606e-06, + "loss": 0.0849, + "step": 236900 + }, + { + "epoch": 697.06, + "learning_rate": 1.0589689299638606e-06, + "loss": 0.0859, + "step": 237000 + }, + { + "epoch": 697.06, + "eval_cer": 0.06948258576348024, + "eval_loss": 0.5633894205093384, + "eval_runtime": 5.486, + "eval_samples_per_second": 65.44, + "eval_steps_per_second": 2.187, + "eval_wer": 0.26019667902627763, + "step": 237000 + }, + { + "epoch": 697.35, + "learning_rate": 1.0557703308014694e-06, + "loss": 0.0832, + "step": 237100 + }, + { + "epoch": 697.65, + "learning_rate": 1.0525437551086954e-06, + "loss": 0.077, + "step": 237200 + }, + { + "epoch": 697.94, + "learning_rate": 1.0493215372897642e-06, + "loss": 0.0806, + "step": 237300 + }, + { + "epoch": 698.24, + "learning_rate": 1.0461036809019087e-06, + "loss": 0.0826, + "step": 237400 + }, + { + "epoch": 698.53, + "learning_rate": 1.0428901894975458e-06, + "loss": 0.0852, + "step": 237500 + }, + { + "epoch": 698.82, + "learning_rate": 1.0396810666242736e-06, + "loss": 0.0844, + "step": 237600 + }, + { + "epoch": 699.12, + "learning_rate": 1.0364763158248685e-06, + "loss": 0.0766, + "step": 237700 + }, + { + "epoch": 699.41, + "learning_rate": 1.03327594063728e-06, + "loss": 0.083, + "step": 237800 + }, + { + "epoch": 699.71, + "learning_rate": 1.0300799445946264e-06, + "loss": 0.0818, + "step": 237900 + }, + { + "epoch": 700.0, + "learning_rate": 1.0268883312251915e-06, + "loss": 0.0796, + "step": 238000 + }, + { + "epoch": 700.0, + "eval_cer": 0.0696569460790724, + "eval_loss": 0.558987021446228, + "eval_runtime": 4.7414, + "eval_samples_per_second": 75.716, + "eval_steps_per_second": 2.531, + "eval_wer": 0.26277607609221343, + "step": 238000 + }, + { + "epoch": 700.29, + "learning_rate": 1.023701104052422e-06, + "loss": 0.0837, + "step": 238100 + }, + { + "epoch": 700.59, + "learning_rate": 1.020518266594921e-06, + "loss": 0.0844, + "step": 238200 + }, + { + "epoch": 700.88, + "learning_rate": 1.017339822366446e-06, + "loss": 0.08, + "step": 238300 + }, + { + "epoch": 701.18, + "learning_rate": 1.0141657748759048e-06, + "loss": 0.0823, + "step": 238400 + }, + { + "epoch": 701.47, + "learning_rate": 1.0109961276273511e-06, + "loss": 0.0794, + "step": 238500 + }, + { + "epoch": 701.76, + "learning_rate": 1.0078308841199807e-06, + "loss": 0.0854, + "step": 238600 + }, + { + "epoch": 702.06, + "learning_rate": 1.0046700478481281e-06, + "loss": 0.0846, + "step": 238700 + }, + { + "epoch": 702.35, + "learning_rate": 1.0015451647121965e-06, + "loss": 0.0823, + "step": 238800 + }, + { + "epoch": 702.65, + "learning_rate": 9.983931092155874e-07, + "loss": 0.0795, + "step": 238900 + }, + { + "epoch": 702.94, + "learning_rate": 9.952454713735167e-07, + "loss": 0.0806, + "step": 239000 + }, + { + "epoch": 702.94, + "eval_cer": 0.06974412623686849, + "eval_loss": 0.5627612471580505, + "eval_runtime": 4.8839, + "eval_samples_per_second": 73.507, + "eval_steps_per_second": 2.457, + "eval_wer": 0.2616475898758665, + "step": 239000 + }, + { + "epoch": 703.24, + "learning_rate": 9.921022546608861e-07, + "loss": 0.0766, + "step": 239100 + }, + { + "epoch": 703.53, + "learning_rate": 9.88963462547709e-07, + "loss": 0.0834, + "step": 239200 + }, + { + "epoch": 703.82, + "learning_rate": 9.858290984991197e-07, + "loss": 0.0842, + "step": 239300 + }, + { + "epoch": 704.12, + "learning_rate": 9.826991659753626e-07, + "loss": 0.0799, + "step": 239400 + }, + { + "epoch": 704.41, + "learning_rate": 9.79573668431788e-07, + "loss": 0.079, + "step": 239500 + }, + { + "epoch": 704.71, + "learning_rate": 9.764526093188565e-07, + "loss": 0.0821, + "step": 239600 + }, + { + "epoch": 705.0, + "learning_rate": 9.7333599208212e-07, + "loss": 0.0829, + "step": 239700 + }, + { + "epoch": 705.29, + "learning_rate": 9.70223820162232e-07, + "loss": 0.0829, + "step": 239800 + }, + { + "epoch": 705.59, + "learning_rate": 9.671160969949371e-07, + "loss": 0.085, + "step": 239900 + }, + { + "epoch": 705.88, + "learning_rate": 9.640128260110688e-07, + "loss": 0.0846, + "step": 240000 + }, + { + "epoch": 705.88, + "eval_cer": 0.0696569460790724, + "eval_loss": 0.5651042461395264, + "eval_runtime": 4.7198, + "eval_samples_per_second": 76.063, + "eval_steps_per_second": 2.543, + "eval_wer": 0.26100274060938256, + "step": 240000 + }, + { + "epoch": 706.18, + "learning_rate": 9.609140106365478e-07, + "loss": 0.0811, + "step": 240100 + }, + { + "epoch": 706.47, + "learning_rate": 9.578196542923713e-07, + "loss": 0.08, + "step": 240200 + }, + { + "epoch": 706.76, + "learning_rate": 9.54729760394617e-07, + "loss": 0.0796, + "step": 240300 + }, + { + "epoch": 707.06, + "learning_rate": 9.516443323544355e-07, + "loss": 0.0857, + "step": 240400 + }, + { + "epoch": 707.35, + "learning_rate": 9.485633735780475e-07, + "loss": 0.0778, + "step": 240500 + }, + { + "epoch": 707.65, + "learning_rate": 9.454868874667389e-07, + "loss": 0.085, + "step": 240600 + }, + { + "epoch": 707.94, + "learning_rate": 9.424148774168596e-07, + "loss": 0.0845, + "step": 240700 + }, + { + "epoch": 708.24, + "learning_rate": 9.393473468198155e-07, + "loss": 0.0812, + "step": 240800 + }, + { + "epoch": 708.53, + "learning_rate": 9.362842990620702e-07, + "loss": 0.0816, + "step": 240900 + }, + { + "epoch": 708.82, + "learning_rate": 9.332257375251364e-07, + "loss": 0.079, + "step": 241000 + }, + { + "epoch": 708.82, + "eval_cer": 0.06961335600017436, + "eval_loss": 0.5604375600814819, + "eval_runtime": 5.0667, + "eval_samples_per_second": 70.855, + "eval_steps_per_second": 2.368, + "eval_wer": 0.2616475898758665, + "step": 241000 + }, + { + "epoch": 709.12, + "learning_rate": 9.301716655855747e-07, + "loss": 0.0836, + "step": 241100 + }, + { + "epoch": 709.41, + "learning_rate": 9.271220866149882e-07, + "loss": 0.081, + "step": 241200 + }, + { + "epoch": 709.71, + "learning_rate": 9.241074325384697e-07, + "loss": 0.0794, + "step": 241300 + }, + { + "epoch": 710.0, + "learning_rate": 9.21066804587209e-07, + "loss": 0.0787, + "step": 241400 + }, + { + "epoch": 710.29, + "learning_rate": 9.180306796564203e-07, + "loss": 0.0823, + "step": 241500 + }, + { + "epoch": 710.59, + "learning_rate": 9.149990610978915e-07, + "loss": 0.0829, + "step": 241600 + }, + { + "epoch": 710.88, + "learning_rate": 9.119719522584436e-07, + "loss": 0.0829, + "step": 241700 + }, + { + "epoch": 711.18, + "learning_rate": 9.089493564799101e-07, + "loss": 0.0786, + "step": 241800 + }, + { + "epoch": 711.47, + "learning_rate": 9.059312770991496e-07, + "loss": 0.0806, + "step": 241900 + }, + { + "epoch": 711.76, + "learning_rate": 9.029177174480314e-07, + "loss": 0.0793, + "step": 242000 + }, + { + "epoch": 711.76, + "eval_cer": 0.06939540560568415, + "eval_loss": 0.5705261826515198, + "eval_runtime": 4.6246, + "eval_samples_per_second": 77.628, + "eval_steps_per_second": 2.595, + "eval_wer": 0.26100274060938256, + "step": 242000 + }, + { + "epoch": 712.06, + "learning_rate": 8.999086808534341e-07, + "loss": 0.0795, + "step": 242100 + }, + { + "epoch": 712.35, + "learning_rate": 8.969041706372461e-07, + "loss": 0.0824, + "step": 242200 + }, + { + "epoch": 712.65, + "learning_rate": 8.939041901163531e-07, + "loss": 0.0808, + "step": 242300 + }, + { + "epoch": 712.94, + "learning_rate": 8.909087426026492e-07, + "loss": 0.0813, + "step": 242400 + }, + { + "epoch": 713.24, + "learning_rate": 8.87917831403014e-07, + "loss": 0.0786, + "step": 242500 + }, + { + "epoch": 713.53, + "learning_rate": 8.849314598193282e-07, + "loss": 0.0838, + "step": 242600 + }, + { + "epoch": 713.82, + "learning_rate": 8.81949631148456e-07, + "loss": 0.0787, + "step": 242700 + }, + { + "epoch": 714.12, + "learning_rate": 8.789723486822443e-07, + "loss": 0.0791, + "step": 242800 + }, + { + "epoch": 714.41, + "learning_rate": 8.759996157075285e-07, + "loss": 0.0844, + "step": 242900 + }, + { + "epoch": 714.71, + "learning_rate": 8.730314355061126e-07, + "loss": 0.0813, + "step": 243000 + }, + { + "epoch": 714.71, + "eval_cer": 0.06926463536899002, + "eval_loss": 0.5673476457595825, + "eval_runtime": 5.3489, + "eval_samples_per_second": 67.117, + "eval_steps_per_second": 2.243, + "eval_wer": 0.25906819280993065, + "step": 243000 + }, + { + "epoch": 715.0, + "learning_rate": 8.700678113547822e-07, + "loss": 0.0833, + "step": 243100 + }, + { + "epoch": 715.29, + "learning_rate": 8.671087465252903e-07, + "loss": 0.0805, + "step": 243200 + }, + { + "epoch": 715.59, + "learning_rate": 8.641542442843526e-07, + "loss": 0.0848, + "step": 243300 + }, + { + "epoch": 715.88, + "learning_rate": 8.612043078936555e-07, + "loss": 0.0796, + "step": 243400 + }, + { + "epoch": 716.18, + "learning_rate": 8.582589406098357e-07, + "loss": 0.0803, + "step": 243500 + }, + { + "epoch": 716.47, + "learning_rate": 8.553181456844955e-07, + "loss": 0.0822, + "step": 243600 + }, + { + "epoch": 716.76, + "learning_rate": 8.523819263641841e-07, + "loss": 0.0863, + "step": 243700 + }, + { + "epoch": 717.06, + "learning_rate": 8.494795796192135e-07, + "loss": 0.0813, + "step": 243800 + }, + { + "epoch": 717.35, + "learning_rate": 8.465524753915627e-07, + "loss": 0.0867, + "step": 243900 + }, + { + "epoch": 717.65, + "learning_rate": 8.436299564459782e-07, + "loss": 0.0803, + "step": 244000 + }, + { + "epoch": 717.65, + "eval_cer": 0.06978771631576654, + "eval_loss": 0.5662087202072144, + "eval_runtime": 4.8974, + "eval_samples_per_second": 73.304, + "eval_steps_per_second": 2.45, + "eval_wer": 0.2616475898758665, + "step": 244000 + }, + { + "epoch": 717.94, + "learning_rate": 8.40712026008833e-07, + "loss": 0.081, + "step": 244100 + }, + { + "epoch": 718.24, + "learning_rate": 8.377986873014355e-07, + "loss": 0.0802, + "step": 244200 + }, + { + "epoch": 718.53, + "learning_rate": 8.348899435400249e-07, + "loss": 0.0806, + "step": 244300 + }, + { + "epoch": 718.82, + "learning_rate": 8.319857979357665e-07, + "loss": 0.0783, + "step": 244400 + }, + { + "epoch": 719.12, + "learning_rate": 8.290862536947514e-07, + "loss": 0.0785, + "step": 244500 + }, + { + "epoch": 719.41, + "learning_rate": 8.2619131401799e-07, + "loss": 0.083, + "step": 244600 + }, + { + "epoch": 719.71, + "learning_rate": 8.233009821014081e-07, + "loss": 0.0873, + "step": 244700 + }, + { + "epoch": 720.0, + "learning_rate": 8.204152611358468e-07, + "loss": 0.0818, + "step": 244800 + }, + { + "epoch": 720.29, + "learning_rate": 8.175341543070553e-07, + "loss": 0.0802, + "step": 244900 + }, + { + "epoch": 720.59, + "learning_rate": 8.146576647956905e-07, + "loss": 0.079, + "step": 245000 + }, + { + "epoch": 720.59, + "eval_cer": 0.06970053615797045, + "eval_loss": 0.5707852840423584, + "eval_runtime": 4.806, + "eval_samples_per_second": 74.699, + "eval_steps_per_second": 2.497, + "eval_wer": 0.2603578913428986, + "step": 245000 + }, + { + "epoch": 720.88, + "learning_rate": 8.117857957773096e-07, + "loss": 0.0786, + "step": 245100 + }, + { + "epoch": 721.18, + "learning_rate": 8.089185504223712e-07, + "loss": 0.0819, + "step": 245200 + }, + { + "epoch": 721.47, + "learning_rate": 8.060559318962285e-07, + "loss": 0.0851, + "step": 245300 + }, + { + "epoch": 721.76, + "learning_rate": 8.031979433591263e-07, + "loss": 0.0834, + "step": 245400 + }, + { + "epoch": 722.06, + "learning_rate": 8.003445879661992e-07, + "loss": 0.0787, + "step": 245500 + }, + { + "epoch": 722.35, + "learning_rate": 7.974958688674661e-07, + "loss": 0.0825, + "step": 245600 + }, + { + "epoch": 722.65, + "learning_rate": 7.946517892078281e-07, + "loss": 0.0861, + "step": 245700 + }, + { + "epoch": 722.94, + "learning_rate": 7.918123521270637e-07, + "loss": 0.0819, + "step": 245800 + }, + { + "epoch": 723.24, + "learning_rate": 7.889775607598276e-07, + "loss": 0.0841, + "step": 245900 + }, + { + "epoch": 723.53, + "learning_rate": 7.861474182356449e-07, + "loss": 0.0792, + "step": 246000 + }, + { + "epoch": 723.53, + "eval_cer": 0.06961335600017436, + "eval_loss": 0.568951427936554, + "eval_runtime": 4.8277, + "eval_samples_per_second": 74.362, + "eval_steps_per_second": 2.486, + "eval_wer": 0.2600354667096566, + "step": 246000 + }, + { + "epoch": 723.82, + "learning_rate": 7.833501595469872e-07, + "loss": 0.0801, + "step": 246100 + }, + { + "epoch": 724.12, + "learning_rate": 7.805292775106627e-07, + "loss": 0.0805, + "step": 246200 + }, + { + "epoch": 724.41, + "learning_rate": 7.777130536440419e-07, + "loss": 0.0792, + "step": 246300 + }, + { + "epoch": 724.71, + "learning_rate": 7.749014910561536e-07, + "loss": 0.083, + "step": 246400 + }, + { + "epoch": 725.0, + "learning_rate": 7.720945928508789e-07, + "loss": 0.082, + "step": 246500 + }, + { + "epoch": 725.29, + "learning_rate": 7.692923621269482e-07, + "loss": 0.0778, + "step": 246600 + }, + { + "epoch": 725.59, + "learning_rate": 7.664948019779444e-07, + "loss": 0.0814, + "step": 246700 + }, + { + "epoch": 725.88, + "learning_rate": 7.637019154922865e-07, + "loss": 0.0849, + "step": 246800 + }, + { + "epoch": 726.18, + "learning_rate": 7.60913705753239e-07, + "loss": 0.0785, + "step": 246900 + }, + { + "epoch": 726.47, + "learning_rate": 7.581301758389026e-07, + "loss": 0.0731, + "step": 247000 + }, + { + "epoch": 726.47, + "eval_cer": 0.06956976592127631, + "eval_loss": 0.5695874691009521, + "eval_runtime": 5.5665, + "eval_samples_per_second": 64.492, + "eval_steps_per_second": 2.156, + "eval_wer": 0.2600354667096566, + "step": 247000 + }, + { + "epoch": 726.76, + "learning_rate": 7.553513288222108e-07, + "loss": 0.0777, + "step": 247100 + }, + { + "epoch": 727.06, + "learning_rate": 7.525771677709276e-07, + "loss": 0.0844, + "step": 247200 + }, + { + "epoch": 727.35, + "learning_rate": 7.498076957476447e-07, + "loss": 0.0797, + "step": 247300 + }, + { + "epoch": 727.65, + "learning_rate": 7.470429158097758e-07, + "loss": 0.084, + "step": 247400 + }, + { + "epoch": 727.94, + "learning_rate": 7.442828310095562e-07, + "loss": 0.0799, + "step": 247500 + }, + { + "epoch": 728.24, + "learning_rate": 7.415274443940363e-07, + "loss": 0.0826, + "step": 247600 + }, + { + "epoch": 728.53, + "learning_rate": 7.387767590050809e-07, + "loss": 0.0842, + "step": 247700 + }, + { + "epoch": 728.82, + "learning_rate": 7.360307778793646e-07, + "loss": 0.0789, + "step": 247800 + }, + { + "epoch": 729.12, + "learning_rate": 7.332895040483689e-07, + "loss": 0.078, + "step": 247900 + }, + { + "epoch": 729.41, + "learning_rate": 7.305529405383776e-07, + "loss": 0.0822, + "step": 248000 + }, + { + "epoch": 729.41, + "eval_cer": 0.06987489647356261, + "eval_loss": 0.5686177015304565, + "eval_runtime": 4.9297, + "eval_samples_per_second": 72.824, + "eval_steps_per_second": 2.434, + "eval_wer": 0.26293728840883446, + "step": 248000 + }, + { + "epoch": 729.71, + "learning_rate": 7.278210903704763e-07, + "loss": 0.0813, + "step": 248100 + }, + { + "epoch": 730.0, + "learning_rate": 7.250939565605447e-07, + "loss": 0.0878, + "step": 248200 + }, + { + "epoch": 730.29, + "learning_rate": 7.223715421192573e-07, + "loss": 0.0789, + "step": 248300 + }, + { + "epoch": 730.59, + "learning_rate": 7.196538500520789e-07, + "loss": 0.0767, + "step": 248400 + }, + { + "epoch": 730.88, + "learning_rate": 7.169408833592606e-07, + "loss": 0.0817, + "step": 248500 + }, + { + "epoch": 731.18, + "learning_rate": 7.142326450358361e-07, + "loss": 0.0814, + "step": 248600 + }, + { + "epoch": 731.47, + "learning_rate": 7.115291380716194e-07, + "loss": 0.0797, + "step": 248700 + }, + { + "epoch": 731.76, + "learning_rate": 7.088303654512024e-07, + "loss": 0.0835, + "step": 248800 + }, + { + "epoch": 732.06, + "learning_rate": 7.061363301539486e-07, + "loss": 0.0806, + "step": 248900 + }, + { + "epoch": 732.35, + "learning_rate": 7.03447035153993e-07, + "loss": 0.08, + "step": 249000 + }, + { + "epoch": 732.35, + "eval_cer": 0.06952617584237827, + "eval_loss": 0.5695518851280212, + "eval_runtime": 4.6502, + "eval_samples_per_second": 77.2, + "eval_steps_per_second": 2.581, + "eval_wer": 0.2621312268257295, + "step": 249000 + }, + { + "epoch": 732.65, + "learning_rate": 7.00762483420237e-07, + "loss": 0.0801, + "step": 249100 + }, + { + "epoch": 732.94, + "learning_rate": 6.980826779163457e-07, + "loss": 0.086, + "step": 249200 + }, + { + "epoch": 733.24, + "learning_rate": 6.954076216007438e-07, + "loss": 0.0809, + "step": 249300 + }, + { + "epoch": 733.53, + "learning_rate": 6.927373174266139e-07, + "loss": 0.0798, + "step": 249400 + }, + { + "epoch": 733.82, + "learning_rate": 6.900717683418923e-07, + "loss": 0.0821, + "step": 249500 + }, + { + "epoch": 734.12, + "learning_rate": 6.874109772892651e-07, + "loss": 0.0794, + "step": 249600 + }, + { + "epoch": 734.41, + "learning_rate": 6.847549472061671e-07, + "loss": 0.0817, + "step": 249700 + }, + { + "epoch": 734.71, + "learning_rate": 6.821036810247755e-07, + "loss": 0.0783, + "step": 249800 + }, + { + "epoch": 735.0, + "learning_rate": 6.794571816720085e-07, + "loss": 0.0798, + "step": 249900 + }, + { + "epoch": 735.29, + "learning_rate": 6.768154520695241e-07, + "loss": 0.082, + "step": 250000 + }, + { + "epoch": 735.29, + "eval_cer": 0.06987489647356261, + "eval_loss": 0.5729803442955017, + "eval_runtime": 4.2644, + "eval_samples_per_second": 84.185, + "eval_steps_per_second": 2.814, + "eval_wer": 0.2621312268257295, + "step": 250000 + }, + { + "epoch": 735.59, + "learning_rate": 6.74178495133711e-07, + "loss": 0.0774, + "step": 250100 + }, + { + "epoch": 735.88, + "learning_rate": 6.715463137756923e-07, + "loss": 0.0809, + "step": 250200 + }, + { + "epoch": 736.18, + "learning_rate": 6.689189109013167e-07, + "loss": 0.083, + "step": 250300 + }, + { + "epoch": 736.47, + "learning_rate": 6.662962894111591e-07, + "loss": 0.0831, + "step": 250400 + }, + { + "epoch": 736.76, + "learning_rate": 6.636784522005152e-07, + "loss": 0.088, + "step": 250500 + }, + { + "epoch": 737.06, + "learning_rate": 6.610654021593993e-07, + "loss": 0.0841, + "step": 250600 + }, + { + "epoch": 737.35, + "learning_rate": 6.5845714217254e-07, + "loss": 0.0807, + "step": 250700 + }, + { + "epoch": 737.65, + "learning_rate": 6.55853675119379e-07, + "loss": 0.0819, + "step": 250800 + }, + { + "epoch": 737.94, + "learning_rate": 6.532550038740665e-07, + "loss": 0.0881, + "step": 250900 + }, + { + "epoch": 738.24, + "learning_rate": 6.506611313054567e-07, + "loss": 0.0821, + "step": 251000 + }, + { + "epoch": 738.24, + "eval_cer": 0.0696569460790724, + "eval_loss": 0.5708038806915283, + "eval_runtime": 5.0046, + "eval_samples_per_second": 71.734, + "eval_steps_per_second": 2.398, + "eval_wer": 0.26180880219248753, + "step": 251000 + }, + { + "epoch": 738.53, + "learning_rate": 6.48072060277109e-07, + "loss": 0.0755, + "step": 251100 + }, + { + "epoch": 738.82, + "learning_rate": 6.454877936472798e-07, + "loss": 0.0852, + "step": 251200 + }, + { + "epoch": 739.12, + "learning_rate": 6.429083342689224e-07, + "loss": 0.0845, + "step": 251300 + }, + { + "epoch": 739.41, + "learning_rate": 6.403336849896824e-07, + "loss": 0.087, + "step": 251400 + }, + { + "epoch": 739.71, + "learning_rate": 6.377638486518967e-07, + "loss": 0.0781, + "step": 251500 + }, + { + "epoch": 740.0, + "learning_rate": 6.351988280925874e-07, + "loss": 0.0796, + "step": 251600 + }, + { + "epoch": 740.29, + "learning_rate": 6.326386261434603e-07, + "loss": 0.0832, + "step": 251700 + }, + { + "epoch": 740.59, + "learning_rate": 6.300832456309036e-07, + "loss": 0.0829, + "step": 251800 + }, + { + "epoch": 740.88, + "learning_rate": 6.275326893759775e-07, + "loss": 0.0798, + "step": 251900 + }, + { + "epoch": 741.18, + "learning_rate": 6.249869601944236e-07, + "loss": 0.079, + "step": 252000 + }, + { + "epoch": 741.18, + "eval_cer": 0.06948258576348024, + "eval_loss": 0.5701922178268433, + "eval_runtime": 5.0097, + "eval_samples_per_second": 71.661, + "eval_steps_per_second": 2.395, + "eval_wer": 0.26148637755924553, + "step": 252000 + }, + { + "epoch": 741.47, + "learning_rate": 6.224460608966492e-07, + "loss": 0.0847, + "step": 252100 + }, + { + "epoch": 741.76, + "learning_rate": 6.199099942877318e-07, + "loss": 0.0833, + "step": 252200 + }, + { + "epoch": 742.06, + "learning_rate": 6.174040515337682e-07, + "loss": 0.0784, + "step": 252300 + }, + { + "epoch": 742.35, + "learning_rate": 6.148776102998055e-07, + "loss": 0.0839, + "step": 252400 + }, + { + "epoch": 742.65, + "learning_rate": 6.123560101100456e-07, + "loss": 0.0819, + "step": 252500 + }, + { + "epoch": 742.94, + "learning_rate": 6.098392537482562e-07, + "loss": 0.084, + "step": 252600 + }, + { + "epoch": 743.24, + "learning_rate": 6.073273439928623e-07, + "loss": 0.0823, + "step": 252700 + }, + { + "epoch": 743.53, + "learning_rate": 6.04820283616937e-07, + "loss": 0.0781, + "step": 252800 + }, + { + "epoch": 743.82, + "learning_rate": 6.023180753882008e-07, + "loss": 0.0802, + "step": 252900 + }, + { + "epoch": 744.12, + "learning_rate": 5.998207220690161e-07, + "loss": 0.0867, + "step": 253000 + }, + { + "epoch": 744.12, + "eval_cer": 0.0696569460790724, + "eval_loss": 0.5710974335670471, + "eval_runtime": 4.3252, + "eval_samples_per_second": 83.003, + "eval_steps_per_second": 2.774, + "eval_wer": 0.26132516524262456, + "step": 253000 + }, + { + "epoch": 744.41, + "learning_rate": 5.973282264163866e-07, + "loss": 0.0813, + "step": 253100 + }, + { + "epoch": 744.71, + "learning_rate": 5.948405911819538e-07, + "loss": 0.0816, + "step": 253200 + }, + { + "epoch": 745.0, + "learning_rate": 5.923578191119922e-07, + "loss": 0.0733, + "step": 253300 + }, + { + "epoch": 745.29, + "learning_rate": 5.898799129474076e-07, + "loss": 0.0871, + "step": 253400 + }, + { + "epoch": 745.59, + "learning_rate": 5.874068754237349e-07, + "loss": 0.0823, + "step": 253500 + }, + { + "epoch": 745.88, + "learning_rate": 5.849387092711339e-07, + "loss": 0.0796, + "step": 253600 + }, + { + "epoch": 746.18, + "learning_rate": 5.824754172143865e-07, + "loss": 0.0801, + "step": 253700 + }, + { + "epoch": 746.47, + "learning_rate": 5.800170019728929e-07, + "loss": 0.0778, + "step": 253800 + }, + { + "epoch": 746.76, + "learning_rate": 5.7756346626067e-07, + "loss": 0.084, + "step": 253900 + }, + { + "epoch": 747.06, + "learning_rate": 5.751148127863487e-07, + "loss": 0.0825, + "step": 254000 + }, + { + "epoch": 747.06, + "eval_cer": 0.0696569460790724, + "eval_loss": 0.5694045424461365, + "eval_runtime": 5.1895, + "eval_samples_per_second": 69.178, + "eval_steps_per_second": 2.312, + "eval_wer": 0.2619700145091085, + "step": 254000 + }, + { + "epoch": 747.35, + "learning_rate": 5.72671044253168e-07, + "loss": 0.083, + "step": 254100 + }, + { + "epoch": 747.65, + "learning_rate": 5.702321633589785e-07, + "loss": 0.0792, + "step": 254200 + }, + { + "epoch": 747.94, + "learning_rate": 5.67822488485888e-07, + "loss": 0.0769, + "step": 254300 + }, + { + "epoch": 748.24, + "learning_rate": 5.65393341998165e-07, + "loss": 0.0792, + "step": 254400 + }, + { + "epoch": 748.53, + "learning_rate": 5.629690911837949e-07, + "loss": 0.083, + "step": 254500 + }, + { + "epoch": 748.82, + "learning_rate": 5.605497387190828e-07, + "loss": 0.0827, + "step": 254600 + }, + { + "epoch": 749.12, + "learning_rate": 5.581352872749168e-07, + "loss": 0.08, + "step": 254700 + }, + { + "epoch": 749.41, + "learning_rate": 5.557257395167842e-07, + "loss": 0.0814, + "step": 254800 + }, + { + "epoch": 749.71, + "learning_rate": 5.533451202237355e-07, + "loss": 0.0788, + "step": 254900 + }, + { + "epoch": 750.0, + "learning_rate": 5.509453387093233e-07, + "loss": 0.0834, + "step": 255000 + }, + { + "epoch": 750.0, + "eval_cer": 0.0696569460790724, + "eval_loss": 0.5699195265769958, + "eval_runtime": 4.7379, + "eval_samples_per_second": 75.771, + "eval_steps_per_second": 2.533, + "eval_wer": 0.26100274060938256, + "step": 255000 + }, + { + "epoch": 750.29, + "learning_rate": 5.485743931961168e-07, + "loss": 0.0805, + "step": 255100 + }, + { + "epoch": 750.59, + "learning_rate": 5.461843884168661e-07, + "loss": 0.0782, + "step": 255200 + }, + { + "epoch": 750.88, + "learning_rate": 5.437993005170794e-07, + "loss": 0.0808, + "step": 255300 + }, + { + "epoch": 751.18, + "learning_rate": 5.414191321298273e-07, + "loss": 0.081, + "step": 255400 + }, + { + "epoch": 751.47, + "learning_rate": 5.390438858827412e-07, + "loss": 0.0777, + "step": 255500 + }, + { + "epoch": 751.76, + "learning_rate": 5.366735643980225e-07, + "loss": 0.0813, + "step": 255600 + }, + { + "epoch": 752.06, + "learning_rate": 5.343081702924374e-07, + "loss": 0.0839, + "step": 255700 + }, + { + "epoch": 752.35, + "learning_rate": 5.319477061773076e-07, + "loss": 0.0833, + "step": 255800 + }, + { + "epoch": 752.65, + "learning_rate": 5.296157055488105e-07, + "loss": 0.0832, + "step": 255900 + }, + { + "epoch": 752.94, + "learning_rate": 5.272650598619727e-07, + "loss": 0.0832, + "step": 256000 + }, + { + "epoch": 752.94, + "eval_cer": 0.06948258576348024, + "eval_loss": 0.5696724057197571, + "eval_runtime": 4.9457, + "eval_samples_per_second": 72.589, + "eval_steps_per_second": 2.426, + "eval_wer": 0.2608415282927616, + "step": 256000 + }, + { + "epoch": 753.24, + "learning_rate": 5.249193519409756e-07, + "loss": 0.085, + "step": 256100 + }, + { + "epoch": 753.53, + "learning_rate": 5.2257858437541e-07, + "loss": 0.0806, + "step": 256200 + }, + { + "epoch": 753.82, + "learning_rate": 5.202427597494153e-07, + "loss": 0.0789, + "step": 256300 + }, + { + "epoch": 754.12, + "learning_rate": 5.179118806416677e-07, + "loss": 0.077, + "step": 256400 + }, + { + "epoch": 754.41, + "learning_rate": 5.155859496253928e-07, + "loss": 0.0791, + "step": 256500 + }, + { + "epoch": 754.71, + "learning_rate": 5.132649692683472e-07, + "loss": 0.083, + "step": 256600 + }, + { + "epoch": 755.0, + "learning_rate": 5.109489421328234e-07, + "loss": 0.0836, + "step": 256700 + }, + { + "epoch": 755.29, + "learning_rate": 5.086378707756473e-07, + "loss": 0.0783, + "step": 256800 + }, + { + "epoch": 755.59, + "learning_rate": 5.063317577481718e-07, + "loss": 0.0771, + "step": 256900 + }, + { + "epoch": 755.88, + "learning_rate": 5.040306055962773e-07, + "loss": 0.0818, + "step": 257000 + }, + { + "epoch": 755.88, + "eval_cer": 0.07009284686805282, + "eval_loss": 0.5731448531150818, + "eval_runtime": 5.0204, + "eval_samples_per_second": 71.508, + "eval_steps_per_second": 2.39, + "eval_wer": 0.26293728840883446, + "step": 257000 + }, + { + "epoch": 756.18, + "learning_rate": 5.017344168603672e-07, + "loss": 0.0777, + "step": 257100 + }, + { + "epoch": 756.47, + "learning_rate": 4.994431940753647e-07, + "loss": 0.0805, + "step": 257200 + }, + { + "epoch": 756.76, + "learning_rate": 4.971569397707115e-07, + "loss": 0.084, + "step": 257300 + }, + { + "epoch": 757.06, + "learning_rate": 4.948756564703649e-07, + "loss": 0.0813, + "step": 257400 + }, + { + "epoch": 757.35, + "learning_rate": 4.925993466927925e-07, + "loss": 0.0771, + "step": 257500 + }, + { + "epoch": 757.65, + "learning_rate": 4.90328012950973e-07, + "loss": 0.0761, + "step": 257600 + }, + { + "epoch": 757.94, + "learning_rate": 4.880616577523911e-07, + "loss": 0.0808, + "step": 257700 + }, + { + "epoch": 758.24, + "learning_rate": 4.85800283599035e-07, + "loss": 0.0815, + "step": 257800 + }, + { + "epoch": 758.53, + "learning_rate": 4.835438929873937e-07, + "loss": 0.076, + "step": 257900 + }, + { + "epoch": 758.82, + "learning_rate": 4.812924884084569e-07, + "loss": 0.0814, + "step": 258000 + }, + { + "epoch": 758.82, + "eval_cer": 0.0696569460790724, + "eval_loss": 0.5717082619667053, + "eval_runtime": 5.3882, + "eval_samples_per_second": 66.627, + "eval_steps_per_second": 2.227, + "eval_wer": 0.26229243914235045, + "step": 258000 + }, + { + "epoch": 759.12, + "learning_rate": 4.790460723477053e-07, + "loss": 0.0782, + "step": 258100 + }, + { + "epoch": 759.41, + "learning_rate": 4.768046472851168e-07, + "loss": 0.0824, + "step": 258200 + }, + { + "epoch": 759.71, + "learning_rate": 4.745682156951581e-07, + "loss": 0.0792, + "step": 258300 + }, + { + "epoch": 760.0, + "learning_rate": 4.723367800467826e-07, + "loss": 0.0804, + "step": 258400 + }, + { + "epoch": 760.29, + "learning_rate": 4.701103428034287e-07, + "loss": 0.0797, + "step": 258500 + }, + { + "epoch": 760.59, + "learning_rate": 4.6788890642301523e-07, + "loss": 0.0806, + "step": 258600 + }, + { + "epoch": 760.88, + "learning_rate": 4.656724733579432e-07, + "loss": 0.0782, + "step": 258700 + }, + { + "epoch": 761.18, + "learning_rate": 4.6348313554157366e-07, + "loss": 0.0771, + "step": 258800 + }, + { + "epoch": 761.47, + "learning_rate": 4.6127666634818326e-07, + "loss": 0.078, + "step": 258900 + }, + { + "epoch": 761.76, + "learning_rate": 4.590752077698496e-07, + "loss": 0.0803, + "step": 259000 + }, + { + "epoch": 761.76, + "eval_cer": 0.0699620766313587, + "eval_loss": 0.5720624327659607, + "eval_runtime": 4.7445, + "eval_samples_per_second": 75.667, + "eval_steps_per_second": 2.529, + "eval_wer": 0.2624536514589715, + "step": 259000 + }, + { + "epoch": 762.06, + "learning_rate": 4.56878762236917e-07, + "loss": 0.0821, + "step": 259100 + }, + { + "epoch": 762.35, + "learning_rate": 4.5468733217419626e-07, + "loss": 0.0828, + "step": 259200 + }, + { + "epoch": 762.65, + "learning_rate": 4.5250092000096e-07, + "loss": 0.0827, + "step": 259300 + }, + { + "epoch": 762.94, + "learning_rate": 4.5031952813094246e-07, + "loss": 0.078, + "step": 259400 + }, + { + "epoch": 763.24, + "learning_rate": 4.4814315897233507e-07, + "loss": 0.081, + "step": 259500 + }, + { + "epoch": 763.53, + "learning_rate": 4.459718149277842e-07, + "loss": 0.0785, + "step": 259600 + }, + { + "epoch": 763.82, + "learning_rate": 4.438054983943896e-07, + "loss": 0.0798, + "step": 259700 + }, + { + "epoch": 764.12, + "learning_rate": 4.416442117636988e-07, + "loss": 0.0811, + "step": 259800 + }, + { + "epoch": 764.41, + "learning_rate": 4.3948795742170867e-07, + "loss": 0.0797, + "step": 259900 + }, + { + "epoch": 764.71, + "learning_rate": 4.3733673774885965e-07, + "loss": 0.0825, + "step": 260000 + }, + { + "epoch": 764.71, + "eval_cer": 0.06974412623686849, + "eval_loss": 0.573108971118927, + "eval_runtime": 4.5318, + "eval_samples_per_second": 79.217, + "eval_steps_per_second": 2.648, + "eval_wer": 0.2603578913428986, + "step": 260000 + }, + { + "epoch": 765.0, + "learning_rate": 4.3519055512003306e-07, + "loss": 0.0815, + "step": 260100 + }, + { + "epoch": 765.29, + "learning_rate": 4.3304941190455195e-07, + "loss": 0.0779, + "step": 260200 + }, + { + "epoch": 765.59, + "learning_rate": 4.309133104661728e-07, + "loss": 0.0785, + "step": 260300 + }, + { + "epoch": 765.88, + "learning_rate": 4.287822531630892e-07, + "loss": 0.0813, + "step": 260400 + }, + { + "epoch": 766.18, + "learning_rate": 4.2665624234792425e-07, + "loss": 0.0765, + "step": 260500 + }, + { + "epoch": 766.47, + "learning_rate": 4.245352803677305e-07, + "loss": 0.0816, + "step": 260600 + }, + { + "epoch": 766.76, + "learning_rate": 4.2241936956398665e-07, + "loss": 0.082, + "step": 260700 + }, + { + "epoch": 767.06, + "learning_rate": 4.203085122725953e-07, + "loss": 0.0868, + "step": 260800 + }, + { + "epoch": 767.35, + "learning_rate": 4.18202710823879e-07, + "loss": 0.0798, + "step": 260900 + }, + { + "epoch": 767.65, + "learning_rate": 4.1610196754258095e-07, + "loss": 0.0776, + "step": 261000 + }, + { + "epoch": 767.65, + "eval_cer": 0.06978771631576654, + "eval_loss": 0.5764541029930115, + "eval_runtime": 5.2048, + "eval_samples_per_second": 68.974, + "eval_steps_per_second": 2.306, + "eval_wer": 0.26148637755924553, + "step": 261000 + }, + { + "epoch": 767.94, + "learning_rate": 4.140062847478576e-07, + "loss": 0.0765, + "step": 261100 + }, + { + "epoch": 768.24, + "learning_rate": 4.119156647532818e-07, + "loss": 0.0849, + "step": 261200 + }, + { + "epoch": 768.53, + "learning_rate": 4.098301098668339e-07, + "loss": 0.0767, + "step": 261300 + }, + { + "epoch": 768.82, + "learning_rate": 4.0774962239090553e-07, + "loss": 0.0869, + "step": 261400 + }, + { + "epoch": 769.12, + "learning_rate": 4.0567420462229225e-07, + "loss": 0.0747, + "step": 261500 + }, + { + "epoch": 769.41, + "learning_rate": 4.0360385885219345e-07, + "loss": 0.0817, + "step": 261600 + }, + { + "epoch": 769.71, + "learning_rate": 4.0153858736620865e-07, + "loss": 0.0824, + "step": 261700 + }, + { + "epoch": 770.0, + "learning_rate": 3.994783924443368e-07, + "loss": 0.0799, + "step": 261800 + }, + { + "epoch": 770.29, + "learning_rate": 3.9742327636097034e-07, + "loss": 0.0778, + "step": 261900 + }, + { + "epoch": 770.59, + "learning_rate": 3.953732413848971e-07, + "loss": 0.0805, + "step": 262000 + }, + { + "epoch": 770.59, + "eval_cer": 0.0696569460790724, + "eval_loss": 0.5757123827934265, + "eval_runtime": 5.0402, + "eval_samples_per_second": 71.227, + "eval_steps_per_second": 2.381, + "eval_wer": 0.26116395292600353, + "step": 262000 + }, + { + "epoch": 770.88, + "learning_rate": 3.9332828977929395e-07, + "loss": 0.0764, + "step": 262100 + }, + { + "epoch": 771.18, + "learning_rate": 3.912884238017267e-07, + "loss": 0.0782, + "step": 262200 + }, + { + "epoch": 771.47, + "learning_rate": 3.892536457041468e-07, + "loss": 0.078, + "step": 262300 + }, + { + "epoch": 771.76, + "learning_rate": 3.872239577328879e-07, + "loss": 0.0835, + "step": 262400 + }, + { + "epoch": 772.06, + "learning_rate": 3.8519936212866483e-07, + "loss": 0.0789, + "step": 262500 + }, + { + "epoch": 772.35, + "learning_rate": 3.831798611265708e-07, + "loss": 0.0807, + "step": 262600 + }, + { + "epoch": 772.65, + "learning_rate": 3.811654569560752e-07, + "loss": 0.0804, + "step": 262700 + }, + { + "epoch": 772.94, + "learning_rate": 3.7915615184101973e-07, + "loss": 0.0755, + "step": 262800 + }, + { + "epoch": 773.24, + "learning_rate": 3.771519479996172e-07, + "loss": 0.0802, + "step": 262900 + }, + { + "epoch": 773.53, + "learning_rate": 3.751528476444488e-07, + "loss": 0.0794, + "step": 263000 + }, + { + "epoch": 773.53, + "eval_cer": 0.0699620766313587, + "eval_loss": 0.5735283493995667, + "eval_runtime": 4.7277, + "eval_samples_per_second": 75.936, + "eval_steps_per_second": 2.538, + "eval_wer": 0.2619700145091085, + "step": 263000 + }, + { + "epoch": 773.82, + "learning_rate": 3.7315885298246145e-07, + "loss": 0.0781, + "step": 263100 + }, + { + "epoch": 774.12, + "learning_rate": 3.7116996621496647e-07, + "loss": 0.0834, + "step": 263200 + }, + { + "epoch": 774.41, + "learning_rate": 3.6918618953763477e-07, + "loss": 0.085, + "step": 263300 + }, + { + "epoch": 774.71, + "learning_rate": 3.672075251404966e-07, + "loss": 0.0768, + "step": 263400 + }, + { + "epoch": 775.0, + "learning_rate": 3.6523397520793866e-07, + "loss": 0.0799, + "step": 263500 + }, + { + "epoch": 775.29, + "learning_rate": 3.632655419187009e-07, + "loss": 0.0777, + "step": 263600 + }, + { + "epoch": 775.59, + "learning_rate": 3.6130222744587493e-07, + "loss": 0.078, + "step": 263700 + }, + { + "epoch": 775.88, + "learning_rate": 3.5934403395690266e-07, + "loss": 0.0777, + "step": 263800 + }, + { + "epoch": 776.18, + "learning_rate": 3.5739096361356806e-07, + "loss": 0.0825, + "step": 263900 + }, + { + "epoch": 776.47, + "learning_rate": 3.554430185720054e-07, + "loss": 0.0803, + "step": 264000 + }, + { + "epoch": 776.47, + "eval_cer": 0.06961335600017436, + "eval_loss": 0.5729749798774719, + "eval_runtime": 4.7677, + "eval_samples_per_second": 75.299, + "eval_steps_per_second": 2.517, + "eval_wer": 0.2605191036595196, + "step": 264000 + }, + { + "epoch": 776.76, + "learning_rate": 3.535002009826871e-07, + "loss": 0.0819, + "step": 264100 + }, + { + "epoch": 777.06, + "learning_rate": 3.515625129904249e-07, + "loss": 0.082, + "step": 264200 + }, + { + "epoch": 777.35, + "learning_rate": 3.4962995673437083e-07, + "loss": 0.081, + "step": 264300 + }, + { + "epoch": 777.65, + "learning_rate": 3.47702534348005e-07, + "loss": 0.0817, + "step": 264400 + }, + { + "epoch": 777.94, + "learning_rate": 3.457802479591482e-07, + "loss": 0.0803, + "step": 264500 + }, + { + "epoch": 778.24, + "learning_rate": 3.438630996899461e-07, + "loss": 0.0789, + "step": 264600 + }, + { + "epoch": 778.53, + "learning_rate": 3.4195109165687246e-07, + "loss": 0.0813, + "step": 264700 + }, + { + "epoch": 778.82, + "learning_rate": 3.400442259707282e-07, + "loss": 0.0788, + "step": 264800 + }, + { + "epoch": 779.12, + "learning_rate": 3.3814250473663434e-07, + "loss": 0.0763, + "step": 264900 + }, + { + "epoch": 779.41, + "learning_rate": 3.362459300540355e-07, + "loss": 0.0792, + "step": 265000 + }, + { + "epoch": 779.41, + "eval_cer": 0.0699620766313587, + "eval_loss": 0.5743491649627686, + "eval_runtime": 4.8049, + "eval_samples_per_second": 74.715, + "eval_steps_per_second": 2.497, + "eval_wer": 0.26180880219248753, + "step": 265000 + }, + { + "epoch": 779.71, + "learning_rate": 3.34354504016694e-07, + "loss": 0.0802, + "step": 265100 + }, + { + "epoch": 780.0, + "learning_rate": 3.324682287126868e-07, + "loss": 0.0815, + "step": 265200 + }, + { + "epoch": 780.29, + "learning_rate": 3.305871062244065e-07, + "loss": 0.0819, + "step": 265300 + }, + { + "epoch": 780.59, + "learning_rate": 3.2871113862855407e-07, + "loss": 0.0791, + "step": 265400 + }, + { + "epoch": 780.88, + "learning_rate": 3.2684032799614463e-07, + "loss": 0.0783, + "step": 265500 + }, + { + "epoch": 781.18, + "learning_rate": 3.2497467639249437e-07, + "loss": 0.081, + "step": 265600 + }, + { + "epoch": 781.47, + "learning_rate": 3.231141858772291e-07, + "loss": 0.0853, + "step": 265700 + }, + { + "epoch": 781.76, + "learning_rate": 3.2125885850427476e-07, + "loss": 0.0836, + "step": 265800 + }, + { + "epoch": 782.06, + "learning_rate": 3.194086963218551e-07, + "loss": 0.0812, + "step": 265900 + }, + { + "epoch": 782.35, + "learning_rate": 3.175637013724975e-07, + "loss": 0.0816, + "step": 266000 + }, + { + "epoch": 782.35, + "eval_cer": 0.06961335600017436, + "eval_loss": 0.5711695551872253, + "eval_runtime": 4.7303, + "eval_samples_per_second": 75.894, + "eval_steps_per_second": 2.537, + "eval_wer": 0.2605191036595196, + "step": 266000 + }, + { + "epoch": 782.65, + "learning_rate": 3.1572387569301753e-07, + "loss": 0.0772, + "step": 266100 + }, + { + "epoch": 782.94, + "learning_rate": 3.1388922131453006e-07, + "loss": 0.0852, + "step": 266200 + }, + { + "epoch": 783.24, + "learning_rate": 3.120597402624398e-07, + "loss": 0.0799, + "step": 266300 + }, + { + "epoch": 783.53, + "learning_rate": 3.102354345564357e-07, + "loss": 0.0778, + "step": 266400 + }, + { + "epoch": 783.82, + "learning_rate": 3.0841630621050055e-07, + "loss": 0.082, + "step": 266500 + }, + { + "epoch": 784.12, + "learning_rate": 3.066023572328941e-07, + "loss": 0.0835, + "step": 266600 + }, + { + "epoch": 784.41, + "learning_rate": 3.04793589626165e-07, + "loss": 0.0808, + "step": 266700 + }, + { + "epoch": 784.71, + "learning_rate": 3.0299000538713816e-07, + "loss": 0.0792, + "step": 266800 + }, + { + "epoch": 785.0, + "learning_rate": 3.0119160650691424e-07, + "loss": 0.0736, + "step": 266900 + }, + { + "epoch": 785.29, + "learning_rate": 2.993983949708756e-07, + "loss": 0.0773, + "step": 267000 + }, + { + "epoch": 785.29, + "eval_cer": 0.06970053615797045, + "eval_loss": 0.5727453827857971, + "eval_runtime": 5.3818, + "eval_samples_per_second": 66.707, + "eval_steps_per_second": 2.23, + "eval_wer": 0.26068031597614055, + "step": 267000 + }, + { + "epoch": 785.59, + "learning_rate": 2.976282272871539e-07, + "loss": 0.083, + "step": 267100 + }, + { + "epoch": 785.88, + "learning_rate": 2.958453444499787e-07, + "loss": 0.0826, + "step": 267200 + }, + { + "epoch": 786.18, + "learning_rate": 2.9406765485910036e-07, + "loss": 0.0746, + "step": 267300 + }, + { + "epoch": 786.47, + "learning_rate": 2.922951604770352e-07, + "loss": 0.0792, + "step": 267400 + }, + { + "epoch": 786.76, + "learning_rate": 2.9052786326056457e-07, + "loss": 0.0823, + "step": 267500 + }, + { + "epoch": 787.06, + "learning_rate": 2.8876576516073117e-07, + "loss": 0.077, + "step": 267600 + }, + { + "epoch": 787.35, + "learning_rate": 2.870088681228389e-07, + "loss": 0.0817, + "step": 267700 + }, + { + "epoch": 787.65, + "learning_rate": 2.852746652656024e-07, + "loss": 0.0784, + "step": 267800 + }, + { + "epoch": 787.94, + "learning_rate": 2.8352812410562815e-07, + "loss": 0.0807, + "step": 267900 + }, + { + "epoch": 788.24, + "learning_rate": 2.8178678978979357e-07, + "loss": 0.0803, + "step": 268000 + }, + { + "epoch": 788.24, + "eval_cer": 0.06943899568458219, + "eval_loss": 0.5726141333580017, + "eval_runtime": 4.5444, + "eval_samples_per_second": 78.998, + "eval_steps_per_second": 2.641, + "eval_wer": 0.2608415282927616, + "step": 268000 + }, + { + "epoch": 788.53, + "learning_rate": 2.800506642404821e-07, + "loss": 0.0822, + "step": 268100 + }, + { + "epoch": 788.82, + "learning_rate": 2.783197493743217e-07, + "loss": 0.0829, + "step": 268200 + }, + { + "epoch": 789.12, + "learning_rate": 2.765940471021933e-07, + "loss": 0.0817, + "step": 268300 + }, + { + "epoch": 789.41, + "learning_rate": 2.74873559329219e-07, + "loss": 0.0793, + "step": 268400 + }, + { + "epoch": 789.71, + "learning_rate": 2.731582879547667e-07, + "loss": 0.082, + "step": 268500 + }, + { + "epoch": 790.0, + "learning_rate": 2.71448234872444e-07, + "loss": 0.0829, + "step": 268600 + }, + { + "epoch": 790.29, + "learning_rate": 2.69743401970099e-07, + "loss": 0.0781, + "step": 268700 + }, + { + "epoch": 790.59, + "learning_rate": 2.680437911298167e-07, + "loss": 0.0856, + "step": 268800 + }, + { + "epoch": 790.88, + "learning_rate": 2.6634940422791577e-07, + "loss": 0.0824, + "step": 268900 + }, + { + "epoch": 791.18, + "learning_rate": 2.646602431349504e-07, + "loss": 0.0814, + "step": 269000 + }, + { + "epoch": 791.18, + "eval_cer": 0.0696569460790724, + "eval_loss": 0.5711923241615295, + "eval_runtime": 4.6959, + "eval_samples_per_second": 76.449, + "eval_steps_per_second": 2.555, + "eval_wer": 0.26116395292600353, + "step": 269000 + }, + { + "epoch": 791.47, + "learning_rate": 2.6297630971570234e-07, + "loss": 0.0795, + "step": 269100 + }, + { + "epoch": 791.76, + "learning_rate": 2.6129760582918383e-07, + "loss": 0.0809, + "step": 269200 + }, + { + "epoch": 792.06, + "learning_rate": 2.5962413332863534e-07, + "loss": 0.0837, + "step": 269300 + }, + { + "epoch": 792.35, + "learning_rate": 2.5795589406151846e-07, + "loss": 0.0817, + "step": 269400 + }, + { + "epoch": 792.65, + "learning_rate": 2.5629288986952217e-07, + "loss": 0.0823, + "step": 269500 + }, + { + "epoch": 792.94, + "learning_rate": 2.5463512258855126e-07, + "loss": 0.0754, + "step": 269600 + }, + { + "epoch": 793.24, + "learning_rate": 2.5298259404873125e-07, + "loss": 0.0828, + "step": 269700 + }, + { + "epoch": 793.53, + "learning_rate": 2.513353060744067e-07, + "loss": 0.0811, + "step": 269800 + }, + { + "epoch": 793.82, + "learning_rate": 2.4969326048413124e-07, + "loss": 0.0767, + "step": 269900 + }, + { + "epoch": 794.12, + "learning_rate": 2.4805645909067697e-07, + "loss": 0.0896, + "step": 270000 + }, + { + "epoch": 794.12, + "eval_cer": 0.0696569460790724, + "eval_loss": 0.5720658898353577, + "eval_runtime": 4.9834, + "eval_samples_per_second": 72.039, + "eval_steps_per_second": 2.408, + "eval_wer": 0.26180880219248753, + "step": 270000 + }, + { + "epoch": 794.41, + "learning_rate": 2.4642490370102247e-07, + "loss": 0.0785, + "step": 270100 + }, + { + "epoch": 794.71, + "learning_rate": 2.447985961163546e-07, + "loss": 0.0761, + "step": 270200 + }, + { + "epoch": 795.0, + "learning_rate": 2.4317753813207165e-07, + "loss": 0.0814, + "step": 270300 + }, + { + "epoch": 795.29, + "learning_rate": 2.415617315377705e-07, + "loss": 0.0803, + "step": 270400 + }, + { + "epoch": 795.59, + "learning_rate": 2.399511781172553e-07, + "loss": 0.0776, + "step": 270500 + }, + { + "epoch": 795.88, + "learning_rate": 2.3834587964852773e-07, + "loss": 0.0789, + "step": 270600 + }, + { + "epoch": 796.18, + "learning_rate": 2.3674583790378957e-07, + "loss": 0.0781, + "step": 270700 + }, + { + "epoch": 796.47, + "learning_rate": 2.3515105464943956e-07, + "loss": 0.0801, + "step": 270800 + }, + { + "epoch": 796.76, + "learning_rate": 2.3356153164606933e-07, + "loss": 0.0792, + "step": 270900 + }, + { + "epoch": 797.06, + "learning_rate": 2.3197727064846798e-07, + "loss": 0.0819, + "step": 271000 + }, + { + "epoch": 797.06, + "eval_cer": 0.0699620766313587, + "eval_loss": 0.5707818865776062, + "eval_runtime": 4.6691, + "eval_samples_per_second": 76.889, + "eval_steps_per_second": 2.57, + "eval_wer": 0.2619700145091085, + "step": 271000 + }, + { + "epoch": 797.35, + "learning_rate": 2.3039827340560928e-07, + "loss": 0.0757, + "step": 271100 + }, + { + "epoch": 797.65, + "learning_rate": 2.288245416606605e-07, + "loss": 0.0793, + "step": 271200 + }, + { + "epoch": 797.94, + "learning_rate": 2.272560771509741e-07, + "loss": 0.0822, + "step": 271300 + }, + { + "epoch": 798.24, + "learning_rate": 2.2569288160808778e-07, + "loss": 0.0775, + "step": 271400 + }, + { + "epoch": 798.53, + "learning_rate": 2.241349567577239e-07, + "loss": 0.0837, + "step": 271500 + }, + { + "epoch": 798.82, + "learning_rate": 2.225823043197839e-07, + "loss": 0.0814, + "step": 271600 + }, + { + "epoch": 799.12, + "learning_rate": 2.210349260083494e-07, + "loss": 0.0812, + "step": 271700 + }, + { + "epoch": 799.41, + "learning_rate": 2.1949282353168122e-07, + "loss": 0.0828, + "step": 271800 + }, + { + "epoch": 799.71, + "learning_rate": 2.179559985922125e-07, + "loss": 0.0833, + "step": 271900 + }, + { + "epoch": 800.0, + "learning_rate": 2.16424452886555e-07, + "loss": 0.0765, + "step": 272000 + }, + { + "epoch": 800.0, + "eval_cer": 0.06983130639466457, + "eval_loss": 0.5701684355735779, + "eval_runtime": 4.6145, + "eval_samples_per_second": 77.799, + "eval_steps_per_second": 2.601, + "eval_wer": 0.2616475898758665, + "step": 272000 + }, + { + "epoch": 800.29, + "learning_rate": 2.1489818810548736e-07, + "loss": 0.077, + "step": 272100 + }, + { + "epoch": 800.59, + "learning_rate": 2.1337720593396004e-07, + "loss": 0.0785, + "step": 272200 + }, + { + "epoch": 800.88, + "learning_rate": 2.118615080510933e-07, + "loss": 0.084, + "step": 272300 + }, + { + "epoch": 801.18, + "learning_rate": 2.1035109613017134e-07, + "loss": 0.0812, + "step": 272400 + }, + { + "epoch": 801.47, + "learning_rate": 2.0884597183864374e-07, + "loss": 0.0806, + "step": 272500 + }, + { + "epoch": 801.76, + "learning_rate": 2.073461368381241e-07, + "loss": 0.0802, + "step": 272600 + }, + { + "epoch": 802.06, + "learning_rate": 2.0586651202931184e-07, + "loss": 0.0814, + "step": 272700 + }, + { + "epoch": 802.35, + "learning_rate": 2.0437720763816893e-07, + "loss": 0.0786, + "step": 272800 + }, + { + "epoch": 802.65, + "learning_rate": 2.02893197471416e-07, + "loss": 0.0823, + "step": 272900 + }, + { + "epoch": 802.94, + "learning_rate": 2.0141448316735424e-07, + "loss": 0.079, + "step": 273000 + }, + { + "epoch": 802.94, + "eval_cer": 0.06961335600017436, + "eval_loss": 0.5719471573829651, + "eval_runtime": 4.6624, + "eval_samples_per_second": 76.999, + "eval_steps_per_second": 2.574, + "eval_wer": 0.26148637755924553, + "step": 273000 + }, + { + "epoch": 803.24, + "learning_rate": 1.9994106635844225e-07, + "loss": 0.0813, + "step": 273100 + }, + { + "epoch": 803.53, + "learning_rate": 1.9847294867128608e-07, + "loss": 0.0827, + "step": 273200 + }, + { + "epoch": 803.82, + "learning_rate": 1.970101317266454e-07, + "loss": 0.0794, + "step": 273300 + }, + { + "epoch": 804.12, + "learning_rate": 1.955526171394262e-07, + "loss": 0.0853, + "step": 273400 + }, + { + "epoch": 804.41, + "learning_rate": 1.941004065186797e-07, + "loss": 0.0801, + "step": 273500 + }, + { + "epoch": 804.71, + "learning_rate": 1.9265350146760564e-07, + "loss": 0.0825, + "step": 273600 + }, + { + "epoch": 805.0, + "learning_rate": 1.9121190358354135e-07, + "loss": 0.0815, + "step": 273700 + }, + { + "epoch": 805.29, + "learning_rate": 1.8977561445796932e-07, + "loss": 0.0749, + "step": 273800 + }, + { + "epoch": 805.59, + "learning_rate": 1.8835891917292903e-07, + "loss": 0.0795, + "step": 273900 + }, + { + "epoch": 805.88, + "learning_rate": 1.8693319918830056e-07, + "loss": 0.0825, + "step": 274000 + }, + { + "epoch": 805.88, + "eval_cer": 0.0699620766313587, + "eval_loss": 0.5727930665016174, + "eval_runtime": 4.7385, + "eval_samples_per_second": 75.762, + "eval_steps_per_second": 2.532, + "eval_wer": 0.26277607609221343, + "step": 274000 + }, + { + "epoch": 806.18, + "learning_rate": 1.8551279268572586e-07, + "loss": 0.0821, + "step": 274100 + }, + { + "epoch": 806.47, + "learning_rate": 1.8409770123329118e-07, + "loss": 0.0779, + "step": 274200 + }, + { + "epoch": 806.76, + "learning_rate": 1.826879263932152e-07, + "loss": 0.0799, + "step": 274300 + }, + { + "epoch": 807.06, + "learning_rate": 1.8128346972184797e-07, + "loss": 0.0765, + "step": 274400 + }, + { + "epoch": 807.35, + "learning_rate": 1.7988433276966698e-07, + "loss": 0.0759, + "step": 274500 + }, + { + "epoch": 807.65, + "learning_rate": 1.784905170812784e-07, + "loss": 0.0778, + "step": 274600 + }, + { + "epoch": 807.94, + "learning_rate": 1.7710202419541246e-07, + "loss": 0.0823, + "step": 274700 + }, + { + "epoch": 808.24, + "learning_rate": 1.7571885564492407e-07, + "loss": 0.0776, + "step": 274800 + }, + { + "epoch": 808.53, + "learning_rate": 1.7434101295678963e-07, + "loss": 0.0765, + "step": 274900 + }, + { + "epoch": 808.82, + "learning_rate": 1.7296849765210731e-07, + "loss": 0.0799, + "step": 275000 + }, + { + "epoch": 808.82, + "eval_cer": 0.06948258576348024, + "eval_loss": 0.5712651610374451, + "eval_runtime": 5.286, + "eval_samples_per_second": 67.915, + "eval_steps_per_second": 2.27, + "eval_wer": 0.26116395292600353, + "step": 275000 + }, + { + "epoch": 809.12, + "learning_rate": 1.7160131124609237e-07, + "loss": 0.0826, + "step": 275100 + }, + { + "epoch": 809.41, + "learning_rate": 1.702394552480774e-07, + "loss": 0.0836, + "step": 275200 + }, + { + "epoch": 809.71, + "learning_rate": 1.68882931161512e-07, + "loss": 0.0807, + "step": 275300 + }, + { + "epoch": 810.0, + "learning_rate": 1.675317404839566e-07, + "loss": 0.0782, + "step": 275400 + }, + { + "epoch": 810.29, + "learning_rate": 1.6618588470708686e-07, + "loss": 0.0838, + "step": 275500 + }, + { + "epoch": 810.59, + "learning_rate": 1.648453653166865e-07, + "loss": 0.0816, + "step": 275600 + }, + { + "epoch": 810.88, + "learning_rate": 1.635101837926495e-07, + "loss": 0.0805, + "step": 275700 + }, + { + "epoch": 811.18, + "learning_rate": 1.6218034160897567e-07, + "loss": 0.0778, + "step": 275800 + }, + { + "epoch": 811.47, + "learning_rate": 1.6085584023377177e-07, + "loss": 0.0808, + "step": 275900 + }, + { + "epoch": 811.76, + "learning_rate": 1.5953668112924758e-07, + "loss": 0.0781, + "step": 276000 + }, + { + "epoch": 811.76, + "eval_cer": 0.06987489647356261, + "eval_loss": 0.5731009244918823, + "eval_runtime": 4.7801, + "eval_samples_per_second": 75.102, + "eval_steps_per_second": 2.51, + "eval_wer": 0.2619700145091085, + "step": 276000 + }, + { + "epoch": 812.06, + "learning_rate": 1.5822286575171486e-07, + "loss": 0.0751, + "step": 276100 + }, + { + "epoch": 812.35, + "learning_rate": 1.5691439555158783e-07, + "loss": 0.0798, + "step": 276200 + }, + { + "epoch": 812.65, + "learning_rate": 1.556242767386512e-07, + "loss": 0.0819, + "step": 276300 + }, + { + "epoch": 812.94, + "learning_rate": 1.5432644773326065e-07, + "loss": 0.0791, + "step": 276400 + }, + { + "epoch": 813.24, + "learning_rate": 1.5303396820680326e-07, + "loss": 0.0795, + "step": 276500 + }, + { + "epoch": 813.53, + "learning_rate": 1.517468395861388e-07, + "loss": 0.0786, + "step": 276600 + }, + { + "epoch": 813.82, + "learning_rate": 1.5046506329221833e-07, + "loss": 0.0815, + "step": 276700 + }, + { + "epoch": 814.12, + "learning_rate": 1.49188640740085e-07, + "loss": 0.0795, + "step": 276800 + }, + { + "epoch": 814.41, + "learning_rate": 1.4791757333887213e-07, + "loss": 0.077, + "step": 276900 + }, + { + "epoch": 814.71, + "learning_rate": 1.466518624917984e-07, + "loss": 0.0827, + "step": 277000 + }, + { + "epoch": 814.71, + "eval_cer": 0.06922104529009197, + "eval_loss": 0.5720049738883972, + "eval_runtime": 4.7084, + "eval_samples_per_second": 76.247, + "eval_steps_per_second": 2.549, + "eval_wer": 0.2608415282927616, + "step": 277000 + }, + { + "epoch": 815.0, + "learning_rate": 1.453915095961722e-07, + "loss": 0.0804, + "step": 277100 + }, + { + "epoch": 815.29, + "learning_rate": 1.441365160433844e-07, + "loss": 0.0796, + "step": 277200 + }, + { + "epoch": 815.59, + "learning_rate": 1.428868832189112e-07, + "loss": 0.0825, + "step": 277300 + }, + { + "epoch": 815.88, + "learning_rate": 1.4164261250231014e-07, + "loss": 0.0797, + "step": 277400 + }, + { + "epoch": 816.18, + "learning_rate": 1.4040370526721802e-07, + "loss": 0.0785, + "step": 277500 + }, + { + "epoch": 816.47, + "learning_rate": 1.391701628813519e-07, + "loss": 0.0773, + "step": 277600 + }, + { + "epoch": 816.76, + "learning_rate": 1.3794198670650572e-07, + "loss": 0.0803, + "step": 277700 + }, + { + "epoch": 817.06, + "learning_rate": 1.3671917809854996e-07, + "loss": 0.0822, + "step": 277800 + }, + { + "epoch": 817.35, + "learning_rate": 1.3550173840742753e-07, + "loss": 0.0765, + "step": 277900 + }, + { + "epoch": 817.65, + "learning_rate": 1.3428966897715667e-07, + "loss": 0.0767, + "step": 278000 + }, + { + "epoch": 817.65, + "eval_cer": 0.06952617584237827, + "eval_loss": 0.5717321038246155, + "eval_runtime": 5.4079, + "eval_samples_per_second": 66.384, + "eval_steps_per_second": 2.219, + "eval_wer": 0.2616475898758665, + "step": 278000 + }, + { + "epoch": 817.94, + "learning_rate": 1.3308297114582535e-07, + "loss": 0.0783, + "step": 278100 + }, + { + "epoch": 818.24, + "learning_rate": 1.3188164624559186e-07, + "loss": 0.0811, + "step": 278200 + }, + { + "epoch": 818.53, + "learning_rate": 1.3068569560268307e-07, + "loss": 0.0802, + "step": 278300 + }, + { + "epoch": 818.82, + "learning_rate": 1.2949512053739232e-07, + "loss": 0.0773, + "step": 278400 + }, + { + "epoch": 819.12, + "learning_rate": 1.2830992236408046e-07, + "loss": 0.0809, + "step": 278500 + }, + { + "epoch": 819.41, + "learning_rate": 1.2713010239116919e-07, + "loss": 0.0787, + "step": 278600 + }, + { + "epoch": 819.71, + "learning_rate": 1.259556619211455e-07, + "loss": 0.0758, + "step": 278700 + }, + { + "epoch": 820.0, + "learning_rate": 1.2478660225055616e-07, + "loss": 0.0862, + "step": 278800 + }, + { + "epoch": 820.29, + "learning_rate": 1.2362292467000882e-07, + "loss": 0.082, + "step": 278900 + }, + { + "epoch": 820.59, + "learning_rate": 1.2246463046416745e-07, + "loss": 0.0772, + "step": 279000 + }, + { + "epoch": 820.59, + "eval_cer": 0.06956976592127631, + "eval_loss": 0.5717667937278748, + "eval_runtime": 4.7601, + "eval_samples_per_second": 75.419, + "eval_steps_per_second": 2.521, + "eval_wer": 0.26148637755924553, + "step": 279000 + }, + { + "epoch": 820.88, + "learning_rate": 1.213117209117559e-07, + "loss": 0.0759, + "step": 279100 + }, + { + "epoch": 821.18, + "learning_rate": 1.2016419728555108e-07, + "loss": 0.0848, + "step": 279200 + }, + { + "epoch": 821.47, + "learning_rate": 1.1902206085238455e-07, + "loss": 0.0821, + "step": 279300 + }, + { + "epoch": 821.76, + "learning_rate": 1.1788531287314109e-07, + "loss": 0.0835, + "step": 279400 + }, + { + "epoch": 822.06, + "learning_rate": 1.1675395460275629e-07, + "loss": 0.083, + "step": 279500 + }, + { + "epoch": 822.35, + "learning_rate": 1.1562798729021662e-07, + "loss": 0.0793, + "step": 279600 + }, + { + "epoch": 822.65, + "learning_rate": 1.145074121785561e-07, + "loss": 0.083, + "step": 279700 + }, + { + "epoch": 822.94, + "learning_rate": 1.133922305048557e-07, + "loss": 0.0792, + "step": 279800 + }, + { + "epoch": 823.24, + "learning_rate": 1.1228244350024342e-07, + "loss": 0.0836, + "step": 279900 + }, + { + "epoch": 823.53, + "learning_rate": 1.1118906958730913e-07, + "loss": 0.0755, + "step": 280000 + }, + { + "epoch": 823.53, + "eval_cer": 0.06961335600017436, + "eval_loss": 0.5713757872581482, + "eval_runtime": 4.7516, + "eval_samples_per_second": 75.554, + "eval_steps_per_second": 2.525, + "eval_wer": 0.26132516524262456, + "step": 280000 + }, + { + "epoch": 823.82, + "learning_rate": 1.1009002161327942e-07, + "loss": 0.0798, + "step": 280100 + }, + { + "epoch": 824.12, + "learning_rate": 1.0899637195387892e-07, + "loss": 0.0788, + "step": 280200 + }, + { + "epoch": 824.41, + "learning_rate": 1.0790812181646183e-07, + "loss": 0.0808, + "step": 280300 + }, + { + "epoch": 824.71, + "learning_rate": 1.0682527240242435e-07, + "loss": 0.082, + "step": 280400 + }, + { + "epoch": 825.0, + "learning_rate": 1.0574782490720082e-07, + "loss": 0.0784, + "step": 280500 + }, + { + "epoch": 825.29, + "learning_rate": 1.0467578052026029e-07, + "loss": 0.0791, + "step": 280600 + }, + { + "epoch": 825.59, + "learning_rate": 1.0360914042510883e-07, + "loss": 0.0805, + "step": 280700 + }, + { + "epoch": 825.88, + "learning_rate": 1.0254790579928398e-07, + "loss": 0.0806, + "step": 280800 + }, + { + "epoch": 826.18, + "learning_rate": 1.0149207781435689e-07, + "loss": 0.0811, + "step": 280900 + }, + { + "epoch": 826.47, + "learning_rate": 1.0044165763593183e-07, + "loss": 0.077, + "step": 281000 + }, + { + "epoch": 826.47, + "eval_cer": 0.06956976592127631, + "eval_loss": 0.5718855857849121, + "eval_runtime": 4.6002, + "eval_samples_per_second": 78.04, + "eval_steps_per_second": 2.609, + "eval_wer": 0.2616475898758665, + "step": 281000 + }, + { + "epoch": 826.76, + "learning_rate": 9.940706975758773e-08, + "loss": 0.084, + "step": 281100 + }, + { + "epoch": 827.06, + "learning_rate": 9.836741455820143e-08, + "loss": 0.0778, + "step": 281200 + }, + { + "epoch": 827.35, + "learning_rate": 9.733317061485114e-08, + "loss": 0.0797, + "step": 281300 + }, + { + "epoch": 827.65, + "learning_rate": 9.630433906931135e-08, + "loss": 0.079, + "step": 281400 + }, + { + "epoch": 827.94, + "learning_rate": 9.528092105738129e-08, + "loss": 0.0846, + "step": 281500 + }, + { + "epoch": 828.24, + "learning_rate": 9.42629177088844e-08, + "loss": 0.0845, + "step": 281600 + }, + { + "epoch": 828.53, + "learning_rate": 9.325033014766505e-08, + "loss": 0.0766, + "step": 281700 + }, + { + "epoch": 828.82, + "learning_rate": 9.224315949158957e-08, + "loss": 0.0807, + "step": 281800 + }, + { + "epoch": 829.12, + "learning_rate": 9.124140685254579e-08, + "loss": 0.0794, + "step": 281900 + }, + { + "epoch": 829.41, + "learning_rate": 9.024507333643684e-08, + "loss": 0.0866, + "step": 282000 + }, + { + "epoch": 829.41, + "eval_cer": 0.06961335600017436, + "eval_loss": 0.5701565742492676, + "eval_runtime": 4.6728, + "eval_samples_per_second": 76.828, + "eval_steps_per_second": 2.568, + "eval_wer": 0.26116395292600353, + "step": 282000 + }, + { + "epoch": 829.71, + "learning_rate": 8.925416004318732e-08, + "loss": 0.0794, + "step": 282100 + }, + { + "epoch": 830.0, + "learning_rate": 8.826866806673329e-08, + "loss": 0.0786, + "step": 282200 + }, + { + "epoch": 830.29, + "learning_rate": 8.728859849503057e-08, + "loss": 0.0817, + "step": 282300 + }, + { + "epoch": 830.59, + "learning_rate": 8.631395241004592e-08, + "loss": 0.078, + "step": 282400 + }, + { + "epoch": 830.88, + "learning_rate": 8.534473088775919e-08, + "loss": 0.0766, + "step": 282500 + }, + { + "epoch": 831.18, + "learning_rate": 8.43809349981628e-08, + "loss": 0.0789, + "step": 282600 + }, + { + "epoch": 831.47, + "learning_rate": 8.342256580525842e-08, + "loss": 0.0821, + "step": 282700 + }, + { + "epoch": 831.76, + "learning_rate": 8.246962436705642e-08, + "loss": 0.082, + "step": 282800 + }, + { + "epoch": 832.06, + "learning_rate": 8.152211173557634e-08, + "loss": 0.0807, + "step": 282900 + }, + { + "epoch": 832.35, + "learning_rate": 8.05800289568437e-08, + "loss": 0.0791, + "step": 283000 + }, + { + "epoch": 832.35, + "eval_cer": 0.0696569460790724, + "eval_loss": 0.5718459486961365, + "eval_runtime": 4.5798, + "eval_samples_per_second": 78.388, + "eval_steps_per_second": 2.62, + "eval_wer": 0.26132516524262456, + "step": 283000 + }, + { + "epoch": 832.65, + "learning_rate": 7.964337707088987e-08, + "loss": 0.0784, + "step": 283100 + }, + { + "epoch": 832.94, + "learning_rate": 7.871215711174995e-08, + "loss": 0.0832, + "step": 283200 + }, + { + "epoch": 833.24, + "learning_rate": 7.778637010746437e-08, + "loss": 0.0796, + "step": 283300 + }, + { + "epoch": 833.53, + "learning_rate": 7.686601708007224e-08, + "loss": 0.0785, + "step": 283400 + }, + { + "epoch": 833.82, + "learning_rate": 7.595109904561748e-08, + "loss": 0.0768, + "step": 283500 + }, + { + "epoch": 834.12, + "learning_rate": 7.504161701414159e-08, + "loss": 0.079, + "step": 283600 + }, + { + "epoch": 834.41, + "learning_rate": 7.413757198968585e-08, + "loss": 0.0769, + "step": 283700 + }, + { + "epoch": 834.71, + "learning_rate": 7.32389649702897e-08, + "loss": 0.0797, + "step": 283800 + }, + { + "epoch": 835.0, + "learning_rate": 7.234579694798627e-08, + "loss": 0.0799, + "step": 283900 + }, + { + "epoch": 835.29, + "learning_rate": 7.145806890880846e-08, + "loss": 0.0781, + "step": 284000 + }, + { + "epoch": 835.29, + "eval_cer": 0.06974412623686849, + "eval_loss": 0.5719029307365417, + "eval_runtime": 4.7885, + "eval_samples_per_second": 74.971, + "eval_steps_per_second": 2.506, + "eval_wer": 0.26132516524262456, + "step": 284000 + }, + { + "epoch": 835.59, + "learning_rate": 7.057578183278069e-08, + "loss": 0.082, + "step": 284100 + }, + { + "epoch": 835.88, + "learning_rate": 6.969893669392213e-08, + "loss": 0.0802, + "step": 284200 + }, + { + "epoch": 836.18, + "learning_rate": 6.882753446024293e-08, + "loss": 0.0807, + "step": 284300 + }, + { + "epoch": 836.47, + "learning_rate": 6.79615760937452e-08, + "loss": 0.0803, + "step": 284400 + }, + { + "epoch": 836.76, + "learning_rate": 6.710106255042148e-08, + "loss": 0.0816, + "step": 284500 + }, + { + "epoch": 837.06, + "learning_rate": 6.624599478025295e-08, + "loss": 0.08, + "step": 284600 + }, + { + "epoch": 837.35, + "learning_rate": 6.539637372720897e-08, + "loss": 0.0793, + "step": 284700 + }, + { + "epoch": 837.65, + "learning_rate": 6.455220032924592e-08, + "loss": 0.0759, + "step": 284800 + }, + { + "epoch": 837.94, + "learning_rate": 6.371347551830498e-08, + "loss": 0.0752, + "step": 284900 + }, + { + "epoch": 838.24, + "learning_rate": 6.288020022031494e-08, + "loss": 0.0821, + "step": 285000 + }, + { + "epoch": 838.24, + "eval_cer": 0.06952617584237827, + "eval_loss": 0.5715811252593994, + "eval_runtime": 4.9425, + "eval_samples_per_second": 72.635, + "eval_steps_per_second": 2.428, + "eval_wer": 0.26148637755924553, + "step": 285000 + }, + { + "epoch": 838.53, + "learning_rate": 6.20523753551855e-08, + "loss": 0.0799, + "step": 285100 + }, + { + "epoch": 838.82, + "learning_rate": 6.123000183681116e-08, + "loss": 0.0764, + "step": 285200 + }, + { + "epoch": 839.12, + "learning_rate": 6.041308057306793e-08, + "loss": 0.0788, + "step": 285300 + }, + { + "epoch": 839.41, + "learning_rate": 5.96016124658122e-08, + "loss": 0.0789, + "step": 285400 + }, + { + "epoch": 839.71, + "learning_rate": 5.879559841088067e-08, + "loss": 0.0771, + "step": 285500 + }, + { + "epoch": 840.0, + "learning_rate": 5.799503929808825e-08, + "loss": 0.076, + "step": 285600 + }, + { + "epoch": 840.29, + "learning_rate": 5.7199936011229085e-08, + "loss": 0.0809, + "step": 285700 + }, + { + "epoch": 840.59, + "learning_rate": 5.6410289428073805e-08, + "loss": 0.0825, + "step": 285800 + }, + { + "epoch": 840.88, + "learning_rate": 5.5626100420367314e-08, + "loss": 0.0801, + "step": 285900 + }, + { + "epoch": 841.18, + "learning_rate": 5.484736985383155e-08, + "loss": 0.0794, + "step": 286000 + }, + { + "epoch": 841.18, + "eval_cer": 0.06943899568458219, + "eval_loss": 0.5725530385971069, + "eval_runtime": 4.3327, + "eval_samples_per_second": 82.858, + "eval_steps_per_second": 2.77, + "eval_wer": 0.2616475898758665, + "step": 286000 + }, + { + "epoch": 841.47, + "learning_rate": 5.407409858816215e-08, + "loss": 0.0761, + "step": 286100 + }, + { + "epoch": 841.76, + "learning_rate": 5.330628747702682e-08, + "loss": 0.0813, + "step": 286200 + }, + { + "epoch": 842.06, + "learning_rate": 5.254393736806696e-08, + "loss": 0.0746, + "step": 286300 + }, + { + "epoch": 842.35, + "learning_rate": 5.1787049102893226e-08, + "loss": 0.0787, + "step": 286400 + }, + { + "epoch": 842.65, + "learning_rate": 5.103562351708891e-08, + "loss": 0.0804, + "step": 286500 + }, + { + "epoch": 842.94, + "learning_rate": 5.0289661440203754e-08, + "loss": 0.0821, + "step": 286600 + }, + { + "epoch": 843.24, + "learning_rate": 4.954916369575957e-08, + "loss": 0.077, + "step": 286700 + }, + { + "epoch": 843.53, + "learning_rate": 4.8814131101243e-08, + "loss": 0.0812, + "step": 286800 + }, + { + "epoch": 843.82, + "learning_rate": 4.8084564468107163e-08, + "loss": 0.0793, + "step": 286900 + }, + { + "epoch": 844.12, + "learning_rate": 4.736046460177335e-08, + "loss": 0.084, + "step": 287000 + }, + { + "epoch": 844.12, + "eval_cer": 0.06943899568458219, + "eval_loss": 0.572623610496521, + "eval_runtime": 4.6704, + "eval_samples_per_second": 76.867, + "eval_steps_per_second": 2.569, + "eval_wer": 0.26148637755924553, + "step": 287000 + }, + { + "epoch": 844.41, + "learning_rate": 4.664899155756353e-08, + "loss": 0.0819, + "step": 287100 + }, + { + "epoch": 844.71, + "learning_rate": 4.5935772929447395e-08, + "loss": 0.0836, + "step": 287200 + }, + { + "epoch": 845.0, + "learning_rate": 4.5235073860416254e-08, + "loss": 0.0758, + "step": 287300 + }, + { + "epoch": 845.29, + "learning_rate": 4.453273958858917e-08, + "loss": 0.0788, + "step": 287400 + }, + { + "epoch": 845.59, + "learning_rate": 4.383587600467143e-08, + "loss": 0.0818, + "step": 287500 + }, + { + "epoch": 845.88, + "learning_rate": 4.314448387798098e-08, + "loss": 0.0785, + "step": 287600 + }, + { + "epoch": 846.18, + "learning_rate": 4.245856397179282e-08, + "loss": 0.081, + "step": 287700 + }, + { + "epoch": 846.47, + "learning_rate": 4.1778117043342894e-08, + "loss": 0.0748, + "step": 287800 + }, + { + "epoch": 846.76, + "learning_rate": 4.1103143843823635e-08, + "loss": 0.0754, + "step": 287900 + }, + { + "epoch": 847.06, + "learning_rate": 4.043364511838566e-08, + "loss": 0.0821, + "step": 288000 + }, + { + "epoch": 847.06, + "eval_cer": 0.06970053615797045, + "eval_loss": 0.5727963447570801, + "eval_runtime": 5.4197, + "eval_samples_per_second": 66.24, + "eval_steps_per_second": 2.214, + "eval_wer": 0.2616475898758665, + "step": 288000 + }, + { + "epoch": 847.35, + "learning_rate": 3.976962160613551e-08, + "loss": 0.0784, + "step": 288100 + }, + { + "epoch": 847.65, + "learning_rate": 3.911107404013459e-08, + "loss": 0.0837, + "step": 288200 + }, + { + "epoch": 847.94, + "learning_rate": 3.845800314740133e-08, + "loss": 0.0825, + "step": 288300 + }, + { + "epoch": 848.24, + "learning_rate": 3.78104096489057e-08, + "loss": 0.0807, + "step": 288400 + }, + { + "epoch": 848.53, + "learning_rate": 3.716829425957136e-08, + "loss": 0.0752, + "step": 288500 + }, + { + "epoch": 848.82, + "learning_rate": 3.65316576882746e-08, + "loss": 0.0849, + "step": 288600 + }, + { + "epoch": 849.12, + "learning_rate": 3.590050063784323e-08, + "loss": 0.079, + "step": 288700 + }, + { + "epoch": 849.41, + "learning_rate": 3.527482380505598e-08, + "loss": 0.0771, + "step": 288800 + }, + { + "epoch": 849.71, + "learning_rate": 3.4654627880641446e-08, + "loss": 0.0837, + "step": 288900 + }, + { + "epoch": 850.0, + "learning_rate": 3.403991354927694e-08, + "loss": 0.0781, + "step": 289000 + }, + { + "epoch": 850.0, + "eval_cer": 0.06926463536899002, + "eval_loss": 0.5718810558319092, + "eval_runtime": 4.9265, + "eval_samples_per_second": 72.871, + "eval_steps_per_second": 2.436, + "eval_wer": 0.2605191036595196, + "step": 289000 + }, + { + "epoch": 850.29, + "learning_rate": 3.343068148958906e-08, + "loss": 0.0751, + "step": 289100 + }, + { + "epoch": 850.59, + "learning_rate": 3.2826932374151464e-08, + "loss": 0.0807, + "step": 289200 + }, + { + "epoch": 850.88, + "learning_rate": 3.2228666869486e-08, + "loss": 0.0819, + "step": 289300 + }, + { + "epoch": 851.18, + "learning_rate": 3.163588563605935e-08, + "loss": 0.0802, + "step": 289400 + }, + { + "epoch": 851.47, + "learning_rate": 3.104858932828414e-08, + "loss": 0.0805, + "step": 289500 + }, + { + "epoch": 851.76, + "learning_rate": 3.046677859451841e-08, + "loss": 0.0777, + "step": 289600 + }, + { + "epoch": 852.06, + "learning_rate": 2.989045407706282e-08, + "loss": 0.0806, + "step": 289700 + }, + { + "epoch": 852.35, + "learning_rate": 2.9319616412163966e-08, + "loss": 0.0825, + "step": 289800 + }, + { + "epoch": 852.65, + "learning_rate": 2.8754266230008875e-08, + "loss": 0.0834, + "step": 289900 + }, + { + "epoch": 852.94, + "learning_rate": 2.819440415472663e-08, + "loss": 0.0822, + "step": 290000 + }, + { + "epoch": 852.94, + "eval_cer": 0.06930822544788806, + "eval_loss": 0.572381854057312, + "eval_runtime": 4.9827, + "eval_samples_per_second": 72.05, + "eval_steps_per_second": 2.408, + "eval_wer": 0.26116395292600353, + "step": 290000 + }, + { + "epoch": 853.24, + "learning_rate": 2.7640030804389485e-08, + "loss": 0.0818, + "step": 290100 + }, + { + "epoch": 853.53, + "learning_rate": 2.7091146791007883e-08, + "loss": 0.0835, + "step": 290200 + }, + { + "epoch": 853.82, + "learning_rate": 2.6547752720533782e-08, + "loss": 0.0782, + "step": 290300 + }, + { + "epoch": 854.12, + "learning_rate": 2.6009849192858428e-08, + "loss": 0.0794, + "step": 290400 + }, + { + "epoch": 854.41, + "learning_rate": 2.547743680181125e-08, + "loss": 0.0743, + "step": 290500 + }, + { + "epoch": 854.71, + "learning_rate": 2.4950516135159308e-08, + "loss": 0.0772, + "step": 290600 + }, + { + "epoch": 855.0, + "learning_rate": 2.442908777460673e-08, + "loss": 0.08, + "step": 290700 + }, + { + "epoch": 855.29, + "learning_rate": 2.391315229579638e-08, + "loss": 0.0824, + "step": 290800 + }, + { + "epoch": 855.59, + "learning_rate": 2.3402710268303762e-08, + "loss": 0.083, + "step": 290900 + }, + { + "epoch": 855.88, + "learning_rate": 2.2897762255643108e-08, + "loss": 0.0797, + "step": 291000 + }, + { + "epoch": 855.88, + "eval_cer": 0.06970053615797045, + "eval_loss": 0.5726251006126404, + "eval_runtime": 5.2315, + "eval_samples_per_second": 68.623, + "eval_steps_per_second": 2.294, + "eval_wer": 0.2616475898758665, + "step": 291000 + }, + { + "epoch": 856.18, + "learning_rate": 2.2398308815261283e-08, + "loss": 0.0801, + "step": 291100 + }, + { + "epoch": 856.47, + "learning_rate": 2.1904350498540562e-08, + "loss": 0.0867, + "step": 291200 + }, + { + "epoch": 856.76, + "learning_rate": 2.141588785079529e-08, + "loss": 0.0829, + "step": 291300 + }, + { + "epoch": 857.06, + "learning_rate": 2.093772386768278e-08, + "loss": 0.0784, + "step": 291400 + }, + { + "epoch": 857.35, + "learning_rate": 2.0460199199532904e-08, + "loss": 0.0814, + "step": 291500 + }, + { + "epoch": 857.65, + "learning_rate": 1.9988171794658728e-08, + "loss": 0.0798, + "step": 291600 + }, + { + "epoch": 857.94, + "learning_rate": 1.9521642174164522e-08, + "loss": 0.0799, + "step": 291700 + }, + { + "epoch": 858.24, + "learning_rate": 1.906061085308497e-08, + "loss": 0.0761, + "step": 291800 + }, + { + "epoch": 858.53, + "learning_rate": 1.8605078340385165e-08, + "loss": 0.0898, + "step": 291900 + }, + { + "epoch": 858.82, + "learning_rate": 1.8155045138959494e-08, + "loss": 0.0765, + "step": 292000 + }, + { + "epoch": 858.82, + "eval_cer": 0.06943899568458219, + "eval_loss": 0.5725178122520447, + "eval_runtime": 4.364, + "eval_samples_per_second": 82.263, + "eval_steps_per_second": 2.75, + "eval_wer": 0.2616475898758665, + "step": 292000 + }, + { + "epoch": 859.12, + "learning_rate": 1.7710511745630542e-08, + "loss": 0.0812, + "step": 292100 + }, + { + "epoch": 859.41, + "learning_rate": 1.72714786511502e-08, + "loss": 0.0782, + "step": 292200 + }, + { + "epoch": 859.71, + "learning_rate": 1.6837946340197976e-08, + "loss": 0.0808, + "step": 292300 + }, + { + "epoch": 860.0, + "learning_rate": 1.640991529138103e-08, + "loss": 0.0757, + "step": 292400 + }, + { + "epoch": 860.29, + "learning_rate": 1.5987385977231374e-08, + "loss": 0.0787, + "step": 292500 + }, + { + "epoch": 860.59, + "learning_rate": 1.5570358864210876e-08, + "loss": 0.0807, + "step": 292600 + }, + { + "epoch": 860.88, + "learning_rate": 1.5158834412703493e-08, + "loss": 0.083, + "step": 292700 + }, + { + "epoch": 861.18, + "learning_rate": 1.4756846048477047e-08, + "loss": 0.0832, + "step": 292800 + }, + { + "epoch": 861.47, + "learning_rate": 1.4356273239014007e-08, + "loss": 0.0783, + "step": 292900 + }, + { + "epoch": 861.76, + "learning_rate": 1.396120443137916e-08, + "loss": 0.077, + "step": 293000 + }, + { + "epoch": 861.76, + "eval_cer": 0.06939540560568415, + "eval_loss": 0.5725964903831482, + "eval_runtime": 5.0444, + "eval_samples_per_second": 71.168, + "eval_steps_per_second": 2.379, + "eval_wer": 0.2619700145091085, + "step": 293000 + }, + { + "epoch": 862.06, + "learning_rate": 1.3571640061716407e-08, + "loss": 0.0802, + "step": 293100 + }, + { + "epoch": 862.35, + "learning_rate": 1.3187580560092839e-08, + "loss": 0.0801, + "step": 293200 + }, + { + "epoch": 862.65, + "learning_rate": 1.2809026350498744e-08, + "loss": 0.0786, + "step": 293300 + }, + { + "epoch": 862.94, + "learning_rate": 1.2435977850847048e-08, + "loss": 0.0799, + "step": 293400 + }, + { + "epoch": 863.24, + "learning_rate": 1.2068435472972207e-08, + "loss": 0.0804, + "step": 293500 + }, + { + "epoch": 863.53, + "learning_rate": 1.1706399622629095e-08, + "loss": 0.082, + "step": 293600 + }, + { + "epoch": 863.82, + "learning_rate": 1.134987069949578e-08, + "loss": 0.0772, + "step": 293700 + }, + { + "epoch": 864.12, + "learning_rate": 1.0998849097169085e-08, + "loss": 0.0767, + "step": 293800 + }, + { + "epoch": 864.41, + "learning_rate": 1.0653335203165693e-08, + "loss": 0.0787, + "step": 293900 + }, + { + "epoch": 864.71, + "learning_rate": 1.0313329398923822e-08, + "loss": 0.0803, + "step": 294000 + }, + { + "epoch": 864.71, + "eval_cer": 0.06952617584237827, + "eval_loss": 0.5726108551025391, + "eval_runtime": 4.7362, + "eval_samples_per_second": 75.799, + "eval_steps_per_second": 2.534, + "eval_wer": 0.26132516524262456, + "step": 294000 + }, + { + "epoch": 865.0, + "learning_rate": 9.978832059798216e-09, + "loss": 0.0795, + "step": 294100 + }, + { + "epoch": 865.29, + "learning_rate": 9.649843555065708e-09, + "loss": 0.0814, + "step": 294200 + }, + { + "epoch": 865.59, + "learning_rate": 9.326364247918552e-09, + "loss": 0.0837, + "step": 294300 + }, + { + "epoch": 865.88, + "learning_rate": 9.00839449546831e-09, + "loss": 0.0812, + "step": 294400 + }, + { + "epoch": 866.18, + "learning_rate": 8.695934648744742e-09, + "loss": 0.0783, + "step": 294500 + }, + { + "epoch": 866.47, + "learning_rate": 8.392027271795777e-09, + "loss": 0.0805, + "step": 294600 + }, + { + "epoch": 866.76, + "learning_rate": 8.090533157728008e-09, + "loss": 0.0813, + "step": 294700 + }, + { + "epoch": 867.06, + "learning_rate": 7.794549962677479e-09, + "loss": 0.0824, + "step": 294800 + }, + { + "epoch": 867.35, + "learning_rate": 7.504078013402249e-09, + "loss": 0.0781, + "step": 294900 + }, + { + "epoch": 867.65, + "learning_rate": 7.219117630573036e-09, + "loss": 0.0826, + "step": 295000 + }, + { + "epoch": 867.65, + "eval_cer": 0.06952617584237827, + "eval_loss": 0.5726599097251892, + "eval_runtime": 4.9613, + "eval_samples_per_second": 72.36, + "eval_steps_per_second": 2.419, + "eval_wer": 0.26148637755924553, + "step": 295000 + }, + { + "epoch": 867.94, + "learning_rate": 6.9396691287787476e-09, + "loss": 0.0856, + "step": 295100 + }, + { + "epoch": 868.24, + "learning_rate": 6.6657328165214975e-09, + "loss": 0.0786, + "step": 295200 + }, + { + "epoch": 868.53, + "learning_rate": 6.397308996219375e-09, + "loss": 0.0779, + "step": 295300 + }, + { + "epoch": 868.82, + "learning_rate": 6.1343979642042305e-09, + "loss": 0.0753, + "step": 295400 + }, + { + "epoch": 869.12, + "learning_rate": 5.877000010721667e-09, + "loss": 0.079, + "step": 295500 + }, + { + "epoch": 869.41, + "learning_rate": 5.625115419931049e-09, + "loss": 0.0804, + "step": 295600 + }, + { + "epoch": 869.71, + "learning_rate": 5.3787444699060495e-09, + "loss": 0.0796, + "step": 295700 + }, + { + "epoch": 870.0, + "learning_rate": 5.137887432632438e-09, + "loss": 0.075, + "step": 295800 + }, + { + "epoch": 870.29, + "learning_rate": 4.9025445740097375e-09, + "loss": 0.0784, + "step": 295900 + }, + { + "epoch": 870.59, + "learning_rate": 4.672716153849011e-09, + "loss": 0.078, + "step": 296000 + }, + { + "epoch": 870.59, + "eval_cer": 0.06978771631576654, + "eval_loss": 0.5726059079170227, + "eval_runtime": 4.7666, + "eval_samples_per_second": 75.316, + "eval_steps_per_second": 2.518, + "eval_wer": 0.2616475898758665, + "step": 296000 + }, + { + "epoch": 870.88, + "learning_rate": 4.448402425873965e-09, + "loss": 0.0806, + "step": 296100 + }, + { + "epoch": 871.18, + "learning_rate": 4.229603637720403e-09, + "loss": 0.0785, + "step": 296200 + }, + { + "epoch": 871.47, + "learning_rate": 4.016320030935106e-09, + "loss": 0.0823, + "step": 296300 + }, + { + "epoch": 871.76, + "learning_rate": 3.808551840978058e-09, + "loss": 0.0789, + "step": 296400 + }, + { + "epoch": 872.06, + "learning_rate": 3.6062992972180076e-09, + "loss": 0.0848, + "step": 296500 + }, + { + "epoch": 872.35, + "learning_rate": 3.4095626229357914e-09, + "loss": 0.0795, + "step": 296600 + }, + { + "epoch": 872.65, + "learning_rate": 3.218342035323785e-09, + "loss": 0.0794, + "step": 296700 + }, + { + "epoch": 872.94, + "learning_rate": 3.0326377454825695e-09, + "loss": 0.0772, + "step": 296800 + }, + { + "epoch": 873.24, + "learning_rate": 2.852449958424819e-09, + "loss": 0.0818, + "step": 296900 + }, + { + "epoch": 873.53, + "learning_rate": 2.677778873072523e-09, + "loss": 0.0795, + "step": 297000 + }, + { + "epoch": 873.53, + "eval_cer": 0.06948258576348024, + "eval_loss": 0.5727548599243164, + "eval_runtime": 5.1786, + "eval_samples_per_second": 69.324, + "eval_steps_per_second": 2.317, + "eval_wer": 0.26180880219248753, + "step": 297000 + }, + { + "epoch": 873.82, + "learning_rate": 2.508624682256988e-09, + "loss": 0.0838, + "step": 297100 + }, + { + "epoch": 874.12, + "learning_rate": 2.3449875727199476e-09, + "loss": 0.0769, + "step": 297200 + }, + { + "epoch": 874.41, + "learning_rate": 2.1868677251113414e-09, + "loss": 0.0778, + "step": 297300 + }, + { + "epoch": 874.71, + "learning_rate": 2.0342653139904246e-09, + "loss": 0.0827, + "step": 297400 + }, + { + "epoch": 875.0, + "learning_rate": 1.88718050782688e-09, + "loss": 0.0773, + "step": 297500 + }, + { + "epoch": 875.29, + "learning_rate": 1.7456134689969317e-09, + "loss": 0.0825, + "step": 297600 + }, + { + "epoch": 875.59, + "learning_rate": 1.6095643537872296e-09, + "loss": 0.0776, + "step": 297700 + }, + { + "epoch": 875.88, + "learning_rate": 1.479033312390965e-09, + "loss": 0.0765, + "step": 297800 + }, + { + "epoch": 876.18, + "learning_rate": 1.3540204889106457e-09, + "loss": 0.0739, + "step": 297900 + }, + { + "epoch": 876.47, + "learning_rate": 1.235693649733194e-09, + "loss": 0.0792, + "step": 298000 + }, + { + "epoch": 876.47, + "eval_cer": 0.06943899568458219, + "eval_loss": 0.5723451972007751, + "eval_runtime": 5.0657, + "eval_samples_per_second": 70.869, + "eval_steps_per_second": 2.369, + "eval_wer": 0.26148637755924553, + "step": 298000 + }, + { + "epoch": 876.76, + "learning_rate": 1.1216624845133972e-09, + "loss": 0.084, + "step": 298100 + }, + { + "epoch": 877.06, + "learning_rate": 1.0131499317367344e-09, + "loss": 0.0804, + "step": 298200 + }, + { + "epoch": 877.35, + "learning_rate": 9.101561111979351e-10, + "loss": 0.0799, + "step": 298300 + }, + { + "epoch": 877.65, + "learning_rate": 8.126811365982701e-10, + "loss": 0.0856, + "step": 298400 + }, + { + "epoch": 877.94, + "learning_rate": 7.207251155483264e-10, + "loss": 0.0837, + "step": 298500 + }, + { + "epoch": 878.24, + "learning_rate": 6.342881495641217e-10, + "loss": 0.0811, + "step": 298600 + }, + { + "epoch": 878.53, + "learning_rate": 5.533703340693253e-10, + "loss": 0.0792, + "step": 298700 + }, + { + "epoch": 878.82, + "learning_rate": 4.77971758395257e-10, + "loss": 0.0818, + "step": 298800 + }, + { + "epoch": 879.12, + "learning_rate": 4.0809250577977797e-10, + "loss": 0.0848, + "step": 298900 + }, + { + "epoch": 879.41, + "learning_rate": 3.4373265336673514e-10, + "loss": 0.083, + "step": 299000 + }, + { + "epoch": 879.41, + "eval_cer": 0.06974412623686849, + "eval_loss": 0.5728374123573303, + "eval_runtime": 4.2557, + "eval_samples_per_second": 84.357, + "eval_steps_per_second": 2.82, + "eval_wer": 0.2621312268257295, + "step": 299000 + }, + { + "epoch": 879.71, + "learning_rate": 2.848922722081815e-10, + "loss": 0.0856, + "step": 299100 + }, + { + "epoch": 880.0, + "learning_rate": 2.315714272621561e-10, + "loss": 0.0794, + "step": 299200 + }, + { + "epoch": 880.29, + "learning_rate": 1.8377017739323876e-10, + "loss": 0.0758, + "step": 299300 + }, + { + "epoch": 880.59, + "learning_rate": 1.4148857537199522e-10, + "loss": 0.0836, + "step": 299400 + }, + { + "epoch": 880.88, + "learning_rate": 1.0472666787664232e-10, + "loss": 0.0777, + "step": 299500 + }, + { + "epoch": 881.18, + "learning_rate": 7.348449549082759e-11, + "loss": 0.0828, + "step": 299600 + }, + { + "epoch": 881.47, + "learning_rate": 4.7762092705294636e-11, + "loss": 0.0778, + "step": 299700 + }, + { + "epoch": 881.76, + "learning_rate": 2.7559487917327988e-11, + "loss": 0.078, + "step": 299800 + }, + { + "epoch": 882.06, + "learning_rate": 1.2876703428532644e-11, + "loss": 0.0842, + "step": 299900 + }, + { + "epoch": 882.35, + "learning_rate": 3.713755449830103e-12, + "loss": 0.0753, + "step": 300000 + }, + { + "epoch": 882.35, + "eval_cer": 0.0693518155267861, + "eval_loss": 0.5725403428077698, + "eval_runtime": 5.1749, + "eval_samples_per_second": 69.373, + "eval_steps_per_second": 2.319, + "eval_wer": 0.26116395292600353, + "step": 300000 + } + ], + "max_steps": 300000, + "num_train_epochs": 883, + "total_flos": 4.30858254034925e+21, + "trial_name": null, + "trial_params": null +}